From e12d6ba7862ff7f2b71771ff3559197b39e3029e Mon Sep 17 00:00:00 2001 From: Luke Hutton Date: Mon, 7 Mar 2022 15:27:21 +0000 Subject: [PATCH] [AOT] Use python temporary directory for AOT tests Uses a python temporary directory with a context manager in an effort to solve the flaky FVP tests raised in https://github.com/apache/tvm/issues/10300 and https://github.com/apache/tvm/issues/10314. Now that CI is becoming more and more parallelized, the thinking is that the python temporary directory implementation might be more stable than `utils.tempdir`. Removing the XFail markings off the affected tests, but keeping the work around implemented in https://github.com/apache/tvm/pull/10408 while we monitor with the above change. Change-Id: Id07869b51cd2278ec4885ef964bc1b23892ba235 --- .../contrib/test_ethosu/test_codegen.py | 6 - .../contrib/test_ethosu/test_lookup_table.py | 1 - tests/python/relay/aot/aot_test_utils.py | 239 +++++++++--------- 3 files changed, 120 insertions(+), 126 deletions(-) diff --git a/tests/python/contrib/test_ethosu/test_codegen.py b/tests/python/contrib/test_ethosu/test_codegen.py index 0413cbf08ec85..20f19af137e59 100644 --- a/tests/python/contrib/test_ethosu/test_codegen.py +++ b/tests/python/contrib/test_ethosu/test_codegen.py @@ -952,7 +952,6 @@ def concat_func(*inputs): _compare_tvm_with_tflite(concat_func, shapes, accel_type, output_tolerance=1) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) def test_tflite_sigmoid(accel_type): ifm_shape = [1, 135, 41, 6] @@ -1017,7 +1016,6 @@ def create_model(): _compare_ethosu_with_reference(ethosu_mod, input_data, output_data, accel_type) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) @pytest.mark.parametrize("ifm_shape,axis", [((2,), 0), ((1, 3, 3), 2)]) def test_tflite_expand_dims(accel_type, ifm_shape, axis): @@ -1057,7 +1055,6 @@ def resize_model(x): _compare_tvm_with_tflite(resize_model, [ifm_shape], accel_type) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) @pytest.mark.parametrize( "ifm_shape,size,align_corners", @@ -1082,7 +1079,6 @@ def resize_model(x): _compare_tvm_with_tflite(resize_model, [ifm_shape], accel_type, output_tolerance=1) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) @pytest.mark.parametrize( "ifm_shape,ofm_shape,kernel_shape,padding", @@ -1122,7 +1118,6 @@ def conv2d_transpose(x): _compare_tvm_with_tflite(conv2d_transpose, [ifm_shape], accel_type=accel_type) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) @pytest.mark.parametrize( "ifm_shapes,axis", @@ -1157,7 +1152,6 @@ def unpack_func(x): _compare_tvm_with_tflite(unpack_func, [ifm_shape], accel_type) -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) @pytest.mark.parametrize("ifm_shape", [(1, 15, 15, 3), (1, 8, 9, 1)]) @pytest.mark.parametrize("alpha", [0.2, 0.634]) diff --git a/tests/python/contrib/test_ethosu/test_lookup_table.py b/tests/python/contrib/test_ethosu/test_lookup_table.py index 31ed56ae29984..ae9d4ee27c721 100644 --- a/tests/python/contrib/test_ethosu/test_lookup_table.py +++ b/tests/python/contrib/test_ethosu/test_lookup_table.py @@ -33,7 +33,6 @@ ACCEL_TYPES = ["ethos-u55-256", "ethos-u55-128", "ethos-u55-64", "ethos-u55-32"] -@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300") @pytest.mark.parametrize("accel_type", ACCEL_TYPES) def test_tflite_lut_activations(accel_type): diff --git a/tests/python/relay/aot/aot_test_utils.py b/tests/python/relay/aot/aot_test_utils.py index 9a62e2ee3f303..2c3675bee7594 100644 --- a/tests/python/relay/aot/aot_test_utils.py +++ b/tests/python/relay/aot/aot_test_utils.py @@ -27,6 +27,8 @@ import shutil import subprocess import tarfile +import tempfile +import contextlib from typing import Any, NamedTuple, Union, Optional, List, Dict import pytest @@ -731,130 +733,129 @@ def run_and_check( This method uses the original test data and compiled runtime.Modules to run in the test runner to verify the results. """ + tmpdir = tempfile.TemporaryDirectory() if test_dir is None else contextlib.surpress() + with tmpdir: + base_path = os.path.join(tmpdir.name, "test") if test_dir is None else test_dir + + cflags = f"-DTVM_RUNTIME_ALLOC_ALIGNMENT_BYTES={workspace_byte_alignment} " + # The calculated workspaces will not account for stack allocator tags used for debugging + if debug_calculated_workspaces: + cflags += "-DTVM_CRT_STACK_ALLOCATOR_ENABLE_LIFO_CHECK " + + base_path = os.path.abspath(base_path) + build_path = os.path.join(base_path, "build") + os.makedirs(build_path, exist_ok=True) + + include_path = os.path.join(base_path, "include") + os.mkdir(include_path) + crt_root = tvm.micro.get_standalone_crt_dir() + shutil.copy2( + os.path.join(crt_root, "template", "crt_config-template.h"), + os.path.join(include_path, "crt_config.h"), + ) - base_path = test_dir - if test_dir is None: - tmp_path = utils.tempdir() - tmp_dir = tmp_path.temp_dir - base_path = os.path.join(tmp_dir, "test") - - cflags = f"-DTVM_RUNTIME_ALLOC_ALIGNMENT_BYTES={workspace_byte_alignment} " - # The calculated workspaces will not account for stack allocator tags used for debugging - if debug_calculated_workspaces: - cflags += "-DTVM_CRT_STACK_ALLOCATOR_ENABLE_LIFO_CHECK " - - base_path = os.path.abspath(base_path) - build_path = os.path.join(base_path, "build") - os.makedirs(build_path, exist_ok=True) - - include_path = os.path.join(base_path, "include") - os.mkdir(include_path) - crt_root = tvm.micro.get_standalone_crt_dir() - shutil.copy2( - os.path.join(crt_root, "template", "crt_config-template.h"), - os.path.join(include_path, "crt_config.h"), - ) - - workspace_bytes = 0 - for compiled_model in models: - model = compiled_model.model - tar_file = os.path.join(base_path, f"{model.name}.tar") - export_model_library_format(compiled_model.executor_factory, tar_file) - t = tarfile.open(tar_file) - t.extractall(base_path) - - # Interface C APIs does not need compiler generated - # workspace to generate the test application, because - # workspace size is codegen'd as a macro to - # tvmgen_.h. - if interface_api != "c": - workspace_bytes += mlf_extract_workspace_size_bytes(tar_file) - - workspace_bytes += model.extra_memory_in_bytes - for key in model.inputs: - sanitized_tensor_name = re.sub(r"\W", "_", key) - create_header_file( - f'{mangle_name(model.name, "input_data")}_{sanitized_tensor_name}', - model.inputs[key], - include_path, - data_linkage, - ) - - for key in model.outputs: - sanitized_tensor_name = re.sub(r"\W", "_", key) - create_header_file( - f'{mangle_name(model.name, "output_data")}_{sanitized_tensor_name}', - np.zeros(model.outputs[key].shape, model.outputs[key].dtype), - include_path, - data_linkage, - ) - create_header_file( - f'{mangle_name(model.name, "expected_output_data")}_{sanitized_tensor_name}', - model.outputs[key], - include_path, - data_linkage, - ) - - use_usmp = runner.pass_config.get("tir.usmp.enable", False) - # We only need the stack allocator if USMP is not used - use_stack_allocator = not use_usmp - - create_main( - "test.c", - models, - build_path, - runner.includes, - runner.prologue, - runner.epilogue, - data_linkage, - interface_api, - workspace_bytes, - use_stack_allocator, - ) + workspace_bytes = 0 + for compiled_model in models: + model = compiled_model.model + tar_file = os.path.join(base_path, f"{model.name}.tar") + export_model_library_format(compiled_model.executor_factory, tar_file) + t = tarfile.open(tar_file) + t.extractall(base_path) + + # Interface C APIs does not need compiler generated + # workspace to generate the test application, because + # workspace size is codegen'd as a macro to + # tvmgen_.h. + if interface_api != "c": + workspace_bytes += mlf_extract_workspace_size_bytes(tar_file) + + workspace_bytes += model.extra_memory_in_bytes + for key in model.inputs: + sanitized_tensor_name = re.sub(r"\W", "_", key) + create_header_file( + f'{mangle_name(model.name, "input_data")}_{sanitized_tensor_name}', + model.inputs[key], + include_path, + data_linkage, + ) - # Verify that compiles fine - file_dir = os.path.dirname(os.path.abspath(__file__)) - codegen_path = os.path.join(base_path, "codegen") - makefile = os.path.join(file_dir, f"{runner.makefile}.mk") - fvp_dir = "/opt/arm/FVP_Corstone_SSE-300/models/Linux64_GCC-6.4/" - # TODO(@grant-arm): Remove once ci_cpu docker image has been updated to FVP_Corstone_SSE - if not os.path.isdir(fvp_dir): - fvp_dir = "/opt/arm/FVP_Corstone_SSE-300_Ethos-U55/models/Linux64_GCC-6.4/" - custom_params = " ".join([f" {param}='{value}'" for param, value in runner.parameters.items()]) - make_command = ( - f"make -f {makefile} build_dir={build_path}" - + f" CFLAGS='{cflags}'" - + f" TVM_ROOT={file_dir}/../../../.." - + f" AOT_TEST_ROOT={file_dir}" - + f" CODEGEN_ROOT={codegen_path}" - + f" STANDALONE_CRT_DIR={tvm.micro.get_standalone_crt_dir()}" - + f" FVP_DIR={fvp_dir}" - + custom_params - ) + for key in model.outputs: + sanitized_tensor_name = re.sub(r"\W", "_", key) + create_header_file( + f'{mangle_name(model.name, "output_data")}_{sanitized_tensor_name}', + np.zeros(model.outputs[key].shape, model.outputs[key].dtype), + include_path, + data_linkage, + ) + create_header_file( + f'{mangle_name(model.name, "expected_output_data")}_{sanitized_tensor_name}', + model.outputs[key], + include_path, + data_linkage, + ) - compile_log_path = os.path.join(build_path, "test_compile.log") - compile_command = f"{make_command} aot_test_runner" - if verbose: - print("Compile command:\n", compile_command) - subprocess_check_log_output(compile_command, ".", compile_log_path) + use_usmp = runner.pass_config.get("tir.usmp.enable", False) + # We only need the stack allocator if USMP is not used + use_stack_allocator = not use_usmp + + create_main( + "test.c", + models, + build_path, + runner.includes, + runner.prologue, + runner.epilogue, + data_linkage, + interface_api, + workspace_bytes, + use_stack_allocator, + ) - # Verify that runs fine - run_log_path = os.path.join(build_path, "test_run.log") - run_command = f"{make_command} run" - if verbose: - print("Run command:\n", run_command) + # Verify that compiles fine + file_dir = os.path.dirname(os.path.abspath(__file__)) + codegen_path = os.path.join(base_path, "codegen") + makefile = os.path.join(file_dir, f"{runner.makefile}.mk") + fvp_dir = "/opt/arm/FVP_Corstone_SSE-300/models/Linux64_GCC-6.4/" + # TODO(@grant-arm): Remove once ci_cpu docker image has been updated to FVP_Corstone_SSE + if not os.path.isdir(fvp_dir): + fvp_dir = "/opt/arm/FVP_Corstone_SSE-300_Ethos-U55/models/Linux64_GCC-6.4/" + custom_params = " ".join( + [f" {param}='{value}'" for param, value in runner.parameters.items()] + ) + make_command = ( + f"make -f {makefile} build_dir={build_path}" + + f" CFLAGS='{cflags}'" + + f" TVM_ROOT={file_dir}/../../../.." + + f" AOT_TEST_ROOT={file_dir}" + + f" CODEGEN_ROOT={codegen_path}" + + f" STANDALONE_CRT_DIR={tvm.micro.get_standalone_crt_dir()}" + + f" FVP_DIR={fvp_dir}" + + custom_params + ) - # TODO(lhutton1) This is a quick and dirty work around to help temporarily reduce - # the flakyness of the tests. Will remove once #10300 and #10314 are resolved. - try: - subprocess_check_log_output(run_command, build_path, run_log_path) - except RuntimeError as err: - print("Failed to run the module, having a second attempt...", file=sys.stderr) - print(err, file=sys.stderr) - subprocess_check_log_output(run_command, build_path, run_log_path) - - with open(run_log_path) as run_log: - assert AOT_SUCCESS_TOKEN in run_log.read() + compile_log_path = os.path.join(build_path, "test_compile.log") + compile_command = f"{make_command} aot_test_runner" + if verbose: + print("Compile command:\n", compile_command) + subprocess_check_log_output(compile_command, ".", compile_log_path) + + # Verify that runs fine + run_log_path = os.path.join(build_path, "test_run.log") + run_command = f"{make_command} run" + if verbose: + print("Run command:\n", run_command) + + # TODO(lhutton1) This is a quick and dirty work around to help temporarily reduce + # the flakyness of the tests. Will remove once #10300 and #10314 are resolved. + try: + subprocess_check_log_output(run_command, build_path, run_log_path) + except RuntimeError as err: + print("Failed to run the module, having a second attempt...", file=sys.stderr) + print(err, file=sys.stderr) + subprocess_check_log_output(run_command, build_path, run_log_path) + + with open(run_log_path) as run_log: + assert AOT_SUCCESS_TOKEN in run_log.read() def compile_and_run(