From 6dd9c7693e7b3b7719901641969aa6359258f922 Mon Sep 17 00:00:00 2001
From: Luke Hutton <luke.hutton@arm.com>
Date: Thu, 10 Mar 2022 06:29:57 +0000
Subject: [PATCH] [AOT] Use python temporary directory for AOT tests (#10518)

* [AOT] Use python temporary directory for AOT tests

Uses a python temporary directory with a context manager in an effort to
solve the flaky FVP tests raised in
https://github.com/apache/tvm/issues/10300 and
https://github.com/apache/tvm/issues/10314. Now that CI is becoming
more and more parallelized, the thinking is that the python temporary
directory implementation might be more stable than `utils.tempdir`.
Removing the XFail markings off the affected tests, but keeping the
work around implemented in https://github.com/apache/tvm/pull/10408
while we monitor with the above change.

Change-Id: Id07869b51cd2278ec4885ef964bc1b23892ba235

* alter context manager to make more readable

Change-Id: Iba0644db14e50648f6dc99a4ed0f455641c31912
---
 .../contrib/test_ethosu/test_codegen.py       |   6 -
 .../contrib/test_ethosu/test_lookup_table.py  |   1 -
 tests/python/relay/aot/aot_test_utils.py      | 240 +++++++++---------
 3 files changed, 122 insertions(+), 125 deletions(-)

diff --git a/tests/python/contrib/test_ethosu/test_codegen.py b/tests/python/contrib/test_ethosu/test_codegen.py
index 105f907e2209a..7ff7295fb0de1 100644
--- a/tests/python/contrib/test_ethosu/test_codegen.py
+++ b/tests/python/contrib/test_ethosu/test_codegen.py
@@ -965,7 +965,6 @@ def concat_func(*inputs):
     _compare_tvm_with_tflite(concat_func, shapes, accel_type, output_tolerance=1)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 def test_tflite_sigmoid(accel_type):
     ifm_shape = [1, 135, 41, 6]
@@ -1030,7 +1029,6 @@ def create_model():
     _compare_ethosu_with_reference(ethosu_mod, input_data, output_data, accel_type)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 @pytest.mark.parametrize("ifm_shape,axis", [((2,), 0), ((1, 3, 3), 2)])
 def test_tflite_expand_dims(accel_type, ifm_shape, axis):
@@ -1070,7 +1068,6 @@ def resize_model(x):
     _compare_tvm_with_tflite(resize_model, [ifm_shape], accel_type)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 @pytest.mark.parametrize(
     "ifm_shape,size,align_corners",
@@ -1095,7 +1092,6 @@ def resize_model(x):
     _compare_tvm_with_tflite(resize_model, [ifm_shape], accel_type, output_tolerance=1)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 @pytest.mark.parametrize(
     "ifm_shape,ofm_shape,kernel_shape,padding",
@@ -1135,7 +1131,6 @@ def conv2d_transpose(x):
     _compare_tvm_with_tflite(conv2d_transpose, [ifm_shape], accel_type=accel_type)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 @pytest.mark.parametrize(
     "ifm_shapes,axis",
@@ -1170,7 +1165,6 @@ def unpack_func(x):
     _compare_tvm_with_tflite(unpack_func, [ifm_shape], accel_type)
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 @pytest.mark.parametrize("ifm_shape", [(1, 15, 15, 3), (1, 8, 9, 1)])
 @pytest.mark.parametrize("alpha", [0.2, 0.634])
diff --git a/tests/python/contrib/test_ethosu/test_lookup_table.py b/tests/python/contrib/test_ethosu/test_lookup_table.py
index 31ed56ae29984..ae9d4ee27c721 100644
--- a/tests/python/contrib/test_ethosu/test_lookup_table.py
+++ b/tests/python/contrib/test_ethosu/test_lookup_table.py
@@ -33,7 +33,6 @@
 ACCEL_TYPES = ["ethos-u55-256", "ethos-u55-128", "ethos-u55-64", "ethos-u55-32"]
 
 
-@pytest.mark.xfail(strict=False, reason="See https://github.com/apache/tvm/issues/10300")
 @pytest.mark.parametrize("accel_type", ACCEL_TYPES)
 def test_tflite_lut_activations(accel_type):
 
diff --git a/tests/python/relay/aot/aot_test_utils.py b/tests/python/relay/aot/aot_test_utils.py
index 9a62e2ee3f303..e8b1efa262e87 100644
--- a/tests/python/relay/aot/aot_test_utils.py
+++ b/tests/python/relay/aot/aot_test_utils.py
@@ -27,6 +27,7 @@
 import shutil
 import subprocess
 import tarfile
+import tempfile
 from typing import Any, NamedTuple, Union, Optional, List, Dict
 
 import pytest
@@ -732,129 +733,132 @@ def run_and_check(
     to run in the test runner to verify the results.
     """
 
-    base_path = test_dir
-    if test_dir is None:
-        tmp_path = utils.tempdir()
-        tmp_dir = tmp_path.temp_dir
-        base_path = os.path.join(tmp_dir, "test")
-
-    cflags = f"-DTVM_RUNTIME_ALLOC_ALIGNMENT_BYTES={workspace_byte_alignment} "
-    # The calculated workspaces will not account for stack allocator tags used for debugging
-    if debug_calculated_workspaces:
-        cflags += "-DTVM_CRT_STACK_ALLOCATOR_ENABLE_LIFO_CHECK "
-
-    base_path = os.path.abspath(base_path)
-    build_path = os.path.join(base_path, "build")
-    os.makedirs(build_path, exist_ok=True)
-
-    include_path = os.path.join(base_path, "include")
-    os.mkdir(include_path)
-    crt_root = tvm.micro.get_standalone_crt_dir()
-    shutil.copy2(
-        os.path.join(crt_root, "template", "crt_config-template.h"),
-        os.path.join(include_path, "crt_config.h"),
-    )
+    def run_and_check_body(base_path):
+        cflags = f"-DTVM_RUNTIME_ALLOC_ALIGNMENT_BYTES={workspace_byte_alignment} "
+        # The calculated workspaces will not account for stack allocator tags used for debugging
+        if debug_calculated_workspaces:
+            cflags += "-DTVM_CRT_STACK_ALLOCATOR_ENABLE_LIFO_CHECK "
+
+        base_path = os.path.abspath(base_path)
+        build_path = os.path.join(base_path, "build")
+        os.makedirs(build_path, exist_ok=True)
+
+        include_path = os.path.join(base_path, "include")
+        os.mkdir(include_path)
+        crt_root = tvm.micro.get_standalone_crt_dir()
+        shutil.copy2(
+            os.path.join(crt_root, "template", "crt_config-template.h"),
+            os.path.join(include_path, "crt_config.h"),
+        )
 
-    workspace_bytes = 0
-    for compiled_model in models:
-        model = compiled_model.model
-        tar_file = os.path.join(base_path, f"{model.name}.tar")
-        export_model_library_format(compiled_model.executor_factory, tar_file)
-        t = tarfile.open(tar_file)
-        t.extractall(base_path)
-
-        # Interface C APIs does not need compiler generated
-        # workspace to generate the test application, because
-        # workspace size is codegen'd as a macro to
-        # tvmgen_<model_name>.h.
-        if interface_api != "c":
-            workspace_bytes += mlf_extract_workspace_size_bytes(tar_file)
-
-        workspace_bytes += model.extra_memory_in_bytes
-        for key in model.inputs:
-            sanitized_tensor_name = re.sub(r"\W", "_", key)
-            create_header_file(
-                f'{mangle_name(model.name, "input_data")}_{sanitized_tensor_name}',
-                model.inputs[key],
-                include_path,
-                data_linkage,
-            )
-
-        for key in model.outputs:
-            sanitized_tensor_name = re.sub(r"\W", "_", key)
-            create_header_file(
-                f'{mangle_name(model.name, "output_data")}_{sanitized_tensor_name}',
-                np.zeros(model.outputs[key].shape, model.outputs[key].dtype),
-                include_path,
-                data_linkage,
-            )
-            create_header_file(
-                f'{mangle_name(model.name, "expected_output_data")}_{sanitized_tensor_name}',
-                model.outputs[key],
-                include_path,
-                data_linkage,
-            )
-
-    use_usmp = runner.pass_config.get("tir.usmp.enable", False)
-    # We only need the stack allocator if USMP is not used
-    use_stack_allocator = not use_usmp
-
-    create_main(
-        "test.c",
-        models,
-        build_path,
-        runner.includes,
-        runner.prologue,
-        runner.epilogue,
-        data_linkage,
-        interface_api,
-        workspace_bytes,
-        use_stack_allocator,
-    )
+        workspace_bytes = 0
+        for compiled_model in models:
+            model = compiled_model.model
+            tar_file = os.path.join(base_path, f"{model.name}.tar")
+            export_model_library_format(compiled_model.executor_factory, tar_file)
+            t = tarfile.open(tar_file)
+            t.extractall(base_path)
+
+            # Interface C APIs does not need compiler generated
+            # workspace to generate the test application, because
+            # workspace size is codegen'd as a macro to
+            # tvmgen_<model_name>.h.
+            if interface_api != "c":
+                workspace_bytes += mlf_extract_workspace_size_bytes(tar_file)
+
+            workspace_bytes += model.extra_memory_in_bytes
+            for key in model.inputs:
+                sanitized_tensor_name = re.sub(r"\W", "_", key)
+                create_header_file(
+                    f'{mangle_name(model.name, "input_data")}_{sanitized_tensor_name}',
+                    model.inputs[key],
+                    include_path,
+                    data_linkage,
+                )
 
-    # Verify that compiles fine
-    file_dir = os.path.dirname(os.path.abspath(__file__))
-    codegen_path = os.path.join(base_path, "codegen")
-    makefile = os.path.join(file_dir, f"{runner.makefile}.mk")
-    fvp_dir = "/opt/arm/FVP_Corstone_SSE-300/models/Linux64_GCC-6.4/"
-    # TODO(@grant-arm): Remove once ci_cpu docker image has been updated to FVP_Corstone_SSE
-    if not os.path.isdir(fvp_dir):
-        fvp_dir = "/opt/arm/FVP_Corstone_SSE-300_Ethos-U55/models/Linux64_GCC-6.4/"
-    custom_params = " ".join([f" {param}='{value}'" for param, value in runner.parameters.items()])
-    make_command = (
-        f"make -f {makefile} build_dir={build_path}"
-        + f" CFLAGS='{cflags}'"
-        + f" TVM_ROOT={file_dir}/../../../.."
-        + f" AOT_TEST_ROOT={file_dir}"
-        + f" CODEGEN_ROOT={codegen_path}"
-        + f" STANDALONE_CRT_DIR={tvm.micro.get_standalone_crt_dir()}"
-        + f" FVP_DIR={fvp_dir}"
-        + custom_params
-    )
+            for key in model.outputs:
+                sanitized_tensor_name = re.sub(r"\W", "_", key)
+                create_header_file(
+                    f'{mangle_name(model.name, "output_data")}_{sanitized_tensor_name}',
+                    np.zeros(model.outputs[key].shape, model.outputs[key].dtype),
+                    include_path,
+                    data_linkage,
+                )
+                create_header_file(
+                    f'{mangle_name(model.name, "expected_output_data")}_{sanitized_tensor_name}',
+                    model.outputs[key],
+                    include_path,
+                    data_linkage,
+                )
+
+        use_usmp = runner.pass_config.get("tir.usmp.enable", False)
+        # We only need the stack allocator if USMP is not used
+        use_stack_allocator = not use_usmp
+
+        create_main(
+            "test.c",
+            models,
+            build_path,
+            runner.includes,
+            runner.prologue,
+            runner.epilogue,
+            data_linkage,
+            interface_api,
+            workspace_bytes,
+            use_stack_allocator,
+        )
 
-    compile_log_path = os.path.join(build_path, "test_compile.log")
-    compile_command = f"{make_command} aot_test_runner"
-    if verbose:
-        print("Compile command:\n", compile_command)
-    subprocess_check_log_output(compile_command, ".", compile_log_path)
+        # Verify that compiles fine
+        file_dir = os.path.dirname(os.path.abspath(__file__))
+        codegen_path = os.path.join(base_path, "codegen")
+        makefile = os.path.join(file_dir, f"{runner.makefile}.mk")
+        fvp_dir = "/opt/arm/FVP_Corstone_SSE-300/models/Linux64_GCC-6.4/"
+        # TODO(@grant-arm): Remove once ci_cpu docker image has been updated to FVP_Corstone_SSE
+        if not os.path.isdir(fvp_dir):
+            fvp_dir = "/opt/arm/FVP_Corstone_SSE-300_Ethos-U55/models/Linux64_GCC-6.4/"
+        custom_params = " ".join(
+            [f" {param}='{value}'" for param, value in runner.parameters.items()]
+        )
+        make_command = (
+            f"make -f {makefile} build_dir={build_path}"
+            + f" CFLAGS='{cflags}'"
+            + f" TVM_ROOT={file_dir}/../../../.."
+            + f" AOT_TEST_ROOT={file_dir}"
+            + f" CODEGEN_ROOT={codegen_path}"
+            + f" STANDALONE_CRT_DIR={tvm.micro.get_standalone_crt_dir()}"
+            + f" FVP_DIR={fvp_dir}"
+            + custom_params
+        )
 
-    # Verify that runs fine
-    run_log_path = os.path.join(build_path, "test_run.log")
-    run_command = f"{make_command} run"
-    if verbose:
-        print("Run command:\n", run_command)
+        compile_log_path = os.path.join(build_path, "test_compile.log")
+        compile_command = f"{make_command} aot_test_runner"
+        if verbose:
+            print("Compile command:\n", compile_command)
+        subprocess_check_log_output(compile_command, ".", compile_log_path)
+
+        # Verify that runs fine
+        run_log_path = os.path.join(build_path, "test_run.log")
+        run_command = f"{make_command} run"
+        if verbose:
+            print("Run command:\n", run_command)
+
+        # TODO(lhutton1) This is a quick and dirty work around to help temporarily reduce
+        # the flakyness of the tests. Will remove once #10300 and #10314 are resolved.
+        try:
+            subprocess_check_log_output(run_command, build_path, run_log_path)
+        except RuntimeError as err:
+            print("Failed to run the module, having a second attempt...", file=sys.stderr)
+            print(err, file=sys.stderr)
+            subprocess_check_log_output(run_command, build_path, run_log_path)
+
+        with open(run_log_path) as run_log:
+            assert AOT_SUCCESS_TOKEN in run_log.read()
 
-    # TODO(lhutton1) This is a quick and dirty work around to help temporarily reduce
-    # the flakyness of the tests. Will remove once #10300 and #10314 are resolved.
-    try:
-        subprocess_check_log_output(run_command, build_path, run_log_path)
-    except RuntimeError as err:
-        print("Failed to run the module, having a second attempt...", file=sys.stderr)
-        print(err, file=sys.stderr)
-        subprocess_check_log_output(run_command, build_path, run_log_path)
-
-    with open(run_log_path) as run_log:
-        assert AOT_SUCCESS_TOKEN in run_log.read()
+    if test_dir is None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            run_and_check_body(os.path.join(tmpdir, "test"))
+    else:
+        run_and_check_body(test_dir)
 
 
 def compile_and_run(