diff --git a/build_tools/python/e2e_test_framework/models/model_groups.py b/build_tools/python/e2e_test_framework/models/model_groups.py index 8149ae47db75..75f52347e85a 100644 --- a/build_tools/python/e2e_test_framework/models/model_groups.py +++ b/build_tools/python/e2e_test_framework/models/model_groups.py @@ -41,15 +41,15 @@ # BERT-Large in various batch sizes. BERT_LARGE_TORCH_BATCHES = [ torch_models.BERT_LARGE_1X384_FP32_TORCH, - torch_models.BERT_LARGE_8X384_FP32_TORCH, torch_models.BERT_LARGE_16X384_FP32_TORCH, + torch_models.BERT_LARGE_24X384_FP32_TORCH, torch_models.BERT_LARGE_32X384_FP32_TORCH, + torch_models.BERT_LARGE_48X384_FP32_TORCH, torch_models.BERT_LARGE_64X384_FP32_TORCH, # Disabled due to https://github.com/openxla/iree/issues/12774. - #torch_models.BERT_LARGE_128X384_FP32_TORCH, - #torch_models.BERT_LARGE_256X384_FP32_TORCH, #torch_models.BERT_LARGE_512X384_FP32_TORCH, #torch_models.BERT_LARGE_1024X384_FP32_TORCH, + #torch_models.BERT_LARGE_1280X384_FP32_TORCH, ] RESNET50_TORCH_BATCHES = [ diff --git a/build_tools/python/e2e_test_framework/models/torch_models.py b/build_tools/python/e2e_test_framework/models/torch_models.py index 7c210d792dcf..f573c096f844 100644 --- a/build_tools/python/e2e_test_framework/models/torch_models.py +++ b/build_tools/python/e2e_test_framework/models/torch_models.py @@ -82,77 +82,67 @@ tags=["fp32", "transformer", "seqlen384", "batch-1"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_1/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_1/linalg.mlir", entry_function="forward", input_types=["1x384xi64", "1x384xi64"]) -BERT_LARGE_8X384_FP32_TORCH = common_definitions.Model( - id=unique_ids.MODEL_BERT_LARGE_8X384_FP32_TORCH, - name="BertLargePTBatch8", - tags=["fp32", "transformer", "seqlen384", "batch-8"], - source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, - source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_8/linalg.mlir", - entry_function="forward", - input_types=["8x384xi64", "8x384xi64"]) - BERT_LARGE_16X384_FP32_TORCH = common_definitions.Model( id=unique_ids.MODEL_BERT_LARGE_16X384_FP32_TORCH, name="BertLargePTBatch16", tags=["fp32", "transformer", "seqlen384", "batch-16"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_16/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_16/linalg.mlir", entry_function="forward", input_types=["16x384xi64", "16x384xi64"]) +BERT_LARGE_24X384_FP32_TORCH = common_definitions.Model( + id=unique_ids.MODEL_BERT_LARGE_24X384_FP32_TORCH, + name="BertLargePTBatch24", + tags=["fp32", "transformer", "seqlen384", "batch-24"], + source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, + source_url= + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_24/linalg.mlir", + entry_function="forward", + input_types=["24x384xi64", "24x384xi64"]) + BERT_LARGE_32X384_FP32_TORCH = common_definitions.Model( id=unique_ids.MODEL_BERT_LARGE_32X384_FP32_TORCH, name="BertLargePTBatch32", tags=["fp32", "transformer", "seqlen384", "batch-32"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_32/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_32/linalg.mlir", entry_function="forward", input_types=["32x384xi64", "32x384xi64"]) +BERT_LARGE_48X384_FP32_TORCH = common_definitions.Model( + id=unique_ids.MODEL_BERT_LARGE_48X384_FP32_TORCH, + name="BertLargePTBatch48", + tags=["fp32", "transformer", "seqlen384", "batch-48"], + source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, + source_url= + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_48/linalg.mlir", + entry_function="forward", + input_types=["48x384xi64", "48x384xi64"]) + BERT_LARGE_64X384_FP32_TORCH = common_definitions.Model( id=unique_ids.MODEL_BERT_LARGE_64X384_FP32_TORCH, name="BertLargePTBatch64", tags=["fp32", "transformer", "seqlen384", "batch-64"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_64/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_64/linalg.mlir", entry_function="forward", input_types=["64x384xi64", "64x384xi64"]) -BERT_LARGE_128X384_FP32_TORCH = common_definitions.Model( - id=unique_ids.MODEL_BERT_LARGE_128X384_FP32_TORCH, - name="BertLargePTBatch128", - tags=["fp32", "transformer", "seqlen384", "batch-128"], - source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, - source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_128/linalg.mlir", - entry_function="forward", - input_types=["128x384xi64", "128x384xi64"]) - -BERT_LARGE_256X384_FP32_TORCH = common_definitions.Model( - id=unique_ids.MODEL_BERT_LARGE_256X384_FP32_TORCH, - name="BertLargePTBatch256", - tags=["fp32", "transformer", "seqlen384", "batch-256"], - source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, - source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_256/linalg.mlir", - entry_function="forward", - input_types=["256x384xi64", "256x384xi64"]) - BERT_LARGE_512X384_FP32_TORCH = common_definitions.Model( id=unique_ids.MODEL_BERT_LARGE_512X384_FP32_TORCH, name="BertLargePTBatch512", tags=["fp32", "transformer", "seqlen384", "batch-512"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_512/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_512/linalg.mlir", entry_function="forward", input_types=["512x384xi64", "512x384xi64"]) @@ -162,10 +152,20 @@ tags=["fp32", "transformer", "seqlen384", "batch-1024"], source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, source_url= - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_1024/linalg.mlir", + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_1024/linalg.mlir", entry_function="forward", input_types=["1024x384xi64", "1024x384xi64"]) +BERT_LARGE_1280X384_FP32_TORCH = common_definitions.Model( + id=unique_ids.MODEL_BERT_LARGE_1280X384_FP32_TORCH, + name="BertLargePTBatch1280", + tags=["fp32", "transformer", "seqlen384", "batch-1280"], + source_type=common_definitions.ModelSourceType.EXPORTED_LINALG_MLIR, + source_url= + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_1280/linalg.mlir", + entry_function="forward", + input_types=["1280x384xi64", "1280x384xi64"]) + # Converted from https://pytorch.org/vision/main/models/generated/torchvision.models.resnet50.html RESNET50_1X3X224X224_FP32_TORCH = common_definitions.Model( id=unique_ids.MODEL_RESNET50_1X3X224X224_FP32_TORCH, diff --git a/build_tools/python/e2e_test_framework/unique_ids.py b/build_tools/python/e2e_test_framework/unique_ids.py index 2dc5cce6c04d..7e015132d751 100644 --- a/build_tools/python/e2e_test_framework/unique_ids.py +++ b/build_tools/python/e2e_test_framework/unique_ids.py @@ -89,14 +89,14 @@ def hash_composite_id(keys: Sequence[str]) -> str: MODEL_EFFICIENTNET_B7_FP32_TORCH = "68caa96e-b8bb-48a2-bb08-a3044981a370" MODEL_BERT_LARGE_1X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1" -MODEL_BERT_LARGE_8X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8" MODEL_BERT_LARGE_16X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16" +MODEL_BERT_LARGE_24X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24" MODEL_BERT_LARGE_32X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-32" +MODEL_BERT_LARGE_48X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48" MODEL_BERT_LARGE_64X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-64" -MODEL_BERT_LARGE_128X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-128" -MODEL_BERT_LARGE_256X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-256" MODEL_BERT_LARGE_512X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-512" MODEL_BERT_LARGE_1024X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1024" +MODEL_BERT_LARGE_1280X384_FP32_TORCH = "cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1280" MODEL_RESNET50_1X3X224X224_FP32_TORCH = "fd05da43-5e37-4fa0-88f8-3ceec1682345-batch-1" MODEL_RESNET50_8X3X224X224_FP32_TORCH = "fd05da43-5e37-4fa0-88f8-3ceec1682345-batch-8" diff --git a/tests/e2e/test_artifacts/generated_e2e_test_fetch_models.cmake b/tests/e2e/test_artifacts/generated_e2e_test_fetch_models.cmake index 4b91285b051d..abf9cb7deae4 100644 --- a/tests/e2e/test_artifacts/generated_e2e_test_fetch_models.cmake +++ b/tests/e2e/test_artifacts/generated_e2e_test_fetch_models.cmake @@ -212,7 +212,7 @@ iree_fetch_artifact( NAME "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1" SOURCE_URL - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_1/linalg.mlir" + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_1/linalg.mlir" OUTPUT "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1_BertLargePTBatch1.mlir" UNPACK @@ -220,21 +220,21 @@ iree_fetch_artifact( iree_fetch_artifact( NAME - "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8" + "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16" SOURCE_URL - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_8/linalg.mlir" + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_16/linalg.mlir" OUTPUT - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8_BertLargePTBatch8.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" UNPACK ) iree_fetch_artifact( NAME - "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16" + "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24" SOURCE_URL - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_16/linalg.mlir" + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_24/linalg.mlir" OUTPUT - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24_BertLargePTBatch24.mlir" UNPACK ) @@ -242,17 +242,27 @@ iree_fetch_artifact( NAME "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-32" SOURCE_URL - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_32/linalg.mlir" + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_32/linalg.mlir" OUTPUT "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-32_BertLargePTBatch32.mlir" UNPACK ) +iree_fetch_artifact( + NAME + "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48" + SOURCE_URL + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_48/linalg.mlir" + OUTPUT + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48_BertLargePTBatch48.mlir" + UNPACK +) + iree_fetch_artifact( NAME "model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-64" SOURCE_URL - "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230321.784_1679461251/BERT_LARGE/batch_64/linalg.mlir" + "https://storage.googleapis.com/iree-model-artifacts/pytorch/torch_models_20230401.795_1680469670/BERT_LARGE/batch_64/linalg.mlir" OUTPUT "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-64_BertLargePTBatch64.mlir" UNPACK diff --git a/tests/e2e/test_artifacts/generated_e2e_test_iree_artifacts.cmake b/tests/e2e/test_artifacts/generated_e2e_test_iree_artifacts.cmake index a24feb8f1367..222a25ff6240 100644 --- a/tests/e2e/test_artifacts/generated_e2e_test_iree_artifacts.cmake +++ b/tests/e2e/test_artifacts/generated_e2e_test_iree_artifacts.cmake @@ -1008,33 +1008,33 @@ iree_bytecode_module( iree_bytecode_module( NAME - "iree-module-3d45f575f4e1de0a6f30bd2c0da39f6c6415e1ecd45ddbd77c94fe3672356842" + "iree-module-21a83414dc1feb2a3b5fb6afadc36c1022a0ab747380291dbb309637d5f32eab" SRC - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8_BertLargePTBatch8.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" MODULE_FILE_NAME - "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch8_module_3d45f575f4e1de0a6f30bd2c0da39f6c6415e1ecd45ddbd77c94fe3672356842/module.vmfb" + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch16_module_21a83414dc1feb2a3b5fb6afadc36c1022a0ab747380291dbb309637d5f32eab/module.vmfb" FLAGS "--iree-hal-target-backends=cuda" "--iree-input-type=none" "--iree-hal-cuda-llvm-target-arch=sm_80" FRIENDLY_NAME - "BertLargePTBatch8(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags]" + "BertLargePTBatch16(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags]" PUBLIC ) iree_bytecode_module( NAME - "iree-module-21a83414dc1feb2a3b5fb6afadc36c1022a0ab747380291dbb309637d5f32eab" + "iree-module-7d93a3e9b342045ed2546960ee3d08f60be237fd8974fe35447a41234f322148" SRC - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24_BertLargePTBatch24.mlir" MODULE_FILE_NAME - "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch16_module_21a83414dc1feb2a3b5fb6afadc36c1022a0ab747380291dbb309637d5f32eab/module.vmfb" + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch24_module_7d93a3e9b342045ed2546960ee3d08f60be237fd8974fe35447a41234f322148/module.vmfb" FLAGS "--iree-hal-target-backends=cuda" "--iree-input-type=none" "--iree-hal-cuda-llvm-target-arch=sm_80" FRIENDLY_NAME - "BertLargePTBatch16(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags]" + "BertLargePTBatch24(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags]" PUBLIC ) @@ -1054,6 +1054,22 @@ iree_bytecode_module( PUBLIC ) +iree_bytecode_module( + NAME + "iree-module-45ed9ca2efb9bb645316e856a5c464b76e56902e930ff1d4e54fdef38043b33f" + SRC + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48_BertLargePTBatch48.mlir" + MODULE_FILE_NAME + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch48_module_45ed9ca2efb9bb645316e856a5c464b76e56902e930ff1d4e54fdef38043b33f/module.vmfb" + FLAGS + "--iree-hal-target-backends=cuda" + "--iree-input-type=none" + "--iree-hal-cuda-llvm-target-arch=sm_80" + FRIENDLY_NAME + "BertLargePTBatch48(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags]" + PUBLIC +) + iree_bytecode_module( NAME "iree-module-8c26886533593b666597f8698e33c0e9c98b349bdf8ac01c3d122cc20b741def" @@ -3320,11 +3336,11 @@ iree_bytecode_module( iree_bytecode_module( NAME - "iree-module-be8bc043a1d039ecddfac6fda959b2739de49bda4478c53cf8a48baa6a9e8da3" + "iree-module-5176d0f5fa331fa047395186a866870fe4210f637472ef4bb0a3f1ba3a62a749" SRC - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8_BertLargePTBatch8.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" MODULE_FILE_NAME - "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch8_module_be8bc043a1d039ecddfac6fda959b2739de49bda4478c53cf8a48baa6a9e8da3/module.vmfb" + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch16_module_5176d0f5fa331fa047395186a866870fe4210f637472ef4bb0a3f1ba3a62a749/module.vmfb" FLAGS "--iree-hal-target-backends=cuda" "--iree-input-type=none" @@ -3332,17 +3348,17 @@ iree_bytecode_module( "--iree-vm-emit-polyglot-zip=true" "--iree-llvmcpu-debug-symbols=false" FRIENDLY_NAME - "BertLargePTBatch8(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags,compile-stats]" + "BertLargePTBatch16(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags,compile-stats]" PUBLIC ) iree_bytecode_module( NAME - "iree-module-5176d0f5fa331fa047395186a866870fe4210f637472ef4bb0a3f1ba3a62a749" + "iree-module-e67816e321544bb61b63ed8cd8b7faa8ff7d35cca15832b5fbc117f4693b3e78" SRC - "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16_BertLargePTBatch16.mlir" + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24_BertLargePTBatch24.mlir" MODULE_FILE_NAME - "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch16_module_5176d0f5fa331fa047395186a866870fe4210f637472ef4bb0a3f1ba3a62a749/module.vmfb" + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch24_module_e67816e321544bb61b63ed8cd8b7faa8ff7d35cca15832b5fbc117f4693b3e78/module.vmfb" FLAGS "--iree-hal-target-backends=cuda" "--iree-input-type=none" @@ -3350,7 +3366,7 @@ iree_bytecode_module( "--iree-vm-emit-polyglot-zip=true" "--iree-llvmcpu-debug-symbols=false" FRIENDLY_NAME - "BertLargePTBatch16(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags,compile-stats]" + "BertLargePTBatch24(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags,compile-stats]" PUBLIC ) @@ -3372,6 +3388,24 @@ iree_bytecode_module( PUBLIC ) +iree_bytecode_module( + NAME + "iree-module-439dab16cd6df449fc83eb3e1603fa86ad811e749bcad2c3e3176976c56848e5" + SRC + "${ROOT_ARTIFACTS_DIR}/model_cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48_BertLargePTBatch48.mlir" + MODULE_FILE_NAME + "${ROOT_ARTIFACTS_DIR}/iree_BertLargePTBatch48_module_439dab16cd6df449fc83eb3e1603fa86ad811e749bcad2c3e3176976c56848e5/module.vmfb" + FLAGS + "--iree-hal-target-backends=cuda" + "--iree-input-type=none" + "--iree-hal-cuda-llvm-target-arch=sm_80" + "--iree-vm-emit-polyglot-zip=true" + "--iree-llvmcpu-debug-symbols=false" + FRIENDLY_NAME + "BertLargePTBatch48(linalg) [cuda-sm_80-linux_gnu-cuda][default-flags,compile-stats]" + PUBLIC +) + iree_bytecode_module( NAME "iree-module-815e44d1ac31402e86d0fef72e79474a25dfad3a5c15b8cdd3642e101274342d" @@ -4912,9 +4946,10 @@ add_dependencies(iree-benchmark-import-models ${PACKAGE_NAME}_model-340553d1-e6fe-41b6-b2c7-687c74ccec56 ${PACKAGE_NAME}_model-68caa96e-b8bb-48a2-bb08-a3044981a370 ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-1 - ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-8 ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-16 + ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-24 ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-32 + ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-48 ${PACKAGE_NAME}_model-cbc5e400-7c93-4844-aca8-bce8f1bf9948-batch-64 ${PACKAGE_NAME}_model-fd05da43-5e37-4fa0-88f8-3ceec1682345-batch-1 ${PACKAGE_NAME}_model-fd05da43-5e37-4fa0-88f8-3ceec1682345-batch-8 @@ -4967,9 +5002,10 @@ add_dependencies(iree-benchmark-suites ${PACKAGE_NAME}_iree-module-c8ec2db5ee884e0af17814e61b13d7f7f1f2d4f7028e8c1920d0d968c27de2bb ${PACKAGE_NAME}_iree-module-9470c46965ea67794da45496454c82eade29b5a519d8037b1314738621e02260 ${PACKAGE_NAME}_iree-module-154de838dc7742304c9e27a9f315645a915493bc4f84160e29b15b7fc6dc475e - ${PACKAGE_NAME}_iree-module-3d45f575f4e1de0a6f30bd2c0da39f6c6415e1ecd45ddbd77c94fe3672356842 ${PACKAGE_NAME}_iree-module-21a83414dc1feb2a3b5fb6afadc36c1022a0ab747380291dbb309637d5f32eab + ${PACKAGE_NAME}_iree-module-7d93a3e9b342045ed2546960ee3d08f60be237fd8974fe35447a41234f322148 ${PACKAGE_NAME}_iree-module-995595b7b80370d9c484413e9d06c2de928db32777101c91d3bac0d3797058ec + ${PACKAGE_NAME}_iree-module-45ed9ca2efb9bb645316e856a5c464b76e56902e930ff1d4e54fdef38043b33f ${PACKAGE_NAME}_iree-module-8c26886533593b666597f8698e33c0e9c98b349bdf8ac01c3d122cc20b741def ${PACKAGE_NAME}_iree-module-222490941c581c67f5ce710e9ea141482cd8074294a43a5dc67a01a127037cd4 ${PACKAGE_NAME}_iree-module-39556c12d84502be71243197b99b0f8c22949093c561c55c01ca906812a86288 @@ -5097,9 +5133,10 @@ add_dependencies(iree-e2e-compile-stats-suites ${PACKAGE_NAME}_iree-module-925cdb19f2aa31a1907c81b5a9e179d91280c77b08a039c1cbf146f71683dde9 ${PACKAGE_NAME}_iree-module-3c94ab45ad76bd8b2083729b65340b987da3247c854faf7d06431cb05a3b0a23 ${PACKAGE_NAME}_iree-module-999f2edcdf9fbc84e0969923f8605e9069810a63849973a5b74488f83d14a2fe - ${PACKAGE_NAME}_iree-module-be8bc043a1d039ecddfac6fda959b2739de49bda4478c53cf8a48baa6a9e8da3 ${PACKAGE_NAME}_iree-module-5176d0f5fa331fa047395186a866870fe4210f637472ef4bb0a3f1ba3a62a749 + ${PACKAGE_NAME}_iree-module-e67816e321544bb61b63ed8cd8b7faa8ff7d35cca15832b5fbc117f4693b3e78 ${PACKAGE_NAME}_iree-module-d746ecf3d747f18306b6dea4cb6b9e9dbf987fe7fd4d0b27b39a57a213e75dd9 + ${PACKAGE_NAME}_iree-module-439dab16cd6df449fc83eb3e1603fa86ad811e749bcad2c3e3176976c56848e5 ${PACKAGE_NAME}_iree-module-815e44d1ac31402e86d0fef72e79474a25dfad3a5c15b8cdd3642e101274342d ${PACKAGE_NAME}_iree-module-681f456f27dbb79e7d8d0266bf835866d9f29f87eafad7e867ac13c84602742f ${PACKAGE_NAME}_iree-module-3b0ae1403ef444d812f0c7b37fda7311e2cc4ea407850ee7b91e6984b9c86100