forked from iree-org/iree
-
Notifications
You must be signed in to change notification settings - Fork 11
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Enable MI300 CI testing. (iree-org#17842)
This commit enables mi300 gpu and model testing. ci-exactly: build_all, test_amd_mi300, build_packages, regression_test --------- Signed-off-by: saienduri <saimanas.enduri@amd.com> Co-authored-by: Scott Todd <scott.todd0@gmail.com>
- Loading branch information
Showing
7 changed files
with
243 additions
and
3 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
28 changes: 28 additions & 0 deletions
28
build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,28 @@ | ||
{ | ||
"config_name": "gpu_rocm", | ||
"iree_compile_flags": [ | ||
"--iree-hal-target-backends=rocm", | ||
"--iree-rocm-target-chip=gfx942", | ||
"--iree-input-demote-f64-to-f32" | ||
], | ||
"iree_run_module_flags": [ | ||
"--device=hip" | ||
], | ||
"skip_compile_tests": [ | ||
"pytorch/models/sdxl-scheduled-unet-3-tank", | ||
"pytorch/models/sdxl-prompt-encoder-tank", | ||
"pytorch/models/sdxl-vae-decode-tank" | ||
], | ||
"skip_run_tests": [], | ||
"expected_compile_failures": [ | ||
// TODO(#17344): need to regenerate .mlirbc | ||
"pytorch/models/opt-125M", | ||
"pytorch/models/resnet50", | ||
"pytorch/models/sdxl-vae-decode-tank", | ||
|
||
// error: 'builtin.module' op failed to run transform dialect passes | ||
// (transform spec file is specific to SDXL?) | ||
"sharktank/llama/open-llama-3b-v2-f16" | ||
], | ||
"expected_run_failures": [] | ||
} |
25 changes: 25 additions & 0 deletions
25
build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942_additional_flags.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,25 @@ | ||
{ | ||
"config_name": "gpu_rocm", | ||
"iree_compile_flags": [ | ||
"--iree-hal-target-backends=rocm", | ||
"--iree-rocm-target-chip=gfx942", | ||
"--iree-input-demote-f64-to-f32", | ||
"--iree-opt-const-eval=false", | ||
"--iree-codegen-transform-dialect-library=${IREE_TEST_PATH_EXTENSION}/attention_and_matmul_spec.mlir" | ||
], | ||
"iree_run_module_flags": [ | ||
"--device=hip" | ||
], | ||
"skip_compile_tests": [ | ||
"pytorch/models/sdxl-scheduled-unet-3-tank", | ||
"pytorch/models/sdxl-prompt-encoder-tank", | ||
"pytorch/models/sdxl-vae-decode-tank" | ||
], | ||
"skip_run_tests": [], | ||
"expected_compile_failures": [ | ||
// TODO(#17344): need to regenerate .mlirbc | ||
"pytorch/models/opt-125M", | ||
"pytorch/models/resnet50" | ||
], | ||
"expected_run_failures": [] | ||
} |
36 changes: 36 additions & 0 deletions
36
build_tools/pkgci/external_test_suite/sdxl_prompt_encoder_gpu_rocm_gfx942.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,36 @@ | ||
{ | ||
"config_name": "gpu_rocm", | ||
"iree_compile_flags": [ | ||
"--iree-hal-target-backends=rocm", | ||
"--iree-rocm-target-chip=gfx942", | ||
"--iree-input-type=torch", | ||
"--iree-opt-const-eval=false", | ||
"--iree-global-opt-propagate-transposes=true", | ||
"--iree-opt-outer-dim-concat=true", | ||
"--iree-rocm-waves-per-eu=2", | ||
"--iree-llvmgpu-enable-prefetch", | ||
"--iree-flow-enable-aggressive-fusion", | ||
"--iree-global-opt-enable-fuse-horizontal-contractions=true", | ||
"--iree-opt-aggressively-propagate-transposes=true", | ||
"--iree-codegen-llvmgpu-use-vector-distribution=true", | ||
"--iree-execution-model=async-external", | ||
"--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics{pad-target-type=conv}))", | ||
"--iree-scheduling-dump-statistics-format=json", | ||
"--iree-scheduling-dump-statistics-file=compilation_info.json" | ||
], | ||
"iree_run_module_flags": [ | ||
"--device=hip", | ||
"--parameters=model=real_weights.irpa", | ||
"--input=1x64xi64=@inference_input.0.bin", | ||
"--input=1x64xi64=@inference_input.1.bin", | ||
"--input=1x64xi64=@inference_input.2.bin", | ||
"--input=1x64xi64=@inference_input.3.bin", | ||
"--expected_output=2x64x2048xf16=@inference_output.0.bin", | ||
"--expected_output=2x1280xf16=@inference_output.1.bin", | ||
"--expected_f16_threshold=1.0f" | ||
], | ||
"skip_compile_tests": [], | ||
"skip_run_tests": [], | ||
"expected_compile_failures": [], | ||
"expected_run_failures": [] | ||
} |
41 changes: 41 additions & 0 deletions
41
build_tools/pkgci/external_test_suite/sdxl_scheduled_unet_gpu_rocm_gfx942.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,41 @@ | ||
{ | ||
"config_name": "gpu_rocm", | ||
"iree_compile_flags" : [ | ||
"--iree-hal-target-backends=rocm", | ||
"--iree-rocm-target-chip=gfx942", | ||
"--iree-opt-const-eval=false", | ||
"--iree-codegen-transform-dialect-library=${IREE_TEST_PATH_EXTENSION}/attention_and_matmul_spec.mlir", | ||
"--iree-global-opt-propagate-transposes=true", | ||
"--iree-global-opt-enable-fuse-horizontal-contractions=true", | ||
"--iree-flow-enable-aggressive-fusion=true", | ||
"--iree-opt-aggressively-propagate-transposes=true", | ||
"--iree-opt-outer-dim-concat=true", | ||
"--iree-vm-target-truncate-unsupported-floats", | ||
"--iree-llvmgpu-enable-prefetch=true", | ||
"--iree-opt-data-tiling=false", | ||
"--iree-codegen-gpu-native-math-precision=true", | ||
"--iree-codegen-llvmgpu-use-vector-distribution", | ||
"--iree-rocm-waves-per-eu=2", | ||
"--iree-execution-model=async-external", | ||
"--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))", | ||
"--iree-scheduling-dump-statistics-format=json", | ||
"--iree-scheduling-dump-statistics-file=compilation_info.json" | ||
], | ||
"iree_run_module_flags": [ | ||
"--device=hip", | ||
"--parameters=model=real_weights.irpa", | ||
"--module=sdxl_scheduled_unet_pipeline_fp16_rocm.vmfb", | ||
"--input=1x4x128x128xf16=@inference_input.0.bin", | ||
"--input=2x64x2048xf16=@inference_input.1.bin", | ||
"--input=2x1280xf16=@inference_input.2.bin", | ||
"--input=1xf16=@inference_input.3.bin", | ||
"--expected_output=1x4x128x128xf16=@inference_output.0.bin", | ||
"--expected_f16_threshold=0.7f" | ||
], | ||
"skip_compile_tests": [], | ||
"skip_run_tests": [], | ||
"expected_compile_failures": [], | ||
"expected_run_failures": [ | ||
"pytorch/models/sdxl-scheduled-unet-3-tank", | ||
] | ||
} |
29 changes: 29 additions & 0 deletions
29
build_tools/pkgci/external_test_suite/sdxl_vae_decode_gpu_rocm_gfx942.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,29 @@ | ||
{ | ||
"config_name": "gpu_rocm", | ||
"iree_compile_flags" : [ | ||
"--iree-hal-target-backends=rocm", | ||
"--iree-rocm-target-chip=gfx942", | ||
"--iree-opt-const-eval=false", | ||
"--iree-global-opt-propagate-transposes=true", | ||
"--iree-opt-outer-dim-concat=true", | ||
"--iree-llvmgpu-enable-prefetch=true", | ||
"--iree-rocm-waves-per-eu=2", | ||
"--iree-flow-enable-aggressive-fusion", | ||
"--iree-codegen-llvmgpu-use-vector-distribution=true", | ||
"--iree-execution-model=async-external", | ||
"--iree-preprocessing-pass-pipeline=builtin.module(iree-preprocessing-transpose-convolution-pipeline, util.func(iree-preprocessing-pad-to-intrinsics))", | ||
"--iree-scheduling-dump-statistics-format=json", | ||
"--iree-scheduling-dump-statistics-file=compilation_info.json" | ||
], | ||
"iree_run_module_flags": [ | ||
"--device=hip", | ||
"--parameters=model=real_weights.irpa", | ||
"--input=1x4x128x128xf16=@inference_input.0.bin", | ||
"--expected_output=1x3x1024x1024xf16=@inference_output.0.bin", | ||
"--expected_f16_threshold=0.4f" | ||
], | ||
"skip_compile_tests": [], | ||
"skip_run_tests": [], | ||
"expected_compile_failures": [], | ||
"expected_run_failures": [] | ||
} |