Skip to content

Commit

Permalink
Update flags for MI perf.
Browse files Browse the repository at this point in the history
  • Loading branch information
monorimet committed Mar 19, 2024
1 parent 4ed0bb6 commit 62a8364
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion models/turbine_models/custom_models/sd_inference/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@
"--iree-global-opt-propagate-transposes=true",
"--iree-opt-const-eval=false",
"--iree-opt-outer-dim-concat=true",
"--iree-rocm-bc-dir=/opt/rocm/amdgcn/bitcode",
"--iree-rocm-bc-dir=/home/eagarvey/2024-q1-sdxl-sprint/bitcode-2024-03-07",
"--iree-vm-target-truncate-unsupported-floats",
"--iree-llvmgpu-enable-prefetch=true",
"--verify=false",
Expand All @@ -24,6 +24,8 @@
],
"unet": [
# "--iree-flow-split-matmul-reduction=5",
"--iree-codegen-llvmgpu-use-conv-vector-distribute-pipeline",
"--iree-codegen-llvmgpu-reduce-skinny-matmuls",
"--iree-codegen-gpu-native-math-precision=true",
"--iree-codegen-llvmgpu-use-vector-distribution",
],
Expand Down

0 comments on commit 62a8364

Please sign in to comment.