diff --git a/models/turbine_models/custom_models/torchbench/README.md b/models/turbine_models/custom_models/torchbench/README.md index fc821784..890f9070 100644 --- a/models/turbine_models/custom_models/torchbench/README.md +++ b/models/turbine_models/custom_models/torchbench/README.md @@ -17,7 +17,7 @@ These commands assume a few things about your machine/distro, so please read the docker build --platform linux/amd64 --tag shark_torchbench --file shark_torchbench.dockerfile . ``` ```shell -docker run -it --network=host --device=/dev/kfd --device=/dev/dri --group-add video --cap-add=SYS_PTRACE --security-opt seccomp=unconfined -v shark_torchbench:/SHARK-Turbine/models/turbine_models/custom_models/torchbench/outputs -w /SHARK-Turbine/models/turbine_models/custom_models/torchbench shark_torchbench:latest +docker run -it --network=host --device=/dev/kfd --device=/dev/dri --group-add video --cap-add=SYS_PTRACE --security-opt seccomp=unconfined -v ./shark_torchbench_outputs:/SHARK-Turbine/models/turbine_models/custom_models/torchbench/outputs -w /SHARK-Turbine/models/turbine_models/custom_models/torchbench shark_torchbench:latest ``` ```shell python3 ./export.py --target=gfx942 --device=rocm --compile_to=vmfb --performance --inference --precision=fp16 --float16 --external_weights=safetensors --external_weights_dir=./torchbench_weights/ --output_csv=./outputs/torchbench_results_SHARK.csv diff --git a/models/turbine_models/custom_models/torchbench/utils.py b/models/turbine_models/custom_models/torchbench/utils.py index 34b1caf5..d303e403 100644 --- a/models/turbine_models/custom_models/torchbench/utils.py +++ b/models/turbine_models/custom_models/torchbench/utils.py @@ -412,7 +412,7 @@ def get_mfma_spec_path(target_chip, save_dir, masked_attention=False, use_punet= url = "https://raw.githubusercontent.com/nod-ai/sdxl-scripts/main/int8-model/specs/attention_and_matmul_spec.mlir" elif not masked_attention: suffix = "" - url = "https://sharkpublic.blob.core.windows.net/sharkpublic/specs/no_pad/attention_and_matmul_spec_mfma.mlir" + url = "https://raw.githubusercontent.com/iree-org/iree/refs/heads/main/build_tools/pkgci/external_test_suite/attention_and_matmul_spec.mlir" else: suffix = "_pad" url = "https://sharkpublic.blob.core.windows.net/sharkpublic/specs/latest/attention_and_matmul_spec_gfx942.mlir"