Adds instructions for exporting and benchmarking an example model

eagarvey-amd · eagarvey-amd · commit 21896757e828 · 2024-09-19T16:04:41.000-05:00
diff --git a/models/turbine_models/custom_models/torchbench/README.md b/models/turbine_models/custom_models/torchbench/README.md
@@ -4,7 +4,7 @@
 
  - pip install torch+rocm packages:
 ```shell
-pip install --pre torch==2.5.0.dev20240801+rocm6.1 torchvision==0.20.0.dev20240801+rocm6.1 torchaudio==2.4.0.dev20240801%2Brocm6.1 --index-url https://download.pytorch.org/whl/nightly/rocm6.1
+pip install torch==2.5.0.dev20240801+rocm6.1 torchvision==0.20.0.dev20240801+rocm6.1 torchaudio==2.4.0.dev20240801+rocm6.1 --index-url https://download.pytorch.org/whl/nightly/rocm6.1
 
 ```
  - Workaround amdsmi error in pre-release pytorch+rocm:
@@ -33,4 +33,12 @@ cd ..
 
 ```shell
 python ./export.py --target=gfx942 --device=rocm --compile_to=vmfb --performance --inference --precision=fp16 --float16 --external_weights=safetensors --external_weights_dir=./torchbench_weights/
+```
+
+### Example (hf_Albert)
+
+```shell
+ python ./export.py --target=gfx942 --device=rocm --compile_to=vmfb --performance --inference --precision=fp16 --float16 --external_weights=safetensors --external_weights_dir=./torchbench_weights/ --model_id=hf_Albert
+
+iree-benchmark-module --module=hf_Albert_32_fp16_gfx942.vmfb --input=@input0.npy --parameters=model=./torchbench_weights/hf_Albert_fp16.irpa --device=hip://0 --device_allocator=caching --function=main --benchmark_repetitions=10
 ```
diff --git a/models/turbine_models/custom_models/torchbench/cmd_opts.py b/models/turbine_models/custom_models/torchbench/cmd_opts.py
@@ -68,7 +68,7 @@ def is_valid_file(arg):
 p.add_argument(
     "--external_weights",
     type=str,
-    default=None,
+    default="irpa",
     choices=["safetensors", "irpa", "gguf", None],
     help="Externalizes model weights from the torch dialect IR and its successors",
 )
diff --git a/models/turbine_models/custom_models/torchbench/export.py b/models/turbine_models/custom_models/torchbench/export.py
@@ -48,22 +48,21 @@
         "dim": 32,
         "buffer_prefix": "albert"
     },
-    "hf_Bart": {
-        "dim": 16,
-        "buffer_prefix": "bart"
-    },
-    "hf_Bert": {
-        "dim": 16,
-        "buffer_prefix": "bert"
-    },
-    "hf_GPT2": {
-        "dim": 16,
-        "buffer_prefix": "gpt2"
-    },
-    "hf_T5": {
-        "dim": 4,
-        "buffer_prefix": "t5"
-    },
+    # "hf_Bart": {
+    #     "dim": 16,
+    # },
+    # "hf_Bert": {
+    #     "dim": 16,
+    #     "buffer_prefix": "bert"
+    # },
+    # "hf_GPT2": {
+    #     "dim": 16,
+    #     "buffer_prefix": "gpt2"
+    # },
+    # "hf_T5": {
+    #     "dim": 4,
+    #     "buffer_prefix": "t5"
+    # },
     "mnasnet1_0": {
         "dim": 256,
     },
@@ -182,30 +181,21 @@ def export_torchbench_model(
 
     _, model_name, model, forward_args, _ = get_model_and_inputs(model_id, batch_size, tb_dir, tb_args)
     
+    for idx, i in enumerate(forward_args.values()):
+        np.save(f"input{idx}", i.clone().detach().cpu())
     if dtype == torch.float16:
         model = model.half()
         model.to("cuda:0")
 
     if not isinstance(forward_args, dict):
         forward_args = [i.type(dtype) for i in forward_args]
-    elif "hf" in model_id:
-        forward_args["head_mask"] = torch.zeros(model.config.num_hidden_layers, device="cuda:0")
     
     mapper = {}
     if (external_weights_dir is not None):
         if not os.path.exists(external_weights_dir):
             os.mkdir(external_weights_dir)
-        external_weight_path = os.path.join(external_weights_dir, f"{model_id}_{precision}.{external_weights}")
-        if os.path.exists(external_weight_path):
-            print("External weights for this module already exist at {external_weight_path}. Will not overwrite.")
-        utils.save_external_weights(
-            mapper,
-            model,
-            external_weights,
-            external_weight_path,
-        )
-    if weights_only:
-        return external_weight_path
+        external_weight_path = os.path.join(external_weights_dir, f"{model_id}_{precision}.irpa")
+
 
     decomp_list = [torch.ops.aten.reflection_pad2d]
     if decomp_attn == True:
@@ -225,18 +215,20 @@ def __init__(self, model):
                     self.mod = model
                 
                 def forward(self, inp):
-                    return self.mod(**inp, return_dict=False)
-            # In transformers, the position ids buffer is registered as non-persistent,
-            # which makes it fail to globalize in the FX import.
-            # Add them manually to the state dict here.
-
-            prefix = torchbench_models_dict[model_id]["buffer_prefix"]
-            getattr(model, prefix).embeddings.register_buffer(
-                "position_ids",
-                getattr(model, prefix).embeddings.position_ids,
-                persistent=True,
-            )
+                    return self.mod(**inp)
+            
+            if "Bart" not in model_id:
+                # In some transformers models, the position ids buffer is registered as non-persistent,
+                # which makes it fail to globalize in the FX import.
+                # Add them manually to the state dict here.
 
+                prefix = torchbench_models_dict[model_id]["buffer_prefix"]
+                getattr(model, prefix).embeddings.register_buffer(
+                    "position_ids",
+                    getattr(model, prefix).embeddings.position_ids,
+                    persistent=True,
+                )
+            breakpoint()
             fxb = FxProgramsBuilder(HF_M(model))
             @fxb.export_program(args=(forward_args,))
             def _forward(module: HF_M(model), inputs):
@@ -252,6 +244,7 @@ class CompiledTorchbenchModel(CompiledModule):
 
         if external_weights:
             externalize_module_parameters(model)
+            save_module_parameters(external_weight_path, model)
 
         inst = CompiledTorchbenchModel(context=Context(), import_to="IMPORT")
 

Original file line number	Diff line number	Diff line change
`@@ -68,7 +68,7 @@ def is_valid_file(arg):`
`68`	`68`	`p.add_argument(`
`69`	`69`	`"--external_weights",`
`70`	`70`	`type=str,`
`71`		`- default=None,`
	`71`	`+ default="irpa",`
`72`	`72`	`choices=["safetensors", "irpa", "gguf", None],`
`73`	`73`	`help="Externalizes model weights from the torch dialect IR and its successors",`
`74`	`74`	`)`