Update matmul reassoc flags for cpu llama2.

2026-04-03 03:00:17 -04:00 · 2024-01-10 14:57:44 -06:00
parent d35288e893
commit 97e112091f
1 changed files with 2 additions and 2 deletions
--- a/apps/language_models/scripts/vicuna.py
+++ b/apps/language_models/scripts/vicuna.py
@@ -2076,8 +2076,8 @@ class UnshardedVicuna(VicunaBase):
            f"{'://' + str(self.device_id) if self.device_id is not None else ''}"
        )
        if "cpu" in self.device:
-            self.extra_args.extend("--iree-llvmcpu-enable-quantized-matmul-reassociation")
-            self.extra_args.extend("--iree-global-opt-enable-quantized-matmul-reassociation")
+            self.extra_args.extend(["--iree-llvmcpu-enable-quantized-matmul-reassociation"])
+            self.extra_args.extend(["--iree-global-opt-enable-quantized-matmul-reassociation"])

        shark_module = SharkInference(
            mlir_module=combined_module,