mirror of
https://github.com/nod-ai/AMD-SHARK-Studio.git
synced 2026-04-03 03:00:17 -04:00
Relocate quantized matmul reassociation flag (#2047)
* Remove quantized matmul reassociation flag This flag should be a model/use-case specific addition, not a default CPU compile flag.
This commit is contained in:
@@ -106,6 +106,7 @@ class LanguageModel:
|
||||
frontend="torch",
|
||||
external_weight_file=self.external_weight_file,
|
||||
write_to=self.vmfb_name,
|
||||
extra_args=["--iree-global-opt-enable-quantized-matmul-reassociation"],
|
||||
)
|
||||
# TODO: delete the temp file
|
||||
|
||||
|
||||
Reference in New Issue
Block a user