fix: improve gguf performance with torch.compile

pytorch 2.7 does not implement `set.__contains__`, so make this a list instead. See https://github.com/pytorch/pytorch/issues/145761
2026-04-23 03:00:31 -04:00 · 2025-05-21 18:03:51 -07:00
parent f3e2a3c384
commit 8bd52ed744
1 changed files with 2 additions and 1 deletions
--- a/invokeai/backend/quantization/gguf/utils.py
+++ b/invokeai/backend/quantization/gguf/utils.py
@@ -5,7 +5,8 @@ from typing import Callable, Optional, Union
 import gguf
 import torch

-TORCH_COMPATIBLE_QTYPES = {None, gguf.GGMLQuantizationType.F32, gguf.GGMLQuantizationType.F16}
+# should not be a Set until this is resolved: https://github.com/pytorch/pytorch/issues/145761
+TORCH_COMPATIBLE_QTYPES = [None, gguf.GGMLQuantizationType.F32, gguf.GGMLQuantizationType.F16]

 # K Quants #
 QK_K = 256