Skip to content

Commit 1a1634d

Browse files
authored
GGUF: torch.compile cannot trace sets
torch.compile fails to trace ``` s = { ... } if x in s: ``` it can trace lists
1 parent 84e1657 commit 1a1634d

File tree

1 file changed

+7
-7
lines changed

1 file changed

+7
-7
lines changed

src/diffusers/quantizers/gguf/utils.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -41,23 +41,23 @@
4141
else:
4242
ops = None
4343

44-
UNQUANTIZED_TYPES = {gguf.GGMLQuantizationType.F32, gguf.GGMLQuantizationType.F16, gguf.GGMLQuantizationType.BF16}
45-
STANDARD_QUANT_TYPES = {
44+
UNQUANTIZED_TYPES = [gguf.GGMLQuantizationType.F32, gguf.GGMLQuantizationType.F16, gguf.GGMLQuantizationType.BF16]
45+
STANDARD_QUANT_TYPES = [
4646
gguf.GGMLQuantizationType.Q4_0,
4747
gguf.GGMLQuantizationType.Q4_1,
4848
gguf.GGMLQuantizationType.Q5_0,
4949
gguf.GGMLQuantizationType.Q5_1,
5050
gguf.GGMLQuantizationType.Q8_0,
5151
gguf.GGMLQuantizationType.Q8_1,
52-
}
53-
KQUANT_TYPES = {
52+
]
53+
KQUANT_TYPES = [
5454
gguf.GGMLQuantizationType.Q2_K,
5555
gguf.GGMLQuantizationType.Q3_K,
5656
gguf.GGMLQuantizationType.Q4_K,
5757
gguf.GGMLQuantizationType.Q5_K,
5858
gguf.GGMLQuantizationType.Q6_K,
59-
}
60-
IMATRIX_QUANT_TYPES = {
59+
]
60+
IMATRIX_QUANT_TYPES = [
6161
gguf.GGMLQuantizationType.IQ1_M,
6262
gguf.GGMLQuantizationType.IQ1_S,
6363
gguf.GGMLQuantizationType.IQ2_XXS,
@@ -67,7 +67,7 @@
6767
gguf.GGMLQuantizationType.IQ3_S,
6868
gguf.GGMLQuantizationType.IQ4_XS,
6969
gguf.GGMLQuantizationType.IQ4_NL,
70-
}
70+
]
7171
# TODO(Isotr0py): Currently, we don't have MMQ kernel for I-Matrix quantization.
7272
# Consolidate DEQUANT_TYPES, MMVQ_QUANT_TYPES and MMQ_QUANT_TYPES after we add
7373
# MMQ kernel for I-Matrix quantization.

0 commit comments

Comments
 (0)