File tree Expand file tree Collapse file tree 1 file changed +14
-11
lines changed
src/compressed_tensors/quantization/lifecycle Expand file tree Collapse file tree 1 file changed +14
-11
lines changed Original file line number Diff line number Diff line change 45
45
"initialize_module_for_quantization" ,
46
46
"is_attention_module" ,
47
47
"KVCacheScaleType" ,
48
+ "ALL_QPARAM_KEYS" ,
48
49
]
49
50
50
51
@@ -56,6 +57,18 @@ class KVCacheScaleType(Enum):
56
57
VALUE = "v_scale"
57
58
58
59
60
+ ALL_QPARAM_KEYS = [KVCacheScaleType .KEY .value , KVCacheScaleType .VALUE .value ] + [
61
+ f"{ base_name } _{ suffix } "
62
+ for base_name in ("input" , "weight" , "output" )
63
+ for suffix in (
64
+ "global_scale" ,
65
+ "scale" ,
66
+ "zero_point" ,
67
+ "g_idx" ,
68
+ )
69
+ ]
70
+
71
+
59
72
def initialize_module_for_quantization (
60
73
module : Module ,
61
74
scheme : Optional [QuantizationScheme ] = None ,
@@ -146,17 +159,7 @@ def _clear_all_qparams(
146
159
147
160
:param module: module to clear qparams from
148
161
"""
149
- keys = [KVCacheScaleType .KEY .value , KVCacheScaleType .VALUE .value ] + [
150
- f"{ base_name } _{ suffix } "
151
- for base_name in ("input" , "weight" , "output" )
152
- for suffix in (
153
- "global_scale" ,
154
- "scale" ,
155
- "zero_point" ,
156
- "g_idx" ,
157
- )
158
- ]
159
- for key in keys :
162
+ for key in ALL_QPARAM_KEYS :
160
163
if hasattr (module , key ):
161
164
delete_offload_parameter (module , key )
162
165
You can’t perform that action at this time.
0 commit comments