File tree Expand file tree Collapse file tree 1 file changed +21
-0
lines changed
src/llmcompressor/modifiers/awq Expand file tree Collapse file tree 1 file changed +21
-0
lines changed Original file line number Diff line number Diff line change @@ -132,7 +132,28 @@ class AWQMapping:
132
132
AWQMapping ("re:.*up_proj$" , ["re:.*down_proj$" ]),
133
133
]
134
134
135
+ _bloom_mappings = [
136
+ AWQMapping (
137
+ "re:.*input_layernorm$" ,
138
+ ["re:.*query_key_value$" ]
139
+ ),
140
+ AWQMapping (
141
+ "re:.*post_attention_layernorm$" ,
142
+ ["re:.*dense_h_to_4h$" ]
143
+ ),
144
+ AWQMapping (
145
+ "re:.*gelu_impl$" ,
146
+ ["re:.*dense_4h_to_h$" ]
147
+ ),
148
+ # Note: AutoAWQ excludes this mapping, based on researcher's post in
149
+ # https://github.com/mit-han-lab/llm-awq/issues/2#issuecomment-1606297469
150
+ # AWQMapping(
151
+ # "re:.*query_key_value$",
152
+ # ["re:.*dense$"]
153
+ # ),
154
+ ]
135
155
AWQ_MAPPING_REGISTRY : Dict [str , list [AWQMapping ]] = {
156
+ "BloomForCausalLM" : _bloom_mappings ,
136
157
"CohereForCausalLM" : _cohere_mappings ,
137
158
"Cohere2ForCausalLM" : _cohere_mappings ,
138
159
"DeepseekV3ForCausalLM" : _deepseek_mappings ,
You can’t perform that action at this time.
0 commit comments