We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f5f49d6 commit 842aeadCopy full SHA for 842aead
fms_mo/utils/dq_utils.py
@@ -115,5 +115,15 @@ def config_quantize_smooth_layers(qcfg: dict):
115
qcfg["smoothq_act_scale_path"] = "./act_scales/graniteCodeHF_34b_base12.pt"
116
if "granite-34b-code-instruct" in qcfg["model"]:
117
118
+ elif "roberta" in qcfg["model"]:
119
+ qcfg["act_scale_path"] = "./act_scales"
120
+ qcfg["scale_layers"] = [
121
+ "attention.self.query",
122
+ "attention.self.key",
123
+ "attention.self.value",
124
+ "intermediate.dense",
125
+ ]
126
+ qcfg["qskip_layer_name"] = []
127
+ qcfg["qlayer_name_pattern"] = ["roberta.encoder"]
128
else:
129
raise ValueError("The model architecture is not supported for DQ.")
0 commit comments