Skip to content

Commit 47ec10e

Browse files
yiliu30HDCharles
andauthored
Upgrade autoround 0.10.2 (#2410)
Signed-off-by: yiliu30 <yi4.liu@intel.com> SUMMARY: "please provide a brief summary" TEST PLAN: "please outline how the changes were tested" cc @hshen14 @thuang6 @chensuyue --------- Signed-off-by: yiliu30 <yi4.liu@intel.com> Co-authored-by: HDCharles <39544797+HDCharles@users.noreply.github.com>
1 parent 04dea55 commit 47ec10e

File tree

2 files changed

+4
-5
lines changed

2 files changed

+4
-5
lines changed

setup.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -129,10 +129,9 @@ def localversion_func(version: ScmVersion) -> str:
129129
),
130130
("datasets>=4.0.0,<=4.6.0" if BUILD_TYPE == "release" else "datasets>=4.0.0"),
131131
(
132-
# auto-round 0.9.1 cannot work with accelerate <1.10.0
133-
"auto-round>=0.9.6,<=0.10.2"
132+
"auto-round>=0.10.2,<=0.10.2"
134133
if BUILD_TYPE == "release"
135-
else "auto-round>=0.9.6"
134+
else "auto-round>=0.10.2"
136135
),
137136
(
138137
"accelerate>=1.6.0,<=1.12.0"

src/llmcompressor/modifiers/autoround/base.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -262,7 +262,7 @@ def apply_autoround(self, state, subgraph):
262262

263263
# Build kwargs for AutoRound initialization
264264
ar_quant_scheme = self._mapping_config_to_autoround()
265-
fp_layers = self.get_unquantized_layer_names(decoding_layer)
265+
ignore_layers = self.get_unquantized_layer_names(decoding_layer)
266266
kwargs = {
267267
"tokenizer": "", # A placeholder
268268
"scheme": ar_quant_scheme,
@@ -271,7 +271,7 @@ def apply_autoround(self, state, subgraph):
271271
"enable_torch_compile": self.enable_torch_compile,
272272
"batch_size": self.batch_size,
273273
"device_map": self.device_ids,
274-
"fp_layers": ",".join(fp_layers) if fp_layers else "",
274+
"ignore_layers": ",".join(ignore_layers) if ignore_layers else "",
275275
}
276276

277277
llmc_registered_qparams = self._preprocess_qparams(decoding_layer)

0 commit comments

Comments
 (0)