We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent dc0141f commit 9ace086Copy full SHA for 9ace086
swift/llm/export/quant.py
@@ -208,6 +208,7 @@ def gptq_model_quantize(self):
208
with self._patch_gptq():
209
gptq_quantizer = GPTQQuantizer(
210
bits=args.quant_bits,
211
+ group_size=args.group_size,
212
dataset=','.join(args.dataset),
213
batch_size=args.quant_batch_size,
214
block_name_to_quantize=self.get_block_name_to_quantize(self.model, args.model_type))
0 commit comments