Skip to content

Commit 5f7570b

Browse files
Merge branch 'main' into build
Signed-off-by: Thara Palanivel <[email protected]>
2 parents cc3f730 + 1e7856e commit 5f7570b

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

fms_mo/run_quant.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -74,11 +74,10 @@ def quantize(
7474
the model
7575
data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
7676
tokenized dataset
77+
opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
7778
fms_mo_args (fms_mo.training_args.FMSMOArguments): Parameters to use for PTQ quantization
7879
gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
7980
fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
80-
quant_method (str): Quantization technique, options are gptq, fp8 and dq
81-
output_dir (str) Output directory to write to
8281
"""
8382

8483
logger = set_log_level(opt_args.log_level, "fms_mo.quantize")
@@ -120,8 +119,8 @@ def run_gptq(model_args, data_args, opt_args, gptq_args):
120119
the model
121120
data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
122121
tokenized dataset
122+
opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
123123
gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
124-
output_dir (str) Output directory to write to
125124
"""
126125

127126
# Third Party
@@ -187,8 +186,8 @@ def run_fp8(model_args, data_args, opt_args, fp8_args):
187186
the model
188187
data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
189188
tokenized dataset
189+
opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
190190
fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
191-
output_dir (str) Output directory to write to
192191
"""
193192

194193
# Third Party

0 commit comments

Comments
 (0)