@@ -74,11 +74,10 @@ def quantize(
7474 the model
7575 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
7676 tokenized dataset
77+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
7778 fms_mo_args (fms_mo.training_args.FMSMOArguments): Parameters to use for PTQ quantization
7879 gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
7980 fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
80- quant_method (str): Quantization technique, options are gptq, fp8 and dq
81- output_dir (str) Output directory to write to
8281 """
8382
8483 logger = set_log_level (opt_args .log_level , "fms_mo.quantize" )
@@ -120,8 +119,8 @@ def run_gptq(model_args, data_args, opt_args, gptq_args):
120119 the model
121120 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
122121 tokenized dataset
122+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
123123 gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
124- output_dir (str) Output directory to write to
125124 """
126125
127126 # Third Party
@@ -187,8 +186,8 @@ def run_fp8(model_args, data_args, opt_args, fp8_args):
187186 the model
188187 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
189188 tokenized dataset
189+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
190190 fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
191- output_dir (str) Output directory to write to
192191 """
193192
194193 # Third Party
0 commit comments