@@ -64,11 +64,10 @@ def quantize(
6464 the model
6565 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
6666 tokenized dataset
67+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
6768 fms_mo_args (fms_mo.training_args.FMSMOArguments): Parameters to use for PTQ quantization
6869 gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
6970 fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
70- quant_method (str): Quantization technique, options are gptq, fp8 and dq
71- output_dir (str) Output directory to write to
7271 """
7372
7473 logger .info (f"{ fms_mo_args } \n { opt_args .quant_method } \n " )
@@ -108,8 +107,8 @@ def run_gptq(model_args, data_args, opt_args, gptq_args):
108107 the model
109108 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
110109 tokenized dataset
110+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
111111 gptq_args (fms_mo.training_args.GPTQArguments): Parameters to use for GPTQ quantization
112- output_dir (str) Output directory to write to
113112 """
114113
115114 # Third Party
@@ -171,8 +170,8 @@ def run_fp8(model_args, data_args, opt_args, fp8_args):
171170 the model
172171 data_args (fms_mo.training_args.DataArguments): Data arguments to be used when loading the
173172 tokenized dataset
173+ opt_args (fms_mo.training_args.OptArguments): Generic optimization related arguments
174174 fp8_args (fms_mo.training_args.FP8Arguments): Parameters to use for FP8 quantization
175- output_dir (str) Output directory to write to
176175 """
177176
178177 # Third Party
0 commit comments