File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -325,6 +325,9 @@ def main(args):
325
325
model = model .language_model
326
326
model_type = get_model_type (model )
327
327
328
+ if model_type == "phi4mm" :
329
+ warnings .warn ("Please set the default input_mode to InputMode.LANGUAGE before quantizing." )
330
+
328
331
if args .sparsity_fmt != "dense" :
329
332
if args .batch_size == 0 :
330
333
# Sparse algorithm takes more GPU memory so we reduce the batch_size by 4.
@@ -475,9 +478,6 @@ def main(args):
475
478
quant_cfg ["quant_cfg" ]["*audio*" ] = {"enable" : False }
476
479
quant_cfg ["quant_cfg" ]["*image*" ] = {"enable" : False }
477
480
quant_cfg ["quant_cfg" ]["*vision*" ] = {"enable" : False }
478
- warnings .warn (
479
- "Please set the default input_mode to InputMode.LANGUAGE before quantizing."
480
- )
481
481
482
482
if not model_is_already_quantized or calibration_only :
483
483
# Only run single sample for preview
You can’t perform that action at this time.
0 commit comments