Update assertion and argument description

ajrasane · ajrasane · commit 82d26ec8a875 · 2025-09-05T21:25:41.000Z
Signed-off-by: ajrasane &lt;131806219+ajrasane@users.noreply.github.com&gt;
diff --git a/examples/onnx_ptq/torch_quant_to_onnx.py b/examples/onnx_ptq/torch_quant_to_onnx.py
@@ -123,7 +123,7 @@ def main():
         "--batch_size",
         type=int,
         default=1,
-        help="Batch size for calibration.",
+        help="Batch size for calibration and ONNX model export.",
     )
 
     args = parser.parse_args()
diff --git a/modelopt/torch/_deploy/utils/torch_onnx.py b/modelopt/torch/_deploy/utils/torch_onnx.py
@@ -486,7 +486,7 @@ def get_onnx_bytes_and_metadata(
         param_dtype = torch.float32
     if weights_dtype in ["fp16", "bf16"] and param_dtype == torch.float32:
         if is_mxfp8_quantized(model) or is_int4_quantized(model):
-            assert weights_dtype == "fp16", "BF16 + MXFP8 mixed precision is not supported yet"
+            assert weights_dtype == "fp16", "BF16 + MXFP8/INT4 mixed precision is not supported yet"
             onnx_opt_graph = convert_float_to_float16(
                 onnx_opt_graph,
                 keep_io_types=False,

Original file line number	Diff line number	Diff line change
`@@ -123,7 +123,7 @@ def main():`
`123`	`123`	`"--batch_size",`
`124`	`124`	`type=int,`
`125`	`125`	`default=1,`
`126`		`- help="Batch size for calibration.",`
	`126`	`+ help="Batch size for calibration and ONNX model export.",`
`127`	`127`	`)`
`128`	`128`
`129`	`129`	`args = parser.parse_args()`