Skip to content

Commit 82d26ec

Browse files
committed
Update assertion and argument description
Signed-off-by: ajrasane <[email protected]>
1 parent 3a45ff5 commit 82d26ec

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

examples/onnx_ptq/torch_quant_to_onnx.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -123,7 +123,7 @@ def main():
123123
"--batch_size",
124124
type=int,
125125
default=1,
126-
help="Batch size for calibration.",
126+
help="Batch size for calibration and ONNX model export.",
127127
)
128128

129129
args = parser.parse_args()

modelopt/torch/_deploy/utils/torch_onnx.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -486,7 +486,7 @@ def get_onnx_bytes_and_metadata(
486486
param_dtype = torch.float32
487487
if weights_dtype in ["fp16", "bf16"] and param_dtype == torch.float32:
488488
if is_mxfp8_quantized(model) or is_int4_quantized(model):
489-
assert weights_dtype == "fp16", "BF16 + MXFP8 mixed precision is not supported yet"
489+
assert weights_dtype == "fp16", "BF16 + MXFP8/INT4 mixed precision is not supported yet"
490490
onnx_opt_graph = convert_float_to_float16(
491491
onnx_opt_graph,
492492
keep_io_types=False,

0 commit comments

Comments
 (0)