File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed
py/torch_tensorrt/dynamo/conversion/impl Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -34,7 +34,7 @@ def compile_model(
34
34
enabled_precisions = {torch .float4_e2m1fn_x2 }
35
35
ptq_config = mtq .NVFP4_DEFAULT_CFG
36
36
if args .fp4_mha :
37
- from modelopt .core . torch .quantization .config import NVFP4_FP8_MHA_CONFIG
37
+ from modelopt .torch .quantization .config import NVFP4_FP8_MHA_CONFIG
38
38
39
39
ptq_config = NVFP4_FP8_MHA_CONFIG
40
40
Original file line number Diff line number Diff line change @@ -209,7 +209,7 @@ def _static_double_quantize(
209
209
quantized data tensor in fp4
210
210
"""
211
211
212
- import modelopt .core . torch .quantization .qtensor .nvfp4_tensor as nvfp4_tensor
212
+ import modelopt .torch .quantization .qtensor .nvfp4_tensor as nvfp4_tensor
213
213
214
214
if weights_tensor .dtype == torch .float16 :
215
215
original_dtype = trt .DataType .HALF
You can’t perform that action at this time.
0 commit comments