Move triton import inside function to work on Windows

kevalmorabia97 · kevalmorabia97 · commit c391942107ba · 2025-08-30T11:40:09.000+05:30
Signed-off-by: Keval Morabia &lt;28916987+kevalmorabia97@users.noreply.github.com&gt;
diff --git a/modelopt/torch/quantization/qtensor/nvfp4_tensor.py b/modelopt/torch/quantization/qtensor/nvfp4_tensor.py
@@ -19,7 +19,6 @@
 
 from ..backends.utils import fp4_compatible
 from ..qtensor.base_qtensor import BaseQuantizedTensor
-from ..triton.fp4_kernel import fp4_dequantize
 from ..utils import reduce_amax, reduce_block_amax, reduce_block_padding
 
 # Define conversion tables
@@ -266,6 +265,8 @@ def _unpack_tensor(input: torch.Tensor):
                 ) from e
 
         if fast:
+            from ..triton.fp4_kernel import fp4_dequantize
+
             return fp4_dequantize(
                 self._quantized_data,
                 kwarg["scale"],