drop frozen scale_dtype post-merge

brian-dellabetta · brian-dellabetta · commit 595228cc775e · 2025-09-10T23:01:02.000Z
Signed-off-by: Brian Dellabetta &lt;bdellabe@redhat.com&gt;
diff --git a/src/compressed_tensors/quantization/lifecycle/apply.py b/src/compressed_tensors/quantization/lifecycle/apply.py
@@ -213,18 +213,7 @@ def apply_quantization_status(module: Module, status: QuantizationStatus):
 
     force_zero_point_init = status != QuantizationStatus.COMPRESSED
 
-    # When decompressing, we set the scale_dtype as the model's dtype
-    # This is because the normal workflow of using the weight's dtype
-    # will be incorrect as the model weight will be compressed
-    # Therefore, use the dtype set by the user using the PretrainedModel
-    scale_dtype = None
-    if status == QuantizationStatus.FROZEN:
-        if hasattr(module, "dtype"):
-            scale_dtype = module.dtype
-
-    initialize_module_for_quantization(
-        module, force_zero_point=force_zero_point_init, scale_dtype=scale_dtype
-    )
+    initialize_module_for_quantization(module, force_zero_point=force_zero_point_init)
 
     module.quantization_status = status