Rename Float8ActivationInt4WeightConfig to Float8DynamicActivationInt4WeightConfig (#2746)

jerryzh168 · web-flow · commit cd7975e158a2 · 2025-08-12T11:36:06.000-07:00
Summary:
This was a mistake, we need to align the name with other dynamic quant configs

Test Plan:
CI

Reviewers:

Subscribers:

Tasks:

Tags:
diff --git a/docs/source/api_ref_quantization.rst b/docs/source/api_ref_quantization.rst
@@ -24,7 +24,7 @@ Inference APIs for quantize\_
     :nosignatures:
 
     Int4WeightOnlyConfig
-    Float8ActivationInt4WeightConfig
+    Float8DynamicActivationInt4WeightConfig
     Float8DynamicActivationFloat8WeightConfig
     Float8WeightOnlyConfig
     Float8StaticActivationFloat8WeightConfig
diff --git a/test/quantization/quantize_/workflows/int4/test_int4_preshuffled_tensor.py b/test/quantization/quantize_/workflows/int4/test_int4_preshuffled_tensor.py
@@ -16,7 +16,7 @@
 )
 
 from torchao.quantization import (
-    Float8ActivationInt4WeightConfig,
+    Float8DynamicActivationInt4WeightConfig,
     Int4WeightOnlyConfig,
     quantize_,
 )
@@ -33,7 +33,7 @@
     VERSION=2,
 )
 
-FP8_ACT_CONFIG = Float8ActivationInt4WeightConfig(
+FP8_ACT_CONFIG = Float8DynamicActivationInt4WeightConfig(
     group_size=128,
     packing_format="preshuffled",
 )
diff --git a/torchao/quantization/__init__.py b/torchao/quantization/__init__.py
@@ -44,9 +44,9 @@
 from .quant_api import (
     CutlassInt4PackedLayout,
     FbgemmConfig,
-    Float8ActivationInt4WeightConfig,
     Float8DynamicActivationFloat8SemiSparseWeightConfig,
     Float8DynamicActivationFloat8WeightConfig,
+    Float8DynamicActivationInt4WeightConfig,
     Float8MMConfig,
     Float8StaticActivationFloat8WeightConfig,
     Float8WeightOnlyConfig,
@@ -143,7 +143,7 @@
     "Int8DynamicActivationInt8WeightConfig",
     "Int8DynamicActivationIntxWeightConfig",
     "Int4WeightOnlyConfig",
-    "Float8ActivationInt4WeightConfig",
+    "Float8DynamicActivationInt4WeightConfig",
     "Int8WeightOnlyConfig",
     "Float8WeightOnlyConfig",
     "Float8DynamicActivationFloat8WeightConfig",
diff --git a/torchao/quantization/quant_api.py b/torchao/quantization/quant_api.py
@@ -1252,7 +1252,7 @@ def _int4_weight_only_transform(
 
 
 @dataclass
-class Float8ActivationInt4WeightConfig(AOBaseConfig):
+class Float8DynamicActivationInt4WeightConfig(AOBaseConfig):
     """Configuration for apply float8 dynamic per row quantization and int4
     per group weight quantization to linear
 
@@ -1265,9 +1265,9 @@ class Float8ActivationInt4WeightConfig(AOBaseConfig):
     packing_format: PackingFormat = "preshuffled"
 
 
-@register_quantize_module_handler(Float8ActivationInt4WeightConfig)
-def _float8_activation_int4_weight_transform(
-    module: torch.nn.Module, config: Float8ActivationInt4WeightConfig
+@register_quantize_module_handler(Float8DynamicActivationInt4WeightConfig)
+def _float8_dynamic_activation_int4_weight_transform(
+    module: torch.nn.Module, config: Float8DynamicActivationInt4WeightConfig
 ) -> torch.nn.Module:
     assert hasattr(module, "weight"), (
         "applying int8 weight only quant requires module to have weight attribute"

Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@`
`16`	`16`	`)`
`17`	`17`
`18`	`18`	`from torchao.quantization import (`
`19`		`- Float8ActivationInt4WeightConfig,`
	`19`	`+ Float8DynamicActivationInt4WeightConfig,`
`20`	`20`	`Int4WeightOnlyConfig,`
`21`	`21`	`quantize_,`
`22`	`22`	`)`
`@@ -33,7 +33,7 @@`
`33`	`33`	`VERSION=2,`
`34`	`34`	`)`
`35`	`35`
`36`		`-FP8_ACT_CONFIG = Float8ActivationInt4WeightConfig(`
	`36`	`+FP8_ACT_CONFIG = Float8DynamicActivationInt4WeightConfig(`
`37`	`37`	`group_size=128,`
`38`	`38`	`packing_format="preshuffled",`
`39`	`39`	`)`