fix kv cache test

kylesayrs · kylesayrs · commit f0f6392ea488 · 2025-05-05T12:32:50.000-04:00
Signed-off-by: Kyle Sayers &lt;kylesayrs@gmail.com&gt;
diff --git a/src/llmcompressor/modifiers/quantization/gptq/base.py b/src/llmcompressor/modifiers/quantization/gptq/base.py
@@ -158,8 +158,8 @@ def on_start(self, state: State, event: Event, **kwargs):
 
         if not added_hook:
             raise ValueError(
-                "GPTQModifier requires a quantization config be specified by this "
-                "modifier or a modifier preceding it"
+                "GPTQModifier requires a weight quantization config be specified by "
+                "this modifier or a modifier preceding it"
             )
 
     def on_event(self, state: State, event: Event, **kwargs):
diff --git a/tests/llmcompressor/transformers/kv_cache/test_kv_cache.py b/tests/llmcompressor/transformers/kv_cache/test_kv_cache.py
@@ -7,6 +7,7 @@
 from compressed_tensors.quantization.utils.helpers import iter_named_quantizable_modules
 from datasets import load_dataset
 from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer
+from transformers.utils.quantization_config import CompressedTensorsConfig
 
 from llmcompressor import oneshot
 from llmcompressor.core import reset_session
@@ -236,7 +237,11 @@ def test_kv_cache_gptq_model_state_dict_attr(kv_cache_fixture, tmp_path):
     output_dir, _ = next(kv_cache_fixture(recipe, tmp_path))
 
     with init_empty_weights():
-        model = AutoModelForCausalLM.from_pretrained(output_dir)
+        # There is a bug in `apply_quantization_config`
+        model = AutoModelForCausalLM.from_pretrained(
+            output_dir,
+            quantization_config=CompressedTensorsConfig(run_compressed=False),
+        )
 
     counts = 0
     for name, submodule in iter_named_quantizable_modules(

Original file line number	Diff line number	Diff line change
`@@ -158,8 +158,8 @@ def on_start(self, state: State, event: Event, **kwargs):`
`158`	`158`
`159`	`159`	`if not added_hook:`
`160`	`160`	`raise ValueError(`
`161`		`- "GPTQModifier requires a quantization config be specified by this "`
`162`		`- "modifier or a modifier preceding it"`
	`161`	`+ "GPTQModifier requires a weight quantization config be specified by "`
	`162`	`+ "this modifier or a modifier preceding it"`
`163`	`163`	`)`
`164`	`164`
`165`	`165`	`def on_event(self, state: State, event: Event, **kwargs):`