WIP: janice network issues

kylesayrs · kylesayrs · commit 9e975d3ef0dd · 2025-08-05T11:59:15.000-04:00
Signed-off-by: Kyle Sayers &lt;kylesayrs@gmail.com&gt;
diff --git a/src/llmcompressor/modifiers/transform/quip/base.py b/src/llmcompressor/modifiers/transform/quip/base.py
@@ -45,6 +45,7 @@ class QuIPModifier(Modifier):
     )
     randomize: bool = Field(default=False, exclude=True)
     learnable: bool = Field(default=False, exclude=True)
+    precision: 
     ignore: Union[str, List[str]] = Field(default="lm_head", exclude=True)
 
     # optional override for more fine-grained control
diff --git a/tests/llmcompressor/modifiers/transform/test_correctness.py b/tests/llmcompressor/modifiers/transform/test_correctness.py
@@ -1,3 +1,4 @@
+import os
 import pytest
 import torch
 from transformers import AutoModelForCausalLM
@@ -8,16 +9,20 @@
 
 
 @requires_gpu
+# @pytest.mark.skipif(
+#     (not os.getenv("HF_TOKEN")),
+#     reason="Skipping tracing tests requiring gated model access",
+# )
 @pytest.mark.parametrize(
     "dtype,exp_mse",
     [
-        (torch.bfloat16, 1e-2),
-        (torch.float32, 1e-9),
+        (torch.bfloat16, 5e-3),
+        (torch.float32, 5e-11),
     ],
 )
 def test_apply_correctness(dtype, exp_mse):
     model = AutoModelForCausalLM.from_pretrained(
-        "meta-llama/Meta-Llama-3-8B-Instruct", device_map="cuda", torch_dtype=dtype
+        "meta-llama/Llama-3.2-1B-Instruct", device_map="cuda", torch_dtype=dtype
     )
     state = State(model=model)
     modifier = QuIPModifier(transform_type="random-hadamard")
@@ -32,4 +37,5 @@ def test_apply_correctness(dtype, exp_mse):
     with torch.no_grad():
         output = model(**input)
 
+    print(torch.nn.MSELoss()(output.logits, true_output.logits))
     assert torch.nn.MSELoss()(output.logits, true_output.logits) <= exp_mse

Original file line number	Diff line number	Diff line change
`@@ -45,6 +45,7 @@ class QuIPModifier(Modifier):`
`45`	`45`	`)`
`46`	`46`	`randomize: bool = Field(default=False, exclude=True)`
`47`	`47`	`learnable: bool = Field(default=False, exclude=True)`
	`48`	`+ precision:`
`48`	`49`	`ignore: Union[str, List[str]] = Field(default="lm_head", exclude=True)`
`49`	`50`
`50`	`51`	`# optional override for more fine-grained control`