vllm-project
diff --git a/‎examples/transform/quip_example.py‎
Lines changed: 1 addition & 1 deletion b/‎examples/transform/quip_example.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/transform/spinquant_example.py‎
Lines changed: 0 additions & 86 deletions b/‎examples/transform/spinquant_example.py‎
Lines changed: 0 additions & 86 deletions
diff --git a/‎src/llmcompressor/modifiers/transform/__init__.py‎
Lines changed: 0 additions & 1 deletion b/‎src/llmcompressor/modifiers/transform/__init__.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎src/llmcompressor/modifiers/transform/quip/base.py‎
Lines changed: 7 additions & 3 deletions b/‎src/llmcompressor/modifiers/transform/quip/base.py‎
Lines changed: 7 additions & 3 deletions
diff --git a/‎src/llmcompressor/modifiers/transform/spinquant/__init__.py‎
Lines changed: 0 additions & 3 deletions b/‎src/llmcompressor/modifiers/transform/spinquant/__init__.py‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎src/llmcompressor/modifiers/transform/spinquant/base.py‎
Lines changed: 0 additions & 235 deletions b/‎src/llmcompressor/modifiers/transform/spinquant/base.py‎
Lines changed: 0 additions & 235 deletions
@@ -7,7 +7,7 @@
 from llmcompressor.utils import dispatch_for_generation
 
 # Select model and load it.
-MODEL_ID = "meta-llama/Meta-Llama-3-8B-Instruct"
+MODEL_ID = "meta-llama/Llama-3.1-8B-Instruct"
 
 model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
 
@@ -1,4 +1,3 @@
 # flake8: noqa
 
 from .quip import QuIPModifier
-from .spinquant import SpinQuantModifier
@@ -21,7 +21,7 @@ class QuIPModifier(Modifier):
     [QuIP: 2-Bit Quantization of Large Language Models With Guarantees](https://arxiv.org/abs/2307.13304)  # noqa: E501
 
     Transforms (rotations) are extra layers added to a model which reduce the accuracy
-    loss induced by quantization. This is achived through "rotating" weights and
+    loss induced by quantization. This is achieved through "rotating" weights and
     activations into a space with a smaller dynamic range of values, thus decreasing
     the range of scales required for quantization.
 
@@ -31,7 +31,7 @@ class QuIPModifier(Modifier):
     :param transform_type: The type of transform to apply to the model.
         `"hadamard"` has the least performance cost but only supports sizes which are
         powers of power of two.
-        `"random-matrix"` has more performance cost, but supports a much larger set of
+        `"random-hadamard"` has more performance cost, but supports a much larger set of
             sizes.
         `"random-matrix"` has the greatest performance cost, but supports any size
     :param randomize: If true, create distinct transforms for each application
@@ -53,7 +53,9 @@ class QuIPModifier(Modifier):
 
     @field_validator("randomize", "learnable", mode="before")
     def validate_not_implemented(cls, value, info: ValidationInfo):
-        raise NotImplementedError(f"{info.field_name} is not supported right now")
+        if value:
+            raise NotImplementedError(f"{info.field_name} is not supported right now")
+        return value
 
     def on_initialize(self, state: State, **kwargs) -> bool:
         if self.transform_config is not None:
@@ -102,6 +104,7 @@ def _create_config(self) -> TransformConfig:
                         TransformArgs(
                             targets=["Linear"],
                             location="weight_input",
+                            # location="input",
                             inverse=True,
                             ignore=self.ignore,
                         ),
@@ -115,6 +118,7 @@ def _create_config(self) -> TransformConfig:
                         TransformArgs(
                             targets=["Linear"],
                             location="weight_output",
+                            # location="output",
                             ignore=self.ignore,
                         ),
                         TransformArgs(
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,3 @@`
`1`	`1`	`# flake8: noqa`
`2`	`2`
`3`	`3`	`from .quip import QuIPModifier`
`4`		`-from .spinquant import SpinQuantModifier`