Fix svdquant restore

kevalmorabia97 · kevalmorabia97 · commit acecdb5ba659 · 2025-05-09T09:37:59.000+05:30
diff --git a/examples/llm_ptq/README.md b/examples/llm_ptq/README.md
@@ -117,7 +117,8 @@ ChatGLM2, 3 6B | No | No | Yes | No | -
 Bloom | Yes | Yes | Yes | Yes | -
 Phi-1,2,3,4 | Yes | Yes | Yes | Yes<sup>3</sup> |
 Phi-3.5 MOE | Yes | No | No | No | -
-Llama-Nemotron Super/Ultra | Yes | No | No | No | Yes
+Llama-Nemotron Super | Yes | No | No | No | Yes
+Llama-Nemotron Ultra | Yes | No | No | No | No
 Nemotron 8B | Yes | No | Yes | No | -
 Gemma 2B, 7B | Yes | No | Yes | Yes | -
 Gemma 2 9B, 27B | Yes<sup>2</sup> | No | Yes | No | -
diff --git a/modelopt/torch/quantization/conversion.py b/modelopt/torch/quantization/conversion.py
@@ -143,6 +143,7 @@ def create_and_replace_svdquant_linear_on_the_fly(model):
 def restore_svdquant_model(model: nn.Module, config: QuantizeConfig, metadata: MetadataDict):
     """Restore the svdquant states from the given state dict."""
     create_and_replace_svdquant_linear_on_the_fly(model)
+    restore_quantizer_state(model, config, metadata)
     return model
 
 
diff --git a/modelopt/torch/speculative/config.py b/modelopt/torch/speculative/config.py
@@ -134,7 +134,7 @@ class EagleConfig(ModeloptBaseConfig):
     ffn_hidden_size: int = ModeloptField(
         default=0,
         description=(
-            "ffn_hidden_size of the eagle module. Using base model's ffn_hidden_size is set to None."
+            "ffn_hidden_size of the eagle module. Using base model's ffn_hidden_size is set to 0."
         ),
     )
 
diff --git a/tests/_test_utils/torch_quantization/checkpointing.py b/tests/_test_utils/torch_quantization/checkpointing.py
@@ -22,10 +22,12 @@ def format_modelopt_checkpoint_by_version(modelopt_state: dict, version: str):
     if Version(version) >= Version("0.29"):
         return modelopt_state
     modelopt_state = copy.deepcopy(modelopt_state)
+    modelopt_state["modelopt_version"] = version
     for mode, state in modelopt_state["modelopt_state_dict"]:
         if "quantizer_state" not in state["metadata"]:
             continue
         for quantizer_name, quantizer_state in state["metadata"]["quantizer_state"].items():
+            quantizer_state["_mopt_ckpt_versn"] = version
             pyt_states = quantizer_state.pop("_pytorch_state_metadata", None)
             if pyt_states is None:
                 continue

Original file line number	Diff line number	Diff line change
`@@ -134,7 +134,7 @@ class EagleConfig(ModeloptBaseConfig):`
`134`	`134`	`ffn_hidden_size: int = ModeloptField(`
`135`	`135`	`default=0,`
`136`	`136`	`description=(`
`137`		`- "ffn_hidden_size of the eagle module. Using base model's ffn_hidden_size is set to None."`
	`137`	`+ "ffn_hidden_size of the eagle module. Using base model's ffn_hidden_size is set to 0."`
`138`	`138`	`),`
`139`	`139`	`)`
`140`	`140`