diff --git a/examples/llm_ptq/example_utils.py b/examples/llm_ptq/example_utils.py index 28d4fcf2c..014eb9625 100755 --- a/examples/llm_ptq/example_utils.py +++ b/examples/llm_ptq/example_utils.py @@ -526,10 +526,10 @@ def copy_custom_model_files(source_path: str, export_path: str, trust_remote_cod # Common patterns for custom model files that need to be copied custom_file_patterns = [ "configuration_*.py", - "modeling_*.py", + "modeling*.py", "tokenization_*.py", "processing_*.py", - "image_processing_*.py", + "image_processing*.py", "feature_extraction_*.py", "*.json", ] diff --git a/modelopt/torch/export/quant_utils.py b/modelopt/torch/export/quant_utils.py index 3e99a0e0a..b39f70748 100755 --- a/modelopt/torch/export/quant_utils.py +++ b/modelopt/torch/export/quant_utils.py @@ -849,6 +849,11 @@ def postprocess_state_dict(state_dict: dict, maxbound: float, quantization: str post_state_dict = {} for key, value in state_dict.items(): + # Skip problematic parameters for specific model architectures, e.g., Nemotron Nano VL models + if key == "vision_model.radio_model.summary_idxs": + logger.info(f"Removing problematic parameter: {key}") + continue + # Skip keys not related to quantizers if ( "output_quantizer" not in key