copy over json files in export path as well

Edwardf0t1 · Edwardf0t1 · commit 21fa47f5c44a · 2025-09-25T18:41:02.000Z
Signed-off-by: Zhiyu Cheng &lt;zhiyuc@nvidia.com&gt;
diff --git a/examples/llm_ptq/example_utils.py b/examples/llm_ptq/example_utils.py
@@ -345,7 +345,11 @@ def _resolve_model_path(model_name_or_path: str, trust_remote_code: bool = False
 
 
 def copy_custom_model_files(source_path: str, export_path: str, trust_remote_code: bool = False):
-    """Copy custom model files (configuration_*.py, modeling_*.py, etc.) from source to export directory.
+    """Copy custom model files (configuration_*.py, modeling_*.py, *.json, etc.) from source to export directory.
+
+    This function copies custom Python files and JSON configuration files that are needed for
+    models with custom code. It excludes config.json and model.safetensors.index.json as these
+    are typically handled separately by the model export process.
 
     Args:
         source_path: Path to the original model directory or HuggingFace model ID
@@ -383,12 +387,16 @@ def copy_custom_model_files(source_path: str, export_path: str, trust_remote_cod
         "processing_*.py",
         "image_processing_*.py",
         "feature_extraction_*.py",
+        "*.json",
     ]
 
     copied_files = []
     for pattern in custom_file_patterns:
         for file_path in source_dir.glob(pattern):
             if file_path.is_file():
+                # Skip config.json and model.safetensors.index.json as they're handled separately
+                if file_path.name in ["config.json", "model.safetensors.index.json"]:
+                    continue
                 dest_path = export_dir / file_path.name
                 try:
                     shutil.copy2(file_path, dest_path)
diff --git a/examples/llm_ptq/hf_ptq.py b/examples/llm_ptq/hf_ptq.py
@@ -612,7 +612,7 @@ def output_decode(generated_ids, input_shape):
                 inference_pipeline_parallel=args.inference_pipeline_parallel,
             )
 
-            # Copy custom model files for TensorRT-LLM export as well
+            # Copy custom model files (Python files and JSON configs) for TensorRT-LLM export
             copy_custom_model_files(args.pyt_ckpt_path, export_path, args.trust_remote_code)
         else:
             # Check arguments for unified_hf export format and set to default if unsupported arguments are provided
@@ -631,7 +631,7 @@ def output_decode(generated_ids, input_shape):
                 export_dir=export_path,
             )
 
-        # Copy custom model files (configuration_*.py, modeling_*.py, etc.) if trust_remote_code is used
+        # Copy custom model files (Python files and JSON configs) if trust_remote_code is used
         copy_custom_model_files(args.pyt_ckpt_path, export_path, args.trust_remote_code)
 
         # Restore default padding and export the tokenizer as well.

Original file line number	Diff line number	Diff line change
`@@ -612,7 +612,7 @@ def output_decode(generated_ids, input_shape):`
`612`	`612`	`inference_pipeline_parallel=args.inference_pipeline_parallel,`
`613`	`613`	`)`
`614`	`614`
`615`		`- # Copy custom model files for TensorRT-LLM export as well`
	`615`	`+ # Copy custom model files (Python files and JSON configs) for TensorRT-LLM export`
`616`	`616`	`copy_custom_model_files(args.pyt_ckpt_path, export_path, args.trust_remote_code)`
`617`	`617`	`else:`
`618`	`618`	`# Check arguments for unified_hf export format and set to default if unsupported arguments are provided`
`@@ -631,7 +631,7 @@ def output_decode(generated_ids, input_shape):`
`631`	`631`	`export_dir=export_path,`
`632`	`632`	`)`
`633`	`633`
`634`		`- # Copy custom model files (configuration_.py, modeling_.py, etc.) if trust_remote_code is used`
	`634`	`+ # Copy custom model files (Python files and JSON configs) if trust_remote_code is used`
`635`	`635`	`copy_custom_model_files(args.pyt_ckpt_path, export_path, args.trust_remote_code)`
`636`	`636`
`637`	`637`	`# Restore default padding and export the tokenizer as well.`