thuml · Haodong-Lei-Ray · Mar 14, 2025
diff --git a/inference/predict.py b/inference/predict.py
@@ -11,7 +11,7 @@
 from ivideogpt.vq_model import CompressiveVQModel
 from ivideogpt.transformer import HeadModelWithAction
 from utils import NPZParser
-
+from huggingface_hub import hf_hub_download
 device = 'cuda'
 
 
@@ -104,7 +104,9 @@ def main():
                                     tokens_num_per_dyna=tokens_per_dyna, 
                                     context=args.context_length,
                                     segment_length=args.segment_length).to(device)
-        state_dict = load_file(os.path.join(args.pretrained_model_name_or_path, 'transformer', 'model.safetensors'))
+        local_file_path = hf_hub_download(repo_id=args.pretrained_model_name_or_path, filename="transformer/model.safetensors")
+        state_dict = load_file(local_file_path)
+        # state_dict = load_file(os.path.join(args.pretrained_model_name_or_path, 'transformer', 'model.safetensors'))
         model.load_state_dict(state_dict, strict=True)
         assert model.llm.config.vocab_size == tokenizer.num_vq_embeddings + tokenizer.num_dyn_embeddings + 2
     else: