@@ -587,9 +587,9 @@ namespace vl
587587 int media_end_token_id;
588588 int media_pad_token_id;
589589
590- int video_max_frames = 20 ;
591- bool arbitrary_resolution = false ;
592- double fps = 1.0 ;
590+ int video_max_frames = 20 ;
591+ bool native_resolution = false ;
592+ double fps = 1.0 ;
593593 };
594594
595595 void ChatHistoryEncoder::append_ai (int round_idx, const std::string &ai, std::vector<int > &ids) const
@@ -686,7 +686,7 @@ namespace vl
686686 {
687687 Tokenizer *tok = dynamic_cast <Tokenizer *>(tokenizer);
688688 tok->video_max_frames = utils::get_opt (args, " video_max_frames" , tok->video_max_frames );
689- tok->arbitrary_resolution = utils::get_opt (args, " arbitrary_resolution " , false );
689+ tok->native_resolution = utils::get_opt (args, " native_resolution " , tok-> native_resolution );
690690 tok->fps = utils::get_opt (args, " fps" , tok->fps );
691691 }
692692
@@ -714,7 +714,7 @@ namespace vl
714714 std::unique_ptr<vision::Resize> resize;
715715 std::unique_ptr<vision::PreMaxImageSize> max_size;
716716
717- if (!tok->arbitrary_resolution )
717+ if (!tok->native_resolution )
718718 resize.reset (new vision::Resize (896 , 896 ));
719719
720720 // expand video into images
0 commit comments