@@ -133,7 +133,8 @@ static void common_params_handle_model_default(
133133 const std::string & model_url,
134134 std::string & hf_repo,
135135 std::string & hf_file,
136- const std::string & hf_token) {
136+ const std::string & hf_token,
137+ const std::string & model_default) {
137138 if (!hf_repo.empty ()) {
138139 // short-hand to avoid specifying --hf-file -> default it to --model
139140 if (hf_file.empty ()) {
@@ -163,7 +164,7 @@ static void common_params_handle_model_default(
163164 model = fs_get_cache_file (string_split<std::string>(f, ' /' ).back ());
164165 }
165166 } else if (model.empty ()) {
166- model = DEFAULT_MODEL_PATH ;
167+ model = model_default ;
167168 }
168169}
169170
@@ -299,8 +300,9 @@ static bool common_params_parse_ex(int argc, char ** argv, common_params_context
299300 }
300301
301302 // TODO: refactor model params in a common struct
302- common_params_handle_model_default (params.model , params.model_url , params.hf_repo , params.hf_file , params.hf_token );
303- common_params_handle_model_default (params.vocoder .model , params.vocoder .model_url , params.vocoder .hf_repo , params.vocoder .hf_file , params.hf_token );
303+ common_params_handle_model_default (params.model , params.model_url , params.hf_repo , params.hf_file , params.hf_token , DEFAULT_MODEL_PATH);
304+ common_params_handle_model_default (params.speculative .model , params.speculative .model_url , params.speculative .hf_repo , params.speculative .hf_file , params.hf_token , " " );
305+ common_params_handle_model_default (params.vocoder .model , params.vocoder .model_url , params.vocoder .hf_repo , params.vocoder .hf_file , params.hf_token , " " );
304306
305307 if (params.escape ) {
306308 string_process_escapes (params.prompt );
@@ -1637,6 +1639,13 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
16371639 params.hf_repo = value;
16381640 }
16391641 ).set_env (" LLAMA_ARG_HF_REPO" ));
1642+ add_opt (common_arg (
1643+ {" -hfd" , " -hfrd" , " --hf-repo-draft" }, " <user>/<model>[:quant]" ,
1644+ " Same as --hf-repo, but for the draft model (default: unused)" ,
1645+ [](common_params & params, const std::string & value) {
1646+ params.speculative .hf_repo = value;
1647+ }
1648+ ).set_env (" LLAMA_ARG_HFD_REPO" ));
16401649 add_opt (common_arg (
16411650 {" -hff" , " --hf-file" }, " FILE" ,
16421651 " Hugging Face model file. If specified, it will override the quant in --hf-repo (default: unused)" ,
@@ -2282,6 +2291,13 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
22822291 params.vocoder .model = value;
22832292 }
22842293 ).set_examples ({LLAMA_EXAMPLE_TTS, LLAMA_EXAMPLE_SERVER}));
2294+ add_opt (common_arg (
2295+ {" --tts-use-guide-tokens" },
2296+ " Use guide tokens to improve TTS word recall" ,
2297+ [](common_params & params) {
2298+ params.vocoder .use_guide_tokens = true ;
2299+ }
2300+ ).set_examples ({LLAMA_EXAMPLE_TTS, LLAMA_EXAMPLE_SERVER}));
22852301
22862302 // model-specific
22872303 add_opt (common_arg (
0 commit comments