@@ -674,7 +674,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
674674 ));
675675 add_opt (common_arg (
676676 {" --no-context-shift" },
677- string_format (" disables context shift on inifinite text generation (default: %s)" , params.ctx_shift ? " disabled" : " enabled" ),
677+ string_format (" disables context shift on infinite text generation (default: %s)" , params.ctx_shift ? " disabled" : " enabled" ),
678678 [](common_params & params) {
679679 params.ctx_shift = false ;
680680 }
@@ -2341,5 +2341,47 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
23412341 }
23422342 ).set_examples ({LLAMA_EXAMPLE_TTS}));
23432343
2344+ add_opt (common_arg (
2345+ {" --embd-bge-small-en-default" },
2346+ string_format (" use default bge-small-en-v1.5 model (note: can download weights from the internet)" ),
2347+ [](common_params & params) {
2348+ params.hf_repo = " ggml-org/bge-small-en-v1.5-Q8_0-GGUF" ;
2349+ params.hf_file = " bge-small-en-v1.5-q8_0.gguf" ;
2350+ params.pooling_type = LLAMA_POOLING_TYPE_NONE;
2351+ params.embd_normalize = 2 ;
2352+ params.n_ctx = 512 ;
2353+ params.verbose_prompt = true ;
2354+ params.embedding = true ;
2355+ }
2356+ ).set_examples ({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
2357+
2358+ add_opt (common_arg (
2359+ {" --embd-e5-small-en-default" },
2360+ string_format (" use default e5-small-v2 model (note: can download weights from the internet)" ),
2361+ [](common_params & params) {
2362+ params.hf_repo = " ggml-org/e5-small-v2-Q8_0-GGUF" ;
2363+ params.hf_file = " e5-small-v2-q8_0.gguf" ;
2364+ params.pooling_type = LLAMA_POOLING_TYPE_NONE;
2365+ params.embd_normalize = 2 ;
2366+ params.n_ctx = 512 ;
2367+ params.verbose_prompt = true ;
2368+ params.embedding = true ;
2369+ }
2370+ ).set_examples ({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
2371+
2372+ add_opt (common_arg (
2373+ {" --embd-gte-small-default" },
2374+ string_format (" use default gte-small model (note: can download weights from the internet)" ),
2375+ [](common_params & params) {
2376+ params.hf_repo = " ggml-org/gte-small-Q8_0-GGUF" ;
2377+ params.hf_file = " gte-small-q8_0.gguf" ;
2378+ params.pooling_type = LLAMA_POOLING_TYPE_NONE;
2379+ params.embd_normalize = 2 ;
2380+ params.n_ctx = 512 ;
2381+ params.verbose_prompt = true ;
2382+ params.embedding = true ;
2383+ }
2384+ ).set_examples ({LLAMA_EXAMPLE_EMBEDDING, LLAMA_EXAMPLE_SERVER}));
2385+
23442386 return ctx_arg;
23452387}
0 commit comments