Skip to content

Commit e07000b

Browse files
committed
squash! common : add default embeddings presets [no ci]
Default to Q8_0 quantization.
1 parent 19f2ff1 commit e07000b

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

common/arg.cpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2329,7 +2329,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
23292329
string_format("use default bge-small-en-v1.5 model (note: can download weights from the internet)"),
23302330
[](common_params & params) {
23312331
params.hf_repo = "CompendiumLabs/bge-small-en-v1.5-gguf";
2332-
params.hf_file = "bge-small-en-v1.5-q4_k_m.gguf";
2332+
params.hf_file = "bge-small-en-v1.5-q8_0.gguf";
23332333
params.pooling_type = LLAMA_POOLING_TYPE_NONE;
23342334
params.embd_normalize = 2;
23352335
params.n_ctx = 512;
@@ -2343,7 +2343,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
23432343
string_format("use default e5-small-v2 model (note: can download weights from the internet)"),
23442344
[](common_params & params) {
23452345
params.hf_repo = "ChristianAzinn/e5-small-v2-gguf";
2346-
params.hf_file = "e5-small-v2.Q4_K_M.gguf";
2346+
params.hf_file = "e5-small-v2.Q8_0.gguf";
23472347
params.pooling_type = LLAMA_POOLING_TYPE_NONE;
23482348
params.embd_normalize = 2;
23492349
params.n_ctx = 512;
@@ -2357,7 +2357,7 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
23572357
string_format("use default gte-small model (note: can download weights from the internet)"),
23582358
[](common_params & params) {
23592359
params.hf_repo = "ChristianAzinn/gte-small-gguf";
2360-
params.hf_file = "gte-small.Q4_K_M.gguf";
2360+
params.hf_file = "gte-small.Q8_0.gguf";
23612361
params.pooling_type = LLAMA_POOLING_TYPE_NONE;
23622362
params.embd_normalize = 2;
23632363
params.n_ctx = 512;

0 commit comments

Comments
 (0)