File tree Expand file tree Collapse file tree 2 files changed +2
-1
lines changed Expand file tree Collapse file tree 2 files changed +2
-1
lines changed Original file line number Diff line number Diff line change @@ -965,6 +965,7 @@ extern "C" {
965965 LLAMA_API int32_t llama_n_threads_batch (struct llama_context * ctx);
966966
967967 // Set whether the context outputs embeddings or not
968+ // TODO: rename to avoid confusion with llama_get_embeddings()
968969 LLAMA_API void llama_set_embeddings (struct llama_context * ctx, bool embeddings);
969970
970971 // Set whether to use causal attention or not
Original file line number Diff line number Diff line change @@ -1933,7 +1933,7 @@ struct server_context {
19331933 // also we cannot split if the pooling would require any past tokens
19341934 bool can_split () const {
19351935 return
1936- !llama_get_embeddings (ctx) ||
1936+ !params_base. embedding ||
19371937 (llama_get_memory (ctx) && llama_pooling_type (ctx) == LLAMA_POOLING_TYPE_LAST);
19381938 }
19391939
You can’t perform that action at this time.
0 commit comments