Skip to content

Commit 23323cd

Browse files
committed
server : use 4 slots + unified KV by default
1 parent 290f6a9 commit 23323cd

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

tools/server/server.cpp

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4432,6 +4432,13 @@ int main(int argc, char ** argv) {
44324432
return 1;
44334433
}
44344434

4435+
if (params.n_parallel == 1 && params.kv_unified == false) {
4436+
LOG_WRN("%s: setting n_parallel = 4 and kv_unified = true\n", __func__);
4437+
4438+
params.n_parallel = 4;
4439+
params.kv_unified = true;
4440+
}
4441+
44354442
common_init();
44364443

44374444
// struct that contains llama context and inference

0 commit comments

Comments
 (0)