We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ba1aed3 commit 8826cf5Copy full SHA for 8826cf5
examples/server/server.cpp
@@ -1331,8 +1331,8 @@ struct server_slot {
1331
}
1332
n_remaining = INT32_MAX;
1333
1334
- // The request or server have finite limits on the number of tokens to generate.
1335
- if ((params.n_predict != -1 && params.n_predict != -2) || (global_params.n_predict != -1 && global_params.n_predict != -2)) {
+ // The request or server have specified limits on the number of tokens to generate.
+ if ((params.n_predict >= 0) || (global_params.n_predict >= 0)) {
1336
n_remaining = std::min(n_remaining, params.n_predict - n_decoded);
1337
1338
0 commit comments