We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5fe8d72 commit b8000fdCopy full SHA for b8000fd
tools/server/server.cpp
@@ -3256,7 +3256,8 @@ struct server_context {
3256
3257
// entire prompt has been processed
3258
if (slot.n_past == slot.n_prompt_tokens) {
3259
- GGML_ASSERT(slot.cache_tokens.size() == slot.prompt_tokens.size());
+ // TODO @ngxson : this assertion fails sometimes, why?
3260
+ // GGML_ASSERT(slot.cache_tokens.size() == slot.prompt_tokens.size());
3261
3262
slot.state = SLOT_STATE_DONE_PROMPT;
3263
0 commit comments