Skip to content

Commit 689035c

Browse files
committed
on prmpt processing done, assert cache_tokens.size
1 parent f10fc56 commit 689035c

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

tools/server/server.cpp

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3256,6 +3256,8 @@ struct server_context {
32563256

32573257
// entire prompt has been processed
32583258
if (slot.n_past == slot.n_prompt_tokens) {
3259+
GGML_ASSERT(slot.cache_tokens.size() == slot.prompt_tokens.size());
3260+
32593261
slot.state = SLOT_STATE_DONE_PROMPT;
32603262

32613263
GGML_ASSERT(batch.n_tokens > 0);

0 commit comments

Comments
 (0)