Skip to content

Commit b7f9010

Browse files
authored
server : disable checkpoints with mtmd (ggml-org#17045)
1 parent 4882f0f commit b7f9010

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

tools/server/server.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3832,7 +3832,9 @@ struct server_context {
38323832
// the largest pos_min required for a checkpoint to be useful
38333833
const auto pos_min_thold = std::max(0, n_past - n_swa);
38343834

3835-
if (n_past > 0 && n_past < slot.prompt.n_tokens()) {
3835+
// note: disallow with mtmd contexts for now
3836+
// https://github.com/ggml-org/llama.cpp/issues/17043
3837+
if (!mctx && n_past > 0 && n_past < slot.prompt.n_tokens()) {
38363838
const auto pos_min = llama_memory_seq_pos_min(llama_get_memory(ctx), slot.id);
38373839
if (pos_min == -1) {
38383840
SLT_ERR(slot, "n_past = %d, slot.prompt.tokens.size() = %d, seq_id = %d, pos_min = %d\n", n_past, (int) slot.prompt.tokens.size(), slot.id, pos_min);

0 commit comments

Comments
 (0)