From: Georgi Gerganov Date: Thu, 6 Nov 2025 10:09:29 +0000 (+0200) Subject: server : disable checkpoints with mtmd (#17045) X-Git-Tag: upstream/0.0.7011~44 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=b7f9010d24766792d8887c227a883ed3b315d2be;p=pkg%2Fggml%2Fsources%2Fllama.cpp server : disable checkpoints with mtmd (#17045) --- diff --git a/tools/server/server.cpp b/tools/server/server.cpp index f5089bef..0e1a9afc 100644 --- a/tools/server/server.cpp +++ b/tools/server/server.cpp @@ -3832,7 +3832,9 @@ struct server_context { // the largest pos_min required for a checkpoint to be useful const auto pos_min_thold = std::max(0, n_past - n_swa); - if (n_past > 0 && n_past < slot.prompt.n_tokens()) { + // note: disallow with mtmd contexts for now + // https://github.com/ggml-org/llama.cpp/issues/17043 + if (!mctx && n_past > 0 && n_past < slot.prompt.n_tokens()) { const auto pos_min = llama_memory_seq_pos_min(llama_get_memory(ctx), slot.id); if (pos_min == -1) { SLT_ERR(slot, "n_past = %d, slot.prompt.tokens.size() = %d, seq_id = %d, pos_min = %d\n", n_past, (int) slot.prompt.tokens.size(), slot.id, pos_min);