]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
server : send partial stop string when <EOG> is reached (#15007)
authormatteo <redacted>
Thu, 23 Oct 2025 09:32:24 +0000 (11:32 +0200)
committerGitHub <redacted>
Thu, 23 Oct 2025 09:32:24 +0000 (12:32 +0300)
tools/server/server.cpp

index 8737fba124d50ffd7d24439a535c960e299c1528..85849e160e2b0fe278ecfa4fea7a2e945160a030 100644 (file)
@@ -2839,7 +2839,7 @@ struct server_context {
                     slot.generated_text.begin() + pos + stop_pos,
                     slot.generated_text.end());
                 pos = std::min(slot.n_sent_text, slot.generated_text.size());
-            } else if (slot.has_next_token) {
+            } else if (slot.has_next_token && !llama_vocab_is_eog(vocab, result.tok) ) {
                 stop_pos = slot.find_stopping_strings(str_test, token_str.size(), false);
                 send_text = stop_pos == std::string::npos;
             }