From: Georgi Gerganov Date: Fri, 12 Sep 2025 14:02:55 +0000 (+0300) Subject: server : adjust prompt similarity thold + add logs (#15913) X-Git-Tag: upstream/0.0.6527~72 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=f088b6a84f6aed0abb619dbb9d375e726fc888a6;p=pkg%2Fggml%2Fsources%2Fllama.cpp server : adjust prompt similarity thold + add logs (#15913) ggml-ci --- diff --git a/common/common.h b/common/common.h index 85b3b879..74016874 100644 --- a/common/common.h +++ b/common/common.h @@ -452,7 +452,7 @@ struct common_params { std::string slot_save_path; - float slot_prompt_similarity = 0.5f; + float slot_prompt_similarity = 0.1f; // batched-bench params bool is_pp_shared = false; diff --git a/tools/server/server.cpp b/tools/server/server.cpp index 39ef439e..160b97cf 100644 --- a/tools/server/server.cpp +++ b/tools/server/server.cpp @@ -2372,7 +2372,7 @@ struct server_context { } if (ret != nullptr) { - SLT_DBG(*ret, "selected slot by lcs similarity, lcs_len = %d, similarity = %f\n", lcs_len, similarity); + SLT_INF(*ret, "selected slot by lcs similarity, lcs_len = %d, similarity = %.3f (> %.3f thold)\n", lcs_len, similarity, slot_prompt_similarity); } } @@ -2394,7 +2394,7 @@ struct server_context { } if (ret != nullptr) { - SLT_DBG(*ret, "selected slot by lru, t_last = %" PRId64 "\n", t_last); + SLT_INF(*ret, "selected slot by LRU, t_last = %" PRId64 "\n", t_last); } }