]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
server : fix duplicated n_predict key in the generation_settings (#8994)
authorRiceball LEE <redacted>
Thu, 15 Aug 2024 07:28:05 +0000 (15:28 +0800)
committerGitHub <redacted>
Thu, 15 Aug 2024 07:28:05 +0000 (10:28 +0300)
examples/server/server.cpp

index 3fe0e6558b0874b33a8a28496a0d98dfb40bd97d..e073f5813d459f0a5f60548fde0e0871bc4072f9 100644 (file)
@@ -1321,7 +1321,7 @@ struct server_context {
 
         return json {
             {"n_ctx",                     slot.n_ctx},
-            {"n_predict",                 slot.n_predict},
+            {"n_predict",                 slot.n_predict},     // Server configured n_predict
             {"model",                     params.model_alias},
             {"seed",                      slot.sparams.seed},
             {"temperature",               slot.sparams.temp},
@@ -1343,7 +1343,7 @@ struct server_context {
             {"mirostat_eta",              slot.sparams.mirostat_eta},
             {"penalize_nl",               slot.sparams.penalize_nl},
             {"stop",                      slot.params.antiprompt},
-            {"n_predict",                 slot.params.n_predict}, // TODO: fix duplicate key n_predict
+            {"max_tokens",                slot.params.n_predict}, // User configured n_predict
             {"n_keep",                    slot.params.n_keep},
             {"n_discard",                 slot.params.n_discard},
             {"ignore_eos",                ignore_eos},