]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
Server: Handle n_keep parameter in the request (#6174)
authorKarthick <redacted>
Wed, 20 Mar 2024 11:02:34 +0000 (16:32 +0530)
committerGitHub <redacted>
Wed, 20 Mar 2024 11:02:34 +0000 (12:02 +0100)
examples/server/utils.hpp

index 2ddb2cd21f8d6c4ce641125e6e7799294fecf7f9..cc5fce6918b07683a66156bd22d4a4ee881de9f4 100644 (file)
@@ -371,6 +371,7 @@ static json oaicompat_completion_params_parse(
     llama_params["repeat_last_n"]     = json_value(body,   "repeat_last_n",     default_sparams.penalty_last_n);
     llama_params["ignore_eos"]        = json_value(body,   "ignore_eos",        false);
     llama_params["tfs_z"]             = json_value(body,   "tfs_z",             default_sparams.tfs_z);
+    llama_params["n_keep"]            = json_value(body,   "n_keep",            0);
 
     if (body.count("grammar") != 0) {
         llama_params["grammar"] = json_value(body, "grammar", json::object());