]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
server : return error on too large embedding input (#7389)
authorGeorgi Gerganov <redacted>
Mon, 20 May 2024 05:56:05 +0000 (08:56 +0300)
committerGitHub <redacted>
Mon, 20 May 2024 05:56:05 +0000 (08:56 +0300)
examples/server/server.cpp

index 7978f979dde6670c10093735bdfc0f40e3a8b22d..6af5cb96e6d131a466cb026c524f553de9e0ec16 100644 (file)
@@ -1981,8 +1981,7 @@ struct server_context {
                                 slot.state = SLOT_STATE_PROCESSING;
                                 slot.command = SLOT_COMMAND_NONE;
                                 slot.release();
-                                slot.print_timings();
-                                send_final_response(slot);
+                                send_error(slot, "input is too large to process. increase the physical batch size", ERROR_TYPE_SERVER);
                                 continue;
                             }
                         } else {