From: Daniel Bevenius Date: Wed, 14 May 2025 13:22:05 +0000 (+0200) Subject: server : add --flash-attn usage output (#3152) X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=3882a099e18c9149efe0d8d046be3300f709e889;p=pkg%2Fggml%2Fsources%2Fwhisper.cpp server : add --flash-attn usage output (#3152) This commit adds the `--flash-attn` option to the usage output of the server example. The motivation for this change is that while it is possible to set this option it is not printed in the usage output. --- diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 14462707..bf81f792 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -139,6 +139,7 @@ void whisper_print_usage(int /*argc*/, char ** argv, const whisper_params & para fprintf(stderr, " -nth N, --no-speech-thold N [%-7.2f] no speech threshold\n", params.no_speech_thold); fprintf(stderr, " -nc, --no-context [%-7s] do not use previous audio context\n", params.no_context ? "true" : "false"); fprintf(stderr, " -ng, --no-gpu [%-7s] do not use gpu\n", params.use_gpu ? "false" : "true"); + fprintf(stderr, " -fa, --flash-attn [%-7s] flash attention\n", params.flash_attn ? "true" : "false"); fprintf(stderr, "\n"); }