]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
llama : bump max seq limit from 64 to 256 (#15916)
authorGeorgi Gerganov <redacted>
Thu, 18 Sep 2025 09:47:56 +0000 (12:47 +0300)
committerGitHub <redacted>
Thu, 18 Sep 2025 09:47:56 +0000 (12:47 +0300)
ggml-ci

src/llama-cparams.h

index dbbaba9f6274cb0a5a96113e1f42396344c897e4..eae7b839f4857da2df56be6cd8d4d9a5fe362b7a 100644 (file)
@@ -4,7 +4,7 @@
 
 #include <cstdint>
 
-#define LLAMA_MAX_SEQ 64
+#define LLAMA_MAX_SEQ 256
 
 struct llama_cparams {
     uint32_t n_ctx;           // context size used during inference