From: Georgi Gerganov Date: Fri, 24 Mar 2023 16:23:56 +0000 (+0200) Subject: Temporary bump the memory buffer size - hopefully fix issues from 483bab2e X-Git-Tag: gguf-v0.4.0~1124 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=31572d966531f7d768eb773322016ab78eb6e835;p=pkg%2Fggml%2Fsources%2Fllama.cpp Temporary bump the memory buffer size - hopefully fix issues from 483bab2e --- diff --git a/llama.cpp b/llama.cpp index cdb86282..9a93409c 100644 --- a/llama.cpp +++ b/llama.cpp @@ -632,7 +632,7 @@ static bool llama_eval_internal( auto & mem_per_token = lctx.mem_per_token; // TODO: fix this hardcoded size - static size_t buf_size = 512u*1024*1024; + static size_t buf_size = 2048u*1024*1024; // TMP !!! static void * buf = malloc(buf_size); if (mem_per_token > 0 && mem_per_token*N > buf_size) {