From: klosax Date: Wed, 7 Jun 2023 16:15:50 +0000 (+0200) Subject: gpt-neox : fix ctx size calculation (#228) X-Git-Tag: upstream/0.0.1642~1415 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=93a9af7d9828e0663bdb6c0f229885de6fbec766;p=pkg%2Fggml%2Fsources%2Fggml gpt-neox : fix ctx size calculation (#228) --- diff --git a/examples/gpt-neox/main.cpp b/examples/gpt-neox/main.cpp index a53f98d5..2910da73 100644 --- a/examples/gpt-neox/main.cpp +++ b/examples/gpt-neox/main.cpp @@ -156,10 +156,10 @@ bool gpt_neox_model_load(const std::string & fname, gpt_neox_model & model, gpt_ { const auto & hparams = model.hparams; - const int n_embd = hparams.n_embd; - const int n_layer = hparams.n_layer; - const int n_ctx = hparams.n_ctx; - const int n_vocab = hparams.n_vocab; + const size_t n_embd = hparams.n_embd; + const size_t n_layer = hparams.n_layer; + const size_t n_ctx = hparams.n_ctx; + const size_t n_vocab = hparams.n_vocab; ctx_size += n_embd*ggml_type_sizef(GGML_TYPE_F32); // ln_f_g ctx_size += n_embd*ggml_type_sizef(GGML_TYPE_F32); // ln_f_b @@ -190,7 +190,7 @@ bool gpt_neox_model_load(const std::string & fname, gpt_neox_model & model, gpt_ ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F32); // memory_k ctx_size += n_ctx*n_layer*n_embd*ggml_type_sizef(GGML_TYPE_F32); // memory_v - ctx_size += (6 + 16*n_layer)*512; // object overhead + ctx_size += (6 + 16*n_layer)*1024; // object overhead printf("%s: ggml ctx size = %6.2f MB\n", __func__, ctx_size/(1024.0*1024.0)); } @@ -806,4 +806,4 @@ int main(int argc, char ** argv) { ggml_free(model.ctx); return 0; -} \ No newline at end of file +}