]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
llama : print size and type of overridden tensors (#13364)
authorDiego Devesa <redacted>
Thu, 8 May 2025 11:15:15 +0000 (13:15 +0200)
committerGitHub <redacted>
Thu, 8 May 2025 11:15:15 +0000 (13:15 +0200)
src/llama-model.cpp

index 7b66e2a03e38ec96415f2a40df0378cb5fc03ed0..1603eae1292c9eea376761ebffdd8f17aff472eb 100644 (file)
@@ -1651,8 +1651,11 @@ bool llama_model::load_tensors(llama_model_loader & ml) {
                 for (const auto * overrides = ml.tensor_buft_overrides; overrides->pattern != nullptr; ++overrides) {
                     std::regex pattern(overrides->pattern);
                     if (std::regex_search(tensor_name, pattern)) {
-                        LLAMA_LOG_DEBUG("tensor %s buffer type overriden to %s\n", tensor_name.c_str(), ggml_backend_buft_name(overrides->buft));
                         buft = overrides->buft;
+                        LLAMA_LOG_DEBUG("tensor %s (%zu MiB %s) buffer type overridden to %s\n",
+                                tensor_name.c_str(),
+                                ggml_nbytes(t_meta) / 1024 / 1024, ggml_type_name(t_meta->type),
+                                ggml_backend_buft_name(buft));
                         break;
                     }
                 }