]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
quantize : fix using combined imatrix GGUFs (multiple datasets) (#14973)
authorEd Addario <redacted>
Wed, 30 Jul 2025 19:11:56 +0000 (20:11 +0100)
committerGitHub <redacted>
Wed, 30 Jul 2025 19:11:56 +0000 (21:11 +0200)
tools/quantize/quantize.cpp

index 45c59ecb6fffe108b6ba74245fda11f73489ed2b..0e89a2b81b2a84b2fd5d0cae8cf69c1e2c8b2262 100644 (file)
@@ -311,7 +311,7 @@ static int load_imatrix(const std::string & imatrix_file, std::vector<std::strin
     int64_t n_datasets = gguf_get_arr_n(ctx_gguf, dataset_idx);
     imatrix_datasets.reserve(n_datasets);
     for (int64_t i = 0; i < n_datasets; ++i) {
-        imatrix_datasets.push_back(gguf_get_val_str(ctx_gguf, dataset_idx));
+        imatrix_datasets.push_back(gguf_get_arr_str(ctx_gguf, dataset_idx, i));
     }
     printf("%s: imatrix datasets=['%s'", __func__, imatrix_datasets[0].c_str());
     for (size_t i = 1; i < imatrix_datasets.size(); ++i) {