]> git.djapps.eu Git - pkg/ggml/sources/whisper.cpp/commitdiff
Corrected: changed s13 = src1->nb[3] instead of nb[2] (llama/18724)
authorMichael Wand <redacted>
Sat, 10 Jan 2026 09:16:07 +0000 (01:16 -0800)
committerGeorgi Gerganov <redacted>
Wed, 14 Jan 2026 07:11:59 +0000 (09:11 +0200)
ggml/src/ggml-cuda/mmq.cu

index ceb95758d20505d73527dcaeaedcdd742fd09c5b..c9aa7024a9c6b887b8ec882f03271302192bb861 100644 (file)
@@ -190,7 +190,7 @@ void ggml_cuda_mul_mat_q(
     {
         const int64_t s11 = src1->nb[1] / ts_src1;
         const int64_t s12 = src1->nb[2] / ts_src1;
-        const int64_t s13 = src1->nb[2] / ts_src1;
+        const int64_t s13 = src1->nb[3] / ts_src1;
 
         if (use_native_mxfp4) {
             quantize_mmq_mxfp4_cuda(src1_d, ids_src1.get(), src1_q8_1.get(), src0->type, ne10, s11, s12, s13,