]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
ggml : fix scalar implementation of Q4_1 dot
authorGeorgi Gerganov <redacted>
Sat, 20 May 2023 07:13:19 +0000 (10:13 +0300)
committerGeorgi Gerganov <redacted>
Sat, 20 May 2023 07:13:19 +0000 (10:13 +0300)
ggml.c

diff --git a/ggml.c b/ggml.c
index 1cb89636a0b21e0e886d59bf13d28973a19d91e6..101cb733b29eb82687bbd9e4555a7696fb5c75ae 100644 (file)
--- a/ggml.c
+++ b/ggml.c
@@ -2481,7 +2481,7 @@ static void ggml_vec_dot_q4_1_q8_1(const int n, float * restrict s, const void *
             sumi += (v0 * y[i].qs[j]) + (v1 * y[i].qs[j + qk/2]);
         }
 
-        sumf += (GGML_FP16_TO_FP32(x[i]).d*y[i].d)*sumi + GGML_FP16_TO_FP32(x[i].m)*y[i].s;
+        sumf += (GGML_FP16_TO_FP32(x[i].d)*y[i].d)*sumi + GGML_FP16_TO_FP32(x[i].m)*y[i].s;
     }
 
     *s = sumf;