From: Georgi Gerganov Date: Sat, 20 May 2023 07:13:19 +0000 (+0300) Subject: ggml : fix scalar implementation of Q4_1 dot X-Git-Tag: gguf-v0.4.0~738 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=4fd3e29297e3246a7be291932c115636fadb0f52;p=pkg%2Fggml%2Fsources%2Fllama.cpp ggml : fix scalar implementation of Q4_1 dot --- diff --git a/ggml.c b/ggml.c index 1cb89636..101cb733 100644 --- a/ggml.c +++ b/ggml.c @@ -2481,7 +2481,7 @@ static void ggml_vec_dot_q4_1_q8_1(const int n, float * restrict s, const void * sumi += (v0 * y[i].qs[j]) + (v1 * y[i].qs[j + qk/2]); } - sumf += (GGML_FP16_TO_FP32(x[i]).d*y[i].d)*sumi + GGML_FP16_TO_FP32(x[i].m)*y[i].s; + sumf += (GGML_FP16_TO_FP32(x[i].d)*y[i].d)*sumi + GGML_FP16_TO_FP32(x[i].m)*y[i].s; } *s = sumf;