]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
Fix GGML_F32Cx8_STORE in AVX without F16C path (#619)
authorslaren <redacted>
Thu, 30 Mar 2023 09:16:30 +0000 (11:16 +0200)
committerGitHub <redacted>
Thu, 30 Mar 2023 09:16:30 +0000 (11:16 +0200)
ggml.c

diff --git a/ggml.c b/ggml.c
index 02675ee67072d7668c3c018733cda1ca18927688..b7d79ab96fa6d44bc565872293e604dc09832a85 100644 (file)
--- a/ggml.c
+++ b/ggml.c
@@ -1297,7 +1297,7 @@ static inline void __avx_f32cx8_store(ggml_fp16_t *x, __m256 y) {
     _mm256_storeu_ps(arr, y);
 
     for (int i = 0; i < 8; i++)
-        x[i] = GGML_FP16_TO_FP32(arr[i]);
+        x[i] = GGML_FP32_TO_FP16(arr[i]);
 }
 #define GGML_F32Cx8_LOAD(x)     __avx_f32cx8_load(x)
 #define GGML_F32Cx8_STORE(x, y) __avx_f32cx8_store(x, y)