From: Georgi Gerganov Date: Sat, 2 Mar 2024 18:00:49 +0000 (+0200) Subject: ggml : fix IQ3_S AVX implementation (llama/5834) X-Git-Tag: upstream/1.7.4~926 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=bd26876267b88a98447f7caf0faece3512636952;p=pkg%2Fggml%2Fsources%2Fwhisper.cpp ggml : fix IQ3_S AVX implementation (llama/5834) ggml-ci --- diff --git a/ggml-quants.c b/ggml-quants.c index 492a1b9a..2a8881d7 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -10231,7 +10231,7 @@ void ggml_vec_dot_iq3_s_q8_K (int n, float * GGML_RESTRICT s, size_t bs, const v //const __m256i q2_2 = _mm256_i32gather_epi32((const int *)iq3s_grid, idx.vec[1], 4); const __m256i q2_1 = _mm256_set_epi32( iq3s_grid[idx.index[7]], iq3s_grid[idx.index[6]], iq3s_grid[idx.index[5]], iq3s_grid[idx.index[4]], - iq3s_grid[idx.index[3]], iq3s_grid[idx.index[1]], iq3s_grid[idx.index[1]], iq3s_grid[idx.index[0]] + iq3s_grid[idx.index[3]], iq3s_grid[idx.index[2]], iq3s_grid[idx.index[1]], iq3s_grid[idx.index[0]] ); const __m256i q2_2 = _mm256_set_epi32( iq3s_grid[idx.index[15]], iq3s_grid[idx.index[14]], iq3s_grid[idx.index[13]], iq3s_grid[idx.index[12]],