From: Georgi Gerganov Date: Sat, 13 May 2023 14:40:58 +0000 (+0300) Subject: cuda : fix convert function (#1412) X-Git-Tag: gguf-v0.4.0~760 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=08737ef720f0510c7ec2aa84d7f70c691073c35d;p=pkg%2Fggml%2Fsources%2Fllama.cpp cuda : fix convert function (#1412) --- diff --git a/ggml-cuda.cu b/ggml-cuda.cu index b6a7754d..eb9f0df5 100644 --- a/ggml-cuda.cu +++ b/ggml-cuda.cu @@ -414,7 +414,7 @@ static dequantize_mul_mat_vec_cuda_t ggml_get_dequantize_mul_mat_vec_cuda(ggml_t case GGML_TYPE_Q8_0: return dequantize_mul_mat_vec_q8_0_cuda; case GGML_TYPE_F16: - return dequantize_mul_mat_vec_q8_0_cuda; + return convert_mul_mat_vec_f16_cuda; default: return nullptr; }