From: slaren Date: Mon, 25 Mar 2024 14:43:22 +0000 (+0100) Subject: cuda : fix LLAMA_CUDA_F16 build (#6298) X-Git-Tag: upstream/0.0.4488~1958 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=2f34b865b62b1d2b5eb8a27885e4de220deeacbd;p=pkg%2Fggml%2Fsources%2Fllama.cpp cuda : fix LLAMA_CUDA_F16 build (#6298) --- diff --git a/ggml-cuda/dmmv.cu b/ggml-cuda/dmmv.cu index f91732df..7156c921 100644 --- a/ggml-cuda/dmmv.cu +++ b/ggml-cuda/dmmv.cu @@ -1,5 +1,6 @@ #include "dmmv.cuh" #include "dequantize.cuh" +#include "convert.cuh" // dmmv = dequantize_mul_mat_vec #ifndef GGML_CUDA_DMMV_X