From 964c96b2dad1555973c8e84f38dba89aa2044d7e Mon Sep 17 00:00:00 2001 From: slaren Date: Mon, 25 Mar 2024 15:43:22 +0100 Subject: [PATCH] cuda : fix LLAMA_CUDA_F16 build (#6298) --- ggml-cuda/dmmv.cu | 1 + 1 file changed, 1 insertion(+) diff --git a/ggml-cuda/dmmv.cu b/ggml-cuda/dmmv.cu index f91732df56143..7156c9219e31e 100644 --- a/ggml-cuda/dmmv.cu +++ b/ggml-cuda/dmmv.cu @@ -1,5 +1,6 @@ #include "dmmv.cuh" #include "dequantize.cuh" +#include "convert.cuh" // dmmv = dequantize_mul_mat_vec #ifndef GGML_CUDA_DMMV_X