diff --git a/ggml-cuda/dmmv.cu b/ggml-cuda/dmmv.cu index f91732df56143..7156c9219e31e 100644 --- a/ggml-cuda/dmmv.cu +++ b/ggml-cuda/dmmv.cu @@ -1,5 +1,6 @@ #include "dmmv.cuh" #include "dequantize.cuh" +#include "convert.cuh" // dmmv = dequantize_mul_mat_vec #ifndef GGML_CUDA_DMMV_X