From 210e4691149d694ecdd8f5e7eb8a96855ef98a28 Mon Sep 17 00:00:00 2001 From: slaren Date: Mon, 25 Mar 2024 15:31:10 +0100 Subject: [PATCH] cuda : fix LLAMA_CUDA_F16 build --- ggml-cuda/dmmv.cu | 1 + 1 file changed, 1 insertion(+) diff --git a/ggml-cuda/dmmv.cu b/ggml-cuda/dmmv.cu index f91732df5..7156c9219 100644 --- a/ggml-cuda/dmmv.cu +++ b/ggml-cuda/dmmv.cu @@ -1,5 +1,6 @@ #include "dmmv.cuh" #include "dequantize.cuh" +#include "convert.cuh" // dmmv = dequantize_mul_mat_vec #ifndef GGML_CUDA_DMMV_X