cuda : fix LLAMA_CUDA_F16 build

This commit is contained in:
slaren 2024-03-25 15:31:10 +01:00
parent ae1f211ce2
commit 210e469114

View File

@ -1,5 +1,6 @@
#include "dmmv.cuh"
#include "dequantize.cuh"
#include "convert.cuh"
// dmmv = dequantize_mul_mat_vec
#ifndef GGML_CUDA_DMMV_X