cuda : fix LLAMA_CUDA_F16 build (#6298)

This commit is contained in:
slaren 2024-03-25 15:43:22 +01:00 committed by GitHub
parent ae1f211ce2
commit 2f34b865b6
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1,5 +1,6 @@
#include "dmmv.cuh" #include "dmmv.cuh"
#include "dequantize.cuh" #include "dequantize.cuh"
#include "convert.cuh"
// dmmv = dequantize_mul_mat_vec // dmmv = dequantize_mul_mat_vec
#ifndef GGML_CUDA_DMMV_X #ifndef GGML_CUDA_DMMV_X