mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 13:52:22 +01:00
cuda : fix LLAMA_CUDA_F16 build
This commit is contained in:
parent
ae1f211ce2
commit
210e469114
@ -1,5 +1,6 @@
|
||||
#include "dmmv.cuh"
|
||||
#include "dequantize.cuh"
|
||||
#include "convert.cuh"
|
||||
|
||||
// dmmv = dequantize_mul_mat_vec
|
||||
#ifndef GGML_CUDA_DMMV_X
|
||||
|
Loading…
x
Reference in New Issue
Block a user