mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 13:52:22 +01:00
cuda : fix LLAMA_CUDA_F16 build
This commit is contained in:
parent
ae1f211ce2
commit
210e469114
@ -1,5 +1,6 @@
|
|||||||
#include "dmmv.cuh"
|
#include "dmmv.cuh"
|
||||||
#include "dequantize.cuh"
|
#include "dequantize.cuh"
|
||||||
|
#include "convert.cuh"
|
||||||
|
|
||||||
// dmmv = dequantize_mul_mat_vec
|
// dmmv = dequantize_mul_mat_vec
|
||||||
#ifndef GGML_CUDA_DMMV_X
|
#ifndef GGML_CUDA_DMMV_X
|
||||||
|
Loading…
x
Reference in New Issue
Block a user