mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-25 13:58:46 +01:00
cuda : fix convert function (#1412)
This commit is contained in:
parent
bda4d7c215
commit
08737ef720
@ -414,7 +414,7 @@ static dequantize_mul_mat_vec_cuda_t ggml_get_dequantize_mul_mat_vec_cuda(ggml_t
|
|||||||
case GGML_TYPE_Q8_0:
|
case GGML_TYPE_Q8_0:
|
||||||
return dequantize_mul_mat_vec_q8_0_cuda;
|
return dequantize_mul_mat_vec_q8_0_cuda;
|
||||||
case GGML_TYPE_F16:
|
case GGML_TYPE_F16:
|
||||||
return dequantize_mul_mat_vec_q8_0_cuda;
|
return convert_mul_mat_vec_f16_cuda;
|
||||||
default:
|
default:
|
||||||
return nullptr;
|
return nullptr;
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user