cuda : fix convert function (#1412)

This commit is contained in:
Georgi Gerganov 2023-05-13 17:40:58 +03:00
parent bda4d7c215
commit 08737ef720

View File

@ -414,7 +414,7 @@ static dequantize_mul_mat_vec_cuda_t ggml_get_dequantize_mul_mat_vec_cuda(ggml_t
case GGML_TYPE_Q8_0: case GGML_TYPE_Q8_0:
return dequantize_mul_mat_vec_q8_0_cuda; return dequantize_mul_mat_vec_q8_0_cuda;
case GGML_TYPE_F16: case GGML_TYPE_F16:
return dequantize_mul_mat_vec_q8_0_cuda; return convert_mul_mat_vec_f16_cuda;
default: default:
return nullptr; return nullptr;
} }