cuda : re-add q4_0

This commit is contained in:
Georgi Gerganov 2024-08-14 13:37:03 +03:00
parent 503983a69a
commit 62d7b6c87f
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
2 changed files with 8 additions and 3 deletions

View File

@ -29,9 +29,9 @@ void ggml_cuda_op_mul_mat_q(
const mmq_args args = {src0_dd_i, src1_ddq_i, dst_dd_i, ne00, row_diff, stride00, src1_padded_row_size, src1_ncols, ne11, nrows_dst};
switch (src0->type) {
// case GGML_TYPE_Q4_0:
// mul_mat_q_case<GGML_TYPE_Q4_0>(ctx, args, stream);
// break;
case GGML_TYPE_Q4_0:
mul_mat_q_case<GGML_TYPE_Q4_0>(ctx, args, stream);
break;
// case GGML_TYPE_Q4_1:
// mul_mat_q_case<GGML_TYPE_Q4_1>(ctx, args, stream);
// break;

View File

@ -0,0 +1,5 @@
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
#include "../mmq.cuh"
DECL_MMQ_CASE(GGML_TYPE_Q4_0);