ggml-cpu: fix typo in gemv/gemm iq4_nl_4_4 (#10580)

This commit is contained in:
Shupei Fan 2024-11-29 21:49:02 +08:00 committed by GitHub
parent 0f77aae560
commit 4b3242bbea
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1020,7 +1020,7 @@ void ggml_gemv_iq4_nl_4x4_q8_0(int n, float * restrict s, size_t bs, const void
float * res_ptr = s; float * res_ptr = s;
for (int x = 0; x < nc / ncols_interleaved; x++) { for (int x = 0; x < nc / ncols_interleaved; x++) {
const block_q4_0x4 * b_ptr = (const block_q4_0x4 *) vx + (x * nb); const block_iq4_nlx4 * b_ptr = (const block_iq4_nlx4 *) vx + (x * nb);
float32x4_t sumf = vdupq_n_f32(0); float32x4_t sumf = vdupq_n_f32(0);
for (int l = 0; l < nb; l++) { for (int l = 0; l < nb; l++) {
@ -3507,7 +3507,7 @@ void ggml_gemm_iq4_nl_4x4_q8_0(int n, float * restrict s, size_t bs, const void
for (int y = 0; y < nr / 4; y++) { for (int y = 0; y < nr / 4; y++) {
const block_q8_0x4 * a_ptr = (const block_q8_0x4 *) vy + (y * nb); const block_q8_0x4 * a_ptr = (const block_q8_0x4 *) vy + (y * nb);
for (int x = 0; x < nc / ncols_interleaved; x++) { for (int x = 0; x < nc / ncols_interleaved; x++) {
const block_q4_0x4 * b_ptr = (const block_q4_0x4 *) vx + (x * nb); const block_iq4_nlx4 * b_ptr = (const block_iq4_nlx4 *) vx + (x * nb);
float32x4_t sumf[4]; float32x4_t sumf[4];
for (int m = 0; m < 4; m++) { for (int m = 0; m < 4; m++) {