mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-26 14:20:31 +01:00
ggml-cpu: fix typo in gemv/gemm iq4_nl_4_4 (#10580)
This commit is contained in:
parent
0f77aae560
commit
4b3242bbea
@ -1020,7 +1020,7 @@ void ggml_gemv_iq4_nl_4x4_q8_0(int n, float * restrict s, size_t bs, const void
|
|||||||
float * res_ptr = s;
|
float * res_ptr = s;
|
||||||
|
|
||||||
for (int x = 0; x < nc / ncols_interleaved; x++) {
|
for (int x = 0; x < nc / ncols_interleaved; x++) {
|
||||||
const block_q4_0x4 * b_ptr = (const block_q4_0x4 *) vx + (x * nb);
|
const block_iq4_nlx4 * b_ptr = (const block_iq4_nlx4 *) vx + (x * nb);
|
||||||
|
|
||||||
float32x4_t sumf = vdupq_n_f32(0);
|
float32x4_t sumf = vdupq_n_f32(0);
|
||||||
for (int l = 0; l < nb; l++) {
|
for (int l = 0; l < nb; l++) {
|
||||||
@ -3507,7 +3507,7 @@ void ggml_gemm_iq4_nl_4x4_q8_0(int n, float * restrict s, size_t bs, const void
|
|||||||
for (int y = 0; y < nr / 4; y++) {
|
for (int y = 0; y < nr / 4; y++) {
|
||||||
const block_q8_0x4 * a_ptr = (const block_q8_0x4 *) vy + (y * nb);
|
const block_q8_0x4 * a_ptr = (const block_q8_0x4 *) vy + (y * nb);
|
||||||
for (int x = 0; x < nc / ncols_interleaved; x++) {
|
for (int x = 0; x < nc / ncols_interleaved; x++) {
|
||||||
const block_q4_0x4 * b_ptr = (const block_q4_0x4 *) vx + (x * nb);
|
const block_iq4_nlx4 * b_ptr = (const block_iq4_nlx4 *) vx + (x * nb);
|
||||||
|
|
||||||
float32x4_t sumf[4];
|
float32x4_t sumf[4];
|
||||||
for (int m = 0; m < 4; m++) {
|
for (int m = 0; m < 4; m++) {
|
||||||
|
Loading…
Reference in New Issue
Block a user