iq3_s_mult: back to blocks of 32

2025-01-30 05:43:03 +01:00 · 2024-03-03 18:50:26 +02:00 · 2024-03-03 18:50:26 +02:00 · e5e72562c5
commit e5e72562c5
parent f4cb4eac45
1 changed files with 1 additions and 1 deletions
--- a/ggml-quants.h
+++ b/ggml-quants.h
@ -201,7 +201,7 @@ typedef struct {
 static_assert(sizeof(block_iq3_xxs) == sizeof(ggml_fp16_t) + 3*(QK_K/8), "wrong iq3_xxs block size/padding");

 // 3.4375 bpw
-#define IQ3S_BLOCK_SIZE 16
+#define IQ3S_BLOCK_SIZE 32
 #if QK_K == 64
 #define IQ3S_N_SCALE 2
 #else