mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-01 00:39:00 +01:00
iq3_s_mult: another alternative multiplier
This commit is contained in:
parent
8b713a987e
commit
dbe98dfe70
@ -2374,8 +2374,8 @@ static __global__ void dequantize_block_iq3_xxs(const void * __restrict__ vx, ds
|
|||||||
// Better (lower PPL), but requires more bit twidling, so slower
|
// Better (lower PPL), but requires more bit twidling, so slower
|
||||||
#define IQ3S_MULTIPLIER 190842953LL
|
#define IQ3S_MULTIPLIER 190842953LL
|
||||||
#else
|
#else
|
||||||
//#define IQ3S_MULTIPLIER 898886
|
#define IQ3S_MULTIPLIER 898886
|
||||||
#define IQ3S_MULTIPLIER 842866
|
//#define IQ3S_MULTIPLIER 842866
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
template<typename dst_t>
|
template<typename dst_t>
|
||||||
|
@ -4125,8 +4125,8 @@ void dequantize_row_iq3_xxs(const block_iq3_xxs * restrict x, float * restrict y
|
|||||||
// Best PPL
|
// Best PPL
|
||||||
#define IQ3S_MULTIPLIER 190842953
|
#define IQ3S_MULTIPLIER 190842953
|
||||||
#else
|
#else
|
||||||
//#define IQ3S_MULTIPLIER 898886
|
#define IQ3S_MULTIPLIER 898886
|
||||||
#define IQ3S_MULTIPLIER 842866
|
//#define IQ3S_MULTIPLIER 842866
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
#define IQ3S_BITS 3
|
#define IQ3S_BITS 3
|
||||||
|
Loading…
Reference in New Issue
Block a user