mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 05:42:22 +01:00
Single load for half2
This commit is contained in:
parent
4a481556e6
commit
cb3fb42046
@ -4321,8 +4321,9 @@ static void dequantize_block_q4_K(const void * __restrict__ vx, dst_t * __restri
|
|||||||
|
|
||||||
dst_t * y = yy + i*QK_K + 64*il + n*ir;
|
dst_t * y = yy + i*QK_K + 64*il + n*ir;
|
||||||
|
|
||||||
const float dall = x[i].dm[0];
|
const sycl::half2 dm = x[i].dm;
|
||||||
const float dmin = x[i].dm[1];
|
const float dall = dm[0];
|
||||||
|
const float dmin = dm[1];
|
||||||
|
|
||||||
const uint8_t * q = x[i].qs + 32*il + n*ir;
|
const uint8_t * q = x[i].qs + 32*il + n*ir;
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user