KV Cache defrag hash overflow - TMP Fix by @slaren

#6685
2024-12-26 14:20:31 +01:00 · 2024-04-16 10:24:34 +02:00 · 2024-04-16 10:24:34 +02:00 · eedd42e376
commit eedd42e376
parent 8a56075b07
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -10702,7 +10702,7 @@ static void llama_kv_cache_defrag_internal(struct llama_context & lctx) {
    // each move requires 6*n_layer tensors (see build_defrag)
    //   - source view, destination view, copy operation
    //   - x2 for keys and values
-    const uint32_t max_moves = LLAMA_MAX_NODES/(6*n_layer);
+    const uint32_t max_moves = (LLAMA_MAX_NODES - 2*n_layer)/(6*n_layer);
    // determine which KV cells to move where
    //