Compare commits

...
Sign in to create a new pull request.

1 commit

Author SHA1 Message Date
Pierrick HYMBERT
eedd42e376 KV Cache defrag hash overflow - TMP Fix by @slaren
#6685
2024-04-16 10:24:34 +02:00

View file

@ -10702,7 +10702,7 @@ static void llama_kv_cache_defrag_internal(struct llama_context & lctx) {
// each move requires 6*n_layer tensors (see build_defrag)
// - source view, destination view, copy operation
// - x2 for keys and values
const uint32_t max_moves = LLAMA_MAX_NODES/(6*n_layer);
const uint32_t max_moves = (LLAMA_MAX_NODES - 2*n_layer)/(6*n_layer);
// determine which KV cells to move where
//