From 60781f0a2bd8ec3aa8444b453cca978de27e24ef Mon Sep 17 00:00:00 2001
From: Pierrick HYMBERT <pierrick.hymbert@gmail.com>
Date: Sat, 24 Feb 2024 11:13:31 +0100
Subject: [PATCH] server: tests - add explanation about KV Cache.

---
 examples/server/tests/features/server.feature | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/examples/server/tests/features/server.feature b/examples/server/tests/features/server.feature
index a98d92c09..fedcfe5ae 100644
--- a/examples/server/tests/features/server.feature
+++ b/examples/server/tests/features/server.feature
@@ -6,6 +6,9 @@ Feature: llama.cpp server
     And   a model file stories260K.gguf
     And   a model alias tinyllama-2
     And   42 as server seed
+      # KV Cache corresponds to the total amount of tokens
+      # that can be stored across all independent sequences: #4130
+      # see --ctx-size and #5568
     And   32 KV cache size
     And   1 slots
     And   embeddings extraction