context : prepare kv_cache_read/write to be moved to kv_cache

ggml-ci
2025-11-11 10:36:54 +00:00 · 2025-01-14 12:33:13 +02:00
parent 73a14eccc9
commit 4cd1b6fa4c
2 changed files with 76 additions and 78 deletions
--- a/src/llama-kv-cache.h
+++ b/src/llama-kv-cache.h
@@ -44,6 +44,7 @@ struct llama_kv_cache_slot_info {

 // ring-buffer of cached KV data
 // TODO: pimpl
+// TODO: add notion of max sequences
 struct llama_kv_cache {
    bool has_shift = false;
    bool do_defrag = false;