cont : update todos [no ci]

2025-11-02 09:12:03 +00:00 · 2025-10-30 20:39:26 +02:00
parent 9d342994f5
commit 93373cc54e
1 changed files with 2 additions and 2 deletions
--- a/tools/server/server.cpp
+++ b/tools/server/server.cpp
@@ -2699,7 +2699,7 @@ struct server_context {

    // return true if at least one slot has been purged
    // TODO: improve logic
-    //       - smarter decision which slot to purge
+    //       - smarter decision which slot to purge (LRU or longest prompt?)
    //       - move slot to level 2 cache instead of removing?
    //       - instead of purging, try to store and resume later?
    bool try_purge_idle_slots() {
@@ -4159,7 +4159,7 @@ struct server_context {
                    std::string err;

                    if (n_batch == 1 && ret == 1) {
-                        // TODO: try to terminate only the largest active slot and continue
+                        // TODO: try to terminate only the largest active slot/sequence and continue with the rest
                        //       need to remove the tokens from the current batch too
                        err = "Context size has been exceeded.";
                    }