server : fix "can batch with" bug (#17263)

2025-11-16 11:27:03 +00:00 · 2025-11-14 14:03:45 +02:00
parent 45c6ef7307
commit d396b43748
1 changed files with 10 additions and 6 deletions
--- a/tools/server/server.cpp
+++ b/tools/server/server.cpp
@@ -3591,13 +3591,13 @@ struct server_context {
        // next, batch any pending prompts without exceeding n_batch
        if (params_base.cont_batching || batch.n_tokens == 0) {
            for (auto & slot : slots) {
                if (!slot.is_processing()) {
                    continue;
                }
                // check if we can batch this slot with the previous one
-                if (slot.is_processing()) {
+                if (slot_batched && !slot_batched->can_batch_with(slot)) {
-                    if (!slot_batched) {
+                    continue;
                        slot_batched = &slot;
                    } else if (!slot_batched->can_batch_with(slot)) {
                        continue;
                    }
                }
                // this slot still has a prompt to be processed
@@ -4028,6 +4028,10 @@ struct server_context {
                    }
                }
                if (!slot_batched) {
                    slot_batched = &slot;
                }
                if (batch.n_tokens >= n_batch) {
                    break;
                }