kv-cache : fix find_slot to not search for continuous slot (#15638)

ggml-ci
This commit is contained in:
Georgi Gerganov
2025-08-28 17:09:05 +03:00
committed by GitHub
parent 84ab83cc0b
commit c8d0d14e77

View File

@@ -540,7 +540,7 @@ llama_kv_cache::slot_info_vec_t llama_kv_cache::prepare(const std::vector<llama_
for (const auto & ubatch : ubatches) {
// only find a suitable slot for the ubatch. don't modify the cells yet
const auto sinfo_new = find_slot(ubatch, true);
const auto sinfo_new = find_slot(ubatch, false);
if (sinfo_new.empty()) {
success = false;
break;