batch : fix consistency checks for the input positions (#16890)

2025-11-06 09:46:50 +00:00 · 2025-10-31 13:50:33 +02:00
parent c22473b580
commit 8da3c0e200
1 changed files with 22 additions and 8 deletions
--- a/src/llama-batch.cpp
+++ b/src/llama-batch.cpp
@@ -261,6 +261,7 @@ bool llama_batch_allocr::init(
            const llama_pos p0 = memory ? memory->seq_pos_max(s) : -1;
            if (batch.token) {
                if (p0 >= 0 && p0 >= seq_pos_min(s)) {
                    LLAMA_LOG_ERROR(
                            "%s: the tokens of sequence %d in the input batch have inconsistent sequence positions:\n"
@@ -271,6 +272,19 @@ bool llama_batch_allocr::init(
                    return false;
                }
            } else {
                // embedding inputs can have overlapping positions
                if (p0 >= 0 && p0 > seq_pos_min(s)) {
                    LLAMA_LOG_ERROR(
                            "%s: the tokens of sequence %d in the input batch have inconsistent sequence positions:\n"
                            " - the last position stored in the memory module of the context (i.e. the KV cache) for sequence %d is X = %d\n"
                            " - the tokens for sequence %d in the input batch have a starting position of Y = %d\n"
                            " for M-RoPE, it is required that the position satisfies: X <= Y\n",
                            __func__, s, s, p0, s, seq_pos_min(s));
                    return false;
                }
            }
        }
    } else {
        for (uint32_t s = 0; s < n_seq_max; ++s) {