graph : fix reuse check for recurrent inputs

This commit is contained in:
Georgi Gerganov
2025-10-10 10:44:41 +03:00
parent 12a9751d46
commit a126bc48a7
2 changed files with 14 additions and 1 deletions

View File

@@ -234,6 +234,10 @@ public:
ggml_tensor * s_copy_extra; // I32 [n_rs - n_seqs]
const llama_memory_recurrent_context * mctx;
// used in view offsets, need to match for valid graph reuse
uint32_t head;
int32_t rs_z;
};
class llm_graph_input_cross_embd : public llm_graph_input_i {