llama : remove implicit recurrent state rollbacks

This commit is contained in:
Francis Couture-Harpin
2024-11-24 20:35:30 -05:00
parent 124c222f76
commit 8006f3b3c8
25 changed files with 411 additions and 1119 deletions

View File

@@ -111,7 +111,7 @@ if llama_decode(context, batch) != 0 {
}
for i in 1 ..< n_parallel {
llama_past_seq_cp(context, 0, Int32(i), -1, -1)
llama_kv_cache_seq_cp(context, 0, Int32(i), -1, -1)
}
if n_parallel > 1 {