llama : add new llama_decode() API that works with llama_batch

2025-10-30 08:42:00 +00:00 · 2023-09-18 14:23:52 +03:00
parent 58bb5110ca
commit 9f42e75489
13 changed files with 146 additions and 75 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -434,7 +434,7 @@ struct llama_server_context
            {
                n_eval = params.n_batch;
            }
-            if (llama_eval(ctx, &embd[n_past], n_eval, n_past, params.n_threads))
+            if (llama_decode(ctx, llama_batch_get_one(&embd[n_past], n_eval, n_past, 0), params.n_threads))
            {
                LOG_ERROR("failed to eval", {
                                                {"n_eval", n_eval},