rework, targeting llama-server

2025-11-02 09:12:03 +00:00 · 2025-02-14 18:16:49 +01:00
parent 4ed4fe75ed
commit f2e59a8eb9
10 changed files with 191 additions and 136 deletions
--- a/src/llama-batch.h
+++ b/src/llama-batch.h
@@ -20,6 +20,8 @@
 //
 struct llama_batch {
    int32_t n_tokens;
+    int32_t max_tokens;
+    bool is_view;

    llama_token  *  token;
    float        *  embd;