rework, targeting llama-server

This commit is contained in:
Xuan Son Nguyen
2025-02-14 18:16:49 +01:00
parent 4ed4fe75ed
commit f2e59a8eb9
10 changed files with 191 additions and 136 deletions

View File

@@ -20,6 +20,8 @@
//
struct llama_batch {
int32_t n_tokens;
int32_t max_tokens;
bool is_view;
llama_token * token;
float * embd;