llama : bump max seq limit from 64 to 256 (#15916)

ggml-ci
2025-10-27 08:21:30 +00:00 · 2025-09-18 12:47:56 +03:00
parent b213fce89b
commit e58174cecb
1 changed files with 1 additions and 1 deletions
--- a/src/llama-cparams.h
+++ b/src/llama-cparams.h
@@ -4,7 +4,7 @@

 #include <cstdint>

-#define LLAMA_MAX_SEQ 64
+#define LLAMA_MAX_SEQ 256

 struct llama_cparams {
    uint32_t n_ctx;           // context size used during inference