llama-run : fix context size (#11094)

Set `n_ctx` equal to `n_batch` in `Opt` class. Now context size is a more reasonable 2048. Signed-off-by: Eric Curtin <ecurtin@redhat.com>
2025-10-29 08:41:22 +00:00 · 2025-01-06 22:45:28 +00:00
parent ecebbd292d
commit dc7cef9f37
1 changed files with 1 additions and 0 deletions
--- a/examples/run/run.cpp
+++ b/examples/run/run.cpp
@@ -83,6 +83,7 @@ class Opt {
        }

        ctx_params.n_batch        = context_size >= 0 ? context_size : context_size_default;
+        ctx_params.n_ctx          = ctx_params.n_batch;
        model_params.n_gpu_layers = ngl >= 0 ? ngl : ngl_default;
        temperature               = temperature >= 0 ? temperature : temperature_default;