speculative : add --draft CLI arg

2025-11-15 11:17:31 +00:00 · 2023-09-03 13:51:07 +03:00
parent a15ca746c7
commit 847896aba7
3 changed files with 11 additions and 3 deletions
--- a/examples/speculative/speculative.cpp
+++ b/examples/speculative/speculative.cpp
@@ -84,7 +84,7 @@ int main(int argc, char ** argv) {
    //GGML_ASSERT(n_vocab == llama_n_vocab(ctx_dft));

    // how many tokens to draft each time
-    const int n_draft = 16;
+    const int n_draft = params.n_draft;

    int n_predict = 0;
    int n_drafted = 0;