parallel : example for serving multiple users in parallel

2025-11-03 09:22:01 +00:00 · 2023-09-18 20:30:05 +03:00
parent 1f17ea631c
commit 0161372b9a
9 changed files with 262 additions and 13 deletions
--- a/examples/perplexity/perplexity.cpp
+++ b/examples/perplexity/perplexity.cpp
@@ -681,7 +681,7 @@ int main(int argc, char ** argv) {
        return 1;
    }

-    params.perplexity = true;
+    params.logits_all = true;
    params.n_batch = std::min(params.n_batch, params.n_ctx);

    if (params.ppl_stride > 0) {