export llama_timings as struct and expose them in server

2025-11-01 09:01:57 +00:00 · 2023-07-04 21:52:04 -04:00
parent a76ce02a6c
commit 30d973dc42
7 changed files with 1631 additions and 1309 deletions
--- a/examples/server/public/completion.js
+++ b/examples/server/public/completion.js
@@ -72,6 +72,9 @@ export async function* llama(prompt, params = {}, config = {}) {

      // if we got a stop token from server, we will break here
      if (result.data.stop) {
+        if (result.data.generation_settings) {
+          generation_settings = result.data.generation_settings;
+        }
        break;
      }
    }