llama: print memory breakdown on exit (#15860)

* llama: print memory breakdown on exit
2025-10-27 08:21:30 +00:00 · 2025-09-24 16:53:48 +02:00
parent f2a789e334
commit e789095502
18 changed files with 243 additions and 12 deletions
--- a/src/llama-kv-cache.h
+++ b/src/llama-kv-cache.h
@@ -121,6 +121,8 @@ public:
    llama_pos seq_pos_min(llama_seq_id seq_id) const override;
    llama_pos seq_pos_max(llama_seq_id seq_id) const override;

+    std::map<ggml_backend_buffer_type_t, size_t> memory_breakdown() const override;
+
    // state write/load

    void state_write(llama_io_write_i & io, llama_seq_id seq_id = -1, llama_state_seq_flags flags = 0) const override;