ggml : add ggml_flash_attn_ext_get_prec

2025-11-14 11:07:10 +00:00 · 2024-11-06 15:09:47 +02:00
parent 5c333e0140
commit 22a9311a1a
3 changed files with 17 additions and 5 deletions
--- a/ggml/include/ggml.h
+++ b/ggml/include/ggml.h
@@ -1746,6 +1746,9 @@ extern "C" {
            struct ggml_tensor * a,
            enum ggml_prec       prec);

+    GGML_API enum ggml_prec ggml_flash_attn_ext_get_prec(
+            const struct ggml_tensor * a);
+
    // TODO: needs to be adapted to ggml_flash_attn_ext
    GGML_API struct ggml_tensor * ggml_flash_attn_back(
           struct ggml_context * ctx,