diff --git a/ggml/include/ggml.h b/ggml/include/ggml.h index c1ed1a21c8..25916b2847 100644 --- a/ggml/include/ggml.h +++ b/ggml/include/ggml.h @@ -2220,7 +2220,7 @@ extern "C" { struct ggml_tensor * a, int k); -#define GGML_KQ_MASK_PAD 64 +#define GGML_KQ_MASK_PAD 1 // q: [n_embd_k, n_batch, n_head, ne3 ] // k: [n_embd_k, n_kv, n_head_kv, ne3 ]