diff --git a/ggml/include/ggml.h b/ggml/include/ggml.h index 36b23dc6d0..95d47aa168 100644 --- a/ggml/include/ggml.h +++ b/ggml/include/ggml.h @@ -2152,7 +2152,7 @@ extern "C" { struct ggml_tensor * a, int k); -#define GGML_KQ_MASK_PAD 64 +#define GGML_KQ_MASK_PAD 1 // q: [n_embd_k, n_batch, n_head, ne3 ] // k: [n_embd_k, n_kv, n_head_kv, ne3 ]