mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-10-28 08:31:25 +00:00
ggml : remove KQ mask padding
This commit is contained in:
@@ -2152,7 +2152,7 @@ extern "C" {
|
|||||||
struct ggml_tensor * a,
|
struct ggml_tensor * a,
|
||||||
int k);
|
int k);
|
||||||
|
|
||||||
#define GGML_KQ_MASK_PAD 64
|
#define GGML_KQ_MASK_PAD 1
|
||||||
|
|
||||||
// q: [n_embd_k, n_batch, n_head, ne3 ]
|
// q: [n_embd_k, n_batch, n_head, ne3 ]
|
||||||
// k: [n_embd_k, n_kv, n_head_kv, ne3 ]
|
// k: [n_embd_k, n_kv, n_head_kv, ne3 ]
|
||||||
|
|||||||
Reference in New Issue
Block a user