context : reuse built_attn_mha

ggml-ci
This commit is contained in:
Georgi Gerganov
2025-02-24 11:18:40 +02:00
parent a5a85a3bc0
commit 4a1054b552
5 changed files with 109 additions and 167 deletions

View File

@@ -107,13 +107,10 @@ public:
virtual ggml_tensor * build_attn(
ggml_context * ctx0,
ggml_cgraph * gf,
ggml_tensor * wo,
ggml_tensor * wo_b,
ggml_tensor * q_cur,
ggml_tensor * k_cur,
ggml_tensor * v_cur,
ggml_tensor * kq_b,
int32_t n_tokens,
float kq_scale,
int il);