diff --git a/src/llama-model.cpp b/src/llama-model.cpp index 38e8c2812f..8e579d8e88 100644 --- a/src/llama-model.cpp +++ b/src/llama-model.cpp @@ -9741,7 +9741,7 @@ struct llm_build_context { struct ggml_tensor * kq_b = build_pos_bias(pos_bucket_enc, attn_rel_b); cur = build_attn_with_kq_b(gf, - model.layers[il].wo, model.layers[il].bo, + model.layers[il].wo_enc, nullptr, Qcur, Kcur, Vcur, kq_b, n_tokens, 1.0f, il); cb(cur, "kqv_out", il); }