mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-01 09:01:57 +00:00
metal : fix unused warning
This commit is contained in:
@@ -2175,7 +2175,7 @@ kernel void kernel_flash_attn_ext_f16(
|
|||||||
|
|
||||||
const short D4 = D/4;
|
const short D4 = D/4;
|
||||||
const short D8 = D/8;
|
const short D8 = D/8;
|
||||||
const short Q8 = Q/8;
|
//const short Q8 = Q/8;
|
||||||
const short NW = N_SIMDWIDTH;
|
const short NW = N_SIMDWIDTH;
|
||||||
const short SH = (C + Q); // shared memory per simdgroup in (half)
|
const short SH = (C + Q); // shared memory per simdgroup in (half)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user