mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	metal : fix unused warning
This commit is contained in:
		| @@ -2175,7 +2175,7 @@ kernel void kernel_flash_attn_ext_f16( | ||||
|  | ||||
|     const short D4 = D/4; | ||||
|     const short D8 = D/8; | ||||
|     const short Q8 = Q/8; | ||||
|   //const short Q8 = Q/8; | ||||
|     const short NW = N_SIMDWIDTH; | ||||
|     const short SH = (C + Q); // shared memory per simdgroup in (half) | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov