mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	metal : enable mat-vec kernels for bs <= 4 (#10491)
This commit is contained in:
		| @@ -1927,7 +1927,7 @@ static void ggml_metal_encode_node( | |||||||
|  |  | ||||||
|                 // find the break-even point where the matrix-matrix kernel becomes more efficient compared |                 // find the break-even point where the matrix-matrix kernel becomes more efficient compared | ||||||
|                 // to the matrix-vector kernel |                 // to the matrix-vector kernel | ||||||
|                 int ne11_mm_min = 1; |                 int ne11_mm_min = 4; | ||||||
|  |  | ||||||
| #if 0 | #if 0 | ||||||
|                 // the numbers below are measured on M2 Ultra for 7B and 13B models |                 // the numbers below are measured on M2 Ultra for 7B and 13B models | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov