mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-03 09:22:01 +00:00 
			
		
		
		
	sycl : offload of get_rows set to 0 (#10432)
This commit is contained in:
		
				
					committed by
					
						
						GitHub
					
				
			
			
				
	
			
			
			
						parent
						
							266b8519ee
						
					
				
				
					commit
					0f77aae560
				
			@@ -4493,7 +4493,7 @@ static bool ggml_backend_sycl_device_supports_buft(ggml_backend_dev_t dev, ggml_
 | 
			
		||||
static int64_t get_op_batch_size(const ggml_tensor * op) {
 | 
			
		||||
    switch (op->op) {
 | 
			
		||||
        case GGML_OP_GET_ROWS:
 | 
			
		||||
            return op->ne[1]; // this will increse the speed of prefill in test
 | 
			
		||||
            return 0;
 | 
			
		||||
        case GGML_OP_MUL_MAT:
 | 
			
		||||
            return op->ne[1];
 | 
			
		||||
        case GGML_OP_MUL_MAT_ID:
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user