mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	
							
								
								
									
										5
									
								
								ggml.c
									
									
									
									
									
								
							
							
						
						
									
										5
									
								
								ggml.c
									
									
									
									
									
								
							| @@ -15629,7 +15629,6 @@ static int ggml_get_n_tasks(struct ggml_tensor * node, int n_threads) { | ||||
|             } break; | ||||
|         case GGML_OP_DIAG_MASK_ZERO: | ||||
|         case GGML_OP_DIAG_MASK_INF: | ||||
|         case GGML_OP_SOFT_MAX: | ||||
|         case GGML_OP_SOFT_MAX_BACK: | ||||
|         case GGML_OP_ROPE: | ||||
|         case GGML_OP_ROPE_BACK: | ||||
| @@ -15645,6 +15644,10 @@ static int ggml_get_n_tasks(struct ggml_tensor * node, int n_threads) { | ||||
|             { | ||||
|                 n_tasks = 1; //TODO | ||||
|             } break; | ||||
|         case GGML_OP_SOFT_MAX: | ||||
|             { | ||||
|                 n_tasks = MIN(MIN(4, n_threads), ggml_nrows(node->src[0])); | ||||
|             } break; | ||||
|         case GGML_OP_CONV_TRANSPOSE_1D: | ||||
|             { | ||||
|                 n_tasks = n_threads; | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov