mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	Define non-positive temperature behavior (#720)
This commit is contained in:
		
							
								
								
									
										14
									
								
								llama.cpp
									
									
									
									
									
								
							
							
						
						
									
										14
									
								
								llama.cpp
									
									
									
									
									
								
							| @@ -1194,6 +1194,20 @@ static llama_vocab::id llama_sample_top_p_top_k( | ||||
|     const auto & logits = lctx.logits; | ||||
|     const auto * plogits = logits.data() + logits.size() - n_logits; | ||||
|  | ||||
|     if (temp <= 0) { | ||||
|         // select the token with the highest logit directly | ||||
|         float max_logit = plogits[0]; | ||||
|         llama_vocab::id max_id = 0; | ||||
|  | ||||
|         for (int i = 1; i < n_logits; ++i) { | ||||
|             if (plogits[i] > max_logit) { | ||||
|                 max_logit = plogits[i]; | ||||
|                 max_id = i; | ||||
|             } | ||||
|         } | ||||
|         return max_id; | ||||
|     } | ||||
|  | ||||
|     std::vector<std::pair<float, llama_vocab::id>> logits_id; | ||||
|     logits_id.reserve(n_logits); | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Ivan Stepanov
					Ivan Stepanov