mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	llama : add option for greedy sampling with probs (#3813)
* llama : add option for greedy sampling with probs * llama : add comment about llama_sample_token_greedy() missing probs * sampling : temp == 0.0 -> no probs, temp < 0.0 -> probs
This commit is contained in:
		| @@ -148,7 +148,7 @@ int main(int argc, char ** argv) { | ||||
|     std::vector<seq_draft> drafts(n_seq_dft); | ||||
|  | ||||
|     params.sparams.grammar.clear(); // the draft samplers will copy the target sampler's grammar | ||||
|     params.sparams.temp = std::max(0.01f, params.sparams.temp); | ||||
|     params.sparams.temp = -1.0f;    // force greedy sampling with probs for the draft model | ||||
|  | ||||
|     for (int s = 0; s < n_seq_dft; ++s) { | ||||
|         drafts[s].ctx_sampling = llama_sampling_init(params.sparams); | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov