mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	fix speculative decoding build on windows (#5874)
This commit is contained in:
		 Jeffrey Quesnelle
					Jeffrey Quesnelle
				
			
				
					committed by
					
						 GitHub
						GitHub
					
				
			
			
				
	
			
			
			 GitHub
						GitHub
					
				
			
						parent
						
							1d41d6f7c2
						
					
				
				
					commit
					29eee40474
				
			| @@ -226,7 +226,7 @@ int main(int argc, char ** argv) { | |||||||
|  |  | ||||||
|                     while (active_seqs.size() > 0) { |                     while (active_seqs.size() > 0) { | ||||||
|                         // randomly select a sequence to verify from active sequences |                         // randomly select a sequence to verify from active sequences | ||||||
|                         std::uniform_int_distribution<u_int> u_int_dist(0, active_seqs.size() - 1); |                         std::uniform_int_distribution<unsigned int> u_int_dist(0, active_seqs.size() - 1); | ||||||
|                         int s = *std::next(active_seqs.begin(), u_int_dist(rng)); |                         int s = *std::next(active_seqs.begin(), u_int_dist(rng)); | ||||||
|                         if (i_dft >= (int) drafts[s].tokens.size()) { |                         if (i_dft >= (int) drafts[s].tokens.size()) { | ||||||
|                             drafts[s].active = false; |                             drafts[s].active = false; | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user