mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-03 09:22:01 +00:00 
			
		
		
		
	bench: server add stop word for PHI-2 (#6916)
This commit is contained in:
		@@ -90,7 +90,8 @@ export default function () {
 | 
			
		||||
        "model": model,
 | 
			
		||||
        "stream": true,
 | 
			
		||||
        "seed": 42,
 | 
			
		||||
        "max_tokens": max_tokens
 | 
			
		||||
        "max_tokens": max_tokens,
 | 
			
		||||
        "stop": ["<|im_end|>"] // This is temporary for phi-2 base (i.e. not instructed) since the server expects that the model always to emit BOS
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    const params = {method: 'POST', body: JSON.stringify(payload)};
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user