mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	bench: server add stop word for PHI-2 (#6916)
This commit is contained in:
		| @@ -90,7 +90,8 @@ export default function () { | |||||||
|         "model": model, |         "model": model, | ||||||
|         "stream": true, |         "stream": true, | ||||||
|         "seed": 42, |         "seed": 42, | ||||||
|         "max_tokens": max_tokens |         "max_tokens": max_tokens, | ||||||
|  |         "stop": ["<|im_end|>"] // This is temporary for phi-2 base (i.e. not instructed) since the server expects that the model always to emit BOS | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     const params = {method: 'POST', body: JSON.stringify(payload)}; |     const params = {method: 'POST', body: JSON.stringify(payload)}; | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Pierrick Hymbert
					Pierrick Hymbert