mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-28 08:31:25 +00:00 
			
		
		
		
	* Added Phi-4-mini-instruct support * Update regex per ngxson * Change the vocab base to Xenova/gpt-4o * fix conversion update script * no need to check longrope * minor style fix * fix python style --------- Co-authored-by: Nicholas Sparks <nisparks@microsoft.com>
This commit is contained in:
		| @@ -109,6 +109,7 @@ models = [ | ||||
|     {"name": "megrez",           "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/Infinigence/Megrez-3B-Instruct"}, | ||||
|     {"name": "deepseek-v3",      "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/deepseek-ai/DeepSeek-V3"}, | ||||
|     {"name": "deepseek-r1-qwen", "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B"}, | ||||
|     {"name": "gpt-4o",           "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/Xenova/gpt-4o", }, | ||||
| ] | ||||
|  | ||||
|  | ||||
| @@ -131,6 +132,10 @@ def download_model(model): | ||||
|  | ||||
|     files = ["config.json", "tokenizer.json", "tokenizer_config.json"] | ||||
|  | ||||
|     if name == "gpt-4o": | ||||
|         # Xenova/gpt-4o is tokenizer-only, it does not contain config.json | ||||
|         files = ["tokenizer.json", "tokenizer_config.json"] | ||||
|  | ||||
|     if tokt == TOKENIZER_TYPE.SPM: | ||||
|         files.append("tokenizer.model") | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Xuan-Son Nguyen
					Xuan-Son Nguyen