mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	gguf : add tokenization constants
This commit is contained in:
		
							
								
								
									
										13
									
								
								constants.py
									
									
									
									
									
								
							
							
						
						
									
										13
									
								
								constants.py
									
									
									
									
									
								
							| @@ -31,3 +31,16 @@ KEY_ATTENTION_CLAMP_KQV          = "{llm}.attention.clamp_kqv" | |||||||
| # RoPE | # RoPE | ||||||
| KEY_ROPE_DIMENSION_COUNT         = "{llm}.rope.dimension_count" | KEY_ROPE_DIMENSION_COUNT         = "{llm}.rope.dimension_count" | ||||||
| KEY_ROPE_SCALE                   = "{llm}.rope.scale" | KEY_ROPE_SCALE                   = "{llm}.rope.scale" | ||||||
|  |  | ||||||
|  | # tokenization | ||||||
|  | KEY_TOKENIZER_MODEL   = "tokenizer.ggml.model" | ||||||
|  | KEY_TOKENIZER_LIST    = "tokenizer.ggml.tokens" | ||||||
|  | KEY_TOKENIZER_SCORES  = "tokenizer.ggml.scores" | ||||||
|  | KEY_TOKENIZER_MERGES  = "tokenizer.ggml.merges" | ||||||
|  | KEY_TOKENIZER_BOS_ID  = "tokenizer.ggml.bos_token_id" | ||||||
|  | KEY_TOKENIZER_EOS_ID  = "tokenizer.ggml.eos_token_id" | ||||||
|  | KEY_TOKENIZER_UNK_ID  = "tokenizer.ggml.unknown_token_id" | ||||||
|  | KEY_TOKENIZER_SEP_ID  = "tokenizer.ggml.seperator_token_id" | ||||||
|  | KEY_TOKENIZER_PAD_ID  = "tokenizer.ggml.padding_token_id" | ||||||
|  | KEY_TOKENIZER_HF_JSON = "tokenizer.huggingface.json" | ||||||
|  | KEY_TOKENIZER_RWKV    = "tokenizer.rwkv.world" | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 M. Yusuf Sarıgöz
					M. Yusuf Sarıgöz