mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-03 09:22:01 +00:00 
			
		
		
		
	fix head count kv
This commit is contained in:
		@@ -109,6 +109,7 @@ gguf_writer.add_max_position_embeddings(hparams["n_positions"])
 | 
				
			|||||||
gguf_writer.add_feed_forward_length(4 * hparams["n_embd"])
 | 
					gguf_writer.add_feed_forward_length(4 * hparams["n_embd"])
 | 
				
			||||||
gguf_writer.add_block_count(block_count)
 | 
					gguf_writer.add_block_count(block_count)
 | 
				
			||||||
gguf_writer.add_head_count(hparams["n_head"])
 | 
					gguf_writer.add_head_count(hparams["n_head"])
 | 
				
			||||||
 | 
					gguf_writer.add_head_count_kv(1)
 | 
				
			||||||
gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
 | 
					gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
 | 
				
			||||||
gguf_writer.add_file_type(ftype)
 | 
					gguf_writer.add_file_type(ftype)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user