mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	convert-hf : support Mini-Jamba conversion
This commit is contained in:
		| @@ -207,6 +207,7 @@ class TensorNameMap: | ||||
|             "model.layers.{bid}.ffn_norm",                                   # internlm2 | ||||
|             "transformer.decoder_layer.{bid}.rms_norm_2",                    # Grok | ||||
|             "model.layers.{bid}.pre_ff_layernorm",                           # jamba | ||||
|             "model.layers.{bid}.pre_moe_layernorm",                          # mini-jamba | ||||
|         ), | ||||
|  | ||||
|         MODEL_TENSOR.FFN_GATE_INP: ( | ||||
| @@ -390,10 +391,12 @@ class TensorNameMap: | ||||
|  | ||||
|         MODEL_TENSOR.SSM_B_NORM: ( | ||||
|             "model.layers.{bid}.mamba.b_layernorm",  # jamba | ||||
|             "model.layers.{bid}.mamba.B_layernorm",  # mini-jamba | ||||
|         ), | ||||
|  | ||||
|         MODEL_TENSOR.SSM_C_NORM: ( | ||||
|             "model.layers.{bid}.mamba.c_layernorm",  # jamba | ||||
|             "model.layers.{bid}.mamba.C_layernorm",  # mini-jamba | ||||
|         ), | ||||
|  | ||||
|         MODEL_TENSOR.SSM_D: ( | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Francis Couture-Harpin
					Francis Couture-Harpin