mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	model : add SmolLM3 (#14581)
* Init - first pass. * Model -> ModelBase. * fix errors in conversion. * Update the graph. * up. * up. * wip * cgraph ok * rm redundant code --------- Co-authored-by: Vaibhavs10 <vaibhavs10@gmail.com>
This commit is contained in:
		| @@ -79,6 +79,7 @@ static const std::map<llm_arch, const char *> LLM_ARCH_NAMES = { | ||||
|     { LLM_ARCH_ARCEE,            "arcee"            }, | ||||
|     { LLM_ARCH_ERNIE4_5,         "ernie4_5"         }, | ||||
|     { LLM_ARCH_HUNYUAN_MOE,      "hunyuan-moe"      }, | ||||
|     { LLM_ARCH_SMOLLM3,          "smollm3"          }, | ||||
|     { LLM_ARCH_UNKNOWN,          "(unknown)"        }, | ||||
| }; | ||||
|  | ||||
| @@ -1724,6 +1725,23 @@ static const std::map<llm_arch, std::map<llm_tensor, const char *>> LLM_TENSOR_N | ||||
|             { LLM_TENSOR_TOKEN_EMBD,      "token_embd" }, | ||||
|         }, | ||||
|     }, | ||||
|     { | ||||
|         LLM_ARCH_SMOLLM3, | ||||
|         { | ||||
|             { LLM_TENSOR_TOKEN_EMBD,     "token_embd"            }, | ||||
|             { LLM_TENSOR_OUTPUT_NORM,    "output_norm"           }, | ||||
|             { LLM_TENSOR_OUTPUT,         "output"                }, | ||||
|             { LLM_TENSOR_ATTN_NORM,      "blk.%d.attn_norm"      }, | ||||
|             { LLM_TENSOR_ATTN_Q,         "blk.%d.attn_q"         }, | ||||
|             { LLM_TENSOR_ATTN_K,         "blk.%d.attn_k"         }, | ||||
|             { LLM_TENSOR_ATTN_V,         "blk.%d.attn_v"         }, | ||||
|             { LLM_TENSOR_ATTN_OUT,       "blk.%d.attn_output"    }, | ||||
|             { LLM_TENSOR_FFN_NORM,       "blk.%d.ffn_norm"       }, | ||||
|             { LLM_TENSOR_FFN_GATE,       "blk.%d.ffn_gate"       }, | ||||
|             { LLM_TENSOR_FFN_DOWN,       "blk.%d.ffn_down"       }, | ||||
|             { LLM_TENSOR_FFN_UP,         "blk.%d.ffn_up"         }, | ||||
|         }, | ||||
|     }, | ||||
| }; | ||||
|  | ||||
| static const std::map<llm_tensor, llm_tensor_info> LLM_TENSOR_INFOS = { | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Xuan-Son Nguyen
					Xuan-Son Nguyen