mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-28 08:31:25 +00:00 
			
		
		
		
	llama : add OLMo November 2024 support (#10394)
* Add OLMo November 2024 constants * Add OLMo November 2024 converter * Add loading of OLMo November 2024 tensors and hyper parameters * Add building of OLMo November 2024 model
This commit is contained in:
		| @@ -243,6 +243,7 @@ class MODEL_ARCH(IntEnum): | ||||
|     COMMAND_R    = auto() | ||||
|     DBRX         = auto() | ||||
|     OLMO         = auto() | ||||
|     OLMO_1124    = auto() | ||||
|     OLMOE        = auto() | ||||
|     OPENELM      = auto() | ||||
|     ARCTIC       = auto() | ||||
| @@ -404,6 +405,7 @@ MODEL_ARCH_NAMES: dict[MODEL_ARCH, str] = { | ||||
|     MODEL_ARCH.COMMAND_R:      "command-r", | ||||
|     MODEL_ARCH.DBRX:           "dbrx", | ||||
|     MODEL_ARCH.OLMO:           "olmo", | ||||
|     MODEL_ARCH.OLMO_1124:      "olmo_1124", | ||||
|     MODEL_ARCH.OLMOE:          "olmoe", | ||||
|     MODEL_ARCH.OPENELM:        "openelm", | ||||
|     MODEL_ARCH.ARCTIC:         "arctic", | ||||
| @@ -1069,6 +1071,22 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { | ||||
|         MODEL_TENSOR.FFN_DOWN, | ||||
|         MODEL_TENSOR.FFN_UP, | ||||
|     ], | ||||
|     MODEL_ARCH.OLMO_1124: [ | ||||
|         MODEL_TENSOR.TOKEN_EMBD, | ||||
|         MODEL_TENSOR.OUTPUT_NORM, | ||||
|         MODEL_TENSOR.OUTPUT, | ||||
|         MODEL_TENSOR.ATTN_Q, | ||||
|         MODEL_TENSOR.ATTN_K, | ||||
|         MODEL_TENSOR.ATTN_V, | ||||
|         MODEL_TENSOR.ATTN_OUT, | ||||
|         MODEL_TENSOR.ATTN_POST_NORM, | ||||
|         MODEL_TENSOR.ATTN_Q_NORM, | ||||
|         MODEL_TENSOR.ATTN_K_NORM, | ||||
|         MODEL_TENSOR.FFN_POST_NORM, | ||||
|         MODEL_TENSOR.FFN_GATE, | ||||
|         MODEL_TENSOR.FFN_DOWN, | ||||
|         MODEL_TENSOR.FFN_UP, | ||||
|     ], | ||||
|     MODEL_ARCH.OLMOE: [ | ||||
|         MODEL_TENSOR.TOKEN_EMBD, | ||||
|         MODEL_TENSOR.OUTPUT_NORM, | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Shane A
					Shane A