mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-04 09:32:00 +00:00
Merge branch 'add-fh1-rebased' of https://github.com/tiiuae/llama.cpp-public into add-fh1-rebased
This commit is contained in:
@@ -583,6 +583,7 @@ class TensorNameMap:
|
|||||||
),
|
),
|
||||||
|
|
||||||
MODEL_TENSOR.SSM_NORM: (
|
MODEL_TENSOR.SSM_NORM: (
|
||||||
|
"model.layers.{bid}.mamba.norm", # falcon-h1
|
||||||
"backbone.layers.{bid}.mixer.norm", # mamba2
|
"backbone.layers.{bid}.mixer.norm", # mamba2
|
||||||
),
|
),
|
||||||
|
|
||||||
@@ -1177,10 +1178,6 @@ class TensorNameMap:
|
|||||||
"resampler.attn.out_proj",
|
"resampler.attn.out_proj",
|
||||||
),
|
),
|
||||||
|
|
||||||
MODEL_TENSOR.SSM_NORM: (
|
|
||||||
"model.layers.{bid}.mamba.norm",
|
|
||||||
),
|
|
||||||
|
|
||||||
MODEL_TENSOR.V_RESMPL_KV: (
|
MODEL_TENSOR.V_RESMPL_KV: (
|
||||||
"resampler.kv_proj",
|
"resampler.kv_proj",
|
||||||
),
|
),
|
||||||
|
|||||||
@@ -1951,8 +1951,7 @@ bool llm_arch_is_recurrent(const llm_arch & arch) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
bool llm_arch_is_hybrid(const llm_arch & arch) {
|
bool llm_arch_is_hybrid(const llm_arch & arch) {
|
||||||
// TODO: There are currently no hybrid models! Once there are, this will be
|
// List all mamba-attention hybrid models here
|
||||||
// the place to identify them
|
|
||||||
switch (arch) {
|
switch (arch) {
|
||||||
case LLM_ARCH_FALCON_H1:
|
case LLM_ARCH_FALCON_H1:
|
||||||
return true;
|
return true;
|
||||||
|
|||||||
Reference in New Issue
Block a user