llama : fix Gemma rope type (#5691)

2025-10-31 08:51:55 +00:00 · 2024-02-26 08:30:17 +02:00
parent c393733988
commit 269de86ba0
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@@ -12089,7 +12089,6 @@ enum llama_rope_type llama_rope_type(const struct llama_model * model) {
        case LLM_ARCH_ORION:
        case LLM_ARCH_INTERNLM2:
        case LLM_ARCH_MINICPM:
-        case LLM_ARCH_GEMMA:
            return LLAMA_ROPE_TYPE_NORM;

        // the pairs of head values are offset by n_rot/2
@@ -12101,6 +12100,7 @@ enum llama_rope_type llama_rope_type(const struct llama_model * model) {
        case LLM_ARCH_QWEN:
        case LLM_ARCH_QWEN2:
        case LLM_ARCH_PHI2:
+        case LLM_ARCH_GEMMA:
            return LLAMA_ROPE_TYPE_NEOX;

        // all model arches should be listed explicitly here