split q_proj/gate

2025-10-27 08:21:30 +00:00 · 2025-09-20 12:00:14 +07:00
parent 178230ee21
commit 46110e0630
6 changed files with 31 additions and 21 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@@ -3767,8 +3767,12 @@ class Qwen3NextModel(Qwen3MoeModel):
            name = name.rpartition(".dt_bias")[0] + ".dt_proj.bias"
        elif "conv1d" in name:
            data_torch = data_torch.squeeze()
+        elif "q_proj.weight" in name:
+            q_proj, gate = data_torch.chunk(2, dim=0)
+            yield (self.format_tensor_name(gguf.MODEL_TENSOR.ATTN_GATE, bid), gate)
+            data_torch = q_proj

-        return Qwen2MoeModel.modify_tensors(self, data_torch, name, bid)
+        yield from Qwen2MoeModel.modify_tensors(self, data_torch, name, bid)


@ModelBase.register("GPT2LMHeadModel")