convert : fix jamba conv1d shape squeezing

2025-11-01 09:01:57 +00:00 · 2025-07-02 23:49:12 -04:00
parent 2bcaf64e8e
commit 908e6559d6
1 changed files with 3 additions and 0 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@@ -5055,6 +5055,9 @@ class JambaModel(TextModel):

        new_name = self.map_tensor_name(name)

+        if self.match_model_tensor_name(new_name, gguf.MODEL_TENSOR.SSM_CONV1D, bid):
+            data_torch = data_torch.squeeze()
+
        if name.endswith(".A_log"):
            logger.debug("A_log --> A ==> " + new_name)
            data_torch = -torch.exp(data_torch)