mup_vec create as float64

2025-11-04 09:32:00 +00:00 · 2025-07-07 14:25:32 +04:00
parent 49d7420964
commit 97011d7a1f
1 changed files with 1 additions and 1 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@@ -6591,7 +6591,7 @@ class FalconH1Model(Mamba2Model):
        groups_time_state_size = self.hparams["mamba_n_groups"] * self.hparams["mamba_d_state"]
        vector_shape = (2 * intermediate_size + 2 * groups_time_state_size + self.hparams["mamba_n_heads"])

-        mup_vector = torch.ones(1, 1, vector_shape)
+        mup_vector = torch.ones(1, 1, vector_shape, dtype=torch.float64)
        mup_vector[:, :, :intermediate_size] *= zxbcdt_multipliers[0]
        mup_vector[:, :, intermediate_size:2 * intermediate_size] *= zxbcdt_multipliers[1]
        mup_vector[:, :, 2 * intermediate_size:2 * intermediate_size + groups_time_state_size] *= zxbcdt_multipliers[2]