From 97011d7a1fbb1fdd3cee46c1eaa4bfb3d70ba6ad Mon Sep 17 00:00:00 2001 From: ibrahimkhadraoui Date: Mon, 7 Jul 2025 14:25:32 +0400 Subject: [PATCH] mup_vec create as float64 --- convert_hf_to_gguf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 46df230dd3..5ef225d247 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -6591,7 +6591,7 @@ class FalconH1Model(Mamba2Model): groups_time_state_size = self.hparams["mamba_n_groups"] * self.hparams["mamba_d_state"] vector_shape = (2 * intermediate_size + 2 * groups_time_state_size + self.hparams["mamba_n_heads"]) - mup_vector = torch.ones(1, 1, vector_shape) + mup_vector = torch.ones(1, 1, vector_shape, dtype=torch.float64) mup_vector[:, :, :intermediate_size] *= zxbcdt_multipliers[0] mup_vector[:, :, intermediate_size:2 * intermediate_size] *= zxbcdt_multipliers[1] mup_vector[:, :, 2 * intermediate_size:2 * intermediate_size + groups_time_state_size] *= zxbcdt_multipliers[2]