diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 94527c14fa..f9e279b8f3 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -6649,6 +6649,7 @@ class FalconH1Model(Mamba2Model): self.gguf_writer.add_block_count(self.block_count) self.gguf_writer.add_context_length(self.hparams.get("max_position_embeddings", 0)) self.gguf_writer.add_vocab_size(self.hparams["vocab_size"]) + self.gguf_writer.add_add_bos_token(False) self.gguf_writer.add_feed_forward_length(self.hparams["intermediate_size"]) ## Mamba mixer params ##