mpt : do not duplicate token_embd.weight on disk (#5670)

2025-10-27 08:21:30 +00:00 · 2024-02-22 17:05:23 -05:00
parent 96633eeca1
commit 15499eb942
2 changed files with 4 additions and 7 deletions
--- a/convert-hf-to-gguf.py
+++ b/convert-hf-to-gguf.py
@@ -622,11 +622,6 @@ class MPTModel(Model):

            self.gguf_writer.add_tensor(new_name, data)

-            # note: MPT output is tied to (same as) wte in original model;
-            # for easier implementation in llama.cpp it's duplicated in GGUF, though :/
-            if new_name == "token_embd.weight":
-                self.gguf_writer.add_tensor("output.weight", data)
-

 class OrionModel(Model):
    def set_vocab(self):