mpt : do not duplicate token_embd.weight on disk (#5670)
This commit is contained in:
parent
96633eeca1
commit
15499eb942
2 changed files with 4 additions and 7 deletions
|
@ -622,11 +622,6 @@ class MPTModel(Model):
|
|||
|
||||
self.gguf_writer.add_tensor(new_name, data)
|
||||
|
||||
# note: MPT output is tied to (same as) wte in original model;
|
||||
# for easier implementation in llama.cpp it's duplicated in GGUF, though :/
|
||||
if new_name == "token_embd.weight":
|
||||
self.gguf_writer.add_tensor("output.weight", data)
|
||||
|
||||
|
||||
class OrionModel(Model):
|
||||
def set_vocab(self):
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue