diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 2f0f4d5fb..5d48980eb 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -2742,8 +2742,8 @@ class RwkvModel(Model): toktypes.append(gguf.TokenType.NORMAL) remainder = vocab_size - len(tokens) assert remainder >= 0 - for i in range(remainder): - tokens.append(f"".encode("utf-8")) + for i in range(len(tokens), vocab_size): + tokens.append(f"[PAD{i}]".encode("utf-8")) toktypes.append(gguf.TokenType.UNUSED) self.gguf_writer.add_tokenizer_model("rwkv")