fix typo

2023-10-01 17:04:01 -04:00 · 2023-10-01 17:04:01 -04:00 · 02fbbf9099
commit 02fbbf9099
parent f18cfeab62
3 changed files with 3 additions and 3 deletions
--- a/convert-falcon-hf-to-gguf.py
+++ b/convert-falcon-hf-to-gguf.py
@ -144,7 +144,7 @@ for i in range(vocab_size):
        print(f"Key {i} not in tokenizer vocabulary. Padding with an arbitrary token.")
        pad_token = f"[PAD{i}]".encode("utf8")
        text = bytearray(pad_token)
-    elif i in added_tokens:
+    elif i in added_token_ids:
        # these tokens are not encoded, see https://github.com/huggingface/transformers/issues/1133
        text = bytearray(reverse_vocab[i].encode('utf-8'))
    else:
--- a/convert-gptneox-hf-to-gguf.py
+++ b/convert-gptneox-hf-to-gguf.py
@ -140,7 +140,7 @@ for i in range(vocab_size):
        print(f"Key {i} not in tokenizer vocabulary. Padding with an arbitrary token.")
        pad_token = f"[PAD{i}]".encode("utf8")
        text = bytearray(pad_token)
-    elif i in added_tokens:
+    elif i in added_token_ids:
        # these tokens are not encoded, see https://github.com/huggingface/transformers/issues/1133
        text = bytearray(reverse_vocab[i].encode('utf-8'))
    else:
--- a/convert-starcoder-hf-to-gguf.py
+++ b/convert-starcoder-hf-to-gguf.py
@ -128,7 +128,7 @@ for i in range(vocab_size):
        print(f"Key {i} not in tokenizer vocabulary. Padding with an arbitrary token.")
        pad_token = f"[PAD{i}]".encode("utf8")
        text = bytearray(pad_token)
-    elif i in added_tokens:
+    elif i in added_token_ids:
        # these tokens are not encoded, see https://github.com/huggingface/transformers/issues/1133
        text = bytearray(reverse_vocab[i].encode('utf-8'))
    else: