From 5d52192f73cec14cdbb95fb10e64e8dfa1039245 Mon Sep 17 00:00:00 2001 From: goerch Date: Sun, 6 Aug 2023 13:51:26 +0200 Subject: [PATCH] Remove inactive code. --- convert.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/convert.py b/convert.py index ba1522990..5dd0762bd 100755 --- a/convert.py +++ b/convert.py @@ -267,8 +267,6 @@ class SentencePieceVocab: byte_encoder = tokenization_gpt2.bytes_to_unicode() byte_decoder = {v: k for k, v in byte_encoder.items()} for i, item in enumerate(tokenizer): - # text: bytes - # text = b''.join([x.to_bytes(1, byteorder='big') for x in [byte_decoder[y] for y in item]]) text: bytes = item.encode("utf-8") score: float = -i yield text, score