Fix typo
This commit is contained in:
parent
ac793a21e8
commit
8c9d1e781e
1 changed files with 1 additions and 1 deletions
|
@ -231,7 +231,7 @@ class SentencePieceVocab:
|
|||
def sentencepiece_tokens(self) -> Iterable[Tuple[bytes, float]]:
|
||||
tokenizer = self.sentencepiece_tokenizer
|
||||
for i in range(tokenizer.vocab_size()):
|
||||
# TODO: How do we want to support is_unknown, is_control, is_byte and is_unused(i)?
|
||||
# TODO: How do we want to support is_unknown, is_control, is_byte and is_unused?
|
||||
piece = tokenizer.id_to_piece(i)
|
||||
text: bytes = piece.encode("utf-8")
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue