Fix vocab space conversion logic
This commit is contained in:
parent
f7e61fd1a9
commit
08959c88c2
1 changed files with 1 additions and 1 deletions
|
@ -182,7 +182,7 @@ class GGMLToGGUF:
|
||||||
toktypes = []
|
toktypes = []
|
||||||
for (tokid, (vbytes, vscore)) in enumerate(self.model.vocab.items):
|
for (tokid, (vbytes, vscore)) in enumerate(self.model.vocab.items):
|
||||||
tt = 1
|
tt = 1
|
||||||
if len(vbytes) > 1 and vbytes[0] == 32:
|
if len(vbytes) > 0 and vbytes[0] == 32:
|
||||||
vbytes = vbytes.replace(b' ', b'\xe2\x96\x81')
|
vbytes = vbytes.replace(b' ', b'\xe2\x96\x81')
|
||||||
elif len(vbytes) == 0:
|
elif len(vbytes) == 0:
|
||||||
tt = 3
|
tt = 3
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue