llama : fix Viking pre-tokenizer regex
The order was previously wrong, which caused errors in some tests.
This commit is contained in:
parent
f9d42c598b
commit
31a1b0eeaa
1 changed files with 1 additions and 1 deletions
|
@ -15440,8 +15440,8 @@ struct llm_tokenizer_bpe {
|
|||
break;
|
||||
case LLAMA_VOCAB_PRE_TYPE_VIKING:
|
||||
regex_exprs = {
|
||||
"\\p{N}",
|
||||
" ?[^(\\s|.,!?…。,、।۔،)]+",
|
||||
"\\p{N}",
|
||||
};
|
||||
break;
|
||||
default:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue