llama : add support for Deepseek-R1-Qwen distill model (#11310)

* llama : add support for Deepseek-R1-Qwen distill model

* coding style
This commit is contained in:
Xuan Son Nguyen 2025-01-20 14:35:07 +01:00 committed by GitHub
parent ef6dada60c
commit ec7f3ac9ab
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
6 changed files with 208 additions and 45 deletions

View file

@ -1523,7 +1523,8 @@ void llama_vocab::impl::load(llama_model_loader & ml, const LLM_KV & kv) {
pre_type = LLAMA_VOCAB_PRE_TYPE_COMMAND_R;
clean_spaces = false;
} else if (
tokenizer_pre == "qwen2") {
tokenizer_pre == "qwen2" ||
tokenizer_pre == "deepseek-r1-qwen") {
pre_type = LLAMA_VOCAB_PRE_TYPE_QWEN2;
clean_spaces = false;
} else if (