llama : Use token_to_id map find() method instead of iterating over all tokens.

2024-08-04 20:47:47 +02:00 · 2024-08-04 20:47:47 +02:00 · 0b7211387e
commit 0b7211387e
parent 3878b397a9
1 changed files with 3 additions and 5 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -5647,11 +5647,9 @@ static void llm_load_vocab(
        // TODO: convert scripts should provide this token through the KV metadata LLAMA_KV_TOKENIZER_EOM_ID
        //       for now, we apply this workaround to find the EOM token based on its text
        if (vocab.special_eom_id == -1) {
-            for (const auto & t : vocab.token_to_id) {
+            const auto & t = vocab.token_to_id.find("<|eom_id|>");
-                if (t.first == "<|eom_id|>") {
+            if (t != vocab.token_to_id.end()) {
-                    vocab.special_eom_id = t.second;
+                vocab.special_eom_id = t->second;
                    break;
                }
            }
        }