impl::load change map bpe_ranks to onordered map for reduce time of impl::load on 30%

2025-01-27 15:09:34 +04:00 · 2025-01-27 15:09:34 +04:00 · 5144a18e67
commit 5144a18e67
parent acd38efee3
1 changed files with 7 additions and 2 deletions
--- a/src/llama-vocab.cpp
+++ b/src/llama-vocab.cpp
@ -1245,8 +1245,13 @@ struct llama_vocab::impl {
    std::vector<llama_token> cache_special_tokens;
    std::vector<std::string> cache_token_to_piece; // llama_token_to_piece(special = true);
-
+    struct PairHash {
-    std::map<std::pair<std::string, std::string>, int> bpe_ranks;
+        size_t operator()(const std::pair<std::string, std::string>& p) const {
            return std::hash<std::string>{}(p.first) ^  //create some hash for pair
                   (std::hash<std::string>{}(p.second) << 1);
        }
    };
    std::unordered_map<std::pair<std::string, std::string>, int, PairHash> bpe_ranks;
    // set of all tokens that cause "end of generation"
    std::set<llama_token> special_eog_ids;