diff --git a/llama.cpp b/llama.cpp index 5e469dc6f..2ca572a6b 100644 --- a/llama.cpp +++ b/llama.cpp @@ -8,6 +8,7 @@ #include #include #include +#include // determine number of model parts based on the dimension static const std::unordered_map LLAMA_N_PARTS = {