diff --git a/chat.cpp b/chat.cpp index 5ee86ce78..4bdd214ad 100644 --- a/chat.cpp +++ b/chat.cpp @@ -30,7 +30,7 @@ // determine number of model parts based on the dimension static const std::map LLAMA_N_PARTS = { { 4096, 1 }, - { 5120, 2 }, + { 5120, 1 }, { 6656, 4 }, { 8192, 8 }, };