diff --git a/chat.cpp b/chat.cpp index 38b39771a..087290feb 100644 --- a/chat.cpp +++ b/chat.cpp @@ -32,8 +32,8 @@ static const std::map LLAMA_N_PARTS = { { 4096, 1 }, { 5120, 1 }, - { 6656, 4 }, - { 8192, 8 }, + { 6656, 1 }, + { 8192, 1 }, }; // default hparams (LLaMA 7B)