improve detection for 70B.

2023-08-07 10:43:06 +08:00 · 2023-08-07 10:43:06 +08:00 · 0e41b94f40
commit 0e41b94f40
parent fb44d72a78
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -1076,7 +1076,7 @@ static void llama_model_load_internal(
        // LLaMAv2
        // TODO: temporary until GGUF
        //patch for llama2 gqa
-        if (model.type == e_model::MODEL_65B && hparams.n_mult >= 4096) {
+        if (model.type == e_model::MODEL_65B && hparams.n_mult == 4096) {
            fprintf(stderr, "%s: Applying KCPP Patch for 70B model, setting GQA to 8\n", __func__);
            n_gqa = 8;
        }