From 2913e5ff1ef2c0c9a2cc7cc886f24f2dfaeda281 Mon Sep 17 00:00:00 2001 From: Xuan Son Nguyen Date: Sat, 10 Aug 2024 11:24:50 +0200 Subject: [PATCH] double check swa --- src/llama.cpp | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/src/llama.cpp b/src/llama.cpp index 390c6bf62..b236bf040 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -4912,7 +4912,10 @@ static void llm_load_hparams( // default value for Phi-3-medium-128k-instruct hparams.n_swa = 131072; } - ml.get_key(LLM_KV_ATTENTION_SLIDING_WINDOW, hparams.n_swa, false); + bool found_swa = ml.get_key(LLM_KV_ATTENTION_SLIDING_WINDOW, hparams.n_swa, false); + if (!found_swa && hparams.n_swa == 0) { + throw std::runtime_error("invalid value for sliding_window"); + } } break; case LLM_ARCH_PLAMO: {