diff --git a/src/llama-grammar.cpp b/src/llama-grammar.cpp index 501b0037b..2eae29bb9 100644 --- a/src/llama-grammar.cpp +++ b/src/llama-grammar.cpp @@ -1156,7 +1156,7 @@ void llama_grammar_accept_impl(struct llama_grammar & grammar, llama_token token GGML_ASSERT(grammar.vocab != nullptr); const auto & piece = grammar.vocab->token_to_piece(token); - + if (grammar.awaiting_trigger) { if (std::find(grammar.trigger_tokens.begin(), grammar.trigger_tokens.end(), token) != grammar.trigger_tokens.end()) { grammar.awaiting_trigger = false;