Use --reasoning-format, remove forced thinking for now

2025-02-08 17:58:33 +00:00 · 2025-02-08 17:58:33 +00:00 · c0f972bb45
commit c0f972bb45
parent cc2c712cf9
10 changed files with 184 additions and 246 deletions
--- a/common/common.h
+++ b/common/common.h
@ -202,6 +202,11 @@ struct common_params_vocoder {
    bool use_guide_tokens = false; // enable guide tokens to improve TTS accuracy            // NOLINT
 };

+enum common_reasoning_format {
+    COMMON_REASONING_FORMAT_NONE,
+    COMMON_REASONING_FORMAT_DEEPSEEK, // Extract thinking tag contents and return as `message.reasoning_content`
+};
+
 struct common_params {
    int32_t n_predict             =    -1; // new tokens to predict
    int32_t n_ctx                 =  4096; // context size
@ -346,7 +351,7 @@ struct common_params {
    std::string chat_template = "";                                                                         // NOLINT
    bool use_jinja = false;                                                                                 // NOLINT
    bool enable_chat_template = true;
-    bool think                = false;     // return reasoning_content, force model to think unless it supports native <think> tags.
+    common_reasoning_format reasoning_format = COMMON_REASONING_FORMAT_DEEPSEEK;

    std::vector<std::string> api_keys;