diff --git a/tools/server/server.cpp b/tools/server/server.cpp index 160b97cf7d2c9..519704fad7930 100644 --- a/tools/server/server.cpp +++ b/tools/server/server.cpp @@ -2313,7 +2313,7 @@ struct server_context { // thinking is enabled if: // 1. It's not explicitly disabled (reasoning_budget == 0) // 2. The chat template supports it - const bool enable_thinking = params_base.reasoning_budget != 0 && common_chat_templates_support_enable_thinking(chat_templates.get()); + const bool enable_thinking = params_base.use_jinja && params_base.reasoning_budget != 0 && common_chat_templates_support_enable_thinking(chat_templates.get()); SRV_INF("Enable thinking? %d\n", enable_thinking); oai_parser_opt = {