server: allow API calls to set a lower thinking budget if a global budget is set

2026-06-09 07:16:44 +02:00 · 2026-05-30 08:51:06 +02:00
parent 1738129bee
commit 926b94a1bc
1 changed files with 5 additions and 2 deletions
@@ -1123,8 +1123,11 @@ json oaicompat_chat_params_parse(
    // Reasoning budget: pass parameters through to sampling layer
    {
        int reasoning_budget = opt.reasoning_budget;
-        if (reasoning_budget == -1 && body.contains("thinking_budget_tokens")) {
-            reasoning_budget = json_value(body, "thinking_budget_tokens", -1);
+        if (body.contains("thinking_budget_tokens")) {
+            int req_budget = json_value(body, "thinking_budget_tokens", -1);
+            if (reasoning_budget == -1 || (req_budget != -1 && req_budget < reasoning_budget)) {
+                reasoning_budget = req_budget;
+            }
        }

        if (!chat_params.thinking_end_tag.empty()) {