From d37113850c62713f5bb70c1a14cd794f9f771588 Mon Sep 17 00:00:00 2001 From: Debanjum Date: Fri, 27 Jun 2025 00:34:22 -0700 Subject: [PATCH] Let reasoning gemini models dynamically set their thinking budget All gemini 2.5 series models support dynamic thinking budgets by setting thinking_budget to -1. --- src/khoj/processor/conversation/google/utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/khoj/processor/conversation/google/utils.py b/src/khoj/processor/conversation/google/utils.py index 18ab33cc..a513fdab 100644 --- a/src/khoj/processor/conversation/google/utils.py +++ b/src/khoj/processor/conversation/google/utils.py @@ -195,7 +195,7 @@ async def gemini_chat_completion_with_backoff( thinking_config = None if deepthought and is_reasoning_model(model_name): - thinking_config = gtypes.ThinkingConfig(thinking_budget=MAX_REASONING_TOKENS_GEMINI, include_thoughts=True) + thinking_config = gtypes.ThinkingConfig(thinking_budget=-1, include_thoughts=True) max_output_tokens = MAX_OUTPUT_TOKENS_FOR_STANDARD_GEMINI if is_reasoning_model(model_name):