Output tokens >> reasoning tokens to avoid early response termination.

2026-03-02 21:19:12 +00:00 · 2025-05-18 14:40:57 -07:00
parent 73e28666b5
commit 31dcc44c20
1 changed files with 3 additions and 1 deletions
--- a/src/khoj/processor/conversation/google/utils.py
+++ b/src/khoj/processor/conversation/google/utils.py
@@ -36,7 +36,9 @@ logger = logging.getLogger(__name__)
 gemini_clients: Dict[str, genai.Client] = {}
-MAX_OUTPUT_TOKENS_GEMINI = 8192
+# Output tokens should be more than reasoning tokens.
 # This avoids premature response termination.
 MAX_OUTPUT_TOKENS_GEMINI = 20000
 MAX_REASONING_TOKENS_GEMINI = 10000
 SAFETY_SETTINGS = [