mirror of
https://github.com/khoaliber/khoj.git
synced 2026-03-02 13:18:18 +00:00
Fix max thinking budget for gemini models to generate final response
This commit is contained in:
@@ -326,7 +326,7 @@ async def gemini_chat_completion_with_backoff(
|
||||
|
||||
thinking_config = None
|
||||
if deepthought and is_reasoning_model(model_name):
|
||||
thinking_config = gtypes.ThinkingConfig(thinking_budget=-1, include_thoughts=True)
|
||||
thinking_config = gtypes.ThinkingConfig(thinking_budget=MAX_REASONING_TOKENS_GEMINI, include_thoughts=True)
|
||||
|
||||
max_output_tokens = MAX_OUTPUT_TOKENS_FOR_STANDARD_GEMINI
|
||||
if is_reasoning_model(model_name):
|
||||
|
||||
Reference in New Issue
Block a user