From 222cc19b7ffa197406471a735bc3434f34c68552 Mon Sep 17 00:00:00 2001 From: Debanjum Date: Mon, 18 Aug 2025 23:24:00 -0700 Subject: [PATCH] Use subscriber type specific context window to generate response --- src/khoj/routers/helpers.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/src/khoj/routers/helpers.py b/src/khoj/routers/helpers.py index f8807047..ffd384b3 100644 --- a/src/khoj/routers/helpers.py +++ b/src/khoj/routers/helpers.py @@ -1625,6 +1625,7 @@ async def agenerate_chat_response( deepthought = True chat_model = await ConversationAdapters.aget_valid_chat_model(user, conversation, is_subscribed) + max_prompt_size = await ConversationAdapters.aget_max_context_size(chat_model, user) vision_available = chat_model.vision_enabled if not vision_available and query_images: vision_enabled_config = await ConversationAdapters.aget_vision_enabled_config() @@ -1656,7 +1657,7 @@ async def agenerate_chat_response( model=chat_model_name, api_key=api_key, api_base_url=openai_chat_config.api_base_url, - max_prompt_size=chat_model.max_prompt_size, + max_prompt_size=max_prompt_size, tokenizer_name=chat_model.tokenizer, agent=agent, vision_available=vision_available, @@ -1687,7 +1688,7 @@ async def agenerate_chat_response( model=chat_model.name, api_key=api_key, api_base_url=api_base_url, - max_prompt_size=chat_model.max_prompt_size, + max_prompt_size=max_prompt_size, tokenizer_name=chat_model.tokenizer, agent=agent, vision_available=vision_available, @@ -1717,7 +1718,7 @@ async def agenerate_chat_response( model=chat_model.name, api_key=api_key, api_base_url=api_base_url, - max_prompt_size=chat_model.max_prompt_size, + max_prompt_size=max_prompt_size, tokenizer_name=chat_model.tokenizer, agent=agent, vision_available=vision_available,