Track gemini 2.0 flash lite cost. Reduce max prompt size for 4o-mini

2026-03-09 13:25:11 +00:00 · 2025-05-13 13:03:35 -06:00
parent e125e299a7
commit 417ab42206
2 changed files with 2 additions and 1 deletions
--- a/src/khoj/processor/conversation/utils.py
+++ b/src/khoj/processor/conversation/utils.py
@@ -51,7 +51,7 @@ except ImportError:
 model_to_prompt_size = {
    # OpenAI Models
    "gpt-4o": 60000,
-    "gpt-4o-mini": 120000,
+    "gpt-4o-mini": 60000,
    "gpt-4.1": 60000,
    "gpt-4.1-mini": 120000,
    "gpt-4.1-nano": 120000,
--- a/src/khoj/utils/constants.py
+++ b/src/khoj/utils/constants.py
@@ -52,6 +52,7 @@ model_to_cost: Dict[str, Dict[str, float]] = {
    "gemini-1.5-pro": {"input": 1.25, "output": 5.00},
    "gemini-1.5-pro-002": {"input": 1.25, "output": 5.00},
    "gemini-2.0-flash": {"input": 0.10, "output": 0.40},
    "gemini-2.0-flash-lite": {"input": 0.0075, "output": 0.30},
    "gemini-2.5-flash-preview-04-17": {"input": 0.15, "output": 0.60, "thought": 3.50},
    "gemini-2.5-pro-preview-03-25": {"input": 1.25, "output": 10.0},
    # Anthropic Pricing: https://www.anthropic.com/pricing#anthropic-api