mirror of
https://github.com/khoaliber/khoj.git
synced 2026-03-09 13:25:11 +00:00
Track gemini 2.0 flash lite cost. Reduce max prompt size for 4o-mini
This commit is contained in:
@@ -51,7 +51,7 @@ except ImportError:
|
|||||||
model_to_prompt_size = {
|
model_to_prompt_size = {
|
||||||
# OpenAI Models
|
# OpenAI Models
|
||||||
"gpt-4o": 60000,
|
"gpt-4o": 60000,
|
||||||
"gpt-4o-mini": 120000,
|
"gpt-4o-mini": 60000,
|
||||||
"gpt-4.1": 60000,
|
"gpt-4.1": 60000,
|
||||||
"gpt-4.1-mini": 120000,
|
"gpt-4.1-mini": 120000,
|
||||||
"gpt-4.1-nano": 120000,
|
"gpt-4.1-nano": 120000,
|
||||||
|
|||||||
@@ -52,6 +52,7 @@ model_to_cost: Dict[str, Dict[str, float]] = {
|
|||||||
"gemini-1.5-pro": {"input": 1.25, "output": 5.00},
|
"gemini-1.5-pro": {"input": 1.25, "output": 5.00},
|
||||||
"gemini-1.5-pro-002": {"input": 1.25, "output": 5.00},
|
"gemini-1.5-pro-002": {"input": 1.25, "output": 5.00},
|
||||||
"gemini-2.0-flash": {"input": 0.10, "output": 0.40},
|
"gemini-2.0-flash": {"input": 0.10, "output": 0.40},
|
||||||
|
"gemini-2.0-flash-lite": {"input": 0.0075, "output": 0.30},
|
||||||
"gemini-2.5-flash-preview-04-17": {"input": 0.15, "output": 0.60, "thought": 3.50},
|
"gemini-2.5-flash-preview-04-17": {"input": 0.15, "output": 0.60, "thought": 3.50},
|
||||||
"gemini-2.5-pro-preview-03-25": {"input": 1.25, "output": 10.0},
|
"gemini-2.5-pro-preview-03-25": {"input": 1.25, "output": 10.0},
|
||||||
# Anthropic Pricing: https://www.anthropic.com/pricing#anthropic-api
|
# Anthropic Pricing: https://www.anthropic.com/pricing#anthropic-api
|
||||||
|
|||||||
Reference in New Issue
Block a user