Track gemini 2.0 flash lite cost. Reduce max prompt size for 4o-mini

This commit is contained in:
Debanjum
2025-05-13 13:03:35 -06:00
parent e125e299a7
commit 417ab42206
2 changed files with 2 additions and 1 deletions

View File

@@ -51,7 +51,7 @@ except ImportError:
model_to_prompt_size = {
# OpenAI Models
"gpt-4o": 60000,
"gpt-4o-mini": 120000,
"gpt-4o-mini": 60000,
"gpt-4.1": 60000,
"gpt-4.1-mini": 120000,
"gpt-4.1-nano": 120000,

View File

@@ -52,6 +52,7 @@ model_to_cost: Dict[str, Dict[str, float]] = {
"gemini-1.5-pro": {"input": 1.25, "output": 5.00},
"gemini-1.5-pro-002": {"input": 1.25, "output": 5.00},
"gemini-2.0-flash": {"input": 0.10, "output": 0.40},
"gemini-2.0-flash-lite": {"input": 0.0075, "output": 0.30},
"gemini-2.5-flash-preview-04-17": {"input": 0.15, "output": 0.60, "thought": 3.50},
"gemini-2.5-pro-preview-03-25": {"input": 1.25, "output": 10.0},
# Anthropic Pricing: https://www.anthropic.com/pricing#anthropic-api