Default to gpt-4o-mini instead of gpt-3.5-turbo in tests, func args

GPT-4o-mini is cheaper, smarter and can hold more context than GPT-3.5-turbo. In production, we also default to gpt-4o-mini, so makes sense to upgrade defaults and tests to work with it
2026-04-28 00:19:25 +00:00 · 2024-08-22 19:04:49 -07:00
parent 8a4c20d59a
commit 9986c183ea
5 changed files with 7 additions and 6 deletions
@@ -112,7 +112,7 @@ def converse(
    user_query,
    online_results: Optional[Dict[str, Dict]] = None,
    conversation_log={},
-    model: str = "gpt-3.5-turbo",
+    model: str = "gpt-4o-mini",
    api_key: Optional[str] = None,
    api_base_url: Optional[str] = None,
    temperature: float = 0.2,
@@ -23,6 +23,7 @@ model_to_prompt_size = {
    "gpt-3.5-turbo-0125": 12000,
    "gpt-4-0125-preview": 20000,
    "gpt-4-turbo-preview": 20000,
+    "gpt-4o-mini": 20000,
    "TheBloke/Mistral-7B-Instruct-v0.2-GGUF": 3500,
    "NousResearch/Hermes-2-Pro-Mistral-7B-GGUF": 3500,
    "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF": 20000,
@@ -136,7 +137,7 @@ def generate_chatml_messages_with_context(
    user_message,
    system_message=None,
    conversation_log={},
-    model_name="gpt-3.5-turbo",
+    model_name="gpt-4o-mini",
    loaded_model: Optional[Llama] = None,
    max_prompt_size=None,
    tokenizer_name=None,
@@ -89,7 +89,7 @@ class SearchConfig(ConfigBase):

 class OpenAIProcessorConfig(ConfigBase):
    api_key: str
-    chat_model: Optional[str] = "gpt-3.5-turbo"
+    chat_model: Optional[str] = "gpt-4o-mini"


 class OfflineChatProcessorConfig(ConfigBase):