Add Vision Support (#889)

# Summary of Changes * New UI to show preview of image uploads * ChatML message changes to support gpt-4o vision based responses on images * AWS S3 image uploads for persistent image context in conversations * Database changes to have `vision_enabled` option in server admin panel while configuring models * Render previously uploaded images in the chat history, show uploaded images for pending msgs * Pass the uploaded_image_url through to subqueries * Allow image to render upon first message from the homepage * Add rendering support for images to shared chat as well * Fix some UI/functionality bugs in the share page * Convert user attached images for chat to webp format before upload * Use placeholder to attached image for data source, response mode actors * Update all clients to call /api/chat as a POST instead of GET request * Fix copying chat messages with images to clipboard TLDR; Add vision support for openai models on Khoj via the web UI! --------- Co-authored-by: sabaimran <narmiabas@gmail.com> Co-authored-by: Debanjum Singh Solanky <debanjum@gmail.com>
2026-03-02 13:18:18 +00:00 · 2024-09-09 17:22:18 -05:00
parent b553bba1d8
commit 549686a7a4
33 changed files with 740 additions and 417 deletions
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -462,8 +462,8 @@ async def test_chat_with_unauthenticated_user(chat_client_with_auth, api_user2:
    headers = {"Authorization": f"Bearer {api_user2.token}"}

    # Act
-    auth_response = chat_client_with_auth.get(f'/api/chat?q="Hello!"', headers=headers)
-    no_auth_response = chat_client_with_auth.get(f'/api/chat?q="Hello!"')
+    auth_response = chat_client_with_auth.post(f'/api/chat?q="Hello!"', headers=headers)
+    no_auth_response = chat_client_with_auth.post(f'/api/chat?q="Hello!"')

    # Assert
    assert auth_response.status_code == 200