Support image upload with "vision" purpose in chat

chriscarrollsmith · chriscarrollsmith · commit a508405c8ae4 · 2026-03-11T19:36:54.000-04:00
diff --git a/routers/chat.py b/routers/chat.py
@@ -7,7 +7,7 @@
 from typing import AsyncGenerator, Dict, Any, Callable, cast
 from pydantic import ValidationError
 from fastapi.templating import Jinja2Templates
-from fastapi import APIRouter, Form, Depends, Request
+from fastapi import APIRouter, Form, Depends, Request, UploadFile, File
 from fastapi.responses import StreamingResponse, HTMLResponse
 from openai.types.responses import (
     ResponseCreatedEvent, ResponseOutputItemAddedEvent,
@@ -57,23 +57,42 @@ async def send_message(
     request: Request,
     conversation_id: str,
     userInput: str = Form(...),
+    image: UploadFile | None = File(None),
     client: AsyncOpenAI = Depends(lambda: AsyncOpenAI())
 ) -> HTMLResponse:
+    # Build multimodal content array
+    content: list[dict[str, str]] = [{
+        "type": "input_text",
+        "text": f"System: Today's date is {datetime.today().strftime('%Y-%m-%d')}\n{userInput}"
+    }]
+
+    # If an image was uploaded, send it to OpenAI and add to content
+    image_file_id: str | None = None
+    if image and image.filename and image.size:
+        image_bytes = await image.read()
+        if image_bytes:
+            openai_file = await client.files.create(
+                file=(image.filename, image_bytes),
+                purpose="vision"
+            )
+            image_file_id = openai_file.id
+            content.append({
+                "type": "input_image",
+                "file_id": image_file_id,
+            })
+
     # Create a new conversation item for the user's message
     await client.conversations.items.create(
         conversation_id=conversation_id,
         items=[{
             "type": "message",
             "role": "user",
-            "content": [{
-                "type": "input_text",
-                "text": f"System: Today's date is {datetime.today().strftime('%Y-%m-%d')}\n{userInput}"
-            }]
+            "content": content
         }]
     )
 
     user_message_html = templates.get_template("components/user-message.html").render(
-        request=request, user_input=userInput
+        request=request, user_input=userInput, image_file_id=image_file_id
     )
     assistant_run_html = templates.get_template("components/assistant-run.html").render(
         request=request, conversation_id=conversation_id
diff --git a/static/stream-md.js b/static/stream-md.js
@@ -259,3 +259,26 @@ window.removeNetworkError = function() {
         console.warn('removeNetworkError failed:', e);
     }
 };
+
+// Image upload preview helpers
+window.previewImage = function(input) {
+    const preview = document.getElementById('imagePreview');
+    const previewImg = document.getElementById('imagePreviewImg');
+    if (input.files && input.files[0]) {
+        const reader = new FileReader();
+        reader.onload = function(e) {
+            previewImg.src = e.target.result;
+            preview.style.display = 'flex';
+        };
+        reader.readAsDataURL(input.files[0]);
+    }
+};
+
+window.clearImagePreview = function() {
+    const preview = document.getElementById('imagePreview');
+    const previewImg = document.getElementById('imagePreviewImg');
+    const imageInput = document.getElementById('imageInput');
+    if (preview) preview.style.display = 'none';
+    if (previewImg) previewImg.src = '';
+    if (imageInput) imageInput.value = '';
+};
diff --git a/static/styles.css b/static/styles.css
@@ -407,13 +407,83 @@ pre {
 
 .inputForm {
   display: flex;
-  align-items: flex-end;
+  flex-direction: column;
   width: 100%;
   padding: 10px;
   padding-bottom: 40px;
   order: 1;
 }
 
+.inputRow {
+  display: flex;
+  align-items: flex-end;
+  width: 100%;
+}
+
+/* Image upload button */
+.imageUploadLabel {
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  width: 40px;
+  height: calc(1em + 32px + 4px);
+  cursor: pointer;
+  color: #666;
+  flex-shrink: 0;
+  border-radius: 50%;
+  transition: color 0.2s;
+}
+
+.imageUploadLabel:hover {
+  color: #000;
+}
+
+.imageUploadInput {
+  display: none;
+}
+
+/* Image preview above the input row */
+.imagePreview {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  padding: 8px;
+  margin-bottom: 8px;
+  background: #f5f5f5;
+  border-radius: 8px;
+  width: fit-content;
+}
+
+.imagePreview img {
+  max-height: 80px;
+  max-width: 120px;
+  border-radius: 6px;
+  object-fit: cover;
+}
+
+.imagePreviewRemove {
+  background: none;
+  border: none;
+  font-size: 1.2em;
+  cursor: pointer;
+  color: #999;
+  padding: 4px 8px;
+  line-height: 1;
+}
+
+.imagePreviewRemove:hover {
+  color: #333;
+}
+
+/* Thumbnail in user messages */
+.userImageThumb {
+  max-height: 120px;
+  max-width: 200px;
+  border-radius: 8px;
+  margin-bottom: 8px;
+  display: block;
+}
+
 .input {
   flex-grow: 1;
   padding: 16px 24px;
diff --git a/templates/components/user-message.html b/templates/components/user-message.html
@@ -1,2 +1,7 @@
 <!-- user-message.html -->
-<div class="userMessage">{{ user_input }}</div>
+<div class="userMessage">
+  {% if image_file_id %}
+  <img src="/files/{{ image_file_id }}/content" alt="Uploaded image" class="userImageThumb" />
+  {% endif %}
+  {{ user_input }}
+</div>
diff --git a/templates/index.html b/templates/index.html
@@ -24,33 +24,51 @@
             {% endfor %}
           </div>
           <form id="chatForm" class="inputForm clearfix"
-                hx-on::after-request="this.reset()"
-                hx-on::before-request="removeNetworkError(); disableSendButton()">
-            <textarea
-              class="input"
-              name="userInput"
-              placeholder="Enter your question"
-              id="userInput"
-              autocomplete="off"
-              rows="1" {# Start with one row, will expand with CSS #}
-              oninput="this.style.height = 'auto'; this.style.height = (this.scrollHeight) + 'px';"
-              hx-on:keydown="if (event.key === 'Enter' && !event.shiftKey) { event.preventDefault(); this.form.querySelector('button[type=submit]').click(); }"
-              required
-            ></textarea>
-            <button
-              id="sendButton"
-              type="submit"
-              class="button"
-              hx-post="/chat/{{ conversation_id }}/send"
-              hx-target="#messages"
-              hx-swap="beforeend"
-              {% if inputDisabled %}disabled{% endif %}
-            >
-              <span class="button__text">Send</span>
-              <span class="button__loader" style="display: none;">
-                <span class="loading-dot"></span><span class="loading-dot"></span><span class="loading-dot"></span>
-              </span>
-            </button>
+                hx-on::after-request="this.reset(); clearImagePreview();"
+                hx-on::before-request="removeNetworkError(); disableSendButton()"
+                hx-encoding="multipart/form-data">
+            <div id="imagePreview" class="imagePreview" style="display:none;">
+              <img id="imagePreviewImg" src="" alt="Preview" />
+              <button type="button" class="imagePreviewRemove" onclick="clearImagePreview()">&times;</button>
+            </div>
+            <div class="inputRow">
+              <label class="imageUploadLabel" title="Attach image">
+                <svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><rect x="3" y="3" width="18" height="18" rx="2" ry="2"/><circle cx="8.5" cy="8.5" r="1.5"/><polyline points="21 15 16 10 5 21"/></svg>
+                <input
+                  type="file"
+                  name="image"
+                  id="imageInput"
+                  accept="image/png,image/jpeg,image/webp,image/gif"
+                  class="imageUploadInput"
+                  onchange="previewImage(this)"
+                />
+              </label>
+              <textarea
+                class="input"
+                name="userInput"
+                placeholder="Enter your question"
+                id="userInput"
+                autocomplete="off"
+                rows="1" {# Start with one row, will expand with CSS #}
+                oninput="this.style.height = 'auto'; this.style.height = (this.scrollHeight) + 'px';"
+                hx-on:keydown="if (event.key === 'Enter' && !event.shiftKey) { event.preventDefault(); this.form.querySelector('button[type=submit]').click(); }"
+                required
+              ></textarea>
+              <button
+                id="sendButton"
+                type="submit"
+                class="button"
+                hx-post="/chat/{{ conversation_id }}/send"
+                hx-target="#messages"
+                hx-swap="beforeend"
+                {% if inputDisabled %}disabled{% endif %}
+              >
+                <span class="button__text">Send</span>
+                <span class="button__loader" style="display: none;">
+                  <span class="loading-dot"></span><span class="loading-dot"></span><span class="loading-dot"></span>
+                </span>
+              </button>
+            </div>
           </form>
         </div>
 {% endblock %}
diff --git a/tests/test_image_upload.py b/tests/test_image_upload.py
diff --git a/tests/test_image_upload_live.py b/tests/test_image_upload_live.py