stackhpc · Banh-Canh · May 7, 2026
diff --git a/.github/workflows/build-push-images.yml b/.github/workflows/build-push-images.yml
@@ -19,6 +19,7 @@ jobs:
           - chat
           - image-analysis
           - flux-image-gen
+          - omni
     permissions:
       contents: read
       id-token: write         # needed for signing the images with GitHub OIDC Token

diff --git a/charts/azimuth-omni-backend/.helmignore b/charts/azimuth-omni-backend/.helmignore
@@ -0,0 +1,33 @@
+# Patterns to ignore when building packages.
+# This supports shell glob matching, relative path matching, and
+# negation (prefixed with !). Only one pattern per line.
+.DS_Store
+# Common VCS dirs
+.git/
+.gitignore
+.bzr/
+.bzrignore
+.hg/
+.hgignore
+.svn/
+# Common backup files
+*.swp
+*.bak
+*.tmp
+*.orig
+*~
+# Various IDEs
+.project
+.idea/
+*.tmproj
+.vscode/
+
+# Others
+README.md
+Dockerfile
+*kubeconfig.y[a]ml
+venv/
+__pycache__/
+images/
+*.secret
+ci/
diff --git a/charts/azimuth-omni-backend/Chart.yaml b/charts/azimuth-omni-backend/Chart.yaml
@@ -0,0 +1,16 @@
+apiVersion: v2
+name: azimuth-llm-omni-backend
+description: |
+  In-cluster vLLM backends for the Omni multimodal interface
+  (text-to-text / chat, text-to-speech, text-to-image).
+maintainers:
+  - name: "Victor HANG"
+    email: victor@stackhpc.com
+
+type: application
+
+# The version and appVersion are updated by the chart build script
+version: 0.1.0
+appVersion: local
+
+icon: https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg
diff --git a/charts/azimuth-omni-backend/ci/test-values.yaml b/charts/azimuth-omni-backend/ci/test-values.yaml
@@ -0,0 +1,13 @@
+# CI: only exercise the TTT backend with the smallest possible model.
+ttt:
+  enabled: true
+  huggingface:
+    model: HuggingFaceTB/SmolLM2-135M-Instruct
+  api:
+    monitoring:
+      enabled: false
+    gpus: 0
+tts:
+  enabled: false
+tti:
+  enabled: false
diff --git a/charts/azimuth-omni-backend/templates/NOTES.txt b/charts/azimuth-omni-backend/templates/NOTES.txt
@@ -0,0 +1,17 @@
+Azimuth Omni backends provide one or more in-cluster vLLM model deployments
+(text-to-text / chat, text-to-speech, text-to-image) for the Omni interface.
+
+Enabled backends in this release:
+{{- range $alias := list "ttt" "tts" "tti" }}
+{{- $sub := index $.Values $alias }}
+{{- if and $sub $sub.enabled }}
+  - {{ $alias }}: {{ $sub.huggingface.model }} (in-cluster at http://{{ $.Release.Name }}-{{ $alias }}.{{ $.Release.Namespace }}.svc)
+{{- else }}
+  - {{ $alias }}: disabled (toggle with `{{ $alias }}.enabled=true`)
+{{- end }}
+{{- end }}
+
+Each enabled backend downloads its model weights from HuggingFace on first
+start, which can take a while.
+
+Release notes: https://github.com/stackhpc/azimuth-llm/releases