[feat] Activate Dreamverse LTX2 integration

Davids048 · SolitaryThinker · RandNMR73 · Davids048 · commit d325f2ddf629 · 2026-05-11T17:24:48.000-07:00
Apply Dreamverse monorepo changes for stack slice 13/13 from the source branch. Source-Branch: will/dreamverse-monorepo Source-SHA: 03d3e61 Dreamverse-Stack: 13/13 Co-authored-by: SolitaryThinker <wlsaidhi@gmail.com> Co-authored-by: Matthew Noto <99706358+RandNMR73@users.noreply.github.com> Co-authored-by: XOR-op <17672363+XOR-op@users.noreply.github.com> Co-authored-by: Zhang Peiyuan <42993249+jzhang38@users.noreply.github.com>
diff --git a/docs/contributing/dreamverse-development.md b/docs/contributing/dreamverse-development.md
@@ -0,0 +1,100 @@
+# Dreamverse Development
+
+Dreamverse lives under `apps/dreamverse/` as a product app inside the
+FastVideo monorepo. Backend code uses the local FastVideo workspace package;
+frontend tooling remains standalone under `apps/dreamverse/web/`.
+
+## Backend tests
+
+Run CPU-safe backend tests from the FastVideo repository root:
+
+```bash
+uv run --locked --package dreamverse --extra test pytest apps/dreamverse/server/tests/ -m 'not gpu' -q
+```
+
+## Backend launch
+
+Launch the migrated backend through the installed console commands:
+
+```bash
+dreamverse-server --port 8009
+dreamverse-mock-server --port 8009
+```
+
+If `dreamverse-server` is missing, install FastVideo with the `dreamverse`
+extra from the checkout:
+
+```bash
+uv pip install -e ".[dreamverse]"
+```
+
+## Frontend build and tests
+
+Run frontend commands from the standalone web app:
+
+```bash
+cd apps/dreamverse/web
+pnpm install --frozen-lockfile
+pnpm run build
+pnpm run test
+```
+
+Playwright is intentionally run against a live backend as part of the GPU4
+manual verification flow, not in the Phase 3 migration gate.
+
+## Local GPU4 verification hook
+
+Use physical GPU 4 for migration smoke tests. `CUDA_VISIBLE_DEVICES=4` makes
+that GPU appear as logical GPU 0 inside the process, preserving the previous
+Dreamverse deployment behavior.
+
+```bash
+CUDA_VISIBLE_DEVICES=4 dreamverse-server --host 0.0.0.0 --port 8009
+```
+
+In another shell, verify the service:
+
+```bash
+curl -s http://localhost:8009/healthz
+```
+
+Phase 4 adds the public `/healthz`, `/readyz`, `/status`,
+`/prompt-system-config`, and `/curated-presets` route coverage needed for the
+full Playwright suite.
+
+## Phase 0 production-equivalent prerequisites
+
+For the production-equivalent NVFP4 path, install these dependencies
+in the FastVideo `.venv` before GPU smoke tests:
+
+```bash
+uv pip install --python .venv/bin/python \
+  flashinfer-python flash-attn cerebras-cloud-sdk openai \
+  --no-build-isolation
+```
+
+| Package | Why |
+|---|---|
+| `flashinfer-python` | Required for NVFP4 quantization. Without it, model load fails with `ImportError: NVFP4 quantization requires flashinfer`. |
+| `flash-attn` | Optional but recommended; without it attention falls back to Torch SDPA (functional but slower). |
+| `cerebras-cloud-sdk` | Required by the migrated prompt enhancer for the default `cerebras` provider. |
+| `openai` | Required by the prompt enhancer's OpenAI-compatible providers + downstream rewrites. |
+
+### B200 / sm_100a + gcc-15 conda toolchain (flashinfer JIT workaround)
+
+On hosts where the conda toolchain ships gcc-15 (which nvcc rejects with
+`#error -- unsupported GNU version! gcc versions later than 14 are not
+supported!`), set these env vars before launching anything that triggers
+flashinfer's JIT kernel build:
+
+```bash
+export CC=/usr/bin/gcc-13
+export CXX=/usr/bin/g++-13
+export CUDAHOSTCXX=/usr/bin/g++-13
+export NVCC_PREPEND_FLAGS="-ccbin /usr/bin/gcc-13 -allow-unsupported-compiler"
+```
+
+`dreamverse-server` does NOT set these — they need to come from the launching
+shell. The `dreamverse-deploy` skill
+([`.agents/skills/dreamverse-deploy/`](../../.agents/skills/dreamverse-deploy/SKILL.md))
+sets them for you and is the recommended local-deploy path.
diff --git a/fastvideo/models/registry.py b/fastvideo/models/registry.py
@@ -115,6 +115,8 @@
 _UPSAMPLERS = {
     "SRTo720pUpsampler": ("upsamplers", "hunyuan15", "SRTo720pUpsampler"),
     "SRTo1080pUpsampler": ("upsamplers", "hunyuan15", "SRTo1080pUpsampler"),
+    "LTX2LatentUpsampler":
+    ("upsamplers", "ltx2_upsampler", "LTX2LatentUpsampler"),
 }
 
 _LEGACY_FAST_VIDEO_MODELS = {
diff --git a/fastvideo/registry.py b/fastvideo/registry.py
@@ -212,35 +212,42 @@ def _get_config_info(
 
 
 def _register_configs() -> None:
-    # LTX-2 (base)
+    # LTX-2 (distilled) — registered FIRST so its detector wins over
+    # the base detector when both fire. The detector loop in
+    # ``get_model_name_for_path`` ORs the path-based check with a
+    # pipeline-name check (``ltx2pipeline``) which the base detector's
+    # "distilled not in path" predicate matches as True (the
+    # pipeline_name string contains no "distilled" marker), so the
+    # less-specific BASE detector would otherwise win when the
+    # input is the absolute path of the distilled checkpoint.
     register_configs(
         sampling_param_cls=None,
         pipeline_config_cls=LTX2T2VConfig,
         workload_types=(WorkloadType.T2V, ),
         hf_model_paths=[
-            "Lightricks/LTX-2",
-            "FastVideo/LTX2-base",
-            "FastVideo/LTX2-Diffusers",
+            "FastVideo/LTX2-Distilled-Diffusers",
         ],
         model_detectors=[
-            lambda path: ("ltx2" in path.lower() or "ltx-2" in path.lower()) and "distilled" not in path.lower(),
+            lambda path: ("ltx2" in path.lower() or "ltx-2" in path.lower()) and "distilled" in path.lower(),
         ],
         model_family="ltx2",
-        default_preset="ltx2_base",
+        default_preset="ltx2_distilled",
     )
-    # LTX-2 (distilled)
+    # LTX-2 (base)
     register_configs(
         sampling_param_cls=None,
         pipeline_config_cls=LTX2T2VConfig,
         workload_types=(WorkloadType.T2V, ),
         hf_model_paths=[
-            "FastVideo/LTX2-Distilled-Diffusers",
+            "Lightricks/LTX-2",
+            "FastVideo/LTX2-base",
+            "FastVideo/LTX2-Diffusers",
         ],
         model_detectors=[
-            lambda path: ("ltx2" in path.lower() or "ltx-2" in path.lower()) and "distilled" in path.lower(),
+            lambda path: ("ltx2" in path.lower() or "ltx-2" in path.lower()) and "distilled" not in path.lower(),
         ],
         model_family="ltx2",
-        default_preset="ltx2_distilled",
+        default_preset="ltx2_base",
     )
 
     # Stable Audio Open (text-to-audio). Both variants must be loaded
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -161,6 +161,11 @@ nav:
   - Design:
     - Overview: design/overview.md
     - Training Architecture: design/training_architecture.md
+    - Server Contracts:
+      - Overview: design/server_contracts/index.md
+      - OpenAI HTTP: design/server_contracts/openai.md
+      - Streaming WebSocket: design/server_contracts/streaming.md
+      - Dynamo Integration: design/server_contracts/dynamo.md
   - Developer Guide:
     - Overview: contributing/overview.md
     - Developer Environment:
@@ -172,6 +177,7 @@ nav:
     - Testing: contributing/testing.md
     - Profiling: contributing/profiling.md
     - Coding Agents: contributing/coding_agents.md
+    - Dreamverse Development: contributing/dreamverse-development.md
     - Attention Backend Development: contributing/attention_backend.md
   - API Reference:
     - FastVideo: api/fastvideo.md

Original file line number	Diff line number	Diff line change
`@@ -115,6 +115,8 @@`
`115`	`115`	`_UPSAMPLERS = {`
`116`	`116`	`"SRTo720pUpsampler": ("upsamplers", "hunyuan15", "SRTo720pUpsampler"),`
`117`	`117`	`"SRTo1080pUpsampler": ("upsamplers", "hunyuan15", "SRTo1080pUpsampler"),`
	`118`	`+ "LTX2LatentUpsampler":`
	`119`	`+ ("upsamplers", "ltx2_upsampler", "LTX2LatentUpsampler"),`
`118`	`120`	`}`
`119`	`121`
`120`	`122`	`_LEGACY_FAST_VIDEO_MODELS = {`