Partha-dev01
diff --git a/‎DOCS.md‎
Lines changed: 31 additions & 0 deletions b/‎DOCS.md‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎app/api/chat/generate-words/route.ts‎
Lines changed: 281 additions & 0 deletions b/‎app/api/chat/generate-words/route.ts‎
Lines changed: 281 additions & 0 deletions
@@ -409,6 +409,9 @@ npx playwright test    # Run all 30 tests
 | R12 | **CI Playwright failures — AWS SDK "Region is missing"** | `next.config.ts` inlines env vars at build time with `?? ""` defaults. On CI (no `.env.local`), `BEDROCK_REGION`/`POLLY_REGION` resolved to `""` (empty string). Nullish coalescing (`??`) doesn't catch empty strings, so `process.env.BEDROCK_REGION ?? "us-east-1"` → `""`. AWS SDK threw `Error: Region is missing` outside try/catch → uncaught 500. Fix: changed `??` to `||` in all 4 API routes (summary, clinical, tts, conversation) and moved client creation inside try/catch blocks. TTS error status changed from 500 → 503. |
 | R13 | **Step 7 auto-advances without verifying motor actions** | Voice agent spoke motor instructions ("touch your nose", "wave") but immediately moved on without checking if the child performed the action. Also, agent text wasn't displayed prominently. Fix: added camera-based motor action verification using existing YOLO pose detection pipeline. Motor turns activate camera → YOLO extracts 17 keypoints → rule-based ActionDetector checks keypoint geometry → ActionTracker requires 5 consecutive positive frames → confirmed. Agent text now displayed in large centered speech bubble with domain emoji headers. |
 | R14 | **Stage 10 worker URL parse error** | `Failed to execute 'fetch' on 'WorkerGlobalScope': Failed to parse URL from /models/yolo26n-pose-int8.onnx`. ONNX model paths were relative URLs (`/models/...`) which fail inside Web Workers because relative paths resolve against the worker script URL (blob: or /_next/static/), not the page origin. Fix: prefixed all 4 model paths with `${self.location.origin}` in PipelineOrchestrator.ts and MultimodalOrchestrator.ts. |
+| R15 | **Stages 4, 7, 9 overlap and lack differentiation** | Stage 4 (Communication) and Stage 9 (Audio) were both simple speech echo tests with hardcoded word lists. Stage 7 (Preparation) mixed motor actions with LLM conversation. Fix: Stage 4 → pure Word Echo with LLM-generated age-appropriate words + Polly TTS. Stage 7 → pure Motor Action Challenge with fixed 6-action sequence + live YOLO detection feedback (confidence bar, 5-dot frame counter, color-coded borders). Stage 9 → Sentence Echo + Comprehension (Part A: sentence repetition with word-overlap scoring, Part B: audio instruction following). |
+| R16 | **Stage 10 camera fails on mobile** | `getUserMedia()` with fixed resolution constraints fails on many mobile browsers. Also: no HTTPS check (required for camera on mobile), generic error messages, no retry mechanism. Fix: 3-tier progressive constraint negotiation (ideal 320×240 → facingMode only → any video). HTTPS early check. Specific error messages per DOMException type (NotAllowedError, NotFoundError, NotReadableError, SecurityError). Retry Camera + Skip buttons on failure. Shared `cameraUtils.ts` reused by Stage 7 and Stage 10. |
+| R17 | **Stages auto-advance without criteria verification** | Some stages allowed proceeding even when insufficient data was collected. Fix: minimum criteria gates on Stages 4 (2/6 words), 7 (3/6 actions), 9 (2/7 items), 10 (5 samples + 30s). Stages show "Let's try again!" card with Try Again/Skip buttons when criteria not met. |
 
 ---
 
@@ -538,3 +541,31 @@ npx playwright test    # Run all 30 tests
 - Updated: `app/api/chat/conversation/route.ts` (action field in metadata)
 - Fixed: `app/lib/inference/PipelineOrchestrator.ts` (absolute model URLs)
 - Fixed: `app/lib/inference/MultimodalOrchestrator.ts` (absolute model URLs)
+
+### v1.5.0 — 2026-03-04 (Stage Differentiation, Dynamic Content, Mobile Camera, Criteria Gates)
+
+**Major Changes:**
+- **Stage 4 → Word Echo**: Dynamic LLM-generated (Bedrock Nova Lite) age-appropriate words spoken via Polly TTS. Child echoes back, matched via Web Speech API. 6 words per session from age-stratified pools (18-36mo, 36-60mo, 60+mo). Falls back to curated word pools when Bedrock unavailable.
+- **Stage 7 → Action Challenge**: Pure motor action test — fixed sequence of 6 actions (wave, touch nose, clap, raise arms, touch head, touch ears). Camera + YOLO pose detection with **live feedback**: confidence bar, color-coded camera border (red/blue/green), 5-dot frame counter showing consecutive detection progress, contextual status text ("Step into view", "Getting closer!", "Almost there!"). No LLM/TTS/STT — purely visual.
+- **Stage 9 → Speech & Comprehension**: Two-part test. Part A: 4 LLM-generated sentences with word-overlap matching (threshold 0.4). Part B: 3 audio instructions testing comprehension (any verbal response = engaged). Both spoken via Polly TTS.
+
+**New:**
+- `POST /api/chat/generate-words` — Shared endpoint for dynamic content generation. Modes: `words`, `sentences`, `instructions`. Falls back to curated age-stratified pools (20 words, 6 sentences, 5 instructions per bracket).
+- `app/lib/camera/cameraUtils.ts` — Shared camera utility: 3-tier progressive `getUserMedia` constraint negotiation (ideal 320×240 → facingMode only → any camera). HTTPS early check. Specific error messages per DOMException type.
+- `consecutiveHits` exposed from ActionTracker and useActionCamera hook for real-time frame progress display.
+
+**Fixed:**
+- **Mobile camera failures**: Progressive constraint fallback handles devices that can't satisfy resolution constraints. HTTPS check prevents silent failures on mobile HTTP. Specific error messages for NotFoundError, NotReadableError, OverconstrainedError, SecurityError. Retry Camera + Skip buttons added to Stage 10.
+- **Stages auto-advance without verification**: Minimum criteria gates added — Stage 4 (2/6 words), Stage 7 (3/6 actions), Stage 9 (2/7 items), Stage 10 (5 samples + 30s). Shows retry/skip menu when criteria not met.
+
+**Files:**
+- Created: `app/api/chat/generate-words/route.ts`
+- Created: `app/lib/camera/cameraUtils.ts`
+- Rewritten: `app/intake/communication/page.tsx` (Word Echo)
+- Rewritten: `app/intake/preparation/page.tsx` (Action Challenge)
+- Rewritten: `app/intake/audio/page.tsx` (Speech & Comprehension)
+- Updated: `app/intake/video-capture/page.tsx` (mobile camera + criteria gate)
+- Updated: `app/hooks/useActionCamera.ts` (consecutiveHits + cameraUtils)
+- Updated: `app/lib/actions/actionDetector.ts` (consecutiveHits in tracker return)
+- Updated: `tests/intake-flow.spec.ts` (Step 4, 7, 9 test assertions)
+- Updated: `tests/app-pages.spec.ts` (generate-words API test)
@@ -0,0 +1,281 @@
+/**
+ * POST /api/chat/generate-words
+ *
+ * Generates age-appropriate words, sentences, or instructions for
+ * speech echo and comprehension stages. Falls back to curated
+ * age-stratified pools when Bedrock is unavailable.
+ *
+ * Request body:
+ *   { ageMonths: number, count?: number, mode: "words"|"sentences"|"instructions" }
+ *
+ * Response:
+ *   { items: Array<{ text: string, emoji: string }>, fallback: boolean }
+ */
+
+import { NextRequest, NextResponse } from "next/server";
+import {
+  BedrockRuntimeClient,
+  InvokeModelCommand,
+} from "@aws-sdk/client-bedrock-runtime";
+
+/* ------------------------------------------------------------------ */
+/*  Types                                                              */
+/* ------------------------------------------------------------------ */
+
+type Mode = "words" | "sentences" | "instructions";
+
+interface GenerateRequest {
+  ageMonths: number;
+  count?: number;
+  mode: Mode;
+}
+
+interface GeneratedItem {
+  text: string;
+  emoji: string;
+}
+
+/* ------------------------------------------------------------------ */
+/*  Bedrock client                                                     */
+/* ------------------------------------------------------------------ */
+
+const BEDROCK_REGION = process.env.BEDROCK_REGION || "us-east-1";
+
+function getBedrockClient(): BedrockRuntimeClient {
+  return new BedrockRuntimeClient({ region: BEDROCK_REGION });
+}
+
+/* ------------------------------------------------------------------ */
+/*  Fallback pools — curated, age-stratified                           */
+/* ------------------------------------------------------------------ */
+
+const WORD_EMOJIS: Record<string, string> = {
+  mama: "👩", dada: "👨", ball: "⚽", dog: "🐶", cat: "🐱", milk: "🥛",
+  more: "➕", up: "⬆️", bye: "👋", hi: "🙋", book: "📖", shoe: "👟",
+  hat: "🎩", cup: "🥤", fish: "🐟", duck: "🦆", apple: "🍎", baby: "👶",
+  car: "🚗", bird: "🐦", banana: "🍌", elephant: "🐘", butterfly: "🦋",
+  dinosaur: "🦕", rainbow: "🌈", chocolate: "🍫", hello: "👋", purple: "🟣",
+  circle: "⭕", triangle: "🔺", giraffe: "🦒", penguin: "🐧", rocket: "🚀",
+  princess: "👸", monster: "👹", umbrella: "☂️", pumpkin: "🎃",
+  strawberry: "🍓", airplane: "✈️", crocodile: "🐊", computer: "💻",
+  adventure: "🗺️", incredible: "🌟", beautiful: "🌸", discovery: "🔍",
+  astronaut: "🧑‍🚀", magnificent: "✨", helicopter: "🚁", wonderful: "💫",
+  caterpillar: "🐛", watermelon: "🍉", constellation: "⭐", basketball: "🏀",
+  trampoline: "🤸", hippopotamus: "🦛", refrigerator: "🧊", thermometer: "🌡️",
+  xylophone: "🎵", vocabulary: "📝", harmonica: "🎶",
+};
+
+const FALLBACK_WORDS: Record<string, string[]> = {
+  young: ["mama", "dada", "ball", "dog", "cat", "milk", "more", "up", "bye", "hi",
+          "book", "shoe", "hat", "cup", "fish", "duck", "apple", "baby", "car", "bird"],
+  mid:   ["banana", "elephant", "butterfly", "dinosaur", "rainbow", "chocolate", "hello",
+          "purple", "circle", "triangle", "giraffe", "penguin", "rocket", "princess",
+          "monster", "umbrella", "pumpkin", "strawberry", "airplane", "crocodile"],
+  old:   ["computer", "adventure", "incredible", "beautiful", "discovery", "astronaut",
+          "magnificent", "helicopter", "wonderful", "caterpillar", "watermelon",
+          "constellation", "basketball", "trampoline", "hippopotamus", "refrigerator",
+          "thermometer", "xylophone", "vocabulary", "harmonica"],
+};
+
+const FALLBACK_SENTENCES: Record<string, GeneratedItem[]> = {
+  young: [
+    { text: "The cat is big", emoji: "🐱" },
+    { text: "I like dogs", emoji: "🐶" },
+    { text: "My ball is red", emoji: "⚽" },
+    { text: "I see a bird", emoji: "🐦" },
+    { text: "The sun is hot", emoji: "☀️" },
+    { text: "I want milk", emoji: "🥛" },
+  ],
+  mid: [
+    { text: "The butterfly is very pretty", emoji: "🦋" },
+    { text: "I want to go outside and play", emoji: "🏃" },
+    { text: "My favorite color is blue", emoji: "🔵" },
+    { text: "The dog is running in the park", emoji: "🐶" },
+    { text: "I can count to ten", emoji: "🔢" },
+    { text: "The moon comes out at night", emoji: "🌙" },
+  ],
+  old: [
+    { text: "The elephant walked through the tall jungle", emoji: "🐘" },
+    { text: "Can you tell me about your favorite game", emoji: "🎮" },
+    { text: "The beautiful rainbow appeared after the rain", emoji: "🌈" },
+    { text: "I like to read books before bedtime", emoji: "📚" },
+    { text: "The spaceship flew high into the sky", emoji: "🚀" },
+    { text: "My friend and I played at the park today", emoji: "🏞️" },
+  ],
+};
+
+const FALLBACK_INSTRUCTIONS: Record<string, GeneratedItem[]> = {
+  young: [
+    { text: "Clap your hands", emoji: "👏" },
+    { text: "Wave bye bye", emoji: "👋" },
+    { text: "Say your name", emoji: "🗣️" },
+    { text: "Touch your nose", emoji: "👃" },
+    { text: "Say mama", emoji: "👩" },
+  ],
+  mid: [
+    { text: "Clap your hands two times", emoji: "👏" },
+    { text: "Say hello and then wave", emoji: "👋" },
+    { text: "Count to three out loud", emoji: "🔢" },
+    { text: "Tell me something that is red", emoji: "🔴" },
+    { text: "Say the word butterfly", emoji: "🦋" },
+  ],
+  old: [
+    { text: "Clap your hands then touch your head", emoji: "👏" },
+    { text: "Say your name and how old you are", emoji: "🗣️" },
+    { text: "Count backwards from five", emoji: "🔢" },
+    { text: "Tell me your favorite animal and why", emoji: "🐾" },
+    { text: "Say a long word like hippopotamus", emoji: "🦛" },
+  ],
+};
+
+/* ------------------------------------------------------------------ */
+/*  Helpers                                                            */
+/* ------------------------------------------------------------------ */
+
+function getAgeBracket(ageMonths: number): string {
+  if (ageMonths < 36) return "young";
+  if (ageMonths < 60) return "mid";
+  return "old";
+}
+
+function shuffle<T>(arr: T[]): T[] {
+  const a = [...arr];
+  for (let i = a.length - 1; i > 0; i--) {
+    const j = Math.floor(Math.random() * (i + 1));
+    [a[i], a[j]] = [a[j], a[i]];
+  }
+  return a;
+}
+
+function pickFallbackWords(ageMonths: number, count: number): GeneratedItem[] {
+  const bracket = getAgeBracket(ageMonths);
+  const pool = FALLBACK_WORDS[bracket];
+  return shuffle(pool).slice(0, count).map((w) => ({
+    text: w,
+    emoji: WORD_EMOJIS[w] || "🔤",
+  }));
+}
+
+function pickFallbackSentences(ageMonths: number, count: number): GeneratedItem[] {
+  const bracket = getAgeBracket(ageMonths);
+  return shuffle(FALLBACK_SENTENCES[bracket]).slice(0, count);
+}
+
+function pickFallbackInstructions(ageMonths: number, count: number): GeneratedItem[] {
+  const bracket = getAgeBracket(ageMonths);
+  return shuffle(FALLBACK_INSTRUCTIONS[bracket]).slice(0, count);
+}
+
+function pickFallback(mode: Mode, ageMonths: number, count: number): GeneratedItem[] {
+  switch (mode) {
+    case "words": return pickFallbackWords(ageMonths, count);
+    case "sentences": return pickFallbackSentences(ageMonths, count);
+    case "instructions": return pickFallbackInstructions(ageMonths, count);
+  }
+}
+
+/* ------------------------------------------------------------------ */
+/*  Bedrock generation                                                 */
+/* ------------------------------------------------------------------ */
+
+function buildPrompt(mode: Mode, ageMonths: number, count: number): string {
+  const years = Math.floor(ageMonths / 12);
+  const months = ageMonths % 12;
+  const ageStr = months > 0 ? `${years} years and ${months} months` : `${years} years`;
+
+  switch (mode) {
+    case "words":
+      return `Generate exactly ${count} age-appropriate single words for a ${ageStr}-old child to repeat in a speech echo test. Mix easy and slightly challenging words. Use concrete nouns and simple words the child would know. Each word should have a relevant emoji. Return ONLY valid JSON array (no markdown, no code blocks): [{"text":"banana","emoji":"🍌"},...]`;
+    case "sentences":
+      return `Generate exactly ${count} short sentences (3-8 words each) appropriate for a ${ageStr}-old child to repeat in a speech test. Use familiar objects and actions. Each sentence should have a relevant emoji. Return ONLY valid JSON array (no markdown, no code blocks): [{"text":"The cat is sleeping","emoji":"🐱"},...]`;
+    case "instructions":
+      return `Generate exactly ${count} simple audio instructions for a ${ageStr}-old child. Each should ask them to do or say something simple and fun. Each instruction should have a relevant emoji. Return ONLY valid JSON array (no markdown, no code blocks): [{"text":"Clap your hands two times","emoji":"👏"},...]`;
+  }
+}
+
+function parseItems(raw: string): GeneratedItem[] | null {
+  try {
+    // Try direct parse
+    const parsed = JSON.parse(raw);
+    if (Array.isArray(parsed) && parsed.length > 0 && parsed[0].text) {
+      return parsed;
+    }
+  } catch {
+    // Try extracting JSON array from text
+    const match = raw.match(/\[[\s\S]*\]/);
+    if (match) {
+      try {
+        const parsed = JSON.parse(match[0]);
+        if (Array.isArray(parsed) && parsed.length > 0 && parsed[0].text) {
+          return parsed;
+        }
+      } catch { /* fall through */ }
+    }
+  }
+  return null;
+}
+
+/* ------------------------------------------------------------------ */
+/*  POST handler                                                       */
+/* ------------------------------------------------------------------ */
+
+export async function POST(request: NextRequest) {
+  try {
+    const body: GenerateRequest = await request.json();
+    const { ageMonths = 36, count = 6, mode = "words" } = body;
+
+    if (!["words", "sentences", "instructions"].includes(mode)) {
+      return NextResponse.json({ error: "Invalid mode" }, { status: 400 });
+    }
+
+    const clampedCount = Math.max(1, Math.min(count, 10));
+
+    // Try Bedrock first
+    try {
+      const client = getBedrockClient();
+      const prompt = buildPrompt(mode, ageMonths, clampedCount);
+
+      const command = new InvokeModelCommand({
+        modelId: "amazon.nova-lite-v1:0",
+        contentType: "application/json",
+        accept: "application/json",
+        body: JSON.stringify({
+          messages: [{ role: "user", content: [{ text: prompt }] }],
+          inferenceConfig: { maxNewTokens: 500, temperature: 0.8 },
+        }),
+      });
+
+      const controller = new AbortController();
+      const timeout = setTimeout(() => controller.abort(), 3000);
+
+      const response = await client.send(command, { abortSignal: controller.signal });
+      clearTimeout(timeout);
+
+      const responseBody = JSON.parse(new TextDecoder().decode(response.body));
+      const text = responseBody?.output?.message?.content?.[0]?.text;
+
+      if (text) {
+        const items = parseItems(text);
+        if (items && items.length >= clampedCount) {
+          return NextResponse.json({
+            items: items.slice(0, clampedCount),
+            fallback: false,
+          });
+        }
+      }
+    } catch {
+      // Bedrock failed or timed out — use fallback
+    }
+
+    // Fallback
+    return NextResponse.json({
+      items: pickFallback(mode, ageMonths, clampedCount),
+      fallback: true,
+    });
+  } catch (err) {
+    return NextResponse.json(
+      { error: err instanceof Error ? err.message : "Unknown error" },
+      { status: 500 },
+    );
+  }
+}