From c995606c7fb02ed0a4a9a20358ad396ee1a66cf2 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Wed, 8 Apr 2026 17:36:44 -0500
Subject: [PATCH 01/32] MOTO v1.0.5: autonomy efficiency upgrade, title
 exploration, token tracking, and UI updates

---
 .cursor/rules/api-key-controls.mdc            |   30 +-
 .cursor/rules/json-prompt-design.mdc          |   73 +-
 .cursor/rules/latex-renderer.mdc              |   45 +-
 ...-aggregator-tool-design-specifications.mdc |    6 +-
 ...-and-part-2-cointeraction-architecture.mdc |    1 +
 ...t-2-compiler-tool-design-specification.mdc |   30 +-
 .../rules/part-3-autonomous-research-mode.mdc |  216 +-
 ...program-directory-and-file-definitions.mdc |   50 +-
 .../rules/rag-design-for-overall-program.mdc  |   45 +-
 .cursor/rules/workflow-runtime-updates.mdc    |   11 +
 Press to Launch MOTO.bat                      |    5 +-
 README.md                                     |   27 +-
 _moto_internal_launcher.ps1                   |   63 +-
 backend/aggregator/agents/submitter.py        |   10 +-
 backend/aggregator/core/context_allocator.py  |   65 +-
 backend/aggregator/core/coordinator.py        |   53 +-
 backend/aggregator/core/rag_manager.py        |  103 +-
 backend/aggregator/memory/shared_training.py  |   11 +-
 .../aggregator/prompts/submitter_prompts.py   |    2 +
 backend/api/main.py                           |    8 +-
 backend/api/routes/aggregator.py              |   31 +-
 backend/api/routes/autonomous.py              |  801 ++-
 backend/api/routes/boost.py                   |  110 +-
 backend/api/routes/compiler.py                |   56 +-
 backend/api/routes/openrouter.py              |   45 +-
 backend/api/routes/workflow.py                |    7 +
 .../final_answer/answer_format_selector.py    |    5 +
 .../agents/final_answer/certainty_assessor.py |   65 +-
 .../agents/final_answer/volume_organizer.py   |    5 +
 .../autonomous/agents/paper_title_selector.py |   59 +-
 backend/autonomous/agents/topic_selector.py   |   15 +-
 backend/autonomous/agents/topic_validator.py  |   48 +-
 .../autonomous/core/autonomous_coordinator.py | 1068 +++-
 .../autonomous/core/autonomous_rag_manager.py |   48 +-
 .../autonomous/memory/brainstorm_memory.py    |  166 +
 .../autonomous/memory/final_answer_memory.py  |    2 +-
 backend/autonomous/memory/paper_library.py    |  177 +
 .../autonomous/memory/paper_model_tracker.py  |   13 +-
 backend/autonomous/prompts/__init__.py        |    8 +-
 .../prompts/paper_continuation_prompts.py     |  300 +
 .../paper_title_exploration_prompts.py        |   87 +
 .../autonomous/prompts/paper_title_prompts.py |   15 +-
 .../prompts/topic_exploration_prompts.py      |   78 +
 backend/autonomous/prompts/topic_prompts.py   |   21 +-
 .../validation/paper_redundancy_checker.py    |    4 +
 backend/compiler/agents/critique_submitter.py |   18 +
 .../compiler/agents/high_context_submitter.py |  112 +-
 .../compiler/agents/high_param_submitter.py   |   31 +-
 backend/compiler/core/compiler_coordinator.py |  312 +-
 backend/compiler/core/compiler_rag_manager.py |   11 +-
 .../compiler/prompts/construction_prompts.py  |   75 +-
 backend/compiler/prompts/critique_prompts.py  |   10 +
 .../compiler/validation/compiler_validator.py |  226 +-
 backend/shared/api_client_manager.py          |  196 +-
 backend/shared/boost_manager.py               |    4 +
 backend/shared/config.py                      |    6 +-
 backend/shared/critique_prompts.py            |  156 +-
 backend/shared/models.py                      |   34 +-
 backend/shared/token_tracker.py               |   85 +
 frontend/package-lock.json                    |   16 +-
 frontend/package.json                         |    2 +-
 frontend/src/App.jsx                          | 1115 +++-
 frontend/src/components/BoostControlModal.css |   90 +-
 frontend/src/components/BoostControlModal.jsx |  189 +-
 frontend/src/components/BoostLogs.css         |   46 +-
 frontend/src/components/BoostLogs.jsx         |    2 +-
 .../CreditExhaustionNotificationStack.jsx     |  259 +
 .../components/CritiqueNotificationStack.jsx  |   24 +-
 .../HungConnectionNotificationStack.jsx       |  188 +
 frontend/src/components/LatexRenderer.css     |   42 +-
 frontend/src/components/LatexRenderer.jsx     |    4 +-
 .../src/components/OpenRouterApiKeyModal.jsx  |   61 +-
 .../OpenRouterPrivacyWarningModal.jsx         |   39 +-
 .../src/components/PaperCritiqueModal.jsx     |  422 +-
 .../components/StartupProviderSetupModal.jsx  |  163 +
 frontend/src/components/TextFileUploader.css  |   14 +-
 frontend/src/components/WorkflowPanel.css     |  275 +-
 frontend/src/components/WorkflowPanel.jsx     |  117 +-
 .../aggregator/AggregatorInterface.jsx        |   16 +-
 .../components/aggregator/AggregatorLogs.jsx  |   13 +-
 .../aggregator/AggregatorSettings.jsx         |  175 +-
 .../src/components/aggregator/LiveResults.jsx |    5 +-
 .../autonomous/ArchiveViewerModal.css         |  264 +
 .../autonomous/ArchiveViewerModal.jsx         |  197 +-
 .../autonomous/AutonomousResearch.css         |  125 +-
 .../AutonomousResearchInterface.jsx           |  107 +-
 .../autonomous/AutonomousResearchLogs.jsx     |   68 +-
 .../autonomous/AutonomousResearchSettings.jsx | 1308 ++--
 .../components/autonomous/BrainstormList.jsx  |    9 +-
 .../autonomous/FinalAnswerLibrary.css         |  156 +-
 .../autonomous/FinalAnswerLibrary.jsx         |  404 +-
 .../autonomous/LivePaperProgress.jsx          |    8 +-
 .../autonomous/LiveTier3Progress.jsx          |   42 +-
 .../components/autonomous/PaperLibrary.jsx    |    6 +-
 .../autonomous/Stage2PaperHistory.css         |   51 +
 .../autonomous/Stage2PaperHistory.jsx         |  534 ++
 frontend/src/components/autonomous/index.js   |    1 +
 .../components/compiler/CompilerInterface.jsx |   25 +-
 .../src/components/compiler/CompilerLogs.jsx  |   26 +-
 .../components/compiler/CompilerSettings.jsx  |  260 +-
 .../src/components/compiler/LivePaper.jsx     |   17 +-
 frontend/src/components/critique-modal.css    |  496 ++
 frontend/src/components/settings-common.css   |  827 +++
 frontend/src/index.css                        | 1039 ++--
 frontend/src/services/api.js                  |  101 +-
 frontend/src/utils/autonomousProfiles.js      |  424 ++
 frontend/src/utils/disclaimerHelper.js        |   67 +
 frontend/src/utils/downloadHelpers.js         |   14 +-
 frontend/src/utils/researchRunHistory.js      |  129 +
 package-lock.json                             |    4 +-
 package.json                                  |    2 +-
 random dev log.txt                            | 5266 -----------------
 requirements.txt                              |    4 +-
 113 files changed, 11546 insertions(+), 9076 deletions(-)
 create mode 100644 .cursor/rules/workflow-runtime-updates.mdc
 create mode 100644 backend/autonomous/prompts/paper_continuation_prompts.py
 create mode 100644 backend/autonomous/prompts/paper_title_exploration_prompts.py
 create mode 100644 backend/autonomous/prompts/topic_exploration_prompts.py
 create mode 100644 backend/shared/token_tracker.py
 create mode 100644 frontend/src/components/CreditExhaustionNotificationStack.jsx
 create mode 100644 frontend/src/components/HungConnectionNotificationStack.jsx
 create mode 100644 frontend/src/components/StartupProviderSetupModal.jsx
 create mode 100644 frontend/src/components/autonomous/ArchiveViewerModal.css
 create mode 100644 frontend/src/components/autonomous/Stage2PaperHistory.css
 create mode 100644 frontend/src/components/autonomous/Stage2PaperHistory.jsx
 create mode 100644 frontend/src/components/critique-modal.css
 create mode 100644 frontend/src/components/settings-common.css
 create mode 100644 frontend/src/utils/autonomousProfiles.js
 create mode 100644 frontend/src/utils/disclaimerHelper.js
 create mode 100644 frontend/src/utils/researchRunHistory.js
 delete mode 100644 random dev log.txt

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index f5e74dd..d247fc1 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -1,7 +1,6 @@
 ---
-alwaysApply: true
+alwaysApply: false
 ---
-
 # API Key Controls & Workflow Management System
 
 ## Overview
@@ -37,11 +36,12 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 - App Attribution Headers: `HTTP-Referer: https://intrafere.com/moto-autonomous-home-ai/`, `X-Title: MOTO Deep Research Harness`
 - Credit exhaustion detection: HTTP 402 OR error messages containing "credit", "insufficient", "balance", "quota", "key limit", "limit exceeded"
 - Raises `CreditExhaustionError` on exhaustion (no retries). Retries transient errors (max 3).
-- Temperature=0.0 default. Stop sequences on all requests: `\n}\n\n`, `\n]\n\n`, `\n}\n\n\n`, `\n]\n\n\n`
+- Temperature=0.0 default. No stop sequences (removed — caused premature truncation with certain models).
 
 #### APIClientManager (`backend/shared/api_client_manager.py`)
-- Central router for all API calls: boost check → role's OpenRouter (with permanent fallback) → LM Studio
+- Central router for all API calls: boost check → role's OpenRouter (with resettable fallback) → LM Studio
 - Tracks fallback state per role: `_role_fallback_state: Dict[str, str]`
+- `reset_openrouter_fallbacks()`: Resets all roles originally configured for OpenRouter back from LM Studio fallback. Called automatically on API key set, or manually via reset endpoint.
 - Lazy initialization: OpenRouter client initializes from `rag_config.openrouter_api_key` when first needed
 
 **CRITICAL REQUIREMENT - Role Configuration:**
@@ -55,7 +55,7 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 
 **Counter Decrement:** `boost_next_count` decrements ONLY on successful boost API calls. Failed/exhausted calls do NOT decrement.
 
-**Permanent Fallback:** Once a role falls back to LM Studio due to credit exhaustion, it NEVER retries OpenRouter for that session. Each role has independent fallback state. If no fallback configured: raises RuntimeError.
+**Resettable Fallback:** When a role hits credit exhaustion, it falls back to LM Studio for subsequent calls. User can reset all fallen-back roles via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key (auto-resets). Each role has independent fallback state. If no fallback configured: raises RuntimeError.
 
 **Categories from role_id:**
 - `aggregator_submitter_*` → "Aggregator Submitters"
@@ -77,7 +77,7 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 Coordinators read actual agent `task_sequence` counters — no prediction. Task IDs exactly match what agents will generate.
 - Aggregator: `agg_sub{N}_{seq:03d}`, `agg_val_{seq:03d}`
 - Compiler: `comp_hc_{seq:03d}`, `comp_hp_{seq:03d}`, `comp_val_{seq:03d}`
-- Autonomous: `auto_ts_{seq:03d}`, `auto_tv_{seq:03d}`
+- Autonomous: `auto_te_{seq:03d}`, `auto_tev_{seq:03d}`, `auto_ts_{seq:03d}`, `auto_tv_{seq:03d}`
 
 ---
 
@@ -93,11 +93,13 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 ## WebSocket Events
 
-**Workflow:** `workflow_updated` (tasks+mode), `task_started` (task_id), `task_completed` (task_id+sequence)
+**Workflow:** `workflow_updated` (tasks+mode), `task_started` (task_id), `task_completed` (task_id+sequence), `token_usage_updated` (total_input, total_output, by_model, elapsed_seconds)
+
+**Boost:** `boost_enabled` (model_id, provider, context_window, max_output_tokens), `boost_disabled`, `task_boost_toggled` (task_id, boosted), `boost_next_count_updated` (count), `category_boost_toggled` (category, boosted), `boost_credits_exhausted` (task_id, message)
 
-**Boost:** `boost_enabled` (model_id, provider, context_window, max_output_tokens), `boost_disabled`, `task_boost_toggled` (task_id, boosted), `boost_next_count_set` (count), `category_boost_toggled` (category, boosted), `boost_credits_exhausted` (task_id, message)
+**Fallback:** `openrouter_fallback` (role_id, reason, message, fallback_model), `openrouter_fallback_failed` (role_id, reason, message), `openrouter_fallbacks_reset` (reset_roles, message)
 
-**Fallback:** `openrouter_fallback` (role_id, reason, message, fallback_model), `openrouter_fallback_failed` (role_id, reason, message)
+**Hung Connection:** `hung_connection_alert` (role_id, model, provider, elapsed_minutes, message) — fires after 15 minutes of no API response. Amber notification stack (bottom-left, offset from credit exhaustion stack). Auto-cleared on research stop and fallbacks reset.
 
 **Rate Limit:** `openrouter_rate_limit` (model, role_id, retry_after, message)
 
@@ -118,11 +120,12 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `GET /api/boost/openrouter-models` — Fetch OpenRouter models (Bearer key header)
 - `GET /api/boost/model-providers?model_id=` — Providers for a model
 - `GET /api/boost/logs?limit=` — Recent boost logs
-- `POST /api/boost/logs/clear` — Clear logs
+- `POST /api/boost/clear-logs` — Clear logs
 
 ### OpenRouter (`backend/api/routes/openrouter.py`)
 - `GET /api/openrouter/lm-studio-availability` — LM Studio availability check
-- `POST /api/openrouter/set-api-key` — Set and validate global OpenRouter key
+- `POST /api/openrouter/set-api-key` — Set and validate global OpenRouter key (auto-resets exhaustion flags)
+- `POST /api/openrouter/reset-exhaustion` — Reset all credit exhaustion flags + role fallback states mid-session
 - `DELETE /api/openrouter/api-key` — Clear key
 - `GET /api/openrouter/api-key-status` — `{ has_key, enabled }`
 - `GET /api/openrouter/models` — Available models (also caches free models for rotation)
@@ -135,12 +138,13 @@ Predictions refresh: after initialization, each task completion, mode switches,
 ### Workflow (`backend/api/routes/workflow.py`)
 - `GET /api/workflow/predictions` — Next 20 predicted tasks
 - `GET /api/workflow/history?limit=` — Completed tasks
+- `GET /api/token-stats` — Cumulative token usage (total_input, total_output, by_model, elapsed_seconds)
 
 ---
 
 ## Error Handling
 
-**Credit Exhaustion:** HTTP 402 or keywords "credit"/"insufficient"/"balance"/"quota"/"key limit"/"limit exceeded" → `CreditExhaustionError` → permanent LM Studio fallback for that role (or RuntimeError if no fallback).
+**Credit Exhaustion:** HTTP 402 or keywords "credit"/"insufficient"/"balance"/"quota"/"key limit"/"limit exceeded" → `CreditExhaustionError` → LM Studio fallback for that role (or RuntimeError if no fallback). Fallback is resettable via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key.
 
 **Boost Exhaustion:** Falls back to primary for that task; boost stays enabled; counter NOT decremented.
 
@@ -170,7 +174,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - Aggregator submitters: per-submitter pause (others continue); validator loop pauses entire validator
 - Prevents infinite retry loops (the 2000+ attempt bug)
 
-**Account Exhaustion:** HTTP 402 on any `:free` model sets `_account_credits_exhausted` flag. All subsequent free model calls short-circuit immediately. Flag clears on next successful free model call.
+**Account Exhaustion:** HTTP 402 on any `:free` model sets `_account_credits_exhausted` flag. All subsequent free model calls short-circuit immediately. Flag clears on next successful free model call, or via `POST /api/openrouter/reset-exhaustion`, or automatically when the API key is re-set.
 
 **Error Classes:**
 - `FreeModelExhaustedError` — all options exhausted, contains `soonest_retry` timestamp
diff --git a/.cursor/rules/json-prompt-design.mdc b/.cursor/rules/json-prompt-design.mdc
index a1a7e5b..bae4719 100644
--- a/.cursor/rules/json-prompt-design.mdc
+++ b/.cursor/rules/json-prompt-design.mdc
@@ -1,5 +1,5 @@
 ---
-alwaysApply: true
+alwaysApply: false
 ---
 # Enhance AI Role Prompts with Complete Context Assembly
 
@@ -217,12 +217,14 @@ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified inte
 - `backend/compiler/prompts/outline_prompts.py`
 - `backend/compiler/prompts/review_prompts.py`
 - `backend/compiler/prompts/rigor_prompts.py`
+- `backend/compiler/prompts/critique_prompts.py`
 - `backend/compiler/validation/compiler_validator.py`
 - `backend/autonomous/prompts/topic_prompts.py`
 - `backend/autonomous/prompts/completion_prompts.py`
 - `backend/autonomous/prompts/paper_reference_prompts.py`
 - `backend/autonomous/prompts/paper_title_prompts.py`
 - `backend/autonomous/prompts/paper_redundancy_prompts.py`
+- `backend/autonomous/prompts/paper_continuation_prompts.py`
 - `backend/autonomous/prompts/final_answer_prompts.py`
 
 **Note:** The prompt structure examples in the sections below show the core task-specific content. The INTERNAL CONTENT WARNING block is ALWAYS inserted between the role description and the "YOUR TASK:" section in the actual code.
@@ -1347,6 +1349,28 @@ The coordinator tracks the current phase via `autonomous_section_phase`:
 **Autonomous Mode Phase Synchronization:**
 When the compiler runs in autonomous mode (Part 3), the autonomous coordinator polls `autonomous_section_phase` every 3 seconds and syncs it to the workflow state (`paper_phase` field). This ensures accurate crash recovery and prevents the bug where workflow state showed "outline" even though the compiler had progressed through body/conclusion/introduction phases.
 
+### Retroactive Brainstorm Operation (Optional, Autonomous Mode Only)
+
+During autonomous paper compilation, the construction JSON includes an optional `brainstorm_operation` field:
+
+```json
+{
+  ... (standard construction fields) ...,
+  "brainstorm_operation": {
+    "action": "edit | delete | add",
+    "submission_number": 5,
+    "new_content": "corrected or new content (empty for delete)",
+    "reasoning": "Independent justification"
+  }
+}
+```
+
+**Validation**: Brainstorm operations are validated by the compiler validator with brainstorm-only context. The validator never sees the paper operation when validating a brainstorm operation.
+
+**Independent Validity Principle**: Each operation must be justified on its own merits. Paper content must not depend on a brainstorm correction. Brainstorm corrections must not depend on paper content.
+
+**Models**: `BrainstormRetroactiveOperation` in `models.py`. Parsed in `high_context_submitter.py`. Handled in `compiler_coordinator._handle_brainstorm_retroactive_operation()`. Validated in `compiler_validator.validate_brainstorm_operation()`.
+
 ---
 
 ## 5. COMPILER-Submitter OUTLINE CREATION (PHASE 1: ITERATIVE REFINEMENT)
@@ -2064,7 +2088,7 @@ The rigor submitter uses a **2-step planning-then-execution process**:
 - Submitters provide exact text (`old_string`) to identify edit locations
 - The `old_string` is pre-validated to exist verbatim (exactly) in the document
 - The `old_string` is pre-validated to be unique (appear only once)
-- If exact match fails, system tries in order: Unicode normalization → whitespace normalization → backslash normalization (collapses `\\\\cmd` → `\\cmd`, handles over-escaping) → consecutive fuzzy matching (conservative last resort)
+- If exact match fails, system tries in order: Unicode normalization → whitespace normalization (multi-spaces) → all-whitespace normalization (collapses newlines/spaces/tabs to single space) → backslash normalization (collapses `\\\\cmd` → `\\cmd`, handles over-escaping) → consecutive fuzzy matching (conservative last resort)
 - If match fails or is ambiguous after all attempts, pre-validation rejects immediately with clear feedback (before LLM validation)
 - LLM validation then focuses on placement context and semantic appropriateness
 - Industry-standard approach used by Cursor, Claude Code, and similar tools
@@ -2094,7 +2118,7 @@ All compiler modes (construction, review, rigor, outline_update) use this schema
 
 
 ### Validation Rules
-- **REJECT** if `old_string` is not found after trying: exact match → Unicode normalization → whitespace normalization → backslash normalization → consecutive fuzzy matching
+- **REJECT** if `old_string` is not found after trying: exact match → Unicode normalization → whitespace normalization → all-whitespace normalization → backslash normalization → consecutive fuzzy matching
 - **REJECT** if `old_string` matches multiple locations (not unique)
 - **REJECT** if `operation` doesn't match the intent (e.g., using "replace" for new content)
 - Validator confirms content flows naturally at the edit location
@@ -2199,6 +2223,18 @@ Part 3 introduces autonomous topic selection, brainstorm-to-paper workflows, and
 
 ---
 
+### 0. TOPIC EXPLORATION (Pre-Selection Candidate Brainstorm)
+
+**File:** `backend/autonomous/prompts/topic_exploration_prompts.py`
+
+**Purpose:** Before topic selection, collect 5 validated candidate brainstorm questions using the full Part 1 aggregator infrastructure (parallel submitters, batch validation up to 3). Uses `build_exploration_user_prompt()` to frame the standard aggregator as a candidate question generator.
+
+**Architecture:** Reuses `AggregatorCoordinator` — no custom JSON schemas. Standard aggregator submitter/validator prompts handle generation and validation. The exploration user prompt provides the framing context (research goal, existing brainstorms/papers, diversity requirement).
+
+**Standard Aggregator JSON Schemas Apply** (from Part 1 submitter/validator prompts).
+
+---
+
 ### 1. TOPIC SELECTION SUBMITTER
 
 **File:** `backend/autonomous/prompts/topic_prompts.py`
@@ -2499,6 +2535,32 @@ No Removal:
 
 ### PART 3 PROMPT ASSEMBLY PATTERNS
 
+### 9. BRAINSTORM CONTINUATION DECISION
+
+**File:** `backend/autonomous/prompts/paper_continuation_prompts.py`
+
+**Function:** `get_continuation_decision_json_schema()`
+
+```
+REQUIRED JSON FORMAT:
+{
+  "decision": "write_another_paper | move_on",
+  "reasoning": "string - Detailed explanation of assessment"
+}
+
+FIELD REQUIREMENTS:
+- decision: MUST be either "write_another_paper" or "move_on"
+- reasoning: ALWAYS required
+```
+
+**Context**: User prompt + brainstorm topic + brainstorm DB + prior papers from this brainstorm (title/abstract/outline) + paper count ("N of 3 maximum"). Does NOT include cross-topic reference papers.
+
+**Validation**: Topic validator validates with `build_continuation_validation_prompt()` via `override_prompt` parameter.
+
+---
+
+### PART 3 PROMPT ASSEMBLY PATTERNS (continued)
+
 All Part 3 prompts follow similar assembly patterns to Part 1 and Part 2:
 
 ```python
@@ -2517,7 +2579,12 @@ All Part 3 prompts follow similar assembly patterns to Part 1 and Part 2:
 
 **Context Variations by Role:**
 
+**Topic Exploration (uses Part 1 Aggregator):**
+- Aggregator user prompt = `build_exploration_user_prompt()` containing research goal, existing brainstorms, completed papers, diversity framing
+- Standard aggregator submitter/validator prompts + context handling (shared training DB, rejection logs, RAG cycling)
+
 **Topic Selection Submitter:**
+- **5 validated candidate brainstorm questions** from topic exploration (direct injection)
 - All brainstorm topics with metadata
 - All completed papers with title + abstract + word count
 - Topic selection rejection history (last 5)
diff --git a/.cursor/rules/latex-renderer.mdc b/.cursor/rules/latex-renderer.mdc
index 650cc92..6fc03ba 100644
--- a/.cursor/rules/latex-renderer.mdc
+++ b/.cursor/rules/latex-renderer.mdc
@@ -1,7 +1,6 @@
 ---
-alwaysApply: true
+alwaysApply: false
 ---
-
 # LaTeX Renderer System
 
 ## 🔒 CRITICAL SECURITY REQUIREMENTS
@@ -66,7 +65,7 @@ Dual rendering: **Rendered LaTeX View** (KaTeX math, dark theme on screen, white
 <LatexRenderer
   content={string}       // Raw content to render
   className={string}     // Optional CSS class
-  showToggle={boolean}   // Show Rendered/Raw toggle (default: false)
+  showToggle={boolean}   // Show Rendered/Raw toggle (default: true)
   defaultRaw={boolean}   // Start in raw mode (default: false)
   showLatex={boolean}    // External view mode control (optional)
 />
@@ -121,26 +120,43 @@ Must execute in this exact order in `renderLatexToHtml()`:
 
 ## Component Integration
 
-| Component | Location | PDF | Toggle | Notes |
-|-----------|----------|-----|--------|-------|
-| LivePaper.jsx | compiler/ | ✅ | ✅ | Real-time paper viewing; auto-switches to raw >50K chars |
-| PaperLibrary.jsx | autonomous/ | ✅ | ✅ | Paper library cards |
-| FinalAnswerView.jsx | autonomous/ | ✅ | ✅ | Tier 3 final answer (defaults to raw for performance) |
-| FinalAnswerLibrary.jsx | autonomous/ | ✅ | ✅ | Final answer library (all sessions) |
-| LivePaperProgress.jsx | autonomous/ | ✅ | ✅ | Live Tier 2 paper in progress |
-| LiveTier3Progress.jsx | autonomous/ | ✅ | ✅ | Live Tier 3 paper in progress |
-| LiveResults.jsx | aggregator/ | ❌ | ✅ | Aggregator submissions (defaults to raw) |
-| BrainstormList.jsx | autonomous/ | ❌ | ✅ | Brainstorm content viewer |
+| Component | Location | PDF | Toggle | Disclaimer | Notes |
+|-----------|----------|-----|--------|------------|-------|
+| LivePaper.jsx | compiler/ | ✅ | ✅ | paper | Real-time paper viewing; auto-switches to raw >50K chars |
+| PaperLibrary.jsx | autonomous/ | ✅ | ✅ | baked-in | Paper library cards (backend embeds disclaimer at save) |
+| FinalAnswerView.jsx | autonomous/ | ✅ | ✅ | baked-in | Tier 3 final answer (defaults to raw for performance) |
+| FinalAnswerLibrary.jsx | autonomous/ | ✅ | ✅ | paper | Final answer library (all sessions) |
+| LivePaperProgress.jsx | autonomous/ | ✅ | ✅ | paper | Live Tier 2 paper in progress |
+| LiveTier3Progress.jsx | autonomous/ | ✅ | ✅ | paper | Live Tier 3 paper in progress |
+| LiveResults.jsx | aggregator/ | ❌ | ✅ | brainstorm | Aggregator submissions (defaults to raw) |
+| BrainstormList.jsx | autonomous/ | ❌ | ✅ | brainstorm | Brainstorm content viewer |
 
 ### PDF Download Usage
 
 ```javascript
 // Pass raw text content — backend handles rendering and PDF generation
-await downloadPDFViaBackend(rawContent, metadata, sanitizeFilename(title), outline);
+// disclaimerType ('paper'|'brainstorm'|null) auto-prepends disclaimer if content lacks one
+await downloadPDFViaBackend(rawContent, metadata, sanitizeFilename(title), outline, onStart, onComplete, onError, 'paper');
 ```
 
 ---
 
+## Disclaimer Injection (`frontend/src/utils/disclaimerHelper.js`)
+
+**Purpose:** Hallucination/AI-generated-content disclaimers are shown on every brainstorm and paper view and included in every download — but NEVER injected into the model's context window.
+
+**Approach:** Frontend-only. `prependDisclaimer(content, type)` prepends a disclaimer block unless one already exists (detects both the backend-embedded `AUTONOMOUS AI SOLUTION` header on completed papers and the frontend `DISCLAIMER` header).
+
+**Two variants:** `PAPER_DISCLAIMER` (for papers) and `BRAINSTORM_DISCLAIMER` (for brainstorm/aggregator databases).
+
+**Completed papers** (`PaperLibrary`, `FinalAnswerView`) already carry a richer backend-embedded disclaimer with model attribution; the `hasDisclaimer()` check prevents double-prepending.
+
+**Download helpers** (`downloadRawText`, `downloadPDFViaBackend`) accept an optional `disclaimerType` param that triggers the same `prependDisclaimer` logic before writing.
+
+**Critical invariant:** Backend brainstorm files and in-progress paper files remain disclaimer-free so models never waste context tokens on disclaimer text.
+
+---
+
 ## Paper Critique Modal (`PaperCritiqueModal.jsx`)
 
 Ratings: Novelty, Correctness, Impact (1-10 scale). Up to 10 history entries. Regeneration with custom prompt.
@@ -167,3 +183,4 @@ Ratings: Novelty, Correctness, Impact (1-10 scale). Up to 10 history entries. Re
 12. IntersectionObserver root margin MUST be ≥600px — prevents visible pop-in
 13. Debounce delay applies ONLY to rendered mode — raw mode updates instantly
 14. Chunk `key` MUST include content hash (`simpleHash`) — prevents React reusing stale DOM on content change
+15. Disclaimer MUST appear on all brainstorm/paper display and download paths — injected at frontend layer only, never stored in backend files consumed by models
diff --git a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
index 098f082..e89f88e 100644
--- a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
+++ b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
@@ -56,7 +56,7 @@ No context carryover between prompts (only system-intended DB/submission transfe
 
 **RAG Offload Priority — Submitter:** Shared Training DB → Local Submitter DB → Rejection Log → User Upload Files
 
-**RAG Offload Priority — Validator:** Shared Training DB → User Upload Files → Submission under review (last resort)
+**RAG Offload Priority — Validator:** Shared Training DB → User Upload Files (submission under review is always direct injected)
 
 ## Role Selection
 
@@ -85,7 +85,9 @@ Every 7th acceptance (`total_acceptances % 7 == 0`, minimum 7 before first revie
 
 **Phase 1**: Validator reviews ALL accepted submissions, identifies AT MOST ONE for removal (redundant, contradicted, superseded, or provides no unique value).
 
-**Phase 2** (only if removal proposed): Validator self-validates its removal proposal. Conservative default: if uncertain, reject removal. If validated: execute removal + trigger RAG rechunk.
+**Phase 2** (only if removal proposed): Validator self-validates its removal proposal. Conservative default: if uncertain, reject removal. If validated: execute removal + full RAG rebuild (all shared-training sources are dropped and re-indexed from the post-removal file so deleted content is no longer retrievable).
+
+**Cleanup toggle**: `enable_cleanup_review` (default True) can be set False at `Coordinator.initialize()` to disable cleanup for short-lived mini-brainstorm phases (topic exploration, title exploration).
 
 **Critical selection rule**: When multiple submissions redundant, remove the WEAKEST (least unique value). Never remove a more complete submission.
 
diff --git a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
index c0eb38c..04a0207 100644
--- a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
+++ b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
@@ -70,6 +70,7 @@ The live-constructing compiler-written paper should be viewable in one tab and a
 - **Compiler defaults**: validator=25000, high-context=25000 (for outline_create/outline_update/construction/review), high-param=25000 (for rigor mode)
 - **GUI tooltips** provide recommended minimums: Submitter "25000+ for reasoning models", Validator "25000+", High-context "25000+ (outline needs 15K+)", High-param "25000+"
 - Settings are passed through API routes and stored in `rag_config` (aggregator) and `system_config` (compiler)
+- **CRITICAL**: `system_config.compiler_*` settings (context windows, max output tokens) are the single source of truth for all compiler modules. ANY code that creates a `CompilerCoordinator` MUST write its context/token settings to `system_config` BEFORE init. The manual `/api/compiler/start` route does this; autonomous mode (`autonomous_coordinator.py`) must do it explicitly before each `CompilerCoordinator()` creation.
 - Reasoning models (e.g., those with `<think>` tags or separate `reasoning` fields) may use significant tokens on internal reasoning before generating JSON output
 
 ## Other Notes
diff --git a/.cursor/rules/part-2-compiler-tool-design-specification.mdc b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
index a7ff80e..4559443 100644
--- a/.cursor/rules/part-2-compiler-tool-design-specification.mdc
+++ b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
@@ -167,6 +167,7 @@ Submission JSON: `operation`, `old_string` (exact, pre-validated), `new_string`.
 1. Exact match
 2. Unicode hyphen normalization (en-dash, em-dash variants)
 3. Whitespace normalization (2+ spaces → single space)
+3b. All-whitespace normalization (collapses newlines/spaces/tabs → single space)
 4. Backslash normalization (`\\mathbb` → `\mathbb`)
 5. Consecutive fuzzy matching: 85% consecutive chars + last 5% exact tail anchor + unique (≥20 char minimum)
 
@@ -196,16 +197,19 @@ Prevents models' fake placeholder text (e.g., "XI. Conclusion\n*placeholder*") f
 
 Per-role context windows (all user-configurable, default 131072):
 - Validator, High-Context Submitter, High-Parameter Submitter: 131072 tokens each
+- **Settings flow**: All compiler modules read from `system_config.compiler_*` at runtime. The caller that creates `CompilerCoordinator` MUST write settings to `system_config` before init (manual mode: `/api/compiler/start`; autonomous mode: `autonomous_coordinator.py` before `CompilerCoordinator()` creation).
 - Rigor mode dynamically adjusts RAG budget if outline + system prompts exceed available context
+- Construction mode (autonomous) dynamically adjusts RAG budget when brainstorm content is present: `rag_budget = max(5000, max_allowed - outline_tokens - paper_tokens - brainstorm_tokens - 5000_overhead)`. Brainstorm always direct-injected at full fidelity; RAG evidence scales to fit remaining budget.
 
 **Context rules:** User prompt ALWAYS direct injected. Direct injection first; RAG only when doesn't fit. ~85% RAG retrieval, ~15% direct injections. Halt with error if user prompt exceeds context_window - minimum_RAG_allocation.
 
 **Prompt Size Validation** (all submitters before LLM call):
-- `outline_create`, `outline_update`, `rigor`: raises ValueError if exceeds
-- `construction`, `review`: returns None if exceeds
+- `outline_create`, `outline_update`, `rigor`, `construction`, `review`: raises ValueError if exceeds
 - `validator`: rejects submission if exceeds
 
-**Rigor Mode context**: no aggregator database; outline fully injected; paper content RAG-retrieved.
+**Rigor Mode context**: no aggregator database; outline fully injected; paper content RAG-retrieved. RAG excludes `compiler_outline.txt` (already direct-injected).
+
+**RAG source exclusion (anti-duplication)**: All compiler RAG calls pass `exclude_sources` to skip chunks from content already direct-injected. Construction excludes outline + paper + brainstorm sources; outline_update excludes outline + paper; rigor excludes outline. See `rag-design-for-overall-program.mdc` for full table.
 
 ---
 
@@ -215,6 +219,26 @@ Per-role context windows (all user-configurable, default 131072):
 
 ---
 
+## Retroactive Brainstorm Correction (Autonomous Mode Only)
+
+During paper compilation in autonomous mode (Part 3), the compiler submitter sees both the paper AND the source brainstorm database as a unified editable workspace. The submitter may optionally propose a brainstorm operation alongside its paper operation each turn.
+
+**Brainstorm operations**: `edit` (correct submission content), `delete` (remove submission), `add` (new insight discovered during synthesis).
+
+**Independent Validation Principle**: Paper and brainstorm operations are validated SEPARATELY. The validator sees ONLY the paper when validating paper edits, ONLY the brainstorm when validating brainstorm operations. Each must stand on its own merits. Neither can depend on the other for correctness.
+
+**Acceptance is independent**: Paper accepted + brainstorm rejected = valid state. Brainstorm accepted + paper rejected = valid state. No combination produces incoherence.
+
+**Brainstorm content**: Passed to construction prompts with full submission numbers. Submitter references entries by `#N` for edit/delete.
+
+**RAG refresh**: After accepted brainstorm modification, RAG is refreshed with updated brainstorm content so subsequent construction turns see corrected context.
+
+**Files**: `brainstorm_memory.py` (edit_submission, remove_submission, add_submission_retroactive), `compiler_validator.py` (validate_brainstorm_operation), `compiler_coordinator.py` (_handle_brainstorm_retroactive_operation), `construction_prompts.py` (brainstorm_operation JSON schema).
+
+**WebSocket events**: `brainstorm_retroactive_accepted`, `brainstorm_retroactive_rejected`.
+
+---
+
 ## Other Notes
 
 - JSON validation failure: reject submission, send reason to submitter's local failure feedback
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index c668b67..fb31b54 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -2,11 +2,11 @@
 alwaysApply: true
 ---
 
-# Part 3 - Autonomous Research Mode Design Specification
+# Part 3 (Adding an Autonomous-Controlling Tier in Hierarchy Over Part 1 and 2) - Autonomous Research Mode Design Specification
 
 ## Overview
 
-The Autonomous Research Mode is Part 3 of the MOTO Math Variant system. It is a self-directing two-tier research system that autonomously generates brainstorm topics, builds knowledge databases, and produces complete mathematical research papers based on a high-level research topic centered around the user prompt.
+The Autonomous Research Mode is Part 3 of the MOTO Math Variant system. It is a self-directing three-tier research system that autonomously generates brainstorm topics, builds knowledge databases, produces complete mathematical research papers, and can synthesize a final answer based on a high-level research topic centered around the user prompt.
 
 **Example User Prompt**: "Solve the Langlands Bridge problem" or "Advance understanding of the Riemann Hypothesis"
 
@@ -15,9 +15,10 @@ The Autonomous Research Mode is Part 3 of the MOTO Math Variant system. It is a
 - Part 2 (Compiler) requires user-directed paper compilation prompts
 - Part 3 (Autonomous Research) self-directs topic selection, brainstorming, and paper generation
 
-**Two-Tier Architecture**:
+**Three-Tier Architecture**:
 - **Tier 1**: Brainstorm aggregation databases (mathematical concept exploration)
 - **Tier 2**: Finished mathematical research papers (compiled from brainstorm databases)
+- **Tier 3**: Final answer synthesis (short-form answer or long-form volume from Tier 2 papers)
 
 ## Design Philosophy
 
@@ -29,7 +30,7 @@ The Autonomous Research Mode is Part 3 of the MOTO Math Variant system. It is a
 
 **Model Weight Exploration**: Completion review uses SPECIAL SELF-VALIDATION MODE because only the same model can assess whether its own weights have been exhausted for a given topic.
 
-**Internal Knowledge Only**: The autonomous system operates solely on the model's pre-trained mathematical knowledge, RAG context from prior work, and user prompt. No external data access.
+**External Verification Allowed**: The autonomous system may use the model's pre-trained mathematical knowledge, RAG context from prior work, user prompt, and external verification/search when the selected model/provider supports it. Internal AI-generated context remains non-authoritative and should be treated skeptically.
 
 ---
 
@@ -64,6 +65,7 @@ The autonomous coordinator USES actual Part 2 compiler infrastructure for paper
 - Extracts abstract from completed paper for metadata storage
 
 **Critical Implementation Details**:
+- **system_config propagation (REQUIRED)**: Before creating `CompilerCoordinator`, autonomous mode MUST write all compiler context/token settings to `system_config` (e.g., `system_config.compiler_high_context_context_window = self._high_context_context`). Compiler modules read from `system_config` at init — the manual `/api/compiler/start` route does this, but autonomous mode bypasses that route and must do it explicitly. Applies to both `_compile_paper_from_brainstorm()` and `_compile_tier3_paper()`.
 - Constrains section order: Body → Conclusion → Introduction → Abstract
 - Paper is considered complete when abstract is detected in paper content
 - Uses regex patterns to detect and extract abstract section
@@ -75,14 +77,55 @@ The autonomous coordinator USES actual Part 2 compiler infrastructure for paper
 ## Workflow Overview
 
 **Tier 1 → Tier 2 → Tier 3 Loop:**
-1. **Topic Selection** → Validator → Pre-Brainstorm Reference Selection (if papers exist)
+0. **Topic Exploration** — Mini-aggregation: collect 5 validated candidate brainstorm questions (submit→validate→accumulate loop with rejection feedback). Broadens exploration landscape before committing to a direction.
+1. **Topic Selection** (sees all 5 candidates + existing topics) → Validator → Pre-Brainstorm Reference Selection (if papers exist)
 2. **Brainstorm Aggregation** (1-10 submitters, 1 validator, pruning every 7, with reference papers)
 3. **Completion Review** every 10 acceptances (SPECIAL SELF-VALIDATION) → Continue or Write Paper
-4. If Write Paper: **Additional Reference Selection** → **Paper Title Selection** → **Paper Compilation** (Body→Conclusion→Introduction→Abstract)
+4. If Write Paper: **Additional Reference Selection** → **Paper Title Exploration** (5 candidates) → **Paper Title Selection** → **Paper Compilation** (Body→Conclusion→Introduction→Abstract)
 5. **Paper Complete** → Log to Tier 2, cache brainstorm
 6. **Paper Redundancy Review** every 3 papers
-7. **Tier 3 Final Answer** every 5 papers (Certainty→Format→Short-form or Long-form volume)
-8. Loop back to Topic Selection (or STOP if Tier 3 complete)
+7. **Brainstorm Continuation Decision** (if papers < 3): write another paper or move on. If write another: new title → compilation with prior brainstorm papers as auto-refs → loop to step 5
+8. **Tier 3 Final Answer** every 5 papers (Certainty→Format→Short-form or Long-form volume)
+9. Loop back to Topic Selection (or STOP if Tier 3 complete)
+
+---
+
+## PHASE 0: Topic Exploration (Pre-Selection Candidate Brainstorm)
+
+### Purpose
+Before committing to a brainstorm direction, the system runs a full aggregation using the Part 1 infrastructure that collects 5 validated candidate brainstorm questions. This broadens the exploration landscape using all configured submitters in parallel with batch validation.
+
+### Why This Exists (Top-p Exploration at Strategic Level)
+Without exploration, the topic selector samples from the model's highest-probability region — the most obvious topic. By forcing 5 distinct, validated candidate directions first, the system maps the exploration landscape before committing:
+- Breaks greedy single-sample selection
+- Validator enforces diversity (rejects redundant candidates)
+- Final selector sees the full landscape of options
+- Uses full Part 1 aggregator infrastructure (parallel submitters, batch validation up to 3)
+
+### Architecture
+- **Uses `AggregatorCoordinator`** from Part 1 — same parallel submitters + batch validator as normal brainstorms, but with **cleanup/pruning disabled** (`enable_cleanup_review=False`) since target is only 5 candidates
+- **Prompts** (`backend/autonomous/prompts/topic_exploration_prompts.py`): `build_exploration_user_prompt()` frames the aggregation task for candidate question generation
+- **Temp DB**: `exploration_candidates.txt` in brainstorms directory (cleaned up after phase)
+- **Target**: 5 accepted candidates per exploration cycle
+- **Safety valve**: 15 consecutive rejections → proceed with whatever candidates collected
+
+### Workflow
+1. Aggregator starts with all configured submitters running in parallel
+2. Submitters generate candidate brainstorm questions as standard submissions
+3. Validator batch-validates (up to 3 at a time) checking quality, relevance, and DIVERSITY
+4. Accepted candidates accumulate in temp exploration database
+5. Coordinator monitors aggregator stats, stops at 5 acceptances
+6. Reads exploration DB, formats as candidate list for topic selector
+
+### WebSocket Events
+Standard aggregator events (`submission_accepted`, `submission_rejected`) flow through during exploration.
+Additionally: `topic_exploration_started`, `topic_exploration_progress`, `topic_exploration_complete`
+
+### Crash Recovery
+On resume, exploration restarts fresh (short phase, no state to preserve).
+
+### Every Brainstorm Starts This Way
+Topic exploration runs before EVERY new topic selection cycle — no exceptions.
 
 ---
 
@@ -96,6 +139,7 @@ The autonomous topic submitter decides what to work on next. It can:
 
 ### Topic Submitter Context
 The submitter receives:
+- **5 validated candidate brainstorm questions** from Topic Exploration phase (direct injected)
 - User's high-level research prompt (PRIMARY context, always direct injected)
 - List of all existing brainstorm topics with metadata:
   - Topic ID
@@ -261,16 +305,16 @@ The autonomous brainstorm aggregator inherits batch validation from Part 1 infra
 - **Validator processes up to 3 submissions at once**: Uses batch-specific prompts for 1, 2, or 3 submissions
 - **Independent assessment of each submission's value**: Each submission evaluated against existing database independently
 - **Intra-batch redundancy prevention**: If multiple submissions would be accepted but are redundant with each other, only the strongest is accepted
-- **Queue overflow handling**: If 10+ submissions queued, takes latest 3 and clears rest (older submissions were generated against outdated database state)
+- **Queue overflow handling**: If 10+ submissions queued, submitters are paused by the coordinator until queue drops below threshold
 - **Accelerated brainstorm exploration**: Batch validation increases throughput while maintaining quality through redundancy checks
 
 ### Key Differences from Part 1 Aggregator
 1. **Topic-Specific Database**: Writes to `data/auto_brainstorms/brainstorm_{topic_id}.txt` instead of `rag_shared_training.txt`
 2. **No User-Provided Topic Prompt**: Uses the AI-generated brainstorm topic prompt
 3. **Completion Tracking**: Tracks acceptance count (including removals) for completion review trigger
-4. **Hard Limit**: 80 accepted submissions (FORCE transition to paper writing, no completion review)
+4. **Hard Limit**: 30 accepted submissions (FORCE transition to paper writing, no completion review)
    - Purpose: Prevents runaway brainstorms from accumulating indefinitely
-   - Trigger: After each acceptance, check if count >= 80
+   - Trigger: After each acceptance, check if count >= 30
    - Behavior: Immediately transition to paper writing, skip completion review
    - WebSocket event: `brainstorm_hard_limit_reached`
 5. **Rejection Hard Limit**: 10 consecutive rejections (with minimum 5 acceptances) FORCE transition to paper writing
@@ -300,12 +344,12 @@ The autonomous brainstorm aggregator inherits batch validation from Part 1 infra
 ### Regular Trigger
 Runs every 10 accepted submissions (includes both new acceptances AND pruning removals), AFTER the pruner has had its chance to run.
 
-**Hard Limit Override**: If brainstorm reaches 80 accepted submissions, completion review is SKIPPED and paper writing is forced.
+**Hard Limit Override**: If brainstorm reaches 30 accepted submissions, completion review is SKIPPED and paper writing is forced.
 
 **Example trigger points**: 
 - Acceptances at 10, 20, 30, 40... trigger completion review
 - If prune removal happens at acceptance 9, the next acceptance (10th total) still triggers review
-- At 80 acceptances: Hard limit triggers, completion review skipped, paper writing forced
+- At 30 acceptances: Hard limit triggers, completion review skipped, paper writing forced
 
 ### Manual Paper Writing Trigger (User Override)
 
@@ -348,6 +392,7 @@ Runs every 10 accepted submissions (includes both new acceptances AND pruning re
 - Does NOT require self-validation (user decision is final)
 - Brainstorm is marked complete regardless of acceptance count
 - Subsequent paper compilation proceeds normally with all selected reference papers
+- **Race condition guard**: `_brainstorm_aggregation_loop()` checks `_manual_paper_writing_triggered` before calling `start()` on the aggregator (catches override during async init). The monitoring loop also stops the aggregator before returning on manual override.
 
 ### Purpose
 Assess whether the current brainstorm has been sufficiently explored relative to THIS MODEL'S internal knowledge (weights) and decide whether to continue brainstorming or begin writing a paper.
@@ -424,6 +469,30 @@ Same two-step browsing workflow as pre-brainstorm selection (expand request →
 
 **Final Reference List**: Already-selected papers + newly-selected papers (max 6 total)
 
+### Paper Title Exploration (Pre-Title Candidate Brainstorm)
+
+**Purpose**: Before committing to a paper title, the system collects 5 validated candidate titles using the Part 1 aggregator infrastructure. The final title selection then chooses from candidates, synthesizes them, or proposes a new title with justification.
+
+**Architecture**: Uses `AggregatorCoordinator` from Part 1 — same parallel submitters + batch validator, but with **cleanup/pruning disabled** (`enable_cleanup_review=False`) since target is only 5 candidates.
+
+**Applies to EVERY paper creation**: Tier 2 papers (1/2/3 from brainstorm), Tier 3 short-form, Tier 3 gap/intro/conclusion chapters.
+
+**Workflow**:
+1. Aggregator starts with all configured submitters running in parallel
+2. Submitters generate candidate paper titles as standard submissions
+3. Validator checks quality, relevance, and DIVERSITY (rejects near-duplicates)
+4. Accepted candidates accumulate in temp title DB
+5. Coordinator stops at 5 acceptances (or 15 consecutive rejections safety valve)
+6. Reads title DB, formats as candidate list for final title selection
+
+**Temp DB**: `title_candidates_{topic_id}.txt` in brainstorms dir (cleaned up after phase)
+
+**WebSocket Events**: `paper_title_exploration_started`, `paper_title_exploration_progress`, `paper_title_exploration_complete`
+
+**Crash Recovery**: On resume, exploration restarts fresh (short phase, no state to preserve).
+
+**Prompts**: `paper_title_exploration_prompts.py` — `build_title_exploration_user_prompt()` frames the aggregation task for candidate title generation with context: user prompt, topic, brainstorm summary, existing papers, reference papers.
+
 ### Paper Title Selection
 
 **Context**:
@@ -432,8 +501,9 @@ Same two-step browsing workflow as pre-brainstorm selection (expand request →
 - Selected reference papers (if any, RAG)
 - ALL existing paper titles from THIS brainstorm topic (direct injection)
 - ALL existing paper abstracts from THIS brainstorm topic (if any, direct injection)
+- **5 validated candidate titles from Paper Title Exploration phase** (direct injection)
 
-**Purpose**: Choose a title for the paper that will be compiled from this brainstorm.
+**Purpose**: Choose a title for the paper that will be compiled from this brainstorm. The selector sees 5 pre-validated candidate titles and may select one, synthesize, or propose a new title with justification.
 
 JSON schema defined in `json-prompt-design.mdc`. Fields: `paper_title`, `reasoning`.
 
@@ -462,6 +532,18 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `paper_title`, `reasoni
 
 Once paper title is selected and validated, paper compilation begins using the FULL Part 2 compiler workflow.
 
+### Retroactive Brainstorm Correction (Unified Workspace)
+
+During paper compilation, the compiler submitter sees both the paper AND the source brainstorm database simultaneously. On each construction turn, the submitter may optionally propose a brainstorm edit/delete/add alongside its paper operation.
+
+**Key design**: Submitter sees full workspace (paper + brainstorm). Validator sees ONLY the specific operation being validated (paper OR brainstorm, never both). Each operation must be independently justified.
+
+**Operations**: edit (correct entry), delete (remove entry), add (new insight). Each validated independently by the compiler validator with brainstorm-only context.
+
+**Independent acceptance**: Paper and brainstorm results are independent. Paper accepted + brainstorm rejected = valid. RAG refreshed after accepted brainstorm modifications.
+
+**Not available in manual Part 2 mode** — only during autonomous paper compilation where `_current_topic_id` is set.
+
 ### Compilation Workflow
 
 **Uses existing Part 2 (Compiler) infrastructure**:
@@ -523,11 +605,13 @@ The validator will REJECT any outline missing these required sections or with in
 **Skip Critique Phase (User Override)**:
 - **Purpose**: Allow users to manually skip the critique/rewrite phase and proceed directly to conclusion
 - **API Endpoint**: `POST /api/auto-research/skip-critique`
-- **Availability**: Only during Tier 2 paper writing when actively in critique phase
-- **Behavior**: Immediately ends critique phase, transitions to conclusion phase, broadcasts `critique_phase_skipped` with `reason: "user_override"`
-- **Cannot be undone**: Once executed, critique phase for current paper version is permanently skipped
-- **Frontend**: "Skip Critique & Continue" button appears in paper status banner during critique phase (requires confirmation)
-- **Error Conditions**: 400 if not running, 400 if not in Tier 2 paper writing, 400 if not in critique phase
+- **Availability**: Any time during Tier 2 paper writing
+- **Behavior**:
+  - If already in critique phase: immediately ends critique and transitions to conclusion
+  - If critique phase has not started yet: queues a pre-emptive skip and auto-skips when critique is reached
+- **Cannot be undone**: Once executed or queued, critique for the current paper version is bypassed
+- **Frontend**: The paper status banner supports both immediate skip and pre-emptive queued skip
+- **Error Conditions**: 400 if not running, 400 if not in Tier 2 paper writing
 
 **Outline Updates**: Outline can be updated at any time during the cycle (same as Part 2)
 
@@ -686,9 +770,24 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `should_remove` (bool),
    - Update metadata to mark as "archived"
    - Update statistics
 
-### Return to Topic Selection
+### Return to Topic Selection / Brainstorm Multi-Paper Continuation
+
+After paper completion and redundancy review, the system enters a **continuation decision loop** (max 3 papers per brainstorm):
+
+1. If `papers_from_brainstorm < 3`: Run continuation decision (submitter + topic validator)
+   - **write_another_paper**: New title selection + compilation (skip reference re-selection, auto-inject prior brainstorm papers)
+   - **move_on**: Proceed to Tier 3 check, then Topic Selection
+2. If 3 papers reached (hard limit): Skip decision, proceed to Tier 3 check
+
+**Continuation Decision Context**: User prompt + brainstorm topic + brainstorm DB + all prior papers (title/abstract/outline). Does NOT include cross-topic reference papers.
 
-After paper completion (and redundancy review if triggered), the workflow checks if **Tier 3 Final Answer** should trigger.
+**Prior Brainstorm Papers as References**: For paper 2/3, all prior papers from the same brainstorm are auto-loaded into compiler RAG as `is_user_file=True` (high priority). These are separate from the 6-paper cross-topic reference limit.
+
+**Reference Selection**: Runs ONCE per brainstorm cycle. Papers 2/3 reuse the same cross-topic references.
+
+**WebSocket Events**: `brainstorm_continuation_started`, `brainstorm_continuation_decided`, `brainstorm_paper_limit_reached`
+
+**Crash Recovery**: `brainstorm_paper_count` and `current_brainstorm_paper_ids` persisted in workflow state.
 
 ---
 
@@ -846,11 +945,15 @@ The system implements **two tiers of model tracking**:
 ================================================================================
 AUTONOMOUS AI SOLUTION
 
-Disclaimer: This content is for informational purposes only. This paper was
-autonomously generated with the novelty-seeking MOTO harness without peer review
-or user oversight beyond the original prompt. AI-generated content may contain
-fabricated or unverified claims presented with high confidence. All content
-should be viewed with extreme scrutiny and independently verified before use.
+Disclaimer: This content is provided for informational and experimental purposes
+only. This paper was autonomously generated with the novelty-seeking MOTO
+harness without peer review or user oversight beyond the original prompt. It
+may contain incorrect, incomplete, misleading, or fabricated claims presented
+with high confidence. Use of this content is at your own risk. You are solely
+responsible for reviewing and independently verifying any output before relying
+on it, and the developers, operators, and contributors are not responsible for
+errors, omissions, decisions made from this content, or any resulting loss,
+damage, cost, or liability.
 
 User's Research Prompt: [user's original prompt here]
 
@@ -939,11 +1042,15 @@ Tier 3 tracks all models used during final answer generation for author attribut
 ================================================================================
 AUTONOMOUS AI SOLUTION
 
-Disclaimer: This content is for informational purposes only. This paper was
-autonomously generated with the novelty-seeking MOTO harness without peer review
-or user oversight beyond the original prompt. AI-generated content may contain
-fabricated or unverified claims presented with high confidence. All content
-should be viewed with extreme scrutiny and independently verified before use.
+Disclaimer: This content is provided for informational and experimental purposes
+only. This paper was autonomously generated with the novelty-seeking MOTO
+harness without peer review or user oversight beyond the original prompt. It
+may contain incorrect, incomplete, misleading, or fabricated claims presented
+with high confidence. Use of this content is at your own risk. You are solely
+responsible for reviewing and independently verifying any output before relying
+on it, and the developers, operators, and contributors are not responsible for
+errors, omissions, decisions made from this content, or any resulting loss,
+damage, cost, or liability.
 
 User's Research Prompt: [user's original prompt here]
 
@@ -1053,7 +1160,7 @@ Returns: is_long_form, volume_title, outline_complete, current/total/completed c
 
 #### FinalAnswerView.jsx
 Main component for displaying Tier 3 status and content:
-- Status badge: "FINAL ANSWER IN PROGRESS" (yellow) or "FINAL ANSWER" (green)
+- Status badge: "FINAL ANSWER IN PROGRESS" uses the active Tier 3 accent state; completion uses the green success state
 - Certainty assessment display
 - Format selection display
 - Volume organization with chapter status (long form)
@@ -1273,7 +1380,7 @@ Main interface component:
 Brainstorm management component:
 - List of all brainstorm topics with status indicators
 - Expandable to show brainstorm database content
-- Status badges: In Progress (yellow), Complete (green)
+- Status badges: In Progress uses the active accent state; Complete uses the green success state
 - Submission counts per brainstorm
 - Papers generated from each brainstorm
 - **Delete button**: Removes brainstorm and all associated files
@@ -1367,7 +1474,7 @@ Real-time Tier 3 final answer display component (embedded in AutonomousResearchI
 
 ### FinalAnswerView.jsx
 Tier 3 Final Answer display component (separate tab for completed/overall final answer status):
-- Status badge: "FINAL ANSWER IN PROGRESS" (yellow) or "FINAL ANSWER ✓" (green)
+- Status badge: "FINAL ANSWER IN PROGRESS" uses the active Tier 3 accent state; "FINAL ANSWER ✓" uses the green success state
 - Certainty assessment summary display
 - Format selection indicator (Short Form / Long Form)
 - Volume organization outline with chapter status (for long form):
@@ -1382,7 +1489,7 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 
 **Tab Styling**:
 - Tab appears in "Final Answer" section of navigation
-- Yellow highlight when Tier 3 is active (in progress)
+- Active Tier 3 tab uses the in-progress highlight state with pulse animation
 - Green highlight with checkmark when complete
 
 
@@ -1413,16 +1520,17 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
   - Brainstorm database as primary source
 
 ### Running Modes
-- **Part 1, Part 2, Part 3 can run INDEPENDENTLY** (user chooses which mode)
-- **Part 1 and Part 2 can run SIMULTANEOUSLY** (as originally designed)
-- **Part 3 runs ALONE** (it internally uses Part 1 and Part 2 components but manages them autonomously)
-- User cannot manually start Part 1 or Part 2 while Part 3 is running (Part 3 controls them)
+- **Part 1, Part 2, and Part 3 remain user-selectable modes**
+- **Only ONE workflow mode may be active at a time** — Aggregator, Compiler, and Autonomous Research are now mutually exclusive at runtime
+- **Part 3 internally controls Part 1 and Part 2 components** during autonomous execution
+- Starting any mode while another mode is running must be blocked until the active mode is stopped
 
 ---
 
 ## Prerequisites
 
-- At least one LM Studio model must be available for each role
+- Either an OpenRouter API key or at least one LM Studio model must be available to begin
+- LM Studio is highly recommended even with OpenRouter enabled because local embeddings/RAG are free and faster
 - User must provide high-level research prompt
 - No dependency on prior Part 1 or Part 2 usage
 - Fresh start with empty brainstorm/paper libraries
@@ -1432,8 +1540,8 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 ## Error Handling
 
 ### JSON Parse Failure (Topic Selection)
-- Retry up to 3 times with same context
-- If persistent, log error and retry with refreshed context (include prior failure in context)
+- Retry indefinitely with rejection feedback (same as other agents)
+- Each retry includes prior failure context
 
 ### JSON Parse Failure (Brainstorm Aggregation)
 - Same as Part 1 Aggregator: reject submission, feedback to submitter
@@ -1470,10 +1578,16 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 - High-context submitter max tokens: 25000
 - High-parameter submitter max tokens: 25000
 - Completion review interval: 10 acceptances (includes removals)
-- Topic selection retry limit: 3
 - Max brainstorms in parallel: 1 (sequential brainstorm → paper cycle)
 - Max reference papers for context: 6
 
+### Token Tracking & Research Timer
+- `token_tracker` singleton resets and starts timer on `autonomous_coordinator.start()`, stops on stop/finally
+- Cumulative input/output tokens tracked per model from every successful LLM completion call (6 code paths in `api_client_manager`)
+- `token_usage_updated` WebSocket event broadcast after each tracked call; `GET /api/token-stats` for initial fetch
+- Displayed in WorkflowPanel sidebar (timer, totals, expandable per-model breakdown)
+- Also activated for standalone aggregator/compiler via API route start/stop
+
 ---
 
 ## Critical Invariants
@@ -1500,11 +1614,23 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 20. **Model tracking is ENABLED during Tier 3** - All API calls tracked for author attribution and model credits
 21. **Same model = single author** - Model used in multiple instances counts as ONE author entry, but all API calls tallied
 22. **Paper redundancy is DISABLED during Tier 3** - `_tier3_active` flag prevents redundancy checks from purging papers being used in the final volume
-23. **Brainstorm hard limit is 80 acceptances** - After 80 acceptances, paper writing is forced (no completion review)
+23. **Brainstorm hard limit is 30 acceptances** - After 30 acceptances, paper writing is forced (no completion review)
 24. **Maximum 1 completed rewrite per paper** - Rewrite counts as "completed" only after first successful body acceptance; prevents infinite loops from failed rewrite attempts
 25. **Partial revision option available** - Allows targeted edits without full body rewrite
 26. **Total rewrite is last resort** - Only for catastrophic issues that can't be fixed with targeted edits
 27. **Rejection hard limit is 10 consecutive rejections (with 5+ acceptances)** - Prevents infinite rejection loops
+28. **Retroactive brainstorm corrections during Tier 2 paper compilation** - Submitter sees unified paper+brainstorm workspace; operations validated independently by validator (paper-only context for paper ops, brainstorm-only context for brainstorm ops); each operation must stand alone without requiring the other for correctness
+29. **Max 3 papers per brainstorm** - hard limit, continuation decision skipped after 3rd paper
+30. **Prior brainstorm papers ALWAYS auto-included** for paper 2/3 as `is_user_file=True` in RAG, separate from 6-paper cross-topic reference limit
+31. **Reference selection runs ONCE per brainstorm cycle** - papers 2/3 reuse same cross-topic references
+32. **Topic validator validates continuation decisions** - not self-validation (strategic decision, not weight assessment)
+33. **Tier 3 checks after brainstorm cycle completes** (move_on or hard limit), not between papers
+34. **No brainstorm re-opening during continuation** - strictly write_another_paper or move_on
+35. **Topic exploration runs before EVERY topic selection** — Uses full Part 1 aggregator with all submitters in parallel and batch validation to collect 5 candidate questions. No exceptions.
+36. **Topic exploration uses standard aggregator (cleanup disabled)** — Same parallel submitters, batch validation (up to 3), queue management as normal brainstorms. Cleanup/pruning is disabled because the phase is capped at 5 candidates and the temp DB is deleted afterwards.
+37. **Paper title exploration runs before EVERY title selection** — Uses full Part 1 aggregator to collect 5 candidate titles before every paper creation (Tier 2 papers 1/2/3, Tier 3 short-form, Tier 3 gap/intro/conclusion chapters). No exceptions.
+38. **Title exploration uses standard aggregator (cleanup disabled)** — Same parallel submitters, batch validation, queue management. Cleanup/pruning is disabled because the phase is capped at 5 candidates and the temp DB is deleted afterwards.
+39. **Final title selection sees candidate titles** — The 6th selection can choose a candidate, synthesize, or propose new. Must justify divergence from all candidates.
 
 ---
 
@@ -1540,7 +1666,7 @@ Each role in autonomous research mode supports OpenRouter model selection with h
 **Fallback Behavior**:
 - If OpenRouter is selected and has a fallback configured: Automatically falls back to LM Studio on credit exhaustion
 - If no LM Studio available: OpenRouter-only operation (system works without LM Studio)
-- Fallback is per-role and permanent for the session (no retries after fallback)
+- Fallback is per-role and resettable via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key
 
 ## Other Notes
 
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index e93a590..4dea653 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -7,6 +7,9 @@ LM Studio and its pre-loaded models can be reached at "http://127.0.0.1:1234".
 
 ## Complete Project Directory Structure and File Descriptions
 project-root/
+├── .github/                            # GitHub community health files
+│   ├── ISSUE_TEMPLATE/                 # Public issue forms + security contact routing
+│   └── pull_request_template.md        # Default pull request template
 ├── backend/
 │   ├── shared/                          # SHARED RESOURCES
 │   │   ├── __init__.py                  # Package initialization
@@ -20,6 +23,7 @@ project-root/
 │   │   ├── workflow_predictor.py        # Predicts next 20 API calls (mode-specific algorithms)
 │   │   ├── free_model_manager.py        # Free model rotation/cooldown singleton (looping + auto-selector backup)
 │   │   ├── rag_lock.py                  # Global RAG operation lock (prevents Aggregator/Compiler collision)
+│   │   ├── token_tracker.py             # Cumulative input/output token tracker singleton with per-model breakdown and research timer
 │   │   ├── wolfram_alpha_client.py      # Wolfram Alpha API client
 │   │   ├── utils.py                     # Common utilities
 │   │   ├── json_parser.py               # JSON parsing with sanitization for LLM quirks
@@ -66,7 +70,8 @@ project-root/
 │   │   ├── agents/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   ├── high_context_submitter.py # 3 modes: construction, outline, review
-│   │   │   └── high_param_submitter.py   # Rigor enhancement mode
+│   │   │   ├── high_param_submitter.py   # Rigor enhancement mode
+│   │   │   └── critique_submitter.py    # Critique phase submitter (peer review)
 │   │   ├── validation/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   └── compiler_validator.py    # Validates coherence, rigor, placement
@@ -88,7 +93,7 @@ project-root/
 │   │   ├── __init__.py                  # Package initialization
 │   │   ├── core/
 │   │   │   ├── __init__.py              # Package initialization
-│   │   │   ├── autonomous_coordinator.py # Orchestrates two-tier workflow (brainstorm → paper)
+│   │   │   ├── autonomous_coordinator.py # Orchestrates the Tier 1 → Tier 2 → Tier 3 autonomous workflow
 │   │   │   └── autonomous_rag_manager.py # Autonomous-specific RAG wrapper
 │   │   ├── agents/
 │   │   │   ├── __init__.py              # Package initialization
@@ -108,17 +113,23 @@ project-root/
 │   │   ├── prompts/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   ├── topic_prompts.py         # Topic selection & validation prompts
+│   │   │   ├── topic_exploration_prompts.py # Builds aggregator user prompt for topic exploration phase
 │   │   │   ├── completion_prompts.py    # Completion review & self-validation prompts
 │   │   │   ├── paper_reference_prompts.py # Reference selection prompts
+│   │   │   ├── paper_title_exploration_prompts.py # Builds aggregator user prompt for paper title exploration phase
 │   │   │   ├── paper_title_prompts.py   # Paper title selection prompts
 │   │   │   ├── paper_redundancy_prompts.py # Paper redundancy review prompts
+│   │   │   ├── paper_continuation_prompts.py # Brainstorm multi-paper continuation decision prompts
 │   │   │   └── final_answer_prompts.py  # TIER 3 - Final answer assessment/selection/volume prompts
 │   │   └── memory/
 │   │       ├── __init__.py              # Package initialization
-│   │       ├── brainstorm_memory.py     # Per-brainstorm database management
+│   │       ├── brainstorm_memory.py     # Per-brainstorm database management (includes retroactive edit/remove/add during paper compilation)
 │   │       ├── paper_library.py         # Paper library management (Tier 2)
 │   │       ├── research_metadata.py     # Research metadata (brainstorms + papers associations)
 │   │       ├── autonomous_rejection_logs.py # Topic selection & completion feedback logs
+│   │       ├── topic_exploration_memory.py # In-memory candidate DB for topic exploration phase
+│   │       ├── paper_model_tracker.py   # Per-paper model usage tracking and author attribution
+│   │       ├── autonomous_api_logger.py # Autonomous API call logger singleton
 │   │       ├── final_answer_memory.py   # TIER 3 - Final answer state & volume management
 │   │       └── session_manager.py       # Prompt-based session folder organization
 │   │
@@ -137,7 +148,7 @@ project-root/
 │   │       ├── boost.py                 # Boost API endpoints (enable/disable/toggle/status)
 │   │       ├── workflow.py              # Workflow API endpoints (predictions/history)
 │   │       ├── download.py              # PDF generation endpoint via Playwright (POST /api/download/pdf)
-│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers, LM Studio availability, **GET /api/model-cache** for model ID caching)
+│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers, LM Studio availability, **GET /api/model-cache** for model ID caching, **POST /api/openrouter/reset-exhaustion** to reset credit exhaustion mid-session)
 │   │       └── websocket.py             # WebSocket for real-time updates
 │   │
 │   ├── data/                            # Persistent data storage
@@ -205,6 +216,7 @@ project-root/
 │   │   │   │
 │   │   │   └── autonomous/              # AUTONOMOUS RESEARCH
 │   │   │       ├── AutonomousResearchInterface.jsx  # Main control: research prompt, start/stop, current tier
+│   │   │       ├── AutonomousResearch.css     # Autonomous research styles
 │   │   │       ├── BrainstormList.jsx       # List all brainstorm topics with status
 │   │   │       ├── PaperLibrary.jsx         # Grid view of completed papers (title + abstract)
 │   │   │       ├── AutonomousResearchSettings.jsx  # Model configs for all roles
@@ -213,16 +225,27 @@ project-root/
 │   │   │       ├── LiveTier3Progress.jsx    # Real-time Tier 3 final answer display (embedded in interface)
 │   │   │       ├── FinalAnswerView.jsx      # TIER 3 - Final answer tab (separate tab for completed answers)
 │   │   │       ├── FinalAnswerLibrary.jsx   # All sessions final answer library viewer
-│   │   │       └── ArchiveViewerModal.jsx   # Research lineage archive viewer (papers + brainstorms)
+│   │   │       ├── FinalAnswerLibrary.css   # Final answer library styles
+│   │   │       ├── ArchiveViewerModal.jsx   # Research lineage archive viewer (papers + brainstorms)
+│   │   │       └── ArchiveViewerModal.css   # Archive viewer styles
 │   │   │
+│   │   ├── StartupProviderSetupModal.jsx # Post-disclaimer startup chooser for OpenRouter vs LM Studio setup
 │   │   ├── OpenRouterApiKeyModal.jsx    # Modal for global OpenRouter API key configuration
 │   │   ├── PaperCritiqueModal.jsx       # Modal for displaying validator paper critiques (ratings, feedback, history)
 │   │   ├── CritiqueNotificationStack.jsx # Persistent popup notifications for high-scoring critiques (≥7.0 avg)
+│   │   ├── CreditExhaustionNotificationStack.jsx # Persistent red notifications for OpenRouter credit exhaustion with "Retry OpenRouter" reset button
+│   │   ├── HungConnectionNotificationStack.jsx # Persistent amber notifications for API calls exceeding 15 minutes (possible hung connections)
 │   │   ├── BoostLogs.jsx                # Boost API call log viewer
+│   │   ├── BoostLogs.css                # Boost logs styles
 │   │   ├── BoostControlModal.jsx        # Modal for boost configuration (next-X, category, per-task)
+│   │   ├── BoostControlModal.css        # Boost control modal styles
 │   │   ├── WorkflowPanel.jsx            # Workflow prediction panel (next 20 API calls display)
+│   │   ├── WorkflowPanel.css            # Workflow panel styles
 │   │   ├── TextFileUploader.jsx         # User file upload component
+│   │   ├── TextFileUploader.css         # File uploader styles
 │   │   ├── OpenRouterPrivacyWarningModal.jsx # Privacy policy error modal (OpenRouter data sharing)
+│   │   ├── settings-common.css          # Shared settings panel styles
+│   │   ├── critique-modal.css           # Paper critique modal styles
 │   │   │
 │   │   ├── services/
 │   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI)
@@ -230,9 +253,11 @@ project-root/
 │   │   │
 │   │   ├── utils/
 │   │   │   ├── downloadHelpers.js       # PDF/raw download helpers (Playwright backend PDF)
-│   │   │   └── modelCache.js            # Frontend model cache utilities (display_name → api_id lookup)
+│   │   │   ├── modelCache.js            # Frontend model cache utilities (display_name → api_id lookup)
+│   │   │   ├── autonomousProfiles.js    # Shared autonomous recommended-profile definitions and persistence helpers
+│   │   │   └── disclaimerHelper.js      # Frontend-only disclaimer injection for brainstorm/paper views
 │   │   │
-│   │   ├── App.jsx                      # Main app with tab navigation
+│   │   ├── App.jsx                      # Main app shell with top-level mode switch (Autonomous ASI S.T.E.M. / Advanced Manual ASI S.T.E.M.) and tab navigation
 │   │   ├── index.css                    # Styles
 │   │   └── index.jsx                    # React entry point
 │   │
@@ -241,6 +266,7 @@ project-root/
 │
 ├── requirements.txt                     # Python dependencies
 ├── package.json                         # Root scripts
+├── SECURITY.md                          # Security policy and private vulnerability reporting
 ├── Press to Launch MOTO.bat             # The user's one-click program launcher.
 └── _moto_internal_launcher.ps1          # Internal PowerShell launcher (not for direct user use)
 
@@ -259,6 +285,7 @@ project-root/
 - `free_model_manager.py`: Free model rotation/cooldown singleton (looping, auto-selector `openrouter/free`, account exhaustion detection)
 - `wolfram_alpha_client.py`: Wolfram Alpha API client for rigor verification
 - `rag_lock.py`: Global RAG operation lock (prevents collision, retry logic for reads)
+- `token_tracker.py`: Cumulative input/output token tracker singleton with per-model breakdown and research timer. Reset on session start, timer start/stop tied to coordinator lifecycle. Stats broadcast via `token_usage_updated` WebSocket event after each successful LLM call.
 - `utils.py`: Token counting, text compression, file I/O
 - `json_parser.py`: JSON parsing with sanitization for LLM responses; sanitizes reasoning tokens, markdown blocks, control tokens, LaTeX escapes, control characters; **rejects truncated JSON** (raises ValueError with diagnostics) to prevent corrupted content from passing validation
 - `critique_memory.py`: Paper critique persistence (ratings, feedback, history, session-aware)
@@ -282,8 +309,8 @@ project-root/
 - Agents: `topic_selector.py`, `topic_validator.py`, `completion_reviewer.py`, `reference_selector.py`, `paper_title_selector.py`
 - Tier 3 Agents: `certainty_assessor.py`, `answer_format_selector.py`, `volume_organizer.py`
 - `paper_redundancy_checker.py`: Library quality maintenance (every 3 papers)
-- Prompts: `topic_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `final_answer_prompts.py`
-- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py`, `session_manager.py`, `autonomous_rejection_logs.py`, `final_answer_memory.py` (model tracking, archival)
+- Prompts: `topic_prompts.py`, `topic_exploration_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_exploration_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `paper_continuation_prompts.py`, `final_answer_prompts.py`
+- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py`, `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `final_answer_memory.py` (model tracking, archival)
 
 ### API Routes
 
@@ -292,8 +319,9 @@ project-root/
 
 ### Frontend Components
 
+- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global.
 - **Aggregator**: `AggregatorInterface.jsx`, `AggregatorSettings.jsx`, `AggregatorLogs.jsx`, `LiveResults.jsx`
 - **Compiler**: `CompilerInterface.jsx`, `CompilerSettings.jsx`, `CompilerLogs.jsx`, `LivePaper.jsx`
 - **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx`, `ArchiveViewerModal.jsx`
-- **Shared**: `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `BoostLogs.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
-- **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `api.js`, `websocket.js`
+- **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostLogs.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
+- **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
diff --git a/.cursor/rules/rag-design-for-overall-program.mdc b/.cursor/rules/rag-design-for-overall-program.mdc
index f365deb..d3095b1 100644
--- a/.cursor/rules/rag-design-for-overall-program.mdc
+++ b/.cursor/rules/rag-design-for-overall-program.mdc
@@ -1,5 +1,5 @@
 ---
-alwaysApply: true
+alwaysApply: false
 ---
 ## Important Notes When Editing RAG Systems
 The RAG system in this program is very advanced, be certain that any changes you make to the RAG system are correct changes.
@@ -12,7 +12,7 @@ If an item is direct injected, its RAG counterpart must NOT also be included.
 
 **RAG Offload Priority — Submitter:** Shared Training DB → Local Submitter DB → Rejection Log → User Upload Files
 
-**RAG Offload Priority — Validator:** Shared Training DB → User Upload Files → Submission under review (last resort)
+**RAG Offload Priority — Validator:** Shared Training DB → User Upload Files (submission under review is always direct injected)
 
 ## Further RAG Specifications
 
@@ -62,7 +62,7 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Stage C — Reranking + MMR**: Blend vector (60%) + BM25 (40%); MMR λ=0.8 (80% relevance, 20% diversity); removes near-duplicates (similarity > 0.85); hard cap at context budget.
 
-**Stage D — Packing + Compression**: Assembles evidence with headers; priority: document → section → relevance. Compresses only if over budget (preserves entities, numbers, dates). Returns `ContextPack` with evidence tracking.
+**Stage D — Packing**: Assembles evidence with headers; priority: document → section → relevance. Packs chunks incrementally until budget is reached (no compression — disabled as unreliable). Skips chunks from `exclude_sources` (content already direct-injected in prompt). Returns `ContextPack` with evidence tracking.
 
 ---
 
@@ -70,7 +70,7 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **User Files (Permanent Cache)**: Pre-generates all 4 configs; NEVER evicted; supports submitter chunk size cycling.
 
-**Dynamic Files (Re-Chunked on Update)**: Shared training DB, rejection logs, outline, paper. Single config (current submitter cycle or validator constant). LRU eviction when > 10000 documents.
+**Dynamic Files (Re-Chunked on Update)**: Shared training DB, rejection logs, outline, paper. Single config (current submitter cycle or validator constant). LRU eviction when > 10000 documents. Per-size chunk cap: oldest non-permanent chunks trimmed when any bucket exceeds 10,000 chunks.
 
 ---
 
@@ -82,7 +82,7 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Re-Chunking Triggers:**
 
-*Aggregator* (immediate after each acceptance): Acquires global RAG lock → incrementally adds only new submission → releases lock. New chunks: `rag_shared_training_update_{chunk_size}`. Historical chunks accumulate (not removed). MAX_CHUNKS_PER_SIZE = 10,000.
+*Aggregator* (immediate after each acceptance): Acquires global RAG lock → incrementally adds only new submission → releases lock. New chunks: `rag_shared_training_update_{chunk_size}`. Historical chunks accumulate (not removed). `max_chunks_per_size = 10,000` enforced per bucket after each add; oldest non-permanent chunks trimmed on overflow.
 
 *Compiler* (every 10 aggregator acceptances): Monitors count every 30s → acquires global RAG lock → removes old chunks, re-adds entire file with all 4 configs → releases lock.
 
@@ -104,16 +104,26 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Overflow handling**: User prompt always direct injected; if exceeds `context_window - minimum_RAG_allocation`: HALT with error. Content too large: offload to RAG. Still doesn't fit: compress (NEVER truncate).
 
+**Source Exclusion (anti-duplication)**: `rag_manager.retrieve(exclude_sources=[...])` filters chunks from named sources during Stage D packing. Callers pass source names of content already direct-injected so RAG budget goes entirely to non-duplicated content.
+
+| Mode | Excluded Sources | Reason |
+|---|---|---|
+| Compiler construction | `compiler_outline.txt`, `compiler_paper.txt`, brainstorm source (when direct-injected) | All three always direct-injected in construction prompts |
+| Compiler outline_update | `compiler_outline.txt`, `compiler_paper.txt` | Both direct-injected in outline update prompts |
+| Compiler rigor | `compiler_outline.txt` | Outline always direct-injected; paper intentionally RAG'd (smaller context) |
+| Aggregator submitter/validator | Direct-injected user file names + direct-injected shared-training sources (current training file + `rag_shared_training_update_*`) | Prevents RAG returning chunks already in direct context when only some content is offloaded |
+| Aggregator cleanup review | Same as above, when full submissions DB is direct-injected | Prevents cleanup RAG evidence from repeating already-injected submissions |
+
 ---
 
 ## Memory Management
 
 **Cache limits:**
 - Query rewrite cache: 500 entries, 30-min TTL
-- Embedding cache: 500 entries, LRU eviction
 - BM25 cache: 1000 entries, 1-hour TTL
 - Context pack cache: 300 entries
 - Document LRU: removes oldest non-permanent document when > 10000 docs
+- Per-size chunk cap: 10,000 chunks per size bucket; oldest non-permanent trimmed on overflow; embeddings nulled before removal
 
 **Training data limits**: No shared DB size limit. Local rejections: max 5 per submitter. Observability: 1000 retrieval history, 50 gating events, 100 hard negatives.
 
@@ -143,6 +153,25 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 ---
 
+## Agents Intentionally Without RAG
+
+These agents use ONLY direct injection (no RAG fallback) by design. Each operates on compact metadata summaries where RAG is unnecessary. Documented in each file's module docstring.
+
+| Agent | Inputs | Why No RAG |
+|---|---|---|
+| Topic selector | Brainstorm metadata, paper titles/abstracts | Strategic "what to work on" decision — summaries suffice; abstracts truncated as overflow fallback |
+| Topic validator | Same as topic selector | Validates strategic decision, same compact metadata |
+| Paper title selector | Brainstorm summary, existing paper titles/abstracts | Title selection needs topic overview, not full content |
+| Paper redundancy checker | Paper titles/abstracts | Redundancy detected at abstract level, not full-content comparison |
+| Answer format selector | Certainty assessment, paper summaries | Short-form vs long-form is a structural decision, not content-deep |
+| Volume organizer | Paper summaries, certainty assessment, volume state | Chapter ordering uses paper-level metadata, not full content |
+| Compiler review mode | Outline + paper only | Evaluates paper on its own merits without external source bias |
+| Brainstorm continuation | Brainstorm summary, prior paper titles/abstracts | "Write another or move on" uses summary, not full DB |
+
+**Known oversight**: Certainty assessor Step 2 drops expanded papers when they don't fit instead of RAG'ing them. Should use RAG fallback like reference_selector does.
+
+---
+
 ## Critical Invariants
 
 1. User prompt and JSON context NEVER RAG'd — always direct injected (Parts 1, 2, 3)
@@ -156,3 +185,7 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 9. Contradiction check pre-acceptance
 10. Autonomous mode prompt validation before all LLM calls
 11. Read operations retry on HNSW index errors (3 attempts, 0.5s → 1s → 2s backoff)
+12. Document count tracks unique source names — repeated `add_text`/`add_document` with same source name does not inflate count
+13. Per-size chunk cap (`max_chunks_per_size`) enforced after every add — prevents unbounded in-memory embedding growth
+14. Agents that use only metadata summaries (topic selector, title selector, redundancy checker, etc.) intentionally skip RAG — see "Agents Intentionally Without RAG" table above
+15. If content is already direct-injected, it must NOT also appear in RAG retrieval results — no duplication
diff --git a/.cursor/rules/workflow-runtime-updates.mdc b/.cursor/rules/workflow-runtime-updates.mdc
new file mode 100644
index 0000000..116fcae
--- /dev/null
+++ b/.cursor/rules/workflow-runtime-updates.mdc
@@ -0,0 +1,11 @@
+---
+alwaysApply: true
+---
+
+## Workflow Runtime Updates
+
+- Aggregator, Compiler, and Autonomous Research are mutually exclusive runtime modes. Only one workflow mode may be active at a time, and starting any mode while another is running must be blocked.
+- This rule explicitly supersedes any older wording in `part-1-and-part-2-cointeraction-architecture.mdc` that describes Aggregator and Compiler as concurrently runnable.
+
+- Compiler critique skip and autonomous critique skip both support pre-emptive use during active paper-writing. If critique is already active, the skip happens immediately. If critique has not started yet, the skip is queued and auto-applies when critique is reached.
+- This rule explicitly supersedes any older wording in `part-2-compiler-tool-design-specification.mdc` that describes compiler critique skip as active-critique-only.
diff --git a/Press to Launch MOTO.bat b/Press to Launch MOTO.bat
index 77e2692..52710c8 100644
--- a/Press to Launch MOTO.bat	
+++ b/Press to Launch MOTO.bat	
@@ -1,5 +1,5 @@
 @echo off
-setlocal enabledelayedexpansion
+setlocal
 
 cls
 echo ================================================================
@@ -83,7 +83,8 @@ REM ================================================================
 echo [4/8] Installing Python dependencies...
 echo This may take a few minutes if this is your first time...
 echo.
-pip install -r requirements.txt
+python -m pip install --upgrade pip >nul 2>&1
+pip install --upgrade -r requirements.txt
 if errorlevel 1 (
     echo.
     echo ============================================================
diff --git a/README.md b/README.md
index 4ad799c..a737b0a 100644
--- a/README.md
+++ b/README.md
@@ -1,14 +1,24 @@
 # MOTO - S.T.E.M. Mathematics Variant
 # Autonomous AI/ASI Deep Research Harness
-**Version: 1.0.4**
+**Version: 1.0.5**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**An autonomous AI or ASI research system that generates novel mathematical research papers through multi-agent aggregation and compilation. Useful for any discipline that has an interest in novel math: physicists, engineers, mathematicians, chemists, etc. This harness can easily be modified for other research topics such as general academic research, chat bots, niche research, robotics, or anything requiring useful creative output and general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention - if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI and autonmated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration changes how we look at AI weights, a specific combination of reiterative brainstorming, validation, feedback, pruning allow for superintelligence exploration and data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation for mathematics: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for other research topics such as general academic research, chat bots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
-The differentiator that allows us to call this early artificial superintelligence is the brainstorming mechanism when considered in context with how generative transformers (GPT LLMs) operate. Brainstorming may sound trivial; however, transformers predict what tokens will come next. If you provide the transformer with a bunch of previous ideas that it had, then it is more likely to produce something new that it hasn't said before. MOTO maintains and "cleans" or "purges" its brainstorm database as it runs. Once a later idea makes earlier ones redundant, the redundant idea is then removed from the database - this allows for a type of recursive improvement. Once brainstorming is complete, MOTO writes the research paper about its solution. This step then repeats, now the papers become a new "tier 2" brainstorm. Previous papers are referenced in future brainstorms and future papers. This set of tier 2 papers is another higher order brainstorm-like database, which also cleans/prunes itself of newly discovered incorrect or redundant papers just like the tier 1 short-hand idea brainstorm database does for each paper. A 3rd tier, slightly more complex mechanism exists for the final tier 3 answer generation that allows for the book-length volumes.
+### The Core Discovery: Top-P Exploration (Solution Basin Aggregation)
+
+MOTO is built on a [key insight](https://intrafere.com/structured-brainstorming-validated-feedback/) about how generative transformers operate: **transformers predict what tokens come next, so providing them with their own prior ideas enables deeper probing of the solution space**. This is called **solution basin aggregation** — each brainstorming pass explores a richer, more informed landscape, and the cross-recombination of "mined" knowledge compounds to create new insights that do not exist from the model's training alone. Intrafere considers this the mechanism that produces [ASI-like results](https://intrafere.com/structured-brainstorming-validated-feedback/) in practice. MOTO essentially "mines" creativity from a transformer's knowledge set, and this compounding effect is what differentiates it from traditional single-pass AI.
+
+The brainstorming phase runs **multiple submitters in parallel**, each independently exploring the solution space, funneled into a **single bottleneck validator** — a completely separate model instance whose only job is to decide whether each submission genuinely advances the knowledge base. This architectural separation between creative exploration and critical evaluation mitigates the hallucination loops and drift that plague single-model autonomous agents. Every rejection carries specific feedback that steers the next round of exploration, so failure is never wasted. Iterative pruning continuously removes entries that become redundant as stronger ideas emerge, producing an ever-denser, self-refining knowledge base. [View the learning curve data](https://intrafere.com/motos-brainstorming-potential-data/) for empirical evidence of this approach.
+
+### How Research Compounds Across Tiers
+
+Once a brainstorm is sufficiently explored, MOTO writes a research paper from it. This step then repeats — papers become a new "Tier 2" brainstorm. Previous papers are referenced in future brainstorms and future papers. This set of Tier 2 papers is another higher-order brainstorm-like database, which also self-prunes newly discovered incorrect or redundant papers just like the Tier 1 short-hand idea brainstorm does. A third tier generates the final answer, capable of producing book-length volumes.
+
+MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is an experimental system; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
 MOTO may produce many brilliant papers as it runs, these start-up papers are answers that rival traditional paid cloud deep research functions. As the user, observe MOTO as often or as little as you'd like - skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode, a final answer beyond the growing collection of related papers. In this mode, we have found quality can vary - however that is because MOTO is capable of autonomously deciding if it should output a shortform answer, like traditional cloud deep research - or whether to collect existing pre-final answer papers and write a long-form academic volume. With models over 131,000 token context limits, the harness is easily capable of producing final volumes with over 40,000 words, and MOTO produces this book-length content autonomously. It should be noted that this long-form answer is often so detailed that for any AI critique it requires the system to fully direct-inject the paper content. Providing an attempt at a novel 40,000 academic volume to a cloud agent using RAG (summarization-like techniques) may provide mixed results. MOTO strives to direct inject all content where possible. The built in “critique” feature allows the user to direct inject the full 40,000+ word volume into nearly any AI model of their choice. If the system decides to do a long form answer it will collect any relevant papers it has written, take only the best and related ones, organize them into chapters, write any gap papers, write the conclusion, and then lastly write the introduction chapter. This reverse order, body first, conclusion second, then introduction portion(s) last is crucial to allow MOTO the ability to be creative as it write. The traditional introduction -> body -> conclusion writing style ensures we limit any non-Markovian constraints on the creative process. In other words, if the system wrote its introduction first, the body paragraphs are locked in and bound to the rules the introduction set. Writing the body section first gives the system greater freedom to discover as it writes as it is not bound by a detailed introduction. MOTO is an experimental system, the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
@@ -45,15 +55,20 @@ Before installation, you need:
    - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will suport. In this develop tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (I.e. GPT OSS 20b, DeepSeek 32B, etc). **If you do not not download LM studio and enable the Nomic agent the system will run much slower and cost a slightly more due to having to use the paid service OpenRouter for RAG calls.**
    - Start the local server (port 1234)
 4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download the MOTO deep research harness, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
+5. **On first startup, pick your provider path**: After you acknowledge the disclaimer, MOTO will prompt you to either enter an OpenRouter key or confirm that LM Studio is running. If you save an OpenRouter key there, the recommended default autonomous profile is applied immediately so you can open Settings and see it already selected.
 
 ### Installation
 
 #### Windows (One-Click Launcher)
 
 1. Clone or download this repository
-2. Start LM Studio and load your models and "nomic-embed-text-v1.5" agent **and/or** enter OpenRouter API key
+2. Start LM Studio and load your models and "nomic-embed-text-v1.5" agent **and/or** have your OpenRouter API key ready
 3. **Double-click `Press to Launch MOTO.bat`**
-4. The launcher will:
+4. After acknowledging the disclaimer, choose one of the startup setup paths:
+   - Enter your OpenRouter API key
+   - Confirm that LM Studio is already running with a loaded model
+   - Then open Settings to keep the recommended profile or switch to your saved team profile / another default profile
+5. The launcher will:
    - Check all prerequisites
    - Install Python and Node.js dependencies automatically
    - Create necessary directories
@@ -338,6 +353,8 @@ All content generated by this system is for informational purposes only. Papers
 ## 🔗 Links
 
 - **Website**: https://intrafere.com
+- **Top-P Exploration (ASI Discovery)**: https://intrafere.com/structured-brainstorming-validated-feedback/
+- **Learning Curve Data**: https://intrafere.com/motos-brainstorming-potential-data/
 - **Program Info**: https://intrafere.com/moto-autonomous-home-ai/
 - **News & Updates**: https://intrafere.com/moto-news/
 - **Donate**: https://intrafere.com/donate/
diff --git a/_moto_internal_launcher.ps1 b/_moto_internal_launcher.ps1
index beb0146..8e21bba 100644
--- a/_moto_internal_launcher.ps1
+++ b/_moto_internal_launcher.ps1
@@ -28,7 +28,7 @@ try {
     }
 
     # Check for Python
-    Write-Host "[1/6] Checking Python installation..." -ForegroundColor Yellow
+    Write-Host "[1/8] Checking Python installation..." -ForegroundColor Yellow
     if (-not (Test-Command python)) {
         Write-Host ""
         Write-Host "============================================================" -ForegroundColor Red
@@ -46,7 +46,7 @@ try {
     Write-Host ""
 
     # Check for Node.js
-    Write-Host "[2/6] Checking Node.js installation..." -ForegroundColor Yellow
+    Write-Host "[2/8] Checking Node.js installation..." -ForegroundColor Yellow
     if (-not (Test-Command node)) {
         Write-Host ""
         Write-Host "============================================================" -ForegroundColor Red
@@ -63,8 +63,8 @@ try {
     Write-Host "npm: $npmVersion" -ForegroundColor Green
     Write-Host ""
 
-    # Create necessary directories
-    Write-Host "[3/6] Creating necessary directories..." -ForegroundColor Yellow
+    # Create necessary directories & clean ChromaDB
+    Write-Host "[3/8] Creating necessary directories..." -ForegroundColor Yellow
     $directories = @(
         "backend\data",
         "backend\data\user_uploads",
@@ -77,35 +77,38 @@ try {
         }
     }
     Write-Host "Directories ready!" -ForegroundColor Green
+    
+    # Clean ChromaDB on startup to prevent corruption issues
+    $chromaPath = "backend\data\chroma_db"
+    if (Test-Path $chromaPath) {
+        Write-Host "Cleaning ChromaDB database..." -ForegroundColor Yellow
+        Remove-Item -Path $chromaPath -Recurse -Force
+        Write-Host "ChromaDB cleaned!" -ForegroundColor Green
+    }
     Write-Host ""
 
-    # Check/Install Python dependencies
-    Write-Host "[4/6] Checking Python dependencies..." -ForegroundColor Yellow
-    $pipList = pip list 2>&1
-    if ($pipList -notmatch "fastapi") {
-        Write-Host "Installing Python dependencies..." -ForegroundColor Yellow
-        Write-Host "This may take a few minutes..." -ForegroundColor Yellow
+    # Install/Update Python dependencies
+    Write-Host "[4/8] Installing Python dependencies..." -ForegroundColor Yellow
+    Write-Host "Upgrading pip and checking packages..." -ForegroundColor Yellow
+    Write-Host ""
+    python -m pip install --upgrade pip 2>&1 | Out-Null
+    pip install --upgrade -r requirements.txt
+    if ($LASTEXITCODE -ne 0) {
         Write-Host ""
-        pip install -r requirements.txt
-        if ($LASTEXITCODE -ne 0) {
-            Write-Host ""
-            Write-Host "============================================================" -ForegroundColor Red
-            Write-Host "ERROR: Failed to install Python dependencies" -ForegroundColor Red
-            Write-Host "============================================================" -ForegroundColor Red
-            Write-Host ""
-            Write-Host "Please check:" -ForegroundColor Yellow
-            Write-Host "- Internet connection is working" -ForegroundColor Yellow
-            Write-Host "- You have permission to install packages" -ForegroundColor Yellow
-            Exit-WithPause -ExitCode 1
-        }
-        Write-Host "Python dependencies installed successfully" -ForegroundColor Green
-    } else {
-        Write-Host "Python dependencies already installed" -ForegroundColor Green
+        Write-Host "============================================================" -ForegroundColor Red
+        Write-Host "ERROR: Failed to install Python dependencies" -ForegroundColor Red
+        Write-Host "============================================================" -ForegroundColor Red
+        Write-Host ""
+        Write-Host "Please check:" -ForegroundColor Yellow
+        Write-Host "- Internet connection is working" -ForegroundColor Yellow
+        Write-Host "- You have permission to install packages" -ForegroundColor Yellow
+        Exit-WithPause -ExitCode 1
     }
+    Write-Host "Python dependencies up to date" -ForegroundColor Green
     Write-Host ""
 
     # Install Playwright Chromium browser (one-time ~150MB download for PDF generation)
-    Write-Host "[4b/6] Installing Playwright Chromium browser for PDF generation..." -ForegroundColor Yellow
+    Write-Host "[4b/8] Installing Playwright Chromium browser for PDF generation..." -ForegroundColor Yellow
     Write-Host "This is a one-time download (~150MB) and may take a few minutes..." -ForegroundColor Yellow
     Write-Host ""
     python -m playwright install chromium 2>&1
@@ -121,7 +124,7 @@ try {
     Write-Host ""
 
     # Check/Install Node.js dependencies
-    Write-Host "[5/6] Checking Node.js dependencies..." -ForegroundColor Yellow
+    Write-Host "[5/8] Checking Node.js dependencies..." -ForegroundColor Yellow
     if (-not (Test-Path "frontend")) {
         Write-Host ""
         Write-Host "============================================================" -ForegroundColor Red
@@ -160,7 +163,7 @@ try {
     Write-Host ""
 
     # Check for LM Studio (optional - OpenRouter is an alternative)
-    Write-Host "[6/6] Checking LM Studio..." -ForegroundColor Yellow
+    Write-Host "[6/8] Checking LM Studio..." -ForegroundColor Yellow
     Write-Host ""
     
     # Check if LM Studio is responding
@@ -194,7 +197,7 @@ try {
     Write-Host ""
 
     # Clean up any existing processes on ports 8000 and 5173
-    Write-Host "[7/7] Cleaning up existing processes on ports 8000 and 5173..." -ForegroundColor Yellow
+    Write-Host "[7/8] Cleaning up existing processes on ports 8000 and 5173..." -ForegroundColor Yellow
     Write-Host ""
     
     # Kill processes on port 8000
@@ -247,6 +250,8 @@ try {
     Write-Host ""
 
     # Start the system
+    Write-Host "[8/8] Starting services..." -ForegroundColor Yellow
+    Write-Host ""
     Write-Host "================================================================" -ForegroundColor Cyan
     Write-Host "  All checks passed! Starting system..." -ForegroundColor Cyan
     Write-Host "================================================================" -ForegroundColor Cyan
diff --git a/backend/aggregator/agents/submitter.py b/backend/aggregator/agents/submitter.py
index f72e613..de2e5b3 100644
--- a/backend/aggregator/agents/submitter.py
+++ b/backend/aggregator/agents/submitter.py
@@ -273,9 +273,17 @@ async def _generate_submission(self) -> Optional[Submission]:
                             self.task_tracking_callback("completed", task_id)
                         return None  # Return None instead of crashing
                         
+                except FreeModelExhaustedError:
+                    raise
+                except RuntimeError as e:
+                    if "credits exhausted" in str(e).lower():
+                        raise FreeModelExhaustedError(str(e), soonest_retry=None)
+                    logger.error(f"Submitter {self.submitter_id}: Unexpected error during completion: {e}")
+                    if self.task_tracking_callback:
+                        self.task_tracking_callback("completed", task_id)
+                    return None
                 except Exception as e:
                     logger.error(f"Submitter {self.submitter_id}: Unexpected error during completion: {e}")
-                    # Notify task completed (failed but still completed)
                     if self.task_tracking_callback:
                         self.task_tracking_callback("completed", task_id)
                     return None
diff --git a/backend/aggregator/core/context_allocator.py b/backend/aggregator/core/context_allocator.py
index 6e1952a..36d8178 100644
--- a/backend/aggregator/core/context_allocator.py
+++ b/backend/aggregator/core/context_allocator.py
@@ -4,6 +4,7 @@
 """
 from typing import Dict, List, Optional
 import logging
+from pathlib import Path
 
 from backend.shared.config import rag_config
 from backend.shared.models import ContextPack
@@ -45,6 +46,32 @@ def set_context_windows(self, submitter_context: int, validator_context: int,
         if validator_max_output is not None:
             self.validator_max_output_tokens = validator_max_output
         logger.info(f"Context windows updated - Submitter: {submitter_context}, Validator: {validator_context}")
+
+    def _get_shared_training_rag_sources(self) -> List[str]:
+        """
+        Get RAG source names that map to shared-training content.
+
+        Used to exclude shared-training chunks from RAG when the same
+        shared-training content is already direct-injected into the prompt.
+        """
+        sources: List[str] = []
+
+        # Current shared-training file source (manual mode: rag_shared_training.txt,
+        # autonomous mode: brainstorm_<topic_id>.txt)
+        try:
+            from backend.aggregator.memory.shared_training import shared_training_memory
+            current_source = Path(shared_training_memory.file_path).name
+            if current_source:
+                sources.append(current_source)
+        except Exception as e:
+            logger.debug(f"Could not resolve shared-training source name for exclusion: {e}")
+
+        # Incremental re-RAG sources used by aggregator background updates
+        for chunk_size in rag_config.submitter_chunk_intervals:
+            sources.append(f"rag_shared_training_update_{chunk_size}")
+
+        # De-dup while preserving insertion order
+        return list(dict.fromkeys(sources))
     
     async def allocate_submitter_context(
         self,
@@ -184,6 +211,15 @@ async def allocate_submitter_context(
         # Perform RAG retrieval ONLY if content was offloaded
         rag_context = None
         if any([needs_shared_training_rag, needs_local_training_rag, needs_rejection_log_rag, needs_user_files_rag]):
+            # Build exclusion list: sources that were direct-injected should not appear in RAG
+            exclude_sources = []
+            if not needs_shared_training_rag and shared_training_content:
+                exclude_sources.extend(self._get_shared_training_rag_sources())
+            if not needs_user_files_rag and user_files_content:
+                exclude_sources.extend(user_files_content.keys())
+            if exclude_sources:
+                exclude_sources = list(dict.fromkeys(exclude_sources))
+            
             # FIXED: Calculate RAG budget from REMAINING space after direct injection
             # This ensures we maximize context usage without exceeding limits
             direct_content_temp = "\n\n".join(direct_parts)
@@ -216,7 +252,8 @@ async def allocate_submitter_context(
             rag_context = await rag_manager.retrieve(
                 query=user_prompt,
                 chunk_size=chunk_size,  # Cycles: 256→512→768→1024
-                max_tokens=rag_max_tokens
+                max_tokens=rag_max_tokens,
+                exclude_sources=exclude_sources if exclude_sources else None
             )
             
             if rag_context and rag_context.text:
@@ -343,6 +380,15 @@ async def allocate_validator_context(
         # Perform RAG retrieval ONLY if content was offloaded
         rag_context = None
         if needs_shared_training_rag or needs_user_files_rag:
+            # Build exclusion list: sources that were direct-injected should not appear in RAG
+            exclude_sources = []
+            if not needs_shared_training_rag and shared_training_content:
+                exclude_sources.extend(self._get_shared_training_rag_sources())
+            if not needs_user_files_rag and user_files_content:
+                exclude_sources.extend(user_files_content.keys())
+            if exclude_sources:
+                exclude_sources = list(dict.fromkeys(exclude_sources))
+            
             # FIXED: Calculate RAG budget from REMAINING space after direct injection
             # This ensures we maximize context usage without exceeding limits
             direct_content_temp = "\n\n".join(direct_parts)
@@ -375,7 +421,8 @@ async def allocate_validator_context(
             rag_context = await rag_manager.retrieve(
                 query=user_prompt,
                 chunk_size=chunk_size,  # Always 512 for validator
-                max_tokens=rag_max_tokens
+                max_tokens=rag_max_tokens,
+                exclude_sources=exclude_sources if exclude_sources else None
             )
             
             if rag_context and rag_context.text:
@@ -503,6 +550,15 @@ async def allocate_cleanup_review_context(
         # Perform RAG retrieval if content was offloaded
         rag_context = None
         if needs_submissions_rag or needs_user_files_rag:
+            # Build exclusion list: sources that were direct-injected should not appear in RAG
+            exclude_sources = []
+            if not needs_submissions_rag and all_submissions_formatted:
+                exclude_sources.extend(self._get_shared_training_rag_sources())
+            if not needs_user_files_rag and user_files_content:
+                exclude_sources.extend(user_files_content.keys())
+            if exclude_sources:
+                exclude_sources = list(dict.fromkeys(exclude_sources))
+            
             # Calculate RAG budget from remaining space
             direct_content_temp = "\n\n".join(direct_parts)
             direct_content_tokens = count_tokens(direct_content_temp)
@@ -520,12 +576,11 @@ async def allocate_cleanup_review_context(
                 f"direct_content={direct_content_tokens}"
             )
             
-            # Use the user prompt as query for RAG - this will retrieve relevant submissions
-            # For cleanup, we want to find similar/redundant content
             rag_context = await rag_manager.retrieve(
                 query=user_prompt,
                 chunk_size=512,  # Use validator's standard chunk size
-                max_tokens=rag_max_tokens
+                max_tokens=rag_max_tokens,
+                exclude_sources=exclude_sources if exclude_sources else None
             )
             
             if rag_context and rag_context.text:
diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index 3c640ab..3767c89 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -80,6 +80,9 @@ def __init__(self):
         
         # Submitter pause control (queue overflow prevention)
         self.should_pause_submitters = False  # Flag to pause submitters when queue >= 10
+        
+        # Cleanup review toggle (disabled for short-lived mini-brainstorm phases)
+        self.enable_cleanup_review = True
     
     async def _load_stats(self) -> None:
         """Load persisted stats from file."""
@@ -128,7 +131,8 @@ async def initialize(
         validator_max_tokens: Optional[int] = None,
         validator_provider: str = "lm_studio",
         validator_openrouter_provider: Optional[str] = None,
-        validator_lm_studio_fallback: Optional[str] = None
+        validator_lm_studio_fallback: Optional[str] = None,
+        enable_cleanup_review: bool = True
     ) -> None:
         """
         Initialize the coordinator with configuration.
@@ -147,6 +151,9 @@ async def initialize(
         """
         logger.info("Initializing coordinator...")
         
+        # Store cleanup review toggle
+        self.enable_cleanup_review = enable_cleanup_review
+        
         # Validate submitter count
         num_submitters = len(submitter_configs)
         if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
@@ -793,7 +800,7 @@ async def _handle_acceptance(self, submission: Submission, result: ValidationRes
         await self._save_stats()
         
         # Trigger cleanup review every 7 acceptances
-        if self.total_acceptances % 7 == 0 and self.total_acceptances > 0:
+        if self.enable_cleanup_review and self.total_acceptances % 7 == 0 and self.total_acceptances > 0:
             await self._perform_cleanup_review()
     
     async def _handle_rejection(self, submission: Submission, result: ValidationResult) -> None:
@@ -938,7 +945,7 @@ async def _perform_cleanup_review(self) -> None:
             
             # Phase 4: Execute the removal
             logger.info(f"CLEANUP DEBUG: >>> PHASE 4: Executing removal of submission #{submission_number}...")
-            removal_success = await shared_training_memory.remove_submission(submission_number)
+            removal_success = await shared_training_memory.remove_submission(submission_number, trigger_rechunk=False)
             logger.info(f"CLEANUP DEBUG: <<< PHASE 4 Complete: removal_success={removal_success}")
             
             if removal_success:
@@ -956,6 +963,9 @@ async def _perform_cleanup_review(self) -> None:
                     "total_removals": self.removals_executed
                 })
                 
+                # Full RAG rebuild so deleted content is no longer retrievable
+                await self._rebuild_shared_training_rag_after_cleanup()
+                
                 # Log key event to persistent log
                 await event_log.add_event(
                     "cleanup_submission_removed",
@@ -1079,6 +1089,43 @@ async def _rechunk_training_data(self) -> None:
             # ALWAYS RELEASE LOCK
             rag_operation_lock.release()
     
+    async def _rebuild_shared_training_rag_after_cleanup(self) -> None:
+        """Full RAG rebuild of shared-training content after a cleanup removal.
+        
+        The normal incremental rechunk path is append-only and cannot remove
+        deleted content from RAG. After a prune we must drop all shared-training
+        RAG sources and re-add the current (post-removal) file so retrieval
+        results stay consistent with the live database.
+        """
+        current_path = Path(shared_training_memory.file_path)
+        current_count = await shared_training_memory.get_insights_count()
+        
+        await rag_operation_lock.acquire("Aggregator cleanup full re-rag")
+        try:
+            # Collect every source name that could contain shared-training chunks
+            candidate_sources = [current_path.name, current_path.with_suffix(".tmp").name]
+            for size in rag_config.submitter_chunk_intervals:
+                candidate_sources.append(f"rag_shared_training_update_{size}")
+            
+            for source in dict.fromkeys(candidate_sources):
+                if source in rag_manager.document_access_order:
+                    await rag_manager.remove_document(source)
+            
+            if current_count > 0 and current_path.exists():
+                await rag_manager.add_document(
+                    str(current_path),
+                    chunk_sizes=rag_config.submitter_chunk_intervals,
+                    is_user_file=False,
+                )
+            
+            await shared_training_memory.mark_submissions_ragged(current_count)
+            logger.info(f"Cleanup full re-RAG complete: {current_count} live submissions re-indexed")
+        except Exception as e:
+            logger.error(f"Cleanup full re-RAG failed: {e}", exc_info=True)
+            raise
+        finally:
+            rag_operation_lock.release()
+    
     async def get_status(self) -> SystemStatus:
         """Get current system status."""
         queue_size = await queue_manager.size()
diff --git a/backend/aggregator/core/rag_manager.py b/backend/aggregator/core/rag_manager.py
index 766cd6f..156a046 100644
--- a/backend/aggregator/core/rag_manager.py
+++ b/backend/aggregator/core/rag_manager.py
@@ -91,10 +91,11 @@ async def add_document(
             for chunk_size, chunks in chunks_by_size.items():
                 await self._add_chunks(chunks, chunk_size)
             
-            # Track document
+            # Track document (only increment count for genuinely new sources)
             source_name = Path(file_path).name
-            self.document_count += 1
-            self.document_access_order[source_name] = time.time()  # LRU tracking
+            if source_name not in self.document_access_order:
+                self.document_count += 1
+            self.document_access_order[source_name] = time.time()
             if is_user_file:
                 self.permanent_documents.add(source_name)
             
@@ -102,6 +103,9 @@ async def add_document(
             if self.document_count > rag_config.max_documents:
                 await self._evict_lru_document()
             
+            # Enforce per-size chunk cap
+            await self._enforce_chunk_cap()
+            
             logger.info(f"Added document: {file_path}")
             
         except Exception as e:
@@ -137,9 +141,10 @@ async def add_text(
             for chunk_size, chunks in chunks_by_size.items():
                 await self._add_chunks(chunks, chunk_size)
             
-            # Track document
-            self.document_count += 1
-            self.document_access_order[source_name] = time.time()  # LRU tracking
+            # Track document (only increment count for genuinely new sources)
+            if source_name not in self.document_access_order:
+                self.document_count += 1
+            self.document_access_order[source_name] = time.time()
             if is_permanent:
                 self.permanent_documents.add(source_name)
             
@@ -147,6 +152,9 @@ async def add_text(
             if self.document_count > rag_config.max_documents:
                 await self._evict_lru_document()
             
+            # Enforce per-size chunk cap
+            await self._enforce_chunk_cap()
+            
             logger.info(f"Added text: {source_name}")
             
         except Exception as e:
@@ -157,7 +165,8 @@ async def retrieve(
         self,
         query: str,
         chunk_size: int = 512,
-        max_tokens: int = None
+        max_tokens: int = None,
+        exclude_sources: Optional[List[str]] = None
     ) -> ContextPack:
         """
         4-stage retrieval pipeline.
@@ -166,6 +175,7 @@ async def retrieve(
             query: Search query
             chunk_size: Chunk size to retrieve from
             max_tokens: Maximum tokens in result
+            exclude_sources: Source names to skip during packing (already direct-injected)
         
         Returns:
             ContextPack with retrieved context
@@ -189,7 +199,9 @@ async def retrieve(
         
         # Stage D: Packing + Compression
         logger.debug(f"RAG Stage 4/4: Packing and compression (max_tokens={max_tokens})")
-        context_pack = await self._pack_and_compress(ranked_chunks, query, max_tokens)
+        if exclude_sources:
+            logger.info(f"RAG Stage 4/4: Excluding sources already direct-injected: {exclude_sources}")
+        context_pack = await self._pack_and_compress(ranked_chunks, query, max_tokens, exclude_sources)
         logger.debug(f"RAG Stage 4/4 complete: Packed {len(context_pack.evidence)} evidence items, coverage={context_pack.coverage:.2f}")
         
         return context_pack
@@ -309,11 +321,9 @@ async def _vector_search(
         if not chunks:
             return []
         
+        query_embeddings = await api_client_manager.get_embeddings(queries)
         all_results = []
-        for query in queries:
-            # Get query embedding
-            query_embedding = await api_client_manager.get_embeddings([query])
-            
+        for query_embedding in query_embeddings:
             # Search with retry logic for transient HNSW errors during concurrent writes
             max_retries = 3
             retry_delay = 0.5  # Start with 500ms delay
@@ -322,7 +332,7 @@ async def _vector_search(
             for attempt in range(max_retries):
                 try:
                     results = collection.query(
-                        query_embeddings=query_embedding,
+                        query_embeddings=[query_embedding],
                         n_results=min(rag_config.hybrid_recall_top_k, len(chunks))
                     )
                     break  # Success - exit retry loop
@@ -480,13 +490,16 @@ async def _pack_and_compress(
         self,
         chunks: List[DocumentChunk],
         query: str,
-        max_tokens: int
+        max_tokens: int,
+        exclude_sources: Optional[List[str]] = None
     ) -> ContextPack:
         """
         Stage D: Pack chunks into ContextPack with strict token limit enforcement.
         
         CRITICAL: This function MUST NOT exceed max_tokens. We pack chunks incrementally
         until we hit the limit, then stop. Compression is NOT used because it's unreliable.
+        
+        Chunks from exclude_sources are skipped (already direct-injected in the prompt).
         """
         if not chunks:
             return ContextPack(
@@ -498,32 +511,43 @@ async def _pack_and_compress(
                 needs_more_context=True
             )
         
+        exclude_set = set(exclude_sources) if exclude_sources else set()
+        skipped_count = 0
+        
         # Assemble evidence INCREMENTALLY until we hit max_tokens
         evidence = []
         source_map = {}
         assembled_text = []
         current_tokens = 0
+        evidence_idx = 0
         
-        for idx, chunk in enumerate(chunks, start=1):
+        for chunk in chunks:
+            # Skip chunks from excluded sources (already direct-injected)
+            if chunk.source_file in exclude_set:
+                skipped_count += 1
+                continue
+            
+            evidence_idx += 1
+            
             # Format this chunk's evidence entry
-            chunk_entry = f"[Evidence {idx} from {chunk.source_file}]\n{chunk.text}\n"
+            chunk_entry = f"[Evidence {evidence_idx} from {chunk.source_file}]\n{chunk.text}\n"
             chunk_tokens = count_tokens(chunk_entry)
             
             # Check if adding this chunk would exceed limit
             if current_tokens + chunk_tokens > max_tokens:
                 # Stop here - we've hit the limit
-                logger.debug(f"RAG packing stopped at {idx-1}/{len(chunks)} chunks ({current_tokens} tokens, limit={max_tokens})")
+                logger.debug(f"RAG packing stopped at {evidence_idx-1} packed chunks ({current_tokens} tokens, limit={max_tokens})")
                 break
             
             # Add this chunk
             evidence_entry = {
-                "id": idx,
+                "id": evidence_idx,
                 "source": chunk.source_file,
                 "text": chunk.text,
                 "position": chunk.position
             }
             evidence.append(evidence_entry)
-            source_map[f"E{idx}"] = chunk.source_file
+            source_map[f"E{evidence_idx}"] = chunk.source_file
             assembled_text.append(chunk_entry)
             current_tokens += chunk_tokens
             
@@ -531,6 +555,9 @@ async def _pack_and_compress(
             if chunk.source_file in self.document_access_order:
                 self.document_access_order[chunk.source_file] = time.time()
         
+        if skipped_count > 0:
+            logger.info(f"RAG packing: Skipped {skipped_count} chunks from excluded sources (already direct-injected)")
+        
         full_text = "\n".join(assembled_text)
         token_count = current_tokens  # We already counted during packing
         
@@ -556,6 +583,38 @@ async def _pack_and_compress(
             needs_more_context=coverage < rag_config.coverage_threshold
         )
     
+    async def _enforce_chunk_cap(self) -> None:
+        """Trim oldest non-permanent chunks when any size bucket exceeds max_chunks_per_size."""
+        cap = rag_config.max_chunks_per_size
+        for chunk_size in rag_config.submitter_chunk_intervals:
+            chunks = self.chunks_by_size[chunk_size]
+            if len(chunks) <= cap:
+                continue
+
+            overflow = len(chunks) - cap
+            evict_ids = []
+            keep = []
+            removed = 0
+
+            for chunk in chunks:
+                if removed < overflow and not chunk.is_permanent:
+                    evict_ids.append(chunk.chunk_id)
+                    chunk.embedding = None
+                    removed += 1
+                else:
+                    keep.append(chunk)
+
+            if evict_ids:
+                collection = self.collections[chunk_size]
+                try:
+                    collection.delete(ids=evict_ids)
+                except Exception as e:
+                    logger.error(f"ChromaDB delete during chunk cap enforcement (size={chunk_size}): {e}")
+
+                self.chunks_by_size[chunk_size] = keep
+                self.bm25_index[chunk_size] = None
+                logger.info(f"Chunk cap enforced for size={chunk_size}: removed {len(evict_ids)} oldest non-permanent chunks ({len(keep)} remaining)")
+
     async def _evict_lru_document(self) -> None:
         """Evict least recently used document (except permanent ones)."""
         # Find oldest non-permanent document
@@ -585,6 +644,8 @@ async def _evict_lru_document(self) -> None:
     
     async def remove_document(self, source_name: str) -> None:
         """Remove a document from all collections."""
+        was_tracked = source_name in self.document_access_order
+        
         for chunk_size in rag_config.submitter_chunk_intervals:
             # Remove from memory
             self.chunks_by_size[chunk_size] = [
@@ -602,7 +663,8 @@ async def remove_document(self, source_name: str) -> None:
             # Invalidate BM25
             self.bm25_index[chunk_size] = None
         
-        self.document_count -= 1
+        if was_tracked:
+            self.document_count = max(0, self.document_count - 1)
         
         # Clean up LRU tracking
         if source_name in self.document_access_order:
@@ -664,6 +726,7 @@ def clear_all_documents(self) -> None:
             # Reset counters
             self.document_count = 0
             self.permanent_documents.clear()
+            self.document_access_order.clear()
             
             if collection_errors:
                 logger.warning(f"RAG cleared with {len(collection_errors)} non-critical warnings: {'; '.join(collection_errors)}")
diff --git a/backend/aggregator/memory/shared_training.py b/backend/aggregator/memory/shared_training.py
index d3e5499..5460d66 100644
--- a/backend/aggregator/memory/shared_training.py
+++ b/backend/aggregator/memory/shared_training.py
@@ -94,8 +94,9 @@ async def reload_insights_from_current_path(self) -> None:
                                 default=0
                             )
                             self.submission_count = max_number
-                            # Set last_ragged to current count so new submissions start from here
-                            self.last_ragged_submission_count = self.submission_count
+                            # Use entry count (not max number) so post-prune gaps
+                            # don't cause the next acceptance to be skipped from RAG
+                            self.last_ragged_submission_count = len(self.insights)
                         else:
                             self.submission_count = 0
                 
@@ -263,7 +264,7 @@ async def get_submission_content(self, submission_number: int) -> Optional[str]:
                     return insight['content']
             return None
     
-    async def remove_submission(self, submission_number: int) -> bool:
+    async def remove_submission(self, submission_number: int, trigger_rechunk: bool = True) -> bool:
         """
         Remove a submission from the shared training database.
         
@@ -272,6 +273,8 @@ async def remove_submission(self, submission_number: int) -> bool:
         
         Args:
             submission_number: The submission number to remove
+            trigger_rechunk: Whether to fire the incremental rechunk callback.
+                Set False when the caller will do a full RAG rebuild instead.
             
         Returns:
             True if submission was found and removed, False otherwise
@@ -292,7 +295,7 @@ async def remove_submission(self, submission_number: int) -> bool:
                 await self._save()
                 
                 # Trigger re-chunking callback to update RAG
-                if self.rechunk_callback:
+                if trigger_rechunk and self.rechunk_callback:
                     try:
                         logger.info(f"Triggering re-chunking callback after removal of submission #{submission_number}")
                         await self.rechunk_callback()
diff --git a/backend/aggregator/prompts/submitter_prompts.py b/backend/aggregator/prompts/submitter_prompts.py
index 6a9f5bd..78ffd08 100644
--- a/backend/aggregator/prompts/submitter_prompts.py
+++ b/backend/aggregator/prompts/submitter_prompts.py
@@ -40,6 +40,8 @@ def get_submitter_system_prompt() -> str:
 YOUR TASK:
 Generate a novel mathematical insight that advances the user's goal.
 
+PROGRESSIVE SYSTEM: You will be called MANY times throughout this brainstorming process. Each call should produce ONE deep, well-developed mathematical insight. Do not try to cover everything at once — focus on thoroughly developing a single avenue per submission with full rigor. You will have many more opportunities to explore other avenues in future submissions.
+
 Focus on mathematical concepts, theorems, techniques, and proofs that may provide an avenue towards solving or understanding the mathematical problem in the prompt. Use all available resources including web search if available.
 
 WHAT MAKES A VALUABLE SUBMISSION - Consider:
diff --git a/backend/api/main.py b/backend/api/main.py
index 50469a5..4639098 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -77,6 +77,10 @@ async def lifespan(app: FastAPI):
     from backend.shared.boost_manager import boost_manager
     boost_manager.set_broadcast_callback(websocket.broadcast_event)
     
+    # Set API client manager broadcaster (token tracking, rate limits, fallbacks)
+    from backend.shared.api_client_manager import api_client_manager
+    api_client_manager.set_broadcast_callback(websocket.broadcast_event)
+    
     logger.info("ASI Aggregator System ready")
     
     yield
@@ -94,7 +98,7 @@ async def lifespan(app: FastAPI):
 app = FastAPI(
     title="ASI Aggregator System",
     description="AI-powered aggregator with RAG and multi-agent validation",
-    version="1.0.4",
+    version="1.0.5",
     lifespan=lifespan
 )
 
@@ -117,7 +121,7 @@ async def root():
     """Root endpoint."""
     return {
         "name": "ASI Aggregator System",
-        "version": "1.0.4",
+        "version": "1.0.5",
         "status": "running"
     }
 
diff --git a/backend/api/routes/aggregator.py b/backend/api/routes/aggregator.py
index 9aae65e..50715b9 100644
--- a/backend/api/routes/aggregator.py
+++ b/backend/api/routes/aggregator.py
@@ -2,7 +2,7 @@
 Aggregator API routes.
 """
 from fastapi import APIRouter, HTTPException, UploadFile, File
-from typing import List
+from typing import List, Optional
 import logging
 from pathlib import Path
 import aiofiles
@@ -10,19 +10,41 @@
 from backend.shared.models import AggregatorStartRequest, SystemStatus, ModelInfo
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.config import system_config, rag_config
+from backend.shared.token_tracker import token_tracker
 from backend.aggregator.core.coordinator import coordinator
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.memory.event_log import event_log
+from backend.compiler.core.compiler_coordinator import compiler_coordinator
+from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
 
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/aggregator", tags=["aggregator"])
 
 
+def _get_start_conflict() -> Optional[str]:
+    """Return a user-facing conflict message if another workflow is active."""
+    if coordinator.is_running:
+        return "Aggregator is already running"
+
+    if compiler_coordinator.is_running:
+        return "Cannot start Aggregator while Compiler is running. Stop Compiler first."
+
+    autonomous_state = autonomous_coordinator.get_state()
+    if autonomous_state.is_running:
+        return "Cannot start Aggregator while Autonomous Research is running. Stop Autonomous Research first."
+
+    return None
+
+
 @router.post("/start")
 async def start_aggregator(request: AggregatorStartRequest):
     """Start the aggregator system."""
     try:
+        conflict = _get_start_conflict()
+        if conflict:
+            raise HTTPException(status_code=400, detail=conflict)
+
         # Validate submitter configs
         num_submitters = len(request.submitter_configs)
         if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
@@ -50,10 +72,10 @@ async def start_aggregator(request: AggregatorStartRequest):
         # Log submitter configurations
         for config in request.submitter_configs:
             label = "(Main Submitter)" if config.submitter_id == 1 else ""
-        logger.info(
+            logger.info(
                 f"Submitter {config.submitter_id} {label}: model={config.model_id}, "
                 f"context={config.context_window}, max_tokens={config.max_output_tokens}"
-        )
+            )
         logger.info(
             f"Validator: model={request.validator_model}, "
             f"context={request.validator_context_size}, max_tokens={request.validator_max_output_tokens}"
@@ -74,6 +96,8 @@ async def start_aggregator(request: AggregatorStartRequest):
         )
         
         # Start coordinator
+        token_tracker.reset()
+        token_tracker.start_timer()
         await coordinator.start()
         
         return {
@@ -98,6 +122,7 @@ async def stop_aggregator():
     """Stop the aggregator system."""
     try:
         await coordinator.stop()
+        token_tracker.stop_timer()
         return {"status": "stopped", "message": "Aggregator system stopped"}
     except Exception as e:
         logger.error(f"Failed to stop aggregator: {e}")
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index 9f2a925..e101281 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -4,23 +4,380 @@
 """
 import asyncio
 import logging
-from typing import Optional
+import os
+from pathlib import Path
+from typing import Optional, Any, Dict
 from fastapi import APIRouter, HTTPException, BackgroundTasks
 
 from backend.shared.models import AutonomousResearchStartRequest, CritiqueRequest
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
-from backend.autonomous.memory.research_metadata import research_metadata
-from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
-from backend.autonomous.memory.paper_library import paper_library
+from backend.autonomous.memory.research_metadata import research_metadata, ResearchMetadata
+from backend.autonomous.memory.brainstorm_memory import brainstorm_memory, BrainstormMemory
+from backend.autonomous.memory.paper_library import paper_library, PaperLibrary
 from backend.autonomous.memory.final_answer_memory import final_answer_memory
 from backend.autonomous.memory.session_manager import session_manager
 from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
+from backend.aggregator.core.coordinator import coordinator
+from backend.compiler.core.compiler_coordinator import compiler_coordinator
 
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/auto-research", tags=["autonomous"])
 
 
+def _get_active_autonomous_session_id() -> str:
+    """Return the active autonomous session identifier, falling back to legacy mode."""
+    return session_manager.session_id if session_manager.is_session_active else "legacy"
+
+
+def _validate_history_session_id(session_id: str) -> None:
+    """Reject malformed history session identifiers before building any filesystem paths."""
+    if not session_id:
+        raise HTTPException(status_code=400, detail="Session ID is required")
+
+    if session_id == "legacy":
+        return
+
+    if session_id in {".", ".."} or "/" in session_id or "\\" in session_id:
+        raise HTTPException(status_code=400, detail=f"Invalid session ID: {session_id}")
+
+
+def _get_start_conflict() -> Optional[str]:
+    """Return a user-facing conflict message if another workflow is active."""
+    autonomous_state = autonomous_coordinator.get_state()
+    if autonomous_state.is_running:
+        return "Autonomous research is already running"
+
+    if coordinator.is_running:
+        return "Cannot start Autonomous Research while Aggregator is running. Stop Aggregator first."
+
+    if compiler_coordinator.is_running:
+        return "Cannot start Autonomous Research while Compiler is running. Stop Compiler first."
+
+    return None
+
+
+def _resolve_history_session_paths(session_id: str) -> Dict[str, Path]:
+    """Resolve all session-specific paths needed for Stage 2 paper history operations."""
+    from backend.shared.config import system_config
+
+    _validate_history_session_id(session_id)
+
+    if session_id == "legacy":
+        paths = {
+            "papers_dir": Path(system_config.auto_papers_dir),
+            "brainstorms_dir": Path(system_config.auto_brainstorms_dir),
+            "metadata_path": Path(system_config.auto_research_metadata_file),
+            "stats_path": Path(system_config.auto_research_stats_file),
+            "workflow_state_path": Path(system_config.auto_workflow_state_file),
+        }
+    else:
+        sessions_root = Path(system_config.auto_sessions_base_dir).resolve()
+        session_root = (sessions_root / session_id).resolve()
+
+        if session_root.parent != sessions_root:
+            raise HTTPException(status_code=400, detail=f"Invalid session ID: {session_id}")
+
+        if not session_root.exists():
+            raise HTTPException(status_code=404, detail=f"Session not found: {session_id}")
+
+        paths = {
+            "papers_dir": session_root / "papers",
+            "brainstorms_dir": session_root / "brainstorms",
+            "metadata_path": session_root / "session_metadata.json",
+            "stats_path": session_root / "session_stats.json",
+            "workflow_state_path": session_root / "workflow_state.json",
+        }
+
+    if not paths["papers_dir"].exists():
+        raise HTTPException(
+            status_code=404,
+            detail=f"No Stage 2 papers directory found for session: {session_id}"
+        )
+
+    return paths
+
+
+def _build_scoped_paper_library(paths: Dict[str, Path]) -> PaperLibrary:
+    """Create a temporary PaperLibrary rooted at one legacy/session papers directory."""
+    scoped_library = PaperLibrary()
+    scoped_library._base_dir = paths["papers_dir"]
+    scoped_library._archive_dir = paths["papers_dir"] / "archive"
+    return scoped_library
+
+
+def _build_scoped_brainstorm_memory(paths: Dict[str, Path]) -> BrainstormMemory:
+    """Create a temporary BrainstormMemory rooted at one legacy/session brainstorms directory."""
+    scoped_memory = BrainstormMemory()
+    scoped_memory._base_dir = paths["brainstorms_dir"]
+    return scoped_memory
+
+
+async def _ensure_history_paper_is_visible(
+    scoped_paper_library: PaperLibrary,
+    *,
+    session_id: str,
+    paper_id: str,
+) -> Any:
+    """Ensure a history paper matches the completed/non-archived contract of the history UI."""
+    metadata = await scoped_paper_library.get_metadata(paper_id)
+    if not metadata or metadata.status != "complete":
+        raise HTTPException(
+            status_code=404,
+            detail=f"Paper not found in history: session={session_id}, paper={paper_id}"
+        )
+
+    if not await scoped_paper_library.is_paper_complete(paper_id):
+        raise HTTPException(
+            status_code=404,
+            detail=f"Paper is not available in history: session={session_id}, paper={paper_id}"
+        )
+
+    return metadata
+
+
+async def _build_scoped_research_metadata(paths: Dict[str, Path]) -> ResearchMetadata:
+    """Create a temporary ResearchMetadata instance rooted at one legacy/session metadata set."""
+    scoped_metadata = ResearchMetadata()
+    scoped_metadata._metadata_path = paths["metadata_path"]
+    scoped_metadata._stats_path = paths["stats_path"]
+    scoped_metadata._workflow_state_path = paths["workflow_state_path"]
+    await scoped_metadata.initialize()
+    return scoped_metadata
+
+
+def _resolve_validator_config(request: Optional[CritiqueRequest]) -> Dict[str, Any]:
+    """Resolve critique validator settings from the request or the active coordinator."""
+    validator_model = None
+    validator_context_window = None
+    validator_max_tokens = None
+    validator_provider = None
+    validator_openrouter_provider = None
+    custom_prompt = None
+
+    if request:
+        custom_prompt = request.custom_prompt
+        if request.validator_model:
+            validator_model = request.validator_model
+            validator_context_window = request.validator_context_window or 131072
+            validator_max_tokens = request.validator_max_tokens or 25000
+            validator_provider = request.validator_provider or "lm_studio"
+            validator_openrouter_provider = request.validator_openrouter_provider
+
+    if not validator_model:
+        coordinator_config = autonomous_coordinator.get_validator_config()
+        if coordinator_config:
+            validator_model = coordinator_config["validator_model"]
+            validator_context_window = coordinator_config["validator_context_window"]
+            validator_max_tokens = coordinator_config["validator_max_tokens"]
+            validator_provider = coordinator_config["validator_provider"]
+            validator_openrouter_provider = coordinator_config.get("validator_openrouter_provider")
+
+    if not validator_model:
+        raise HTTPException(
+            status_code=400,
+            detail="No validator model configured. Please configure a validator model in Autonomous Research Settings."
+        )
+
+    return {
+        "custom_prompt": custom_prompt,
+        "validator_model": validator_model,
+        "validator_context_window": validator_context_window,
+        "validator_max_tokens": validator_max_tokens,
+        "validator_provider": validator_provider,
+        "validator_openrouter_provider": validator_openrouter_provider,
+    }
+
+
+async def _generate_autonomous_paper_critique(
+    *,
+    paper_id: str,
+    paper_title: str,
+    content: str,
+    base_path: str,
+    request: Optional[CritiqueRequest] = None,
+) -> Dict[str, Any]:
+    """Generate and persist a critique for an autonomous Stage 2 paper."""
+    from backend.shared.critique_memory import save_critique
+    from backend.shared.critique_prompts import (
+        DEFAULT_CRITIQUE_PROMPT,
+        build_critique_prompt,
+        parse_critique_response,
+    )
+    from backend.shared.api_client_manager import api_client_manager
+    from backend.shared.models import ModelConfig, PaperCritique
+    from backend.shared.utils import count_tokens
+    from datetime import datetime
+    import uuid
+
+    config = _resolve_validator_config(request)
+    prompt_to_use = config["custom_prompt"] or DEFAULT_CRITIQUE_PROMPT
+    full_prompt = build_critique_prompt(content, paper_title, prompt_to_use)
+    prompt_tokens = count_tokens(full_prompt)
+
+    output_reserve = config["validator_max_tokens"]
+    safety_margin = int(config["validator_context_window"] * 0.1)
+    available_input = config["validator_context_window"] - output_reserve - safety_margin
+
+    if prompt_tokens > available_input:
+        excess_tokens = prompt_tokens - available_input
+        raise HTTPException(
+            status_code=400,
+            detail=(
+                f"Paper is too long for the validator's context window. "
+                f"The paper requires {prompt_tokens:,} tokens, but the validator can only accept {available_input:,} tokens "
+                f"(context window: {config['validator_context_window']:,}, output reserve: {output_reserve:,}, safety margin: {safety_margin:,}). "
+                f"The paper exceeds the limit by {excess_tokens:,} tokens. "
+                f"A complete and honest review requires direct context injection - please select a validator with a larger context window."
+            )
+        )
+
+    api_client_manager.configure_role(
+        "paper_critic",
+        ModelConfig(
+            provider=config["validator_provider"],
+            model_id=config["validator_model"],
+            openrouter_model_id=config["validator_model"] if config["validator_provider"] == "openrouter" else None,
+            openrouter_provider=config["validator_openrouter_provider"],
+            lm_studio_fallback_id=None,
+            context_window=config["validator_context_window"],
+            max_output_tokens=config["validator_max_tokens"],
+        )
+    )
+
+    logger.info(f"Requesting critique for paper {paper_id} from validator model {config['validator_model']}")
+
+    response = await api_client_manager.generate_completion(
+        task_id=f"paper_critique_{paper_id}_{datetime.now().strftime('%Y%m%d_%H%M%S')}",
+        role_id="paper_critic",
+        model=config["validator_model"],
+        messages=[{"role": "user", "content": full_prompt}],
+        max_tokens=config["validator_max_tokens"],
+        temperature=0.0,
+    )
+
+    response_content = ""
+    if response.get("choices"):
+        message = response["choices"][0].get("message", {})
+        response_content = message.get("content") or message.get("reasoning") or ""
+
+    if not response_content:
+        raise HTTPException(status_code=500, detail="Empty response from validator model")
+
+    critique_data = parse_critique_response(response_content)
+    critique = PaperCritique(
+        critique_id=str(uuid.uuid4()),
+        model_id=config["validator_model"],
+        provider=config["validator_provider"],
+        host_provider=config["validator_openrouter_provider"],
+        date=datetime.now(),
+        prompt_used=prompt_to_use,
+        novelty_rating=critique_data.get("novelty_rating", 0),
+        novelty_feedback=critique_data.get("novelty_feedback", ""),
+        correctness_rating=critique_data.get("correctness_rating", 0),
+        correctness_feedback=critique_data.get("correctness_feedback", ""),
+        impact_rating=critique_data.get("impact_rating", 0),
+        impact_feedback=critique_data.get("impact_feedback", ""),
+        full_critique=critique_data.get("full_critique", ""),
+    )
+
+    saved_critique = await save_critique("autonomous_paper", critique, paper_id, base_path)
+    return {
+        "success": True,
+        "critique": saved_critique.model_dump(),
+        "paper_id": paper_id,
+        "paper_title": paper_title,
+    }
+
+
+async def _get_autonomous_paper_critiques_response(
+    *,
+    paper_id: str,
+    paper_title: str,
+    base_path: str,
+) -> Dict[str, Any]:
+    """Load critique history for an autonomous Stage 2 paper."""
+    from backend.shared.critique_memory import get_critiques
+
+    critiques = await get_critiques("autonomous_paper", paper_id, base_path)
+    return {
+        "success": True,
+        "paper_id": paper_id,
+        "paper_title": paper_title,
+        "critiques": [critique.model_dump() for critique in critiques],
+        "count": len(critiques),
+    }
+
+
+async def _delete_autonomous_paper_from_scope(
+    *,
+    session_id: str,
+    scoped_paper_library: PaperLibrary,
+    scoped_brainstorm_memory: BrainstormMemory,
+    scoped_research_metadata: ResearchMetadata,
+    paper_id: str,
+) -> Dict[str, Any]:
+    """Delete a Stage 2 paper and clean its related metadata/critique state."""
+    from backend.shared.critique_memory import clear_critiques
+
+    state = autonomous_coordinator.get_state()
+    active_session_id = _get_active_autonomous_session_id()
+    if (
+        state.is_running
+        and state.current_tier == "tier2_paper_writing"
+        and autonomous_coordinator._current_paper_id == paper_id
+        and active_session_id == session_id
+    ):
+        raise HTTPException(
+            status_code=400,
+            detail="Cannot delete active paper while it's being compiled. Stop autonomous research first."
+        )
+
+    metadata = await scoped_paper_library.get_metadata(paper_id)
+    if not metadata:
+        raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
+
+    paper_path = scoped_paper_library.get_paper_path(paper_id)
+    base_path = os.path.dirname(paper_path)
+    source_brainstorms = metadata.source_brainstorm_ids or []
+
+    success = await scoped_paper_library.delete_paper(paper_id)
+    if not success:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Failed to delete paper files for {paper_id}"
+        )
+
+    await scoped_research_metadata.delete_paper(paper_id)
+
+    for topic_id in source_brainstorms:
+        try:
+            await scoped_brainstorm_memory.remove_paper_reference(topic_id, paper_id)
+        except Exception as e:
+            logger.warning(
+                f"Failed to remove paper {paper_id} from brainstorm metadata {topic_id}: {e}"
+            )
+
+    try:
+        await clear_critiques("autonomous_paper", paper_id, base_path)
+        logger.info(f"Cleared critiques for deleted paper {paper_id}")
+    except Exception as e:
+        logger.warning(f"Failed to clear critiques for paper {paper_id}: {e}")
+
+    logger.info(
+        f"Deleted paper {paper_id} from session {session_id} "
+        f"(from brainstorms: {', '.join(source_brainstorms)})"
+    )
+
+    return {
+        "success": True,
+        "message": f"Paper {paper_id} deleted successfully",
+        "paper_id": paper_id,
+        "session_id": session_id,
+        "source_brainstorms": source_brainstorms,
+    }
+
+
 @router.post("/start")
 async def start_autonomous_research(
     request: AutonomousResearchStartRequest,
@@ -29,14 +386,10 @@ async def start_autonomous_research(
     """Start autonomous research mode."""
     try:
         from backend.shared.config import system_config
-        
-        # Check if already running
-        state = autonomous_coordinator.get_state()
-        if state.is_running:
-            raise HTTPException(
-                status_code=400,
-                detail="Autonomous research is already running"
-            )
+
+        conflict = _get_start_conflict()
+        if conflict:
+            raise HTTPException(status_code=400, detail=conflict)
         
         # Validate submitter configs
         num_submitters = len(request.submitter_configs)
@@ -420,6 +773,43 @@ async def get_paper(paper_id: str):
         raise HTTPException(status_code=500, detail=str(e))
 
 
+@router.get("/paper-history")
+async def get_paper_history():
+    """Get all completed, non-archived Stage 2 papers from legacy and session history."""
+    try:
+        papers = await paper_library.list_history_papers()
+        return {
+            "success": True,
+            "papers": papers,
+            "total_count": len(papers)
+        }
+    except Exception as e:
+        logger.error(f"Failed to get Stage 2 paper history: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@router.get("/paper-history/{session_id}/{paper_id}")
+async def get_history_paper(session_id: str, paper_id: str):
+    """Get one completed, non-archived Stage 2 paper from legacy/session history."""
+    try:
+        paper = await paper_library.get_history_paper(session_id, paper_id)
+        if not paper:
+            raise HTTPException(
+                status_code=404,
+                detail=f"Paper not found in history: session={session_id}, paper={paper_id}"
+            )
+
+        return {
+            "success": True,
+            **paper
+        }
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to get history paper {session_id}/{paper_id}: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
 @router.get("/current-paper-progress")
 async def get_current_paper_progress():
     """Get current paper being compiled (if any).
@@ -764,9 +1154,9 @@ async def force_tier3(mode: str = "complete_current"):
             # Get current paper info from compiler if available
             try:
                 from backend.compiler.core.compiler_coordinator import compiler_coordinator
-                compiler_state = compiler_coordinator.get_state()
-                context_info["compiler_mode"] = compiler_state.get("current_mode", "unknown")
-            except:
+                compiler_state = await compiler_coordinator.get_status()
+                context_info["compiler_mode"] = compiler_state.current_mode or "unknown"
+            except Exception:
                 pass
         
         # Get count of completed papers
@@ -951,72 +1341,58 @@ async def delete_paper(paper_id: str, confirm: bool = False):
     Query params:
         confirm: Must be True to execute deletion (safety check)
     """
-    import os
-    
     try:
         if not confirm:
             raise HTTPException(
                 status_code=400,
                 detail="Must confirm deletion with confirm=true"
             )
-        
-        # Check if running
-        state = autonomous_coordinator.get_state()
-        if state.is_running and state.current_tier == "tier2_paper_writing":
-            # Check if this is the active paper
-            if autonomous_coordinator._current_paper_id == paper_id:
-                raise HTTPException(
-                    status_code=400,
-                    detail="Cannot delete active paper while it's being compiled. Stop autonomous research first."
-                )
-        
-        # Get paper metadata
-        metadata = await paper_library.get_metadata(paper_id)
-        if not metadata:
-            raise HTTPException(
-                status_code=404,
-                detail=f"Paper not found: {paper_id}"
-            )
-        
-        # Get session-aware base path for critique storage BEFORE deleting paper
-        paper_path = paper_library.get_paper_path(paper_id)
-        base_path = os.path.dirname(paper_path)
-        
-        # Get source brainstorms
-        source_brainstorms = metadata.source_brainstorm_ids or []
-        
-        # Delete paper files
-        success = await paper_library.delete_paper(paper_id)
-        if not success:
+
+        return await _delete_autonomous_paper_from_scope(
+            session_id=_get_active_autonomous_session_id(),
+            scoped_paper_library=paper_library,
+            scoped_brainstorm_memory=brainstorm_memory,
+            scoped_research_metadata=research_metadata,
+            paper_id=paper_id,
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to delete paper {paper_id}: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@router.delete("/paper-history/{session_id}/{paper_id}")
+async def delete_history_paper(session_id: str, paper_id: str, confirm: bool = False):
+    """Delete a completed Stage 2 history paper from a specific legacy/session scope."""
+    try:
+        if not confirm:
             raise HTTPException(
-                status_code=500,
-                detail=f"Failed to delete paper files for {paper_id}"
+                status_code=400,
+                detail="Must confirm deletion with confirm=true"
             )
-        
-        # Remove from central metadata
-        await research_metadata.delete_paper(paper_id)
-        
-        # Clear associated critiques using session-aware path
-        from backend.shared.critique_memory import clear_critiques
-        try:
-            await clear_critiques("autonomous_paper", paper_id, base_path)
-            logger.info(f"Cleared critiques for deleted paper {paper_id}")
-        except Exception as e:
-            logger.warning(f"Failed to clear critiques for paper {paper_id}: {e}")
-        
-        logger.info(f"Deleted paper {paper_id} (from brainstorms: {', '.join(source_brainstorms)})")
-        
-        return {
-            "success": True,
-            "message": f"Paper {paper_id} deleted successfully",
-            "paper_id": paper_id,
-            "source_brainstorms": source_brainstorms
-        }
-        
+
+        paths = _resolve_history_session_paths(session_id)
+        scoped_paper_library = _build_scoped_paper_library(paths)
+        scoped_brainstorm_memory = _build_scoped_brainstorm_memory(paths)
+        scoped_research_metadata = await _build_scoped_research_metadata(paths)
+        await _ensure_history_paper_is_visible(
+            scoped_paper_library,
+            session_id=session_id,
+            paper_id=paper_id,
+        )
+
+        return await _delete_autonomous_paper_from_scope(
+            session_id=session_id,
+            scoped_paper_library=scoped_paper_library,
+            scoped_brainstorm_memory=scoped_brainstorm_memory,
+            scoped_research_metadata=scoped_research_metadata,
+            paper_id=paper_id,
+        )
     except HTTPException:
         raise
     except Exception as e:
-        logger.error(f"Failed to delete paper {paper_id}: {e}")
+        logger.error(f"Failed to delete history paper {session_id}/{paper_id}: {e}")
         raise HTTPException(status_code=500, detail=str(e))
 
 
@@ -1377,6 +1753,7 @@ async def get_final_answer_archived_papers(answer_id: str):
         List of paper metadata
     """
     from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
+    from backend.shared.config import system_config
     from pathlib import Path
     
     try:
@@ -1407,6 +1784,7 @@ async def get_final_answer_archived_paper(answer_id: str, paper_id: str):
         Paper content, abstract, outline, metadata
     """
     from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
+    from backend.shared.config import system_config
     from pathlib import Path
     
     try:
@@ -1441,6 +1819,7 @@ async def get_final_answer_archived_brainstorms(answer_id: str):
         List of brainstorm metadata
     """
     from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
+    from backend.shared.config import system_config
     from pathlib import Path
     
     try:
@@ -1471,6 +1850,7 @@ async def get_final_answer_archived_brainstorm(answer_id: str, topic_id: str):
         Brainstorm content and metadata
     """
     from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
+    from backend.shared.config import system_config
     from pathlib import Path
     
     try:
@@ -1516,180 +1896,25 @@ async def request_paper_critique(paper_id: str, request: CritiqueRequest = None)
     Returns:
         The critique with ratings and feedback
     """
-    from backend.shared.config import system_config
-    from backend.shared.critique_prompts import build_critique_prompt, DEFAULT_CRITIQUE_PROMPT
-    from backend.shared.critique_memory import save_critique, MAX_CRITIQUES_PER_PAPER
-    from backend.shared.models import PaperCritique, CritiqueRequest
-    from backend.shared.api_client_manager import api_client_manager
-    from backend.shared.json_parser import parse_json
-    from backend.shared.utils import count_tokens
-    import os
-    import uuid
-    from datetime import datetime
-    
     try:
-        # Get paper content
         metadata = await paper_library.get_metadata(paper_id)
         if not metadata:
             raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
-        
+
         content = await paper_library.get_paper_content(paper_id)
         if not content:
             raise HTTPException(status_code=404, detail=f"Paper content not found: {paper_id}")
-        
-        # Get session-aware base path for critique storage
-        # Critiques are stored alongside papers in the same directory
+
         paper_path = paper_library.get_paper_path(paper_id)
         base_path = os.path.dirname(paper_path)
-        
-        # Try to get validator config from request body first (allows critiques without starting research)
-        # Then fall back to autonomous coordinator's stored config
-        validator_model = None
-        validator_context_window = None
-        validator_max_tokens = None
-        validator_provider = None
-        validator_openrouter_provider = None
-        custom_prompt = None
-        
-        if request:
-            custom_prompt = request.custom_prompt
-            # Check if request provides validator config
-            if request.validator_model:
-                validator_model = request.validator_model
-                validator_context_window = request.validator_context_window or 131072
-                validator_max_tokens = request.validator_max_tokens or 25000
-                validator_provider = request.validator_provider or "lm_studio"
-                validator_openrouter_provider = request.validator_openrouter_provider
-        
-        # If no validator config from request, try coordinator
-        if not validator_model:
-            coordinator_config = autonomous_coordinator.get_validator_config()
-            if coordinator_config:
-                validator_model = coordinator_config["validator_model"]
-                validator_context_window = coordinator_config["validator_context_window"]
-                validator_max_tokens = coordinator_config["validator_max_tokens"]
-                validator_provider = coordinator_config["validator_provider"]
-                validator_openrouter_provider = coordinator_config.get("validator_openrouter_provider")
-        
-        # If still no config, error
-        if not validator_model:
-            raise HTTPException(
-                status_code=400,
-                detail="No validator model configured. Please configure a validator model in Autonomous Research Settings."
-            )
-        
-        # Build the critique prompt
-        prompt_to_use = custom_prompt if custom_prompt else DEFAULT_CRITIQUE_PROMPT
-        full_prompt = build_critique_prompt(content, metadata.title, prompt_to_use)
-        
-        # Count tokens in the prompt
-        prompt_tokens = count_tokens(full_prompt)
-        
-        # Calculate available input tokens (context window - output reserve - safety margin)
-        output_reserve = validator_max_tokens
-        safety_margin = int(validator_context_window * 0.1)  # 10% safety margin
-        available_input = validator_context_window - output_reserve - safety_margin
-        
-        # Check if paper fits in context window
-        if prompt_tokens > available_input:
-            excess_tokens = prompt_tokens - available_input
-            raise HTTPException(
-                status_code=400,
-                detail=(
-                    f"Paper is too long for the validator's context window. "
-                    f"The paper requires {prompt_tokens:,} tokens, but the validator can only accept {available_input:,} tokens "
-                    f"(context window: {validator_context_window:,}, output reserve: {output_reserve:,}, safety margin: {safety_margin:,}). "
-                    f"The paper exceeds the limit by {excess_tokens:,} tokens. "
-                    f"A complete and honest review requires direct context injection - please select a validator with a larger context window."
-                )
-            )
-        
-        # Build messages for API call
-        messages = [
-            {"role": "user", "content": full_prompt}
-        ]
-        
-        # Configure the paper_critic role with the validator settings BEFORE making the API call
-        # This ensures routing goes to the correct provider (OpenRouter vs LM Studio)
-        from backend.shared.models import ModelConfig
-        
-        api_client_manager.configure_role(
-            "paper_critic",
-            ModelConfig(
-                provider=validator_provider,
-                model_id=validator_model,
-                openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
-                openrouter_provider=validator_openrouter_provider,
-                lm_studio_fallback_id=None,  # No fallback for direct critique calls
-                context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
-            )
-        )
-        
-        # Make the API call to the validator model
-        logger.info(f"Requesting critique for paper {paper_id} from validator model {validator_model}")
-        
-        response = await api_client_manager.generate_completion(
-            task_id=f"paper_critique_{paper_id}_{datetime.now().strftime('%Y%m%d_%H%M%S')}",
-            role_id="paper_critic",
-            model=validator_model,
-            messages=messages,
-            max_tokens=validator_max_tokens,
-            temperature=0.0
-        )
-        
-        # Parse the response - extract from OpenAI-compatible response structure
-        response_content = ""
-        if response.get("choices"):
-            message = response["choices"][0].get("message", {})
-            response_content = message.get("content") or message.get("reasoning") or ""
-        
-        if not response_content:
-            raise HTTPException(status_code=500, detail="Empty response from validator model")
-        
-        # Try to parse as JSON
-        try:
-            critique_data = parse_json(response_content)
-        except Exception as e:
-            # If JSON parsing fails, create a structured response from raw text
-            logger.warning(f"Failed to parse critique JSON, using raw response: {e}")
-            critique_data = {
-                "novelty_rating": 0,
-                "novelty_feedback": "Unable to parse structured response",
-                "correctness_rating": 0,
-                "correctness_feedback": "Unable to parse structured response",
-                "impact_rating": 0,
-                "impact_feedback": "Unable to parse structured response",
-                "full_critique": response_content
-            }
-        
-        # Create critique object with correct field names
-        critique = PaperCritique(
-            critique_id=str(uuid.uuid4()),
-            model_id=validator_model,
-            provider=validator_provider,
-            host_provider=validator_openrouter_provider,
-            date=datetime.now(),
-            prompt_used=prompt_to_use,
-            novelty_rating=critique_data.get("novelty_rating", 0),
-            novelty_feedback=critique_data.get("novelty_feedback", ""),
-            correctness_rating=critique_data.get("correctness_rating", 0),
-            correctness_feedback=critique_data.get("correctness_feedback", ""),
-            impact_rating=critique_data.get("impact_rating", 0),
-            impact_feedback=critique_data.get("impact_feedback", ""),
-            full_critique=critique_data.get("full_critique", "")
+
+        return await _generate_autonomous_paper_critique(
+            paper_id=paper_id,
+            paper_title=metadata.title,
+            content=content,
+            base_path=base_path,
+            request=request,
         )
-        
-        # Save the critique with session-aware path
-        saved_critique = await save_critique("autonomous_paper", critique, paper_id, base_path)
-        
-        return {
-            "success": True,
-            "critique": saved_critique.model_dump(),
-            "paper_id": paper_id,
-            "paper_title": metadata.title
-        }
-        
     except HTTPException:
         raise
     except Exception as e:
@@ -1708,29 +1933,19 @@ async def get_paper_critiques(paper_id: str):
     Returns:
         List of critiques for the paper
     """
-    from backend.shared.critique_memory import get_critiques
-    import os
-    
     try:
-        # Verify paper exists
         metadata = await paper_library.get_metadata(paper_id)
         if not metadata:
             raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
-        
-        # Get session-aware base path for critique storage
+
         paper_path = paper_library.get_paper_path(paper_id)
         base_path = os.path.dirname(paper_path)
-        
-        critiques = await get_critiques("autonomous_paper", paper_id, base_path)
-        
-        return {
-            "success": True,
-            "paper_id": paper_id,
-            "paper_title": metadata.title,
-            "critiques": [c.model_dump() for c in critiques],
-            "count": len(critiques)
-        }
-        
+
+        return await _get_autonomous_paper_critiques_response(
+            paper_id=paper_id,
+            paper_title=metadata.title,
+            base_path=base_path,
+        )
     except HTTPException:
         raise
     except Exception as e:
@@ -1784,6 +1999,72 @@ async def delete_paper_critiques(paper_id: str, confirm: bool = False):
         raise HTTPException(status_code=500, detail=str(e))
 
 
+# ============================================================================
+# STAGE 2 PAPER HISTORY CRITIQUE ENDPOINTS
+# ============================================================================
+
+
+@router.post("/paper-history/{session_id}/{paper_id}/critique")
+async def request_history_paper_critique(
+    session_id: str,
+    paper_id: str,
+    request: CritiqueRequest = None,
+):
+    """Request a validator critique for a Stage 2 history paper from a specific session."""
+    try:
+        paths = _resolve_history_session_paths(session_id)
+        scoped_paper_library = _build_scoped_paper_library(paths)
+        metadata = await _ensure_history_paper_is_visible(
+            scoped_paper_library,
+            session_id=session_id,
+            paper_id=paper_id,
+        )
+
+        content = await scoped_paper_library.get_paper_content(paper_id)
+        if not content:
+            raise HTTPException(
+                status_code=404,
+                detail=f"Paper content not found: session={session_id}, paper={paper_id}"
+            )
+
+        return await _generate_autonomous_paper_critique(
+            paper_id=paper_id,
+            paper_title=metadata.title,
+            content=content,
+            base_path=str(paths["papers_dir"]),
+            request=request,
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to request history critique for {session_id}/{paper_id}: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@router.get("/paper-history/{session_id}/{paper_id}/critiques")
+async def get_history_paper_critiques(session_id: str, paper_id: str):
+    """Get all validator critiques for a Stage 2 history paper from a specific session."""
+    try:
+        paths = _resolve_history_session_paths(session_id)
+        scoped_paper_library = _build_scoped_paper_library(paths)
+        metadata = await _ensure_history_paper_is_visible(
+            scoped_paper_library,
+            session_id=session_id,
+            paper_id=paper_id,
+        )
+
+        return await _get_autonomous_paper_critiques_response(
+            paper_id=paper_id,
+            paper_title=metadata.title,
+            base_path=str(paths["papers_dir"]),
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to get history critiques for {session_id}/{paper_id}: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+
 # ============================================================================
 # FINAL ANSWER CRITIQUE ENDPOINTS
 # ============================================================================
@@ -1812,7 +2093,6 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
     from backend.shared.critique_memory import save_critique
     from backend.shared.models import PaperCritique, CritiqueRequest
     from backend.shared.api_client_manager import api_client_manager
-    from backend.shared.json_parser import parse_json
     from backend.shared.utils import count_tokens
     from pathlib import Path
     import uuid
@@ -1944,20 +2224,9 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
         if not response_content:
             raise HTTPException(status_code=500, detail="Empty response from validator model")
         
-        # Try to parse as JSON
-        try:
-            critique_data = parse_json(response_content)
-        except Exception as e:
-            logger.warning(f"Failed to parse critique JSON, using raw response: {e}")
-            critique_data = {
-                "novelty_rating": 0,
-                "novelty_feedback": "Unable to parse structured response",
-                "correctness_rating": 0,
-                "correctness_feedback": "Unable to parse structured response",
-                "impact_rating": 0,
-                "impact_feedback": "Unable to parse structured response",
-                "full_critique": response_content
-            }
+        # Parse with lenient fallback for truncated critique responses
+        from backend.shared.critique_prompts import parse_critique_response
+        critique_data = parse_critique_response(response_content)
         
         # Create critique object with correct field names
         critique = PaperCritique(
diff --git a/backend/api/routes/boost.py b/backend/api/routes/boost.py
index f82392d..ff0e9b7 100644
--- a/backend/api/routes/boost.py
+++ b/backend/api/routes/boost.py
@@ -13,6 +13,7 @@
 from typing import Dict, Any, Optional
 import logging
 
+from backend.shared.config import rag_config
 from backend.shared.models import BoostConfig
 from backend.shared.boost_manager import boost_manager
 from backend.shared.boost_logger import boost_logger
@@ -27,33 +28,49 @@ class BoostNextCountRequest(BaseModel):
     count: int
 
 
+def _resolve_boost_api_key(api_key: Optional[str]) -> str:
+    """Use the explicit boost key when provided, otherwise fall back to the active global key."""
+    explicit_key = (api_key or "").strip()
+    if explicit_key:
+        return explicit_key
+
+    global_key = (rag_config.openrouter_api_key or "").strip()
+    if global_key:
+        return global_key
+
+    raise HTTPException(
+        status_code=400,
+        detail="No OpenRouter API key available. Use the active global key or provide one in the boost modal."
+    )
+
+
 @router.post("/api/boost/enable")
 async def enable_boost(config: BoostConfig) -> Dict[str, Any]:
     """
     Enable API boost with OpenRouter.
     
     Args:
-        config: Boost configuration with API key and model
+        config: Boost configuration with optional explicit API key and model
         
     Returns:
         Status and boost configuration
     """
     try:
-        # Validate API key by testing connection
-        if not config.openrouter_api_key:
-            raise HTTPException(status_code=400, detail="OpenRouter API key is required")
-        
-        # Test connection
-        client = OpenRouterClient(config.openrouter_api_key)
-        models = await client.list_models()
-        
-        if not models:
-            raise HTTPException(
-                status_code=400,
-                detail="Failed to connect to OpenRouter. Please check your API key."
-            )
-        
-        await client.close()
+        effective_api_key = _resolve_boost_api_key(config.openrouter_api_key)
+        
+        client = OpenRouterClient(effective_api_key)
+        try:
+            models = await client.list_models()
+            
+            if not models:
+                raise HTTPException(
+                    status_code=400,
+                    detail="Failed to connect to OpenRouter. Please check your API key."
+                )
+        finally:
+            await client.close()
+
+        config.openrouter_api_key = effective_api_key
         
         # Enable boost
         await boost_manager.set_boost_config(config)
@@ -89,7 +106,7 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
     - boosted_task_ids
     
     Args:
-        config: New boost configuration with API key and model
+        config: New boost configuration with optional explicit API key and model
         
     Returns:
         Status and updated configuration
@@ -102,21 +119,21 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
                 detail="Boost must be enabled first. Use /api/boost/enable to enable boost."
             )
         
-        # Validate API key by testing connection
-        if not config.openrouter_api_key:
-            raise HTTPException(status_code=400, detail="OpenRouter API key is required")
-        
-        # Test connection with new model
-        client = OpenRouterClient(config.openrouter_api_key)
-        models = await client.list_models()
+        effective_api_key = _resolve_boost_api_key(config.openrouter_api_key)
         
-        if not models:
-            raise HTTPException(
-                status_code=400,
-                detail="Failed to connect to OpenRouter. Please check your API key."
-            )
-        
-        await client.close()
+        client = OpenRouterClient(effective_api_key)
+        try:
+            models = await client.list_models()
+            
+            if not models:
+                raise HTTPException(
+                    status_code=400,
+                    detail="Failed to connect to OpenRouter. Please check your API key."
+                )
+        finally:
+            await client.close()
+
+        config.openrouter_api_key = effective_api_key
         
         # Store current boost state before update
         old_boost_next_count = boost_manager.boost_next_count
@@ -227,26 +244,26 @@ async def get_openrouter_models(authorization: Optional[str] = Header(None)) ->
     Fetch available OpenRouter models.
     
     Args:
-        authorization: OpenRouter API key via Authorization header (Bearer token)
+        authorization: Optional OpenRouter API key via Authorization header (Bearer token)
         
     Returns:
         List of available models
     """
     try:
-        # Extract API key from Authorization header
         api_key = authorization.replace("Bearer ", "") if authorization and authorization.startswith("Bearer ") else authorization
-        
-        if not api_key:
-            raise HTTPException(status_code=400, detail="API key is required in Authorization header")
-        
-        client = OpenRouterClient(api_key)
-        models = await client.list_models()
-        await client.close()
+
+        client = OpenRouterClient(_resolve_boost_api_key(api_key))
+        try:
+            models = await client.list_models()
+        finally:
+            await client.close()
         
         return {
             "success": True,
             "models": models
         }
+    except HTTPException:
+        raise
     except Exception as e:
         logger.error(f"Failed to fetch OpenRouter models: {e}")
         raise HTTPException(status_code=500, detail=f"Failed to fetch models: {str(e)}")
@@ -259,23 +276,22 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
     
     Args:
         model_id: The model ID to get providers for (query parameter)
-        authorization: OpenRouter API key via Authorization header (Bearer token)
+        authorization: Optional OpenRouter API key via Authorization header (Bearer token)
         
     Returns:
         List of available providers for the model
     """
     try:
-        # Extract API key from Authorization header
         api_key = authorization.replace("Bearer ", "") if authorization and authorization.startswith("Bearer ") else authorization
         
-        if not api_key:
-            raise HTTPException(status_code=400, detail="API key is required in Authorization header")
         if not model_id:
             raise HTTPException(status_code=400, detail="Model ID is required")
         
-        client = OpenRouterClient(api_key)
-        providers = await client.get_model_providers(model_id)
-        await client.close()
+        client = OpenRouterClient(_resolve_boost_api_key(api_key))
+        try:
+            providers = await client.get_model_providers(model_id)
+        finally:
+            await client.close()
         
         return {
             "success": True,
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index 8836f67..34cd872 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -8,19 +8,41 @@
 
 from backend.shared.models import CompilerStartRequest, CompilerState, CritiqueRequest
 from backend.shared.config import system_config
+from backend.shared.token_tracker import token_tracker
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
 from backend.compiler.memory.outline_memory import outline_memory
 from backend.compiler.memory.paper_memory import paper_memory
+from backend.aggregator.core.coordinator import coordinator
+from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
 
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/compiler", tags=["compiler"])
 
 
+def _get_start_conflict() -> str | None:
+    """Return a user-facing conflict message if another workflow is active."""
+    if compiler_coordinator.is_running:
+        return "Compiler is already running"
+
+    if coordinator.is_running:
+        return "Cannot start Compiler while Aggregator is running. Stop Aggregator first."
+
+    autonomous_state = autonomous_coordinator.get_state()
+    if autonomous_state.is_running:
+        return "Cannot start Compiler while Autonomous Research is running. Stop Autonomous Research first."
+
+    return None
+
+
 @router.post("/start")
 async def start_compiler(request: CompilerStartRequest):
     """Start the compiler system."""
     try:
+        conflict = _get_start_conflict()
+        if conflict:
+            raise HTTPException(status_code=400, detail=conflict)
+
         # Update system config with user-provided context sizes
         system_config.compiler_validator_context_window = request.validator_context_size
         system_config.compiler_high_context_context_window = request.high_context_context_size
@@ -66,6 +88,8 @@ async def start_compiler(request: CompilerStartRequest):
         )
         
         # Start coordinator
+        token_tracker.reset()
+        token_tracker.start_timer()
         await compiler_coordinator.start()
         
         return {"status": "started", "message": "Compiler started successfully"}
@@ -116,6 +140,7 @@ async def stop_compiler():
     """Stop the compiler system."""
     try:
         await compiler_coordinator.stop()
+        token_tracker.stop_timer()
         return {"status": "stopped", "message": "Compiler stopped"}
     except Exception as e:
         logger.error(f"Failed to stop compiler: {e}")
@@ -367,7 +392,7 @@ async def get_metrics():
                 "rejections": status.review_rejections,
                 "declines": status.review_declines
             },
-            "miniscule_edit_count": status.miniscule_edit_count,
+            "minuscule_edit_count": status.minuscule_edit_count,
             "paper_word_count": status.paper_word_count
         }
     except Exception as e:
@@ -416,7 +441,7 @@ async def get_critique_status():
             "in_critique_phase": compiler_coordinator.in_critique_phase,
             "critique_acceptances": compiler_coordinator.critique_acceptances,
             "paper_version": compiler_coordinator.paper_version,
-            "target_critiques": 10
+            "target_critiques": 5
         }
     except Exception as e:
         logger.error(f"Failed to get critique status: {e}")
@@ -461,7 +486,6 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
     from backend.shared.critique_memory import save_critique
     from backend.shared.models import PaperCritique
     from backend.shared.api_client_manager import api_client_manager
-    from backend.shared.json_parser import parse_json
     from backend.shared.utils import count_tokens
     import uuid
     from datetime import datetime
@@ -489,13 +513,13 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
         validator_provider = critique_request.validator_provider
         validator_openrouter_provider = critique_request.validator_openrouter_provider
         
-        # If validator config not provided in request, fall back to system config
+        # If validator config not provided in request, fall back to coordinator config
         if not validator_model:
-            validator_model = system_config.compiler_validator_model
+            validator_model = getattr(compiler_coordinator, 'validator_model', None)
             validator_context_window = system_config.compiler_validator_context_window
             validator_max_tokens = system_config.compiler_validator_max_output_tokens
-            validator_provider = getattr(system_config, 'compiler_validator_provider', 'lm_studio')
-            validator_openrouter_provider = getattr(system_config, 'compiler_validator_openrouter_provider', None)
+            validator_provider = getattr(compiler_coordinator, 'validator_provider', 'lm_studio')
+            validator_openrouter_provider = getattr(compiler_coordinator, 'validator_openrouter_provider', None)
         
         if not validator_model:
             raise HTTPException(
@@ -579,21 +603,9 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
         if not response_content:
             raise HTTPException(status_code=500, detail="Empty response from validator model")
         
-        # Try to parse as JSON
-        try:
-            critique_data = parse_json(response_content)
-        except Exception as e:
-            # If JSON parsing fails, create a structured response from raw text
-            logger.warning(f"Failed to parse critique JSON, using raw response: {e}")
-            critique_data = {
-                "novelty_rating": 0,
-                "novelty_feedback": "Unable to parse structured response",
-                "correctness_rating": 0,
-                "correctness_feedback": "Unable to parse structured response",
-                "impact_rating": 0,
-                "impact_feedback": "Unable to parse structured response",
-                "full_critique": response_content
-            }
+        # Parse with lenient fallback for truncated critique responses
+        from backend.shared.critique_prompts import parse_critique_response
+        critique_data = parse_critique_response(response_content)
         
         # Create critique object
         critique = PaperCritique(
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index b7d9cf9..4f6c586 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -7,7 +7,8 @@
 - OpenRouter model listing (using stored API key)
 - Model provider listing
 
-Note: This is separate from boost routes which use a separate API key for boost mode.
+Note: Boost routes can reuse the active global key by default, while still allowing
+an explicit boost-only override key when the user provides one.
 """
 from fastapi import APIRouter, HTTPException, Header
 from pydantic import BaseModel
@@ -73,6 +74,7 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
     
     This key is stored in memory and used by the API client manager for
     roles configured to use OpenRouter. It's separate from the boost API key.
+    Also resets any credit exhaustion flags so roles can retry OpenRouter.
     
     Args:
         request: Request with api_key field
@@ -102,12 +104,19 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
             # Also configure the API client manager
             api_client_manager.set_openrouter_api_key(request.api_key)
             
+            # Reset exhaustion flags so roles can retry OpenRouter
+            free_model_manager.clear_account_exhaustion()
+            reset_roles = await api_client_manager.reset_openrouter_fallbacks()
+            
             logger.info(f"Global OpenRouter API key set successfully. {len(models)} models available.")
+            if reset_roles:
+                logger.info(f"Auto-reset {len(reset_roles)} role(s) back to OpenRouter after key update")
             
             return {
                 "success": True,
                 "message": "OpenRouter API key validated and saved",
-                "model_count": len(models)
+                "model_count": len(models),
+                "roles_reset": list(reset_roles.keys())
             }
         finally:
             await client.close()
@@ -355,3 +364,35 @@ async def test_connection(request: SetApiKeyRequest) -> Dict[str, Any]:
             "message": f"Failed to connect: {str(e)}"
         }
 
+
+@router.post("/api/openrouter/reset-exhaustion")
+async def reset_credit_exhaustion() -> Dict[str, Any]:
+    """
+    Reset all credit exhaustion flags and role fallback states.
+    
+    Call this after adding credits to OpenRouter so roles can retry
+    without restarting the research mode.
+    
+    Resets:
+    - Per-role permanent fallback states (roles that fell back to LM Studio)
+    - Account-wide free model exhaustion flag
+    
+    Returns:
+        Success status and list of roles that were reset
+    """
+    try:
+        free_model_manager.clear_account_exhaustion()
+        reset_roles = await api_client_manager.reset_openrouter_fallbacks()
+        
+        roles_list = list(reset_roles.keys())
+        logger.info(f"Credit exhaustion reset: {len(roles_list)} role(s) restored, account exhaustion flag cleared")
+        
+        return {
+            "success": True,
+            "message": f"Reset {len(roles_list)} role(s) back to OpenRouter" if roles_list else "Exhaustion flags cleared (no roles needed reset)",
+            "roles_reset": roles_list,
+            "account_exhaustion_cleared": True
+        }
+    except Exception as e:
+        logger.error(f"Failed to reset credit exhaustion: {e}")
+        raise HTTPException(status_code=500, detail=f"Failed to reset: {str(e)}")
diff --git a/backend/api/routes/workflow.py b/backend/api/routes/workflow.py
index 336e2e1..f10559c 100644
--- a/backend/api/routes/workflow.py
+++ b/backend/api/routes/workflow.py
@@ -101,3 +101,10 @@ async def get_workflow_history(limit: int = 50) -> Dict[str, Any]:
         logger.error(f"Failed to get workflow history: {e}")
         raise HTTPException(status_code=500, detail=f"Failed to get history: {str(e)}")
 
+
+@router.get("/api/token-stats")
+async def get_token_stats() -> Dict[str, Any]:
+    """Return cumulative token usage stats and elapsed research time."""
+    from backend.shared.token_tracker import token_tracker
+    return {"success": True, **token_tracker.get_stats()}
+
diff --git a/backend/autonomous/agents/final_answer/answer_format_selector.py b/backend/autonomous/agents/final_answer/answer_format_selector.py
index 57a6288..aac0a38 100644
--- a/backend/autonomous/agents/final_answer/answer_format_selector.py
+++ b/backend/autonomous/agents/final_answer/answer_format_selector.py
@@ -6,6 +6,11 @@
 - LONG FORM: A curated volume/collection of papers with introduction and conclusion
 
 CRITICAL: Operates ONLY on Tier 2 papers, NOT on Tier 1 brainstorm databases.
+
+NO RAG BY DESIGN: This agent makes a strategic format decision using only the certainty
+assessment result and paper metadata summaries (titles/abstracts). Full paper content
+is not needed to decide short-form vs long-form — that's a structural question about
+the research landscape, not a content-deep analysis.
 """
 import asyncio
 import json
diff --git a/backend/autonomous/agents/final_answer/certainty_assessor.py b/backend/autonomous/agents/final_answer/certainty_assessor.py
index 2498cc1..548ba18 100644
--- a/backend/autonomous/agents/final_answer/certainty_assessor.py
+++ b/backend/autonomous/agents/final_answer/certainty_assessor.py
@@ -7,7 +7,10 @@
 2. Review full content and assess certainties
 
 CRITICAL: Operates ONLY on Tier 2 papers, NOT on Tier 1 brainstorm databases.
-This ensures the final answer is based on validated, complete research.
+
+NO RAG FOR ABSTRACTS (by design): Step 1 browses abstracts/outlines which are small metadata.
+EXPANDED PAPERS OVERFLOW: Step 2 currently drops expanded papers if they don't fit.
+TODO: Should RAG expanded papers instead of dropping — see audit note in rag-design rule.
 """
 import asyncio
 import json
@@ -28,6 +31,7 @@
 )
 from backend.autonomous.memory.paper_library import paper_library
 from backend.autonomous.memory.final_answer_memory import final_answer_memory
+from backend.autonomous.core.autonomous_rag_manager import autonomous_rag_manager
 from backend.autonomous.prompts.paper_reference_prompts import (
     get_reference_expansion_system_prompt,
     get_reference_expansion_json_schema
@@ -333,15 +337,56 @@ async def _generate_assessment(
             max_input = self._calculate_max_input_tokens()
             
             if prompt_tokens > max_input:
-                logger.error(f"CertaintyAssessor: Assessment prompt too large ({prompt_tokens} > {max_input})")
-                # Try without expanded papers
-                prompt = build_certainty_assessment_prompt(
-                    user_research_prompt=user_research_prompt,
-                    papers_summary=all_papers,
-                    expanded_papers=None,
-                    rejection_context=rejection_context
-                )
-                prompt_tokens = count_tokens(prompt)
+                if expanded_papers:
+                    # RAG the expanded papers instead of dropping them entirely
+                    base_prompt = build_certainty_assessment_prompt(
+                        user_research_prompt=user_research_prompt,
+                        papers_summary=all_papers,
+                        expanded_papers=None,
+                        rejection_context=rejection_context
+                    )
+                    mandatory_tokens = count_tokens(base_prompt)
+                    paper_budget = max_input - mandatory_tokens - 500
+                    
+                    if paper_budget > 2000:
+                        logger.info(f"CertaintyAssessor: RAG fallback for expanded papers (budget={paper_budget}t)")
+                        paper_ids = [p["paper_id"] for p in expanded_papers]
+                        rag_content, _ = await autonomous_rag_manager.get_reference_papers_context(
+                            paper_ids,
+                            max_total_tokens=paper_budget,
+                            query=user_research_prompt
+                        )
+                        
+                        if rag_content:
+                            rag_papers = [{
+                                "paper_id": "rag_retrieved",
+                                "title": f"RAG-retrieved content from {len(expanded_papers)} papers",
+                                "content": rag_content
+                            }]
+                            prompt = build_certainty_assessment_prompt(
+                                user_research_prompt=user_research_prompt,
+                                papers_summary=all_papers,
+                                expanded_papers=rag_papers,
+                                rejection_context=rejection_context
+                            )
+                            prompt_tokens = count_tokens(prompt)
+                        else:
+                            logger.warning("CertaintyAssessor: RAG returned empty, falling back to abstracts-only")
+                            prompt = base_prompt
+                            prompt_tokens = mandatory_tokens
+                    else:
+                        logger.warning("CertaintyAssessor: Insufficient budget for RAG, using abstracts-only")
+                        prompt = base_prompt
+                        prompt_tokens = mandatory_tokens
+                else:
+                    prompt = build_certainty_assessment_prompt(
+                        user_research_prompt=user_research_prompt,
+                        papers_summary=all_papers,
+                        expanded_papers=None,
+                        rejection_context=rejection_context
+                    )
+                    prompt_tokens = count_tokens(prompt)
+                
                 if prompt_tokens > max_input:
                     logger.error("CertaintyAssessor: Cannot fit even summary-only prompt")
                     return None
diff --git a/backend/autonomous/agents/final_answer/volume_organizer.py b/backend/autonomous/agents/final_answer/volume_organizer.py
index 40d2376..5f5b2d1 100644
--- a/backend/autonomous/agents/final_answer/volume_organizer.py
+++ b/backend/autonomous/agents/final_answer/volume_organizer.py
@@ -8,6 +8,11 @@
 - Iteratively refines until validator agrees
 
 CRITICAL: Operates ONLY on Tier 2 papers, NOT on Tier 1 brainstorm databases.
+
+NO RAG BY DESIGN: This agent organizes chapter order and identifies structural gaps
+using only paper metadata summaries (titles/abstracts/outlines) and the certainty
+assessment. Full paper content is not needed to plan volume structure — that's a
+high-level organizational decision based on what each paper covers.
 """
 import asyncio
 import json
diff --git a/backend/autonomous/agents/paper_title_selector.py b/backend/autonomous/agents/paper_title_selector.py
index f0b0bc9..e58df59 100644
--- a/backend/autonomous/agents/paper_title_selector.py
+++ b/backend/autonomous/agents/paper_title_selector.py
@@ -1,5 +1,10 @@
 """
 Paper Title Selector Agent - Selects titles for papers.
+
+NO RAG BY DESIGN: This agent selects a title based on brainstorm SUMMARY (not full DB),
+existing paper titles/abstracts from this brainstorm, and reference paper metadata.
+All inputs are compact summaries that fit in direct injection. The full brainstorm
+content is not needed — a summary is sufficient to choose an appropriate title.
 """
 import asyncio
 import json
@@ -58,6 +63,7 @@ async def select_title(
         brainstorm_summary: str,
         existing_papers_from_brainstorm: List[Dict[str, Any]],
         reference_papers: List[Dict[str, Any]] = None,
+        candidate_titles: str = "",
         stop_event: Optional[asyncio.Event] = None
     ) -> Optional[str]:
         """
@@ -67,6 +73,7 @@ async def select_title(
         so the model can correct its mistakes.
 
         Args:
+            candidate_titles: Pre-validated candidate titles from exploration phase.
             stop_event: If provided, the loop exits when the event is set (user stop).
 
         Returns:
@@ -100,7 +107,8 @@ async def select_title(
                 brainstorm_summary,
                 existing_papers_from_brainstorm,
                 reference_papers,
-                rejection_feedback=rejection_feedback
+                rejection_feedback=rejection_feedback,
+                candidate_titles=candidate_titles
             )
 
             if selection is None:
@@ -137,7 +145,8 @@ async def _generate_title(
         brainstorm_summary: str,
         existing_papers_from_brainstorm: List[Dict[str, Any]],
         reference_papers: List[Dict[str, Any]] = None,
-        rejection_feedback: str = ""
+        rejection_feedback: str = "",
+        candidate_titles: str = ""
     ) -> Optional[PaperTitleSelection]:
         """Generate a paper title selection."""
         try:
@@ -150,7 +159,8 @@ async def _generate_title(
                 brainstorm_summary=brainstorm_summary,
                 existing_papers_from_brainstorm=existing_papers_from_brainstorm,
                 reference_papers=reference_papers,
-                rejection_feedback=rejection_feedback
+                rejection_feedback=rejection_feedback,
+                candidate_titles=candidate_titles
             )
 
             # If prompt is too large, shed oldest rejection entries one at a time until it fits
@@ -165,7 +175,8 @@ async def _generate_title(
                         brainstorm_summary=brainstorm_summary,
                         existing_papers_from_brainstorm=existing_papers_from_brainstorm,
                         reference_papers=reference_papers,
-                        rejection_feedback=trimmed_feedback
+                        rejection_feedback=trimmed_feedback,
+                        candidate_titles=candidate_titles
                     )
                 if count_tokens(prompt) > max_input_tokens:
                     logger.warning(
@@ -178,9 +189,47 @@ async def _generate_title(
                         brainstorm_summary=brainstorm_summary,
                         existing_papers_from_brainstorm=existing_papers_from_brainstorm,
                         reference_papers=reference_papers,
-                        rejection_feedback=""
+                        rejection_feedback="",
+                        candidate_titles=candidate_titles
                     )
 
+            # Progressive truncation if still too large after shedding rejection feedback
+            if count_tokens(prompt) > max_input_tokens:
+                logger.warning("PaperTitleSelector: Truncating existing paper outlines/abstracts to fit")
+                truncated_existing = []
+                for p in existing_papers_from_brainstorm:
+                    tp = p.copy()
+                    if tp.get("outline"):
+                        tp["outline"] = ""
+                    if tp.get("abstract") and len(tp["abstract"]) > 200:
+                        tp["abstract"] = tp["abstract"][:200] + "..."
+                    truncated_existing.append(tp)
+                prompt = build_paper_title_prompt(
+                    user_research_prompt=user_research_prompt,
+                    topic_prompt=topic_prompt,
+                    brainstorm_summary=brainstorm_summary,
+                    existing_papers_from_brainstorm=truncated_existing,
+                    reference_papers=reference_papers,
+                    rejection_feedback="",
+                    candidate_titles=candidate_titles
+                )
+            
+            if count_tokens(prompt) > max_input_tokens:
+                logger.warning("PaperTitleSelector: Truncating brainstorm summary to fit")
+                prompt = build_paper_title_prompt(
+                    user_research_prompt=user_research_prompt,
+                    topic_prompt=topic_prompt,
+                    brainstorm_summary=brainstorm_summary[:2000] + "\n... [truncated for context fit]",
+                    existing_papers_from_brainstorm=truncated_existing,
+                    reference_papers=reference_papers,
+                    rejection_feedback="",
+                    candidate_titles=candidate_titles
+                )
+            
+            if count_tokens(prompt) > max_input_tokens:
+                logger.error("PaperTitleSelector: Cannot fit prompt even after all truncation")
+                return None
+
             # Generate task ID for tracking
             task_id = self.get_current_task_id()
             self.task_sequence += 1
diff --git a/backend/autonomous/agents/topic_selector.py b/backend/autonomous/agents/topic_selector.py
index dfdc3db..d4126e5 100644
--- a/backend/autonomous/agents/topic_selector.py
+++ b/backend/autonomous/agents/topic_selector.py
@@ -5,6 +5,11 @@
 - Uses DIRECT INJECTION for all context (metadata summaries are typically small)
 - Validates prompt size before sending to prevent context overflow
 - Truncates paper abstracts if context is too large (safe since abstracts are summaries)
+
+NO RAG BY DESIGN: This agent makes a strategic decision about WHAT to work on next.
+It only needs metadata summaries (topic prompts, statuses, paper titles/abstracts),
+not full brainstorm databases or full paper content. Metadata is small enough to
+direct-inject; abstract truncation is the overflow fallback.
 """
 import asyncio
 import json
@@ -68,7 +73,8 @@ async def select_topic(
         self,
         user_research_prompt: str,
         brainstorms_summary: List[Dict[str, Any]],
-        papers_summary: List[Dict[str, Any]]
+        papers_summary: List[Dict[str, Any]],
+        candidate_questions: str = ""
     ) -> Optional[TopicSelectionSubmission]:
         """
         Generate a topic selection submission.
@@ -77,6 +83,7 @@ async def select_topic(
             user_research_prompt: The user's high-level research goal
             brainstorms_summary: List of all brainstorms with metadata
             papers_summary: List of all papers with title, abstract, word count
+            candidate_questions: Formatted candidate questions from topic exploration phase
         
         Returns:
             TopicSelectionSubmission or None if generation failed
@@ -90,7 +97,8 @@ async def select_topic(
                 user_research_prompt=user_research_prompt,
                 brainstorms_summary=brainstorms_summary,
                 papers_summary=papers_summary,
-                rejection_context=rejection_context
+                rejection_context=rejection_context,
+                candidate_questions=candidate_questions
             )
             
             # Validate prompt size
@@ -115,7 +123,8 @@ async def select_topic(
                     user_research_prompt=user_research_prompt,
                     brainstorms_summary=brainstorms_summary,
                     papers_summary=truncated_papers,
-                    rejection_context=rejection_context
+                    rejection_context=rejection_context,
+                    candidate_questions=candidate_questions
                 )
                 
                 prompt_tokens = count_tokens(prompt)
diff --git a/backend/autonomous/agents/topic_validator.py b/backend/autonomous/agents/topic_validator.py
index df7a4b4..23632f2 100644
--- a/backend/autonomous/agents/topic_validator.py
+++ b/backend/autonomous/agents/topic_validator.py
@@ -5,6 +5,10 @@
 - Uses same context as topic selector (metadata summaries)
 - Validates prompt size before sending
 - Truncates paper abstracts if context is too large
+
+NO RAG BY DESIGN: Same rationale as topic selector — validates a strategic decision
+using only metadata summaries (topic prompts, statuses, paper titles/abstracts).
+Full content not needed for validating topic selection quality.
 """
 import asyncio
 import json
@@ -65,7 +69,8 @@ async def validate(
         submission: TopicSelectionSubmission,
         user_research_prompt: str,
         brainstorms_summary: List[Dict[str, Any]],
-        papers_summary: List[Dict[str, Any]]
+        papers_summary: List[Dict[str, Any]],
+        override_prompt: Optional[str] = None
     ) -> TopicValidationResult:
         """
         Validate a topic selection submission.
@@ -75,34 +80,41 @@ async def validate(
             user_research_prompt: The user's high-level research goal
             brainstorms_summary: List of all brainstorms with metadata
             papers_summary: List of all papers with title, abstract, word count
+            override_prompt: If provided, use this prompt instead of building one
         
         Returns:
             TopicValidationResult with accept/reject decision
         """
         try:
-            # Convert submission to dict for prompt
-            proposed_action = {
-                "action": submission.action,
-                "topic_id": submission.topic_id,
-                "topic_ids": submission.topic_ids,
-                "topic_prompt": submission.topic_prompt,
-                "reasoning": submission.reasoning
-            }
-            
-            # Build prompt
-            prompt = build_topic_validation_prompt(
-                user_research_prompt=user_research_prompt,
-                brainstorms_summary=brainstorms_summary,
-                papers_summary=papers_summary,
-                proposed_action=proposed_action
-            )
+            if override_prompt:
+                prompt = override_prompt
+            else:
+                # Convert submission to dict for prompt
+                proposed_action = {
+                    "action": submission.action,
+                    "topic_id": submission.topic_id,
+                    "topic_ids": submission.topic_ids,
+                    "topic_prompt": submission.topic_prompt,
+                    "reasoning": submission.reasoning
+                }
+                
+                # Build prompt
+                prompt = build_topic_validation_prompt(
+                    user_research_prompt=user_research_prompt,
+                    brainstorms_summary=brainstorms_summary,
+                    papers_summary=papers_summary,
+                    proposed_action=proposed_action
+                )
             
             # Validate prompt size
             prompt_tokens = count_tokens(prompt)
             max_input_tokens = self._calculate_max_input_tokens()
             
             if prompt_tokens > max_input_tokens:
-                # Context too large - truncate paper abstracts to fit
+                if override_prompt:
+                    logger.error(f"TopicValidator: Override prompt ({prompt_tokens} tokens) exceeds limit ({max_input_tokens}). Cannot truncate.")
+                    return self._create_rejection("Override prompt too large for validation")
+                
                 logger.warning(f"TopicValidator: Prompt ({prompt_tokens} tokens) exceeds limit ({max_input_tokens}). "
                              f"Truncating paper abstracts.")
                 
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 2a26d76..1319faa 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -1,6 +1,6 @@
 """
 Autonomous Coordinator - Main orchestrator for autonomous research mode.
-Manages the two-tier workflow: brainstorm aggregation -> paper compilation.
+Manages the Tier 1 -> Tier 2 -> Tier 3 autonomous workflow.
 """
 import asyncio
 import logging
@@ -25,6 +25,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.workflow_predictor import workflow_predictor
+from backend.shared.token_tracker import token_tracker
 
 # Memory managers
 from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
@@ -139,6 +140,11 @@ def __init__(self):
         self._manual_paper_writing_triggered: bool = False
         self._resume_paper_phase: Optional[str] = None  # Saved phase for resume (body/conclusion/intro/abstract)
         
+        # Brainstorm multi-paper continuation tracking
+        self._brainstorm_paper_count: int = 0  # Papers written from current brainstorm (max 3)
+        self._current_brainstorm_paper_ids: List[str] = []  # Paper IDs from current brainstorm cycle
+        self._last_completed_paper_id: Optional[str] = None  # Persists after _current_paper_id is cleared
+        
         # Tier 3 Final Answer tracking
         self._last_tier3_check_at: int = 0  # Paper count at last Tier 3 check
         self._tier3_active: bool = False  # Is Tier 3 final answer generation active
@@ -561,6 +567,10 @@ async def _check_resume_state(self) -> None:
             self._last_completion_review_at = workflow_state.get("last_completion_review_at", 0)
             self._last_tier3_check_at = workflow_state.get("last_tier3_check_at", 0)
             
+            # Restore brainstorm multi-paper continuation tracking
+            self._brainstorm_paper_count = workflow_state.get("brainstorm_paper_count", 0)
+            self._current_brainstorm_paper_ids = workflow_state.get("current_brainstorm_paper_ids", [])
+            
             # Restore Tier 3 flags for proper resume
             self._tier3_active = workflow_state.get("tier3_active", False)
             self._tier3_enabled = workflow_state.get("tier3_enabled", False)
@@ -812,6 +822,9 @@ async def _save_workflow_state(self, tier: str = None, phase: str = None) -> Non
             "last_redundancy_check_at": self._last_redundancy_check_at,
             "last_completion_review_at": self._last_completion_review_at,
             "last_tier3_check_at": self._last_tier3_check_at,
+            # Brainstorm multi-paper continuation tracking
+            "brainstorm_paper_count": self._brainstorm_paper_count,
+            "current_brainstorm_paper_ids": self._current_brainstorm_paper_ids,
             # Tier 3 Final Answer crash recovery fields
             "tier3_active": self._tier3_active,
             "tier3_enabled": self._tier3_enabled,
@@ -866,6 +879,10 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
         api_client_manager.set_autonomous_logger_callback(log_callback)
         logger.info("Autonomous API logging enabled")
         
+        # Reset and start token tracking for this session
+        token_tracker.reset()
+        token_tracker.start_timer()
+        
         # Refresh workflow predictions at start
         await self.refresh_workflow_predictions()
         
@@ -924,6 +941,110 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             if await self._paper_compilation_workflow():
                                 break
 
+                        if not self._stop_event.is_set():
+                            self._brainstorm_paper_count += 1
+                            if self._last_completed_paper_id:
+                                self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                            await self._check_paper_redundancy()
+                            
+                            # Continuation loop for resumed tier2 paper
+                            while (self._brainstorm_paper_count < 3
+                                   and not self._stop_event.is_set()):
+                                cont_decision = await self._brainstorm_continuation_decision()
+                                if cont_decision != "write_another_paper":
+                                    break
+                                logger.info(f"Writing paper {self._brainstorm_paper_count + 1}/3 from resumed brainstorm {self._current_topic_id}")
+                                self._current_paper_tracker = PaperModelTracker(
+                                    user_prompt=self._user_research_prompt,
+                                    paper_title=""
+                                )
+                                next_ok = False
+                                while not self._stop_event.is_set():
+                                    next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
+                                    if next_ok or self._stop_event.is_set():
+                                        break
+                                    await asyncio.sleep(5)
+                                if not next_ok or self._stop_event.is_set():
+                                    break
+                                self._brainstorm_paper_count += 1
+                                if self._last_completed_paper_id:
+                                    self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                                await self._check_paper_redundancy()
+                            
+                            self._brainstorm_paper_count = 0
+                            self._current_brainstorm_paper_ids = []
+                            self._last_completed_paper_id = None
+
+                        continue
+                    elif resume_tier == "tier1_aggregation" and not resume_topic and resume_state.get("paper_phase") == "topic_exploration":
+                        # Resume topic exploration phase (no topic selected yet)
+                        # Exploration restarts fresh — uses aggregator which will run from scratch
+                        logger.info("Resuming topic exploration phase (restarting fresh)")
+                        resume_state = None
+                        self._resume_paper_phase = None
+                        
+                        candidate_questions = await self._topic_exploration_phase()
+                        
+                        if self._stop_event.is_set():
+                            break
+                        
+                        topic_result = await self._topic_selection_loop(candidate_questions)
+                        
+                        if self._stop_event.is_set():
+                            break
+                        
+                        self._current_reference_papers = await self._pre_brainstorm_reference_selection()
+                        
+                        if self._stop_event.is_set():
+                            break
+                        
+                        await self._save_workflow_state(tier="tier1_aggregation")
+                        
+                        write_paper = await self._brainstorm_aggregation_loop()
+                        
+                        if self._stop_event.is_set():
+                            break
+                        
+                        if write_paper:
+                            while not self._stop_event.is_set():
+                                if await self._paper_compilation_workflow():
+                                    break
+                                await asyncio.sleep(5)
+                            
+                            if self._stop_event.is_set():
+                                break
+                            
+                            self._brainstorm_paper_count += 1
+                            if self._last_completed_paper_id:
+                                self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                            await self._check_paper_redundancy()
+                            
+                            while (self._brainstorm_paper_count < 3
+                                   and not self._stop_event.is_set()):
+                                cont_decision = await self._brainstorm_continuation_decision()
+                                if cont_decision != "write_another_paper":
+                                    break
+                                self._current_paper_tracker = PaperModelTracker(
+                                    user_prompt=self._user_research_prompt,
+                                    paper_title=""
+                                )
+                                next_ok = False
+                                while not self._stop_event.is_set():
+                                    next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
+                                    if next_ok or self._stop_event.is_set():
+                                        break
+                                    await asyncio.sleep(5)
+                                if not next_ok or self._stop_event.is_set():
+                                    break
+                                self._brainstorm_paper_count += 1
+                                if self._last_completed_paper_id:
+                                    self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                                await self._check_paper_redundancy()
+                            
+                            self._brainstorm_paper_count = 0
+                            self._current_brainstorm_paper_ids = []
+                            self._last_completed_paper_id = None
+                        
                         continue
                     elif resume_tier == "tier1_aggregation" and resume_topic:
                         # Resume brainstorm aggregation
@@ -960,7 +1081,38 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             if self._stop_event.is_set():
                                 break
 
+                            self._brainstorm_paper_count += 1
+                            if self._last_completed_paper_id:
+                                self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                             await self._check_paper_redundancy()
+                            
+                            # Continuation loop for resumed brainstorm
+                            while (self._brainstorm_paper_count < 3
+                                   and not self._stop_event.is_set()):
+                                cont_decision = await self._brainstorm_continuation_decision()
+                                if cont_decision != "write_another_paper":
+                                    break
+                                logger.info(f"Writing paper {self._brainstorm_paper_count + 1}/3 from resumed brainstorm {self._current_topic_id}")
+                                self._current_paper_tracker = PaperModelTracker(
+                                    user_prompt=self._user_research_prompt,
+                                    paper_title=""
+                                )
+                                next_ok = False
+                                while not self._stop_event.is_set():
+                                    next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
+                                    if next_ok or self._stop_event.is_set():
+                                        break
+                                    await asyncio.sleep(5)
+                                if not next_ok or self._stop_event.is_set():
+                                    break
+                                self._brainstorm_paper_count += 1
+                                if self._last_completed_paper_id:
+                                    self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                                await self._check_paper_redundancy()
+                            
+                            self._brainstorm_paper_count = 0
+                            self._current_brainstorm_paper_ids = []
+                            self._last_completed_paper_id = None
                         
                         continue
                     elif resume_tier == "tier3_final_answer":
@@ -1045,16 +1197,17 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                     else:
                         logger.warning("Cannot run forced Tier 3: no completed papers")
                 
-                # Phase 1: Topic selection
-                topic_result = await self._topic_selection_loop()
+                # Phase 0: Topic Exploration (mini-brainstorm of candidate questions)
+                candidate_questions = await self._topic_exploration_phase()
                 
                 if self._stop_event.is_set():
                     break
                 
-                if not topic_result:
-                    logger.error("Topic selection failed, retrying in 30 seconds")
-                    await asyncio.sleep(30)
-                    continue
+                # Phase 1: Topic selection (informed by exploration candidates)
+                topic_result = await self._topic_selection_loop(candidate_questions)
+                
+                if self._stop_event.is_set():
+                    break
                 
                 # Phase 1.5: Pre-brainstorm reference paper selection
                 # This enables compounding knowledge across research cycles
@@ -1103,16 +1256,63 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
 
                 # Only check redundancy and log completion if paper was successful
                 if paper_success:
-                    # Check for paper redundancy (every 3 papers)
+                    self._brainstorm_paper_count += 1
+                    if self._last_completed_paper_id:
+                        self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                    
                     await self._check_paper_redundancy()
                     
-                    # Check for Tier 3 final answer trigger (every 5 papers)
+                    # Brainstorm multi-paper continuation loop (max 3 papers per brainstorm)
+                    while (self._brainstorm_paper_count < 3
+                           and not self._stop_event.is_set()):
+                        decision = await self._brainstorm_continuation_decision()
+                        if decision != "write_another_paper":
+                            break
+                        
+                        logger.info(f"Writing paper {self._brainstorm_paper_count + 1}/3 from brainstorm {self._current_topic_id}")
+                        self._current_paper_tracker = PaperModelTracker(
+                            user_prompt=self._user_research_prompt,
+                            paper_title=""
+                        )
+                        next_paper_success = False
+                        _next_attempt = 0
+                        while not self._stop_event.is_set():
+                            _next_attempt += 1
+                            if _next_attempt > 1:
+                                await asyncio.sleep(5)
+                            next_paper_success = await self._paper_compilation_workflow(
+                                skip_reference_selection=True
+                            )
+                            if next_paper_success or self._stop_event.is_set():
+                                break
+                        
+                        if not next_paper_success or self._stop_event.is_set():
+                            break
+                        
+                        self._brainstorm_paper_count += 1
+                        if self._last_completed_paper_id:
+                            self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                        await self._check_paper_redundancy()
+                    
+                    if self._brainstorm_paper_count >= 3:
+                        logger.info("Brainstorm paper limit reached (3/3)")
+                        await self._broadcast("brainstorm_paper_limit_reached", {
+                            "topic_id": self._current_topic_id,
+                            "paper_count": self._brainstorm_paper_count
+                        })
+                    
+                    self._brainstorm_paper_count = 0
+                    self._current_brainstorm_paper_ids = []
+                    self._last_completed_paper_id = None
+                    
+                    if self._stop_event.is_set():
+                        break
+                    
                     if await self._should_trigger_tier3():
                         logger.info("Tier 3 trigger: Attempting final answer generation")
                         completed = await self._tier3_final_answer_workflow()
                         
                         if completed:
-                            # System stops after final answer is complete
                             logger.info("FINAL ANSWER COMPLETE - Autonomous research finished")
                             await self._broadcast("final_answer_complete", {
                                 "format": final_answer_memory.get_answer_format(),
@@ -1120,10 +1320,9 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             })
                             break
                         else:
-                            # Tier 3 decided we need more research - continue
                             logger.info("Tier 3: More research needed, returning to topic selection")
                     
-                    logger.info("Paper complete, returning to topic selection")
+                    logger.info("Brainstorm cycle complete, returning to topic selection")
 
               except FreeModelExhaustedError as e:
                 if e.soonest_retry:
@@ -1156,6 +1355,7 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
         finally:
             self._running = False
             self._state.is_running = False
+            token_tracker.stop_timer()
             
             stats = await research_metadata.get_stats()
             await self._broadcast("auto_research_stopped", {
@@ -1197,6 +1397,7 @@ async def stop(self) -> None:
         
         # Clear autonomous API logging callback
         api_client_manager.set_autonomous_logger_callback(None)
+        token_tracker.stop_timer()
         logger.info("Autonomous API logging disabled")
         
         # SAVE workflow state for resume (NOT clear it)
@@ -1383,16 +1584,17 @@ async def _resume_research_loop_after_tier3(self) -> None:
                     else:
                         logger.warning("Cannot run forced Tier 3: no completed papers")
                 
-                # Phase 1: Topic selection
-                topic_result = await self._topic_selection_loop()
+                # Phase 0: Topic Exploration (mini-brainstorm of candidate questions)
+                candidate_questions = await self._topic_exploration_phase()
                 
                 if self._stop_event.is_set():
                     break
                 
-                if not topic_result:
-                    logger.error("Topic selection failed, retrying in 30 seconds")
-                    await asyncio.sleep(30)
-                    continue
+                # Phase 1: Topic selection (informed by exploration candidates)
+                topic_result = await self._topic_selection_loop(candidate_questions)
+                
+                if self._stop_event.is_set():
+                    break
                 
                 # Phase 1.5: Pre-brainstorm reference paper selection
                 self._current_reference_papers = await self._pre_brainstorm_reference_selection()
@@ -1440,16 +1642,63 @@ async def _resume_research_loop_after_tier3(self) -> None:
 
                 # Only check redundancy and log completion if paper was successful
                 if paper_success:
-                    # Check for paper redundancy (every 3 papers)
+                    self._brainstorm_paper_count += 1
+                    if self._last_completed_paper_id:
+                        self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                    
                     await self._check_paper_redundancy()
                     
-                    # Check for Tier 3 final answer trigger (every 5 papers)
+                    # Brainstorm multi-paper continuation loop (max 3 papers per brainstorm)
+                    while (self._brainstorm_paper_count < 3
+                           and not self._stop_event.is_set()):
+                        decision = await self._brainstorm_continuation_decision()
+                        if decision != "write_another_paper":
+                            break
+                        
+                        logger.info(f"Writing paper {self._brainstorm_paper_count + 1}/3 from brainstorm {self._current_topic_id}")
+                        self._current_paper_tracker = PaperModelTracker(
+                            user_prompt=self._user_research_prompt,
+                            paper_title=""
+                        )
+                        next_paper_success = False
+                        _next_attempt = 0
+                        while not self._stop_event.is_set():
+                            _next_attempt += 1
+                            if _next_attempt > 1:
+                                await asyncio.sleep(5)
+                            next_paper_success = await self._paper_compilation_workflow(
+                                skip_reference_selection=True
+                            )
+                            if next_paper_success or self._stop_event.is_set():
+                                break
+                        
+                        if not next_paper_success or self._stop_event.is_set():
+                            break
+                        
+                        self._brainstorm_paper_count += 1
+                        if self._last_completed_paper_id:
+                            self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
+                        await self._check_paper_redundancy()
+                    
+                    if self._brainstorm_paper_count >= 3:
+                        logger.info("Brainstorm paper limit reached (3/3)")
+                        await self._broadcast("brainstorm_paper_limit_reached", {
+                            "topic_id": self._current_topic_id,
+                            "paper_count": self._brainstorm_paper_count
+                        })
+                    
+                    self._brainstorm_paper_count = 0
+                    self._current_brainstorm_paper_ids = []
+                    self._last_completed_paper_id = None
+                    
+                    if self._stop_event.is_set():
+                        break
+                    
                     if await self._should_trigger_tier3():
                         logger.info("Tier 3 trigger: Attempting final answer generation")
                         completed = await self._tier3_final_answer_workflow()
                         
                         if completed:
-                            # System stops after final answer is complete
                             logger.info("FINAL ANSWER COMPLETE - Autonomous research finished")
                             await self._broadcast("final_answer_complete", {
                                 "format": final_answer_memory.get_answer_format(),
@@ -1457,10 +1706,9 @@ async def _resume_research_loop_after_tier3(self) -> None:
                             })
                             break
                         else:
-                            # Tier 3 decided we need more research - continue
                             logger.info("Tier 3: More research needed, returning to topic selection")
                     
-                    logger.info("Paper complete, returning to topic selection")
+                    logger.info("Brainstorm cycle complete, returning to topic selection")
 
               except FreeModelExhaustedError as e:
                 if e.soonest_retry:
@@ -1492,6 +1740,7 @@ async def _resume_research_loop_after_tier3(self) -> None:
         finally:
             self._running = False
             self._state.is_running = False
+            token_tracker.stop_timer()
             
             shared_training_memory.insights.clear()
             shared_training_memory.submission_count = 0
@@ -1546,42 +1795,224 @@ async def skip_critique_phase(self) -> bool:
         
         return await self._paper_compiler.skip_critique_phase()
     
+    # ========================================================================
+    # PHASE 0: TOPIC EXPLORATION (Pre-Selection Candidate Brainstorm)
+    # ========================================================================
+    
+    async def _topic_exploration_phase(self) -> str:
+        """
+        Topic exploration phase using the full Part 1 aggregator infrastructure.
+        All configured submitters run in parallel, batch validation up to 3 at a time.
+        Collects 5 accepted candidate brainstorm questions before topic selection.
+            
+        Returns:
+            Formatted candidate questions DB for injection into topic selection prompt.
+        """
+        api_client_manager.set_autonomous_phase("topic_exploration")
+        self._state.current_tier = "tier1_aggregation"
+        
+        TARGET_CANDIDATES = 5
+        MAX_CONSECUTIVE_REJECTIONS = 15
+        
+        await self._broadcast("topic_exploration_started", {
+            "target": TARGET_CANDIDATES,
+            "resumed_count": 0
+        })
+        
+        logger.info(f"Starting topic exploration phase (target: {TARGET_CANDIDATES} candidates)")
+        
+        # Build the exploration user prompt for the aggregator
+        from backend.autonomous.prompts.topic_exploration_prompts import build_exploration_user_prompt
+        
+        brainstorms_summary = await autonomous_rag_manager.get_all_brainstorms_summary()
+        papers_summary = await autonomous_rag_manager.get_all_papers_summary()
+        
+        exploration_prompt = build_exploration_user_prompt(
+            user_research_prompt=self._user_research_prompt,
+            brainstorms_summary=brainstorms_summary,
+            papers_summary=papers_summary
+        )
+        
+        # Create a temp exploration database file in the brainstorms directory
+        exploration_db_path = brainstorm_memory._base_dir / "exploration_candidates.txt"
+        exploration_db_path.parent.mkdir(parents=True, exist_ok=True)
+        
+        # Clear any stale exploration DB
+        if exploration_db_path.exists():
+            exploration_db_path.unlink()
+        
+        # Override shared training memory path for exploration
+        original_shared_path = system_config.shared_training_file
+        system_config.shared_training_file = str(exploration_db_path)
+        original_memory_path = shared_training_memory.file_path
+        shared_training_memory.file_path = exploration_db_path
+        await shared_training_memory.reload_insights_from_current_path()
+        
+        exploration_aggregator = None
+        
+        try:
+            exploration_aggregator = AggregatorCoordinator()
+            
+            await exploration_aggregator.initialize(
+                user_prompt=exploration_prompt,
+                submitter_configs=self._submitter_configs,
+                validator_model=self._validator_model,
+                user_files=[],
+                skip_stats_load=True,
+                validator_context_window=self._validator_context,
+                validator_max_tokens=self._validator_max_tokens,
+                validator_provider=self._validator_provider,
+                validator_openrouter_provider=self._validator_openrouter_provider,
+                validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                enable_cleanup_review=False
+            )
+            
+            # Set WebSocket broadcaster so aggregator events flow through
+            if self._broadcast_callback:
+                exploration_aggregator.websocket_broadcaster = self._broadcast_callback
+            
+            # Start the aggregator (parallel submitters + batch validator)
+            await exploration_aggregator.start()
+            logger.info("Exploration aggregator started with parallel submitters")
+            
+            last_acceptances = 0
+            last_rejections = 0
+            consecutive_rejections = 0
+            
+            while self._running and not self._stop_event.is_set():
+                status = await exploration_aggregator.get_status()
+                current_acceptances = status.total_acceptances
+                current_rejections = status.total_rejections
+                
+                # Track new acceptances
+                if current_acceptances > last_acceptances:
+                    consecutive_rejections = 0
+                    last_acceptances = current_acceptances
+                    
+                    await self._broadcast("topic_exploration_progress", {
+                        "accepted": current_acceptances,
+                        "target": TARGET_CANDIDATES,
+                        "total_attempts": current_acceptances + current_rejections
+                    })
+                    
+                    await self._save_workflow_state(
+                        tier="tier1_aggregation",
+                        phase="topic_exploration"
+                    )
+                    
+                    logger.info(f"TopicExploration: {current_acceptances}/{TARGET_CANDIDATES} candidates accepted")
+                    
+                    if current_acceptances >= TARGET_CANDIDATES:
+                        logger.info(f"TopicExploration: Target of {TARGET_CANDIDATES} candidates reached")
+                        break
+                
+                # Track consecutive rejections for safety valve
+                if current_rejections > last_rejections:
+                    new_rejections = current_rejections - last_rejections
+                    consecutive_rejections += new_rejections
+                    last_rejections = current_rejections
+                    
+                    if consecutive_rejections >= MAX_CONSECUTIVE_REJECTIONS:
+                        logger.warning(f"TopicExploration: {consecutive_rejections} consecutive rejections - proceeding with {current_acceptances} candidates")
+                        break
+                
+                await asyncio.sleep(2)
+            
+            # Stop the exploration aggregator
+            await exploration_aggregator.stop()
+            
+            # Read accepted candidates from the exploration database
+            candidates_text = ""
+            if exploration_db_path.exists():
+                async with aiofiles.open(exploration_db_path, 'r', encoding='utf-8') as f:
+                    raw_content = await f.read()
+                
+                if raw_content.strip():
+                    # Format into the candidate DB structure expected by topic selector
+                    entries = [e.strip() for e in raw_content.split("\n\n") if e.strip()]
+                    lines = [
+                        "ACCEPTED CANDIDATE BRAINSTORM QUESTIONS:",
+                        "=" * 60
+                    ]
+                    for i, entry in enumerate(entries, 1):
+                        lines.append(f"\nCandidate #{i}:")
+                        lines.append(f"  {entry}")
+                        lines.append("-" * 40)
+                    candidates_text = "\n".join(lines)
+            
+            await self._broadcast("topic_exploration_complete", {
+                "accepted_count": last_acceptances,
+                "total_attempts": last_acceptances + last_rejections
+            })
+            
+            logger.info(f"Topic exploration complete: {last_acceptances} candidates accepted")
+            
+            return candidates_text
+            
+        except FreeModelExhaustedError:
+            # Stop aggregator if running
+            if exploration_aggregator:
+                try:
+                    await exploration_aggregator.stop()
+                except Exception:
+                    pass
+            raise
+        except Exception as e:
+            logger.error(f"Topic exploration phase error: {e}")
+            if exploration_aggregator:
+                try:
+                    await exploration_aggregator.stop()
+                except Exception:
+                    pass
+            return ""
+        finally:
+            # Restore original shared training path
+            system_config.shared_training_file = original_shared_path
+            shared_training_memory.file_path = original_memory_path
+            
+            # Clear in-memory data to prevent cross-contamination
+            async with shared_training_memory._lock:
+                shared_training_memory.insights.clear()
+                shared_training_memory.submission_count = 0
+                shared_training_memory.last_ragged_submission_count = 0
+            logger.info("Exploration: Restored shared_training_memory state")
+            
+            # Clean up exploration database file
+            if exploration_db_path.exists():
+                try:
+                    exploration_db_path.unlink()
+                except Exception:
+                    pass
+    
     # ========================================================================
     # PHASE 1: TOPIC SELECTION
     # ========================================================================
     
-    async def _topic_selection_loop(self) -> Optional[str]:
+    async def _topic_selection_loop(self, candidate_questions: str = "") -> Optional[str]:
         """
-        Topic selection with validation.
+        Topic selection with validation. Retries indefinitely with rejection
+        feedback until a topic is accepted or stop event is set.
         
         Returns:
-            topic_id if successful, None if failed
+            topic_id if successful, None only if stopped
         """
-        # Set tier state immediately when entering topic selection
-        # This ensures force_tier3 can reliably detect we're in the Tier 1 phase
-        # (Previously, state remained "idle" until aggregation loop started, causing race conditions)
         self._state.current_tier = "tier1_aggregation"
         
-        # Set phase for API logging
         api_client_manager.set_autonomous_phase("topic_selection")
         
-        max_attempts = system_config.autonomous_topic_selection_retry_limit
-        
-        for attempt in range(max_attempts):
-            if self._stop_event.is_set():
-                return None
-            
-            logger.info(f"Topic selection attempt {attempt + 1}/{max_attempts}")
+        attempt = 0
+        while not self._stop_event.is_set():
+            attempt += 1
+            logger.info(f"Topic selection attempt {attempt}")
             
-            # Get context
             brainstorms_summary = await autonomous_rag_manager.get_all_brainstorms_summary()
             papers_summary = await autonomous_rag_manager.get_all_papers_summary()
             
-            # Generate topic selection
             submission = await self._topic_selector.select_topic(
                 user_research_prompt=self._user_research_prompt,
                 brainstorms_summary=brainstorms_summary,
-                papers_summary=papers_summary
+                papers_summary=papers_summary,
+                candidate_questions=candidate_questions
             )
             
             if submission is None:
@@ -1589,7 +2020,6 @@ async def _topic_selection_loop(self) -> Optional[str]:
                 await asyncio.sleep(5)
                 continue
             
-            # Validate
             validation = await self._topic_validator.validate(
                 submission=submission,
                 user_research_prompt=self._user_research_prompt,
@@ -1598,12 +2028,10 @@ async def _topic_selection_loop(self) -> Optional[str]:
             )
             
             if validation.decision == "accept":
-                # Check if we should stop before creating new topic
                 if self._stop_event.is_set():
                     logger.info("Topic selection cancelled - stop event set after validation")
                     return None
                 
-                # Execute topic selection
                 topic_id = await self._execute_topic_selection(submission)
                 
                 if topic_id:
@@ -1614,7 +2042,6 @@ async def _topic_selection_loop(self) -> Optional[str]:
                     })
                     return topic_id
             else:
-                # Handle rejection
                 await self._topic_selector.handle_rejection(submission, validation.reasoning)
                 await research_metadata.increment_stat("topic_selection_rejections")
                 
@@ -1624,7 +2051,6 @@ async def _topic_selection_loop(self) -> Optional[str]:
                 
                 logger.info(f"Topic selection rejected: {validation.reasoning[:100]}...")
         
-        logger.error(f"Topic selection failed after {max_attempts} attempts")
         return None
     
     async def _execute_topic_selection(
@@ -1698,6 +2124,148 @@ async def _execute_topic_selection(
             logger.error(f"Error executing topic selection: {e}")
             return None
     
+    async def _brainstorm_continuation_decision(self) -> str:
+        """
+        Decide whether to write another paper from the current brainstorm or move on.
+        Uses topic selector model for submission and topic validator for validation.
+        
+        NO RAG BY DESIGN: This is a strategic decision using only brainstorm SUMMARY
+        (not full DB) and prior paper titles/abstracts/outlines from this brainstorm.
+        Full brainstorm content is not needed to decide "write another or move on" —
+        the summary + completed paper metadata is sufficient context.
+        
+        Returns:
+            "write_another_paper" or "move_on"
+        """
+        from backend.shared.json_parser import parse_json
+        from backend.autonomous.prompts.paper_continuation_prompts import (
+            build_continuation_decision_prompt,
+            build_continuation_validation_prompt
+        )
+        
+        api_client_manager.set_autonomous_phase("brainstorm_continuation")
+        
+        await self._broadcast("brainstorm_continuation_started", {
+            "topic_id": self._current_topic_id,
+            "papers_written": self._brainstorm_paper_count
+        })
+        
+        metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
+        topic_prompt = metadata.topic_prompt if metadata else ""
+        
+        brainstorm_summary = await autonomous_rag_manager.get_brainstorm_summary(
+            self._current_topic_id
+        )
+        
+        papers_from_brainstorm = await research_metadata.get_papers_by_brainstorm(
+            self._current_topic_id
+        )
+        papers_context = []
+        for p in papers_from_brainstorm:
+            paper_id = p.get("paper_id")
+            outline_text = ""
+            if paper_id:
+                outline_path = paper_library.get_outline_path(paper_id)
+                if os.path.exists(outline_path):
+                    async with aiofiles.open(outline_path, "r", encoding="utf-8") as f:
+                        outline_text = await f.read()
+            papers_context.append({
+                "title": p.get("title", "N/A"),
+                "abstract": p.get("abstract", "N/A"),
+                "outline": outline_text
+            })
+        
+        attempt = 0
+        rejection_context = ""
+        
+        while not self._stop_event.is_set():
+            attempt += 1
+            
+            logger.info(f"Brainstorm continuation decision attempt {attempt}")
+            
+            prompt = build_continuation_decision_prompt(
+                user_research_prompt=self._user_research_prompt,
+                topic_prompt=topic_prompt,
+                brainstorm_summary=brainstorm_summary,
+                papers_from_brainstorm=papers_context,
+                papers_written_count=self._brainstorm_paper_count,
+                rejection_context=rejection_context
+            )
+            
+            task_id = f"auto_cd_{self._topic_selector.task_sequence:03d}"
+            self._topic_selector.task_sequence += 1
+            
+            if self._topic_selector.task_tracking_callback:
+                self._topic_selector.task_tracking_callback("started", task_id)
+            
+            try:
+                response = await api_client_manager.generate_completion(
+                    task_id=task_id,
+                    role_id="autonomous_topic_selector",
+                    model=self._topic_selector.model_id,
+                    messages=[{"role": "user", "content": prompt}],
+                    temperature=0.0,
+                    max_tokens=self._topic_selector.max_output_tokens
+                )
+                
+                content = response.get("choices", [{}])[0].get("message", {}).get("content") or ""
+                if not content:
+                    msg = response.get("choices", [{}])[0].get("message", {})
+                    content = msg.get("reasoning") or ""
+                
+                result = parse_json(content)
+                decision = result.get("decision", "move_on")
+                reasoning = result.get("reasoning", "")
+                
+                if decision not in ("write_another_paper", "move_on"):
+                    logger.warning(f"Invalid continuation decision: {decision}, defaulting to move_on")
+                    decision = "move_on"
+                
+                if self._topic_selector.task_tracking_callback:
+                    self._topic_selector.task_tracking_callback("completed", task_id)
+                
+                proposed = {"decision": decision, "reasoning": reasoning}
+                
+                validation = await self._topic_validator.validate(
+                    submission=TopicSelectionSubmission(
+                        action="new_topic",
+                        topic_prompt=f"[CONTINUATION DECISION: {decision}]",
+                        reasoning=reasoning[:200]
+                    ),
+                    user_research_prompt=self._user_research_prompt,
+                    brainstorms_summary=await autonomous_rag_manager.get_all_brainstorms_summary(),
+                    papers_summary=await autonomous_rag_manager.get_all_papers_summary(),
+                    override_prompt=build_continuation_validation_prompt(
+                        user_research_prompt=self._user_research_prompt,
+                        topic_prompt=topic_prompt,
+                        brainstorm_summary=brainstorm_summary,
+                        papers_from_brainstorm=papers_context,
+                        papers_written_count=self._brainstorm_paper_count,
+                        proposed_decision=proposed
+                    )
+                )
+                
+                if validation.decision == "accept":
+                    logger.info(f"Brainstorm continuation decision accepted: {decision}")
+                    await self._broadcast("brainstorm_continuation_decided", {
+                        "topic_id": self._current_topic_id,
+                        "decision": decision,
+                        "paper_count": self._brainstorm_paper_count,
+                        "reasoning": reasoning[:300]
+                    })
+                    return decision
+                else:
+                    rejection_context = validation.reasoning
+                    logger.info(f"Continuation decision rejected: {validation.reasoning[:100]}...")
+                    
+            except FreeModelExhaustedError:
+                raise
+            except Exception as e:
+                logger.error(f"Error in continuation decision attempt {attempt}: {e}")
+                await asyncio.sleep(3)
+        
+        return "move_on"
+    
     async def _pre_brainstorm_reference_selection(self) -> List[str]:
         """
         Select reference papers BEFORE brainstorming begins.
@@ -1895,6 +2463,13 @@ async def paper_model_tracking_callback(model_id: str) -> None:
             if self._broadcast_callback:
                 self._brainstorm_aggregator.websocket_broadcaster = self._broadcast_callback
             
+            # Check if manual override was triggered during initialization
+            # (force_paper_writing() can fire while RAG ingestion is in progress)
+            if self._manual_paper_writing_triggered:
+                logger.info("Manual override detected during initialization - skipping aggregator start")
+                self._manual_paper_writing_triggered = False
+                return True
+            
             # Start aggregator
             await self._brainstorm_aggregator.start()
             logger.info(f"Aggregator started for brainstorm {self._current_topic_id}")
@@ -1937,6 +2512,11 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                 # Track cleanup removals for status display
                 if current_cleanup_removals != self._cleanup_removals:
                     self._cleanup_removals = current_cleanup_removals
+                    # Update brainstorm metadata with live count (accounts for prune)
+                    await brainstorm_memory.update_metadata(
+                        self._current_topic_id,
+                        submission_count=status.shared_training_size
+                    )
                 
                 # Track new acceptances/rejections
                 if current_acceptances > last_acceptances:
@@ -1948,10 +2528,10 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                     # Increment total submissions accepted stat for acceptance rate calculation
                     await research_metadata.increment_stat("total_submissions_accepted", new_acceptances)
                     
-                    # Update brainstorm metadata
+                    # Update brainstorm metadata with live count (accounts for prune)
                     await brainstorm_memory.update_metadata(
                         self._current_topic_id,
-                        submission_count=current_acceptances
+                        submission_count=status.shared_training_size
                     )
                     
                     # NOTE: Don't broadcast here - the aggregator already broadcasts 
@@ -1964,15 +2544,15 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                     if current_acceptances % 5 == 0:
                         await self._save_workflow_state(tier="tier1_aggregation")
                     
-                    # Check for hard limit of 80 acceptances (FORCE paper writing, skip completion review)
-                    if self._acceptance_count >= 80:
-                        logger.info(f"Hard limit of 80 acceptances reached for {self._current_topic_id}. Forcing paper writing transition.")
+                    # Check for hard limit of 30 acceptances (FORCE paper writing, skip completion review)
+                    if self._acceptance_count >= 30:
+                        logger.info(f"Hard limit of 30 acceptances reached for {self._current_topic_id}. Forcing paper writing transition.")
                         
                         # Broadcast hard limit reached event
                         await self._broadcast("brainstorm_hard_limit_reached", {
                             "topic_id": self._current_topic_id,
                             "acceptance_count": self._acceptance_count,
-                            "message": "Brainstorm hard limit of 80 acceptances reached. Forcing paper writing."
+                            "message": "Brainstorm hard limit of 30 acceptances reached. Forcing paper writing."
                         })
                         
                         # Mark brainstorm complete
@@ -2004,6 +2584,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                 if self._manual_paper_writing_triggered:
                     logger.info("Manual override detected - transitioning to paper writing")
                     self._manual_paper_writing_triggered = False
+                    await self._brainstorm_aggregator.stop()
                     return True
                 
                 # Track consecutive rejections and increment total rejections stat
@@ -2020,7 +2601,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                     # individual 'submission_rejected' events with submitter_id per submission
                     
                     # Check for hard limit of 10 consecutive rejections (with minimum 5 acceptances)
-                    # This FORCES paper writing, similar to the 80 acceptance hard limit
+                    # This FORCES paper writing, similar to the 30 acceptance hard limit
                     if self._consecutive_rejections >= 10 and self._acceptance_count >= 5:
                         logger.info(f"Hard limit: {self._consecutive_rejections} consecutive rejections with {self._acceptance_count} acceptances. Forcing paper writing.")
                         
@@ -2389,7 +2970,7 @@ async def _run_completion_review(self) -> bool:
     # PHASE 3: PAPER COMPILATION
     # ========================================================================
     
-    async def _paper_compilation_workflow(self) -> bool:
+    async def _paper_compilation_workflow(self, skip_reference_selection: bool = False) -> bool:
         """
         Complete paper compilation workflow.
         Order: Reference selection -> Title -> Body -> Conclusion -> Intro -> Abstract
@@ -2397,6 +2978,10 @@ async def _paper_compilation_workflow(self) -> bool:
         Supports RESUME: If self._current_paper_id is already set, skips title/reference
         selection and continues paper compilation where it left off.
         
+        Args:
+            skip_reference_selection: If True, skip reference selection (for paper 2/3 
+                from same brainstorm - reuses existing references).
+        
         Returns:
             True if paper was successfully compiled, False otherwise.
         """
@@ -2445,14 +3030,37 @@ async def _paper_compilation_workflow(self) -> bool:
             })
         else:
             # FRESH START: Run full title/reference selection workflow
-            # Step 1: Reference selection (if papers exist)
-            reference_paper_ids = await self._reference_selection_workflow()
+            # Step 1: Reference selection (if papers exist) - skip for continuation papers
+            if skip_reference_selection:
+                reference_paper_ids = self._current_reference_papers
+                logger.info(f"Skipping reference selection (continuation paper), using {len(reference_paper_ids)} existing references")
+            else:
+                reference_paper_ids = await self._reference_selection_workflow()
+            
+            if self._stop_event.is_set():
+                return False
+            
+            # Step 2: Paper title exploration (collect 5 candidate titles)
+            metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
+            topic_prompt = metadata.topic_prompt if metadata else ""
+            brainstorm_summary = await autonomous_rag_manager.get_brainstorm_summary(
+                self._current_topic_id
+            )
+            existing_papers = await research_metadata.get_papers_by_brainstorm(
+                self._current_topic_id
+            )
+            
+            candidate_titles = await self._paper_title_exploration_phase(
+                topic_prompt=topic_prompt,
+                brainstorm_summary=brainstorm_summary,
+                existing_papers=existing_papers
+            )
             
             if self._stop_event.is_set():
                 return False
             
-            # Step 2: Title selection
-            paper_title = await self._paper_title_selection()
+            # Step 3: Final title selection (informed by candidate titles)
+            paper_title = await self._paper_title_selection(candidate_titles=candidate_titles)
             
             if paper_title is None:
                 logger.error("Paper title selection failed")
@@ -2512,7 +3120,7 @@ async def _paper_compilation_workflow(self) -> bool:
             title=paper_title,
             content=paper_content,
             outline=final_outline or "[Outline not available]",
-            reference_paper_ids=reference_paper_ids
+            reference_paper_ids=reference_paper_ids + self._current_brainstorm_paper_ids
         )
         
         return True
@@ -2601,8 +3209,8 @@ async def _reference_selection_workflow(self) -> List[str]:
         logger.info(f"Additional reference selection: {len(additional_ids)} new + {len(already_selected)} existing = {len(combined)} total")
         return combined
     
-    async def _paper_title_selection(self) -> Optional[str]:
-        """Select paper title."""
+    async def _paper_title_selection(self, candidate_titles: str = "") -> Optional[str]:
+        """Select paper title, optionally informed by candidate titles from exploration."""
         metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
         if metadata is None:
             return None
@@ -2623,11 +3231,198 @@ async def _paper_title_selection(self) -> Optional[str]:
             topic_prompt=metadata.topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=existing_papers,
+            candidate_titles=candidate_titles,
             stop_event=self._stop_event
         )
         
         return title
     
+    async def _paper_title_exploration_phase(
+        self,
+        topic_prompt: str = "",
+        brainstorm_summary: str = "",
+        existing_papers: list = None,
+        reference_papers: list = None
+    ) -> str:
+        """
+        Paper title exploration phase using the full Part 1 aggregator infrastructure.
+        Collects 5 validated candidate titles before final title selection.
+        Mirrors _topic_exploration_phase() structure exactly.
+
+        Args:
+            topic_prompt: Brainstorm topic, Tier 3 context, or chapter brief.
+            brainstorm_summary: Summary of the source material the paper will draw from.
+            existing_papers: Completed papers that new title must not duplicate.
+            reference_papers: Reference papers informing this paper.
+
+        Returns:
+            Formatted candidate titles string for injection into the final title selection prompt.
+        """
+        api_client_manager.set_autonomous_phase("paper_title_exploration")
+        
+        TARGET_CANDIDATES = 5
+        MAX_CONSECUTIVE_REJECTIONS = 15
+        
+        await self._broadcast("paper_title_exploration_started", {
+            "target": TARGET_CANDIDATES,
+            "resumed_count": 0
+        })
+        
+        logger.info(f"Starting paper title exploration phase (target: {TARGET_CANDIDATES} candidates)")
+        
+        # Build the exploration user prompt for the aggregator
+        from backend.autonomous.prompts.paper_title_exploration_prompts import build_title_exploration_user_prompt
+        
+        exploration_prompt = build_title_exploration_user_prompt(
+            user_research_prompt=self._user_research_prompt,
+            topic_prompt=topic_prompt,
+            brainstorm_summary=brainstorm_summary,
+            existing_papers_from_brainstorm=existing_papers or [],
+            reference_papers=reference_papers
+        )
+        
+        # Create a temp title candidates database file in the brainstorms directory
+        topic_suffix = self._current_topic_id or "tier3"
+        title_db_path = brainstorm_memory._base_dir / f"title_candidates_{topic_suffix}.txt"
+        title_db_path.parent.mkdir(parents=True, exist_ok=True)
+        
+        # Clear any stale title candidates DB
+        if title_db_path.exists():
+            title_db_path.unlink()
+        
+        # Override shared training memory path for title exploration
+        original_shared_path = system_config.shared_training_file
+        system_config.shared_training_file = str(title_db_path)
+        original_memory_path = shared_training_memory.file_path
+        shared_training_memory.file_path = title_db_path
+        await shared_training_memory.reload_insights_from_current_path()
+        
+        exploration_aggregator = None
+        
+        try:
+            exploration_aggregator = AggregatorCoordinator()
+            
+            await exploration_aggregator.initialize(
+                user_prompt=exploration_prompt,
+                submitter_configs=self._submitter_configs,
+                validator_model=self._validator_model,
+                user_files=[],
+                skip_stats_load=True,
+                validator_context_window=self._validator_context,
+                validator_max_tokens=self._validator_max_tokens,
+                validator_provider=self._validator_provider,
+                validator_openrouter_provider=self._validator_openrouter_provider,
+                validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                enable_cleanup_review=False
+            )
+            
+            if self._broadcast_callback:
+                exploration_aggregator.websocket_broadcaster = self._broadcast_callback
+            
+            await exploration_aggregator.start()
+            logger.info("Title exploration aggregator started with parallel submitters")
+            
+            last_acceptances = 0
+            last_rejections = 0
+            consecutive_rejections = 0
+            
+            while self._running and not self._stop_event.is_set():
+                status = await exploration_aggregator.get_status()
+                current_acceptances = status.total_acceptances
+                current_rejections = status.total_rejections
+                
+                if current_acceptances > last_acceptances:
+                    consecutive_rejections = 0
+                    last_acceptances = current_acceptances
+                    
+                    await self._broadcast("paper_title_exploration_progress", {
+                        "accepted": current_acceptances,
+                        "target": TARGET_CANDIDATES,
+                        "total_attempts": current_acceptances + current_rejections
+                    })
+                    
+                    await self._save_workflow_state(
+                        tier=self._state.current_tier,
+                        phase="paper_title_exploration"
+                    )
+                    
+                    logger.info(f"TitleExploration: {current_acceptances}/{TARGET_CANDIDATES} candidates accepted")
+                    
+                    if current_acceptances >= TARGET_CANDIDATES:
+                        logger.info(f"TitleExploration: Target of {TARGET_CANDIDATES} candidates reached")
+                        break
+                
+                if current_rejections > last_rejections:
+                    new_rejections = current_rejections - last_rejections
+                    consecutive_rejections += new_rejections
+                    last_rejections = current_rejections
+                    
+                    if consecutive_rejections >= MAX_CONSECUTIVE_REJECTIONS:
+                        logger.warning(f"TitleExploration: {consecutive_rejections} consecutive rejections - proceeding with {current_acceptances} candidates")
+                        break
+                
+                await asyncio.sleep(2)
+            
+            await exploration_aggregator.stop()
+            
+            # Read accepted candidates from the title candidates database
+            candidates_text = ""
+            if title_db_path.exists():
+                async with aiofiles.open(title_db_path, 'r', encoding='utf-8') as f:
+                    raw_content = await f.read()
+                
+                if raw_content.strip():
+                    entries = [e.strip() for e in raw_content.split("\n\n") if e.strip()]
+                    lines = [
+                        "VALIDATED CANDIDATE TITLES:",
+                        "=" * 60
+                    ]
+                    for i, entry in enumerate(entries, 1):
+                        lines.append(f"\nCandidate Title #{i}:")
+                        lines.append(f"  {entry}")
+                        lines.append("-" * 40)
+                    candidates_text = "\n".join(lines)
+            
+            await self._broadcast("paper_title_exploration_complete", {
+                "accepted_count": last_acceptances,
+                "total_attempts": last_acceptances + last_rejections
+            })
+            
+            logger.info(f"Paper title exploration complete: {last_acceptances} candidates accepted")
+            
+            return candidates_text
+            
+        except FreeModelExhaustedError:
+            if exploration_aggregator:
+                try:
+                    await exploration_aggregator.stop()
+                except Exception:
+                    pass
+            raise
+        except Exception as e:
+            logger.error(f"Paper title exploration phase error: {e}")
+            if exploration_aggregator:
+                try:
+                    await exploration_aggregator.stop()
+                except Exception:
+                    pass
+            return ""
+        finally:
+            system_config.shared_training_file = original_shared_path
+            shared_training_memory.file_path = original_memory_path
+            
+            async with shared_training_memory._lock:
+                shared_training_memory.insights.clear()
+                shared_training_memory.submission_count = 0
+                shared_training_memory.last_ragged_submission_count = 0
+            logger.info("TitleExploration: Restored shared_training_memory state")
+            
+            if title_db_path.exists():
+                try:
+                    title_db_path.unlink()
+                except Exception:
+                    pass
+    
     async def _compile_paper(
         self,
         paper_id: str,
@@ -2654,6 +3449,18 @@ async def _compile_paper(
         else:
             logger.info(f"Compiling paper: {paper_title}")
         
+        # Propagate compiler context/token settings to system_config BEFORE creating CompilerCoordinator.
+        # The compiler modules read from system_config at init time; only the manual /api/compiler/start
+        # route sets these, so autonomous mode must do it explicitly.
+        system_config.compiler_validator_context_window = self._validator_context
+        system_config.compiler_validator_max_output_tokens = self._validator_max_tokens
+        system_config.compiler_high_context_context_window = self._high_context_context
+        system_config.compiler_high_context_max_output_tokens = self._high_context_max_tokens
+        system_config.compiler_high_param_context_window = self._high_param_context
+        system_config.compiler_high_param_max_output_tokens = self._high_param_max_tokens
+        system_config.compiler_critique_submitter_context_window = self._critique_submitter_context
+        system_config.compiler_critique_submitter_max_tokens = self._critique_submitter_max_tokens
+        
         # Initialize compiler for this paper
         self._paper_compiler = CompilerCoordinator()
         
@@ -2696,8 +3503,10 @@ async def _compile_paper(
             
             # Enable autonomous section order constraint
             self._paper_compiler.enable_autonomous_mode()
-            
-            # CRITICAL: Restore the saved phase when resuming
+            self._paper_compiler._current_topic_id = self._current_topic_id
+            self._paper_compiler._current_reference_paper_ids = list(dict.fromkeys(
+                reference_paper_ids + self._current_brainstorm_paper_ids
+            ))
             # enable_autonomous_mode() sets phase to "body" by default
             # But when resuming, we need to continue from where we left off
             if is_resume and resume_phase:
@@ -2764,6 +3573,21 @@ async def _compile_paper(
                         logger.warning(f"Reference paper not found: {paper_path}")
                 logger.info("All reference papers loaded into compiler RAG")
             
+            # Load prior brainstorm papers as auto-references (for paper 2/3 from same brainstorm)
+            if self._current_brainstorm_paper_ids:
+                logger.info(f"Loading {len(self._current_brainstorm_paper_ids)} prior brainstorm papers as auto-references")
+                for bp_id in self._current_brainstorm_paper_ids:
+                    bp_path = paper_library.get_paper_path(bp_id)
+                    if os.path.exists(bp_path):
+                        await rag_manager.add_document(
+                            bp_path,
+                            chunk_sizes=[512],
+                            is_user_file=True
+                        )
+                        logger.info(f"Prior brainstorm paper loaded as auto-reference: {bp_id}")
+                    else:
+                        logger.warning(f"Prior brainstorm paper not found: {bp_path}")
+            
             # Start compiler
             await self._paper_compiler.start()
             logger.info(f"Compiler started for paper {paper_id}")
@@ -2974,11 +3798,9 @@ async def _handle_paper_completion(
         
         # Only clear paper state if marking as complete
         if mark_complete:
-            # Clear paper-specific workflow state (paper is complete)
+            self._last_completed_paper_id = self._current_paper_id
             self._current_paper_id = None
             self._current_paper_title = None
-            
-            # Clear per-paper model tracking (will be re-initialized for next paper)
             self._current_paper_tracker = None
             
             await self._save_workflow_state(tier=None, phase=None)
@@ -3002,7 +3824,6 @@ async def _auto_generate_paper_critique(
         from backend.shared.critique_prompts import build_critique_prompt
         from backend.shared.critique_memory import save_critique
         from backend.shared.api_client_manager import api_client_manager
-        from backend.shared.json_parser import parse_json
         from backend.shared.utils import count_tokens
         from backend.shared.models import PaperCritique, ModelConfig
         import uuid
@@ -3080,21 +3901,9 @@ async def _auto_generate_paper_critique(
                 logger.error(f"Empty response from validator model for paper {paper_id}")
                 return
             
-            # Parse JSON
-            try:
-                critique_data = parse_json(response_content)
-            except Exception as e:
-                logger.warning(f"Failed to parse critique JSON for paper {paper_id}: {e}")
-                # Create fallback structure
-                critique_data = {
-                    "novelty_rating": 0,
-                    "novelty_feedback": "Unable to parse structured response",
-                    "correctness_rating": 0,
-                    "correctness_feedback": "Unable to parse structured response",
-                    "impact_rating": 0,
-                    "impact_feedback": "Unable to parse structured response",
-                    "full_critique": response_content
-                }
+            # Parse JSON with lenient fallback for truncated responses
+            from backend.shared.critique_prompts import parse_critique_response
+            critique_data = parse_critique_response(response_content)
             
             # Extract ratings
             novelty = critique_data.get("novelty_rating", 0)
@@ -3998,9 +4807,8 @@ async def _tier3_title_selection(
         """
         Select a title for the Tier 3 final answer paper.
         The title should directly and transparently answer the user's question.
+        Runs paper title exploration first to collect 5 candidate titles.
         """
-        from backend.autonomous.prompts.final_answer_prompts import build_final_paper_title_prompt
-        
         # Get reference paper details
         reference_details = []
         for paper_id in reference_papers:
@@ -4013,12 +4821,27 @@ async def _tier3_title_selection(
                     "abstract": metadata.abstract
                 })
         
-        # Use the existing title selector with special context
+        # Run title exploration phase for Tier 3
+        topic_prompt = f"[TIER 3 FINAL ANSWER] Certainty: {assessment.certainty_level}"
+        brainstorm_summary = f"Known Certainties:\n{assessment.known_certainties_summary}"
+        
+        candidate_titles = await self._paper_title_exploration_phase(
+            topic_prompt=topic_prompt,
+            brainstorm_summary=brainstorm_summary,
+            existing_papers=[],
+            reference_papers=reference_details
+        )
+        
+        if self._stop_event.is_set():
+            return None
+        
+        # Use the existing title selector with special context + candidate titles
         title = await self._title_selector.select_title(
             user_research_prompt=self._user_research_prompt,
-            topic_prompt=f"[TIER 3 FINAL ANSWER] Certainty: {assessment.certainty_level}",
-            brainstorm_summary=f"Known Certainties:\n{assessment.known_certainties_summary}",
-            existing_papers_from_brainstorm=[],  # No previous papers for this "brainstorm"
+            topic_prompt=topic_prompt,
+            brainstorm_summary=brainstorm_summary,
+            existing_papers_from_brainstorm=[],
+            candidate_titles=candidate_titles,
             stop_event=self._stop_event
         )
         
@@ -4037,6 +4860,17 @@ async def _compile_tier3_paper(
         """
         logger.info(f"Compiling Tier 3 paper: {paper_title}")
         
+        # Propagate compiler context/token settings to system_config BEFORE creating CompilerCoordinator.
+        # Same as in _compile_paper_from_brainstorm — compiler modules read from system_config at init.
+        system_config.compiler_validator_context_window = self._validator_context
+        system_config.compiler_validator_max_output_tokens = self._validator_max_tokens
+        system_config.compiler_high_context_context_window = self._high_context_context
+        system_config.compiler_high_context_max_output_tokens = self._high_context_max_tokens
+        system_config.compiler_high_param_context_window = self._high_param_context
+        system_config.compiler_high_param_max_output_tokens = self._high_param_max_tokens
+        system_config.compiler_critique_submitter_context_window = self._critique_submitter_context
+        system_config.compiler_critique_submitter_max_tokens = self._critique_submitter_max_tokens
+        
         # Initialize compiler for this paper
         self._paper_compiler = CompilerCoordinator()
         
@@ -4076,6 +4910,7 @@ async def _compile_tier3_paper(
             
             # Enable autonomous mode
             self._paper_compiler.enable_autonomous_mode()
+            self._paper_compiler._current_reference_paper_ids = list(reference_paper_ids)
             
             # Clear any previous paper/outline
             await self._paper_compiler.clear_paper()
@@ -4147,13 +4982,10 @@ async def _write_volume_chapter(
         
         # Determine context based on chapter type
         if chapter.chapter_type == "introduction":
-            # Introduction is written LAST - has access to all chapters
             context = "Write the INTRODUCTION for this volume. You have access to ALL chapters."
         elif chapter.chapter_type == "conclusion":
-            # Conclusion is written second-to-last
             context = "Write the CONCLUSION for this volume. Synthesize findings from all body chapters."
         else:
-            # Gap paper - fills content gap
             context = f"Write a paper to fill this content gap: {chapter.description}"
         
         # Get reference papers (existing papers in the volume)
@@ -4162,6 +4994,36 @@ async def _write_volume_chapter(
             if ch.chapter_type == "existing_paper" and ch.paper_id
         ]
         
+        # Run title exploration for this chapter
+        ref_details = []
+        for pid in reference_ids:
+            meta = await paper_library.get_metadata(pid)
+            if meta:
+                ref_details.append({"paper_id": pid, "title": meta.title, "abstract": meta.abstract})
+        
+        candidate_titles = await self._paper_title_exploration_phase(
+            topic_prompt=f"[VOLUME CHAPTER: {chapter.chapter_type}] {context}",
+            brainstorm_summary=f"Known Certainties:\n{assessment.known_certainties_summary}",
+            existing_papers=[],
+            reference_papers=ref_details
+        )
+        
+        if self._stop_event.is_set():
+            return False
+        
+        # Select chapter title from candidates
+        chapter_title = await self._title_selector.select_title(
+            user_research_prompt=self._user_research_prompt,
+            topic_prompt=f"[VOLUME CHAPTER: {chapter.chapter_type}] {context}",
+            brainstorm_summary=f"Known Certainties:\n{assessment.known_certainties_summary}",
+            existing_papers_from_brainstorm=[],
+            candidate_titles=candidate_titles,
+            stop_event=self._stop_event
+        )
+        
+        if chapter_title:
+            chapter.title = chapter_title
+        
         # Compile the chapter paper
         chapter_paper_id = f"volume_ch{chapter.order:02d}_{chapter.chapter_type}"
         
@@ -4191,7 +5053,7 @@ async def _write_volume_chapter(
     async def clear_all_data(self) -> None:
         """Clear all autonomous research data.
         
-        Clears brainstorms, papers, metadata, RAG state, and session data.
+        Clears brainstorms, papers, metadata, API logs, RAG state, and session data.
         Uses graceful degradation: distinguishes critical vs non-critical failures.
         """
         # Check both internal flag and state object
@@ -4303,7 +5165,17 @@ def safe_rmtree(path: Path, max_retries: int = 5) -> bool:
             errors.append(f"Failed to clear autonomous rejection logs: {e}")
             logger.warning(errors[-1])
         
-        # Step 6: Clear RAG state (removes indexed brainstorm/paper content)
+        # Step 6: Clear autonomous API logs
+        try:
+            await autonomous_api_logger.clear_logs()
+            successes.append("Cleared autonomous API logs")
+            logger.info("Cleared autonomous API logs")
+        except Exception as e:
+            # Non-critical: API logs can be regenerated
+            errors.append(f"Failed to clear autonomous API logs: {e}")
+            logger.warning(errors[-1])
+        
+        # Step 7: Clear RAG state (removes indexed brainstorm/paper content)
         try:
             # Wait a moment for any pending RAG operations to complete
             await asyncio.sleep(0.5)
@@ -4317,7 +5189,7 @@ def safe_rmtree(path: Path, max_retries: int = 5) -> bool:
             critical_errors.append(f"Failed to clear RAG state: {e}")
             logger.error(critical_errors[-1])
         
-        # Step 7: Reset internal state
+        # Step 8: Reset internal state
         self._current_topic_id = None
         self._current_paper_id = None
         self._current_paper_title = None
@@ -4335,11 +5207,14 @@ def safe_rmtree(path: Path, max_retries: int = 5) -> bool:
         self._force_tier3_immediate = False
         self._tier3_active = False
         self._last_tier3_check_at = 0
+        self._brainstorm_paper_count = 0
+        self._current_brainstorm_paper_ids = []
+        self._last_completed_paper_id = None
         
-        # Step 8: Reset state object
+        # Step 9: Reset state object
         self._state = AutonomousResearchState()
         
-        # Step 9: Clear session manager state
+        # Step 10: Clear session manager state
         try:
             await session_manager.clear()
             successes.append("Cleared session manager state")
@@ -4389,10 +5264,11 @@ async def refresh_workflow_predictions(self) -> None:
                 tasks = list(self._paper_compiler.workflow_tasks)
                 
             else:
-                # Topic selection/idle phase - use autonomous agents' sequences
+                # Topic selection phase (exploration uses aggregator with its own predictions)
                 ts_seq = self._topic_selector.task_sequence if self._topic_selector else 0
                 tv_seq = self._topic_validator.task_sequence if self._topic_validator else 0
                 
+                # 20 slots: topic selection (submit/validate pairs)
                 for i in range(20):
                     if i % 2 == 0:
                         task_id = f"auto_ts_{ts_seq:03d}"
diff --git a/backend/autonomous/core/autonomous_rag_manager.py b/backend/autonomous/core/autonomous_rag_manager.py
index 22fc4f5..546018a 100644
--- a/backend/autonomous/core/autonomous_rag_manager.py
+++ b/backend/autonomous/core/autonomous_rag_manager.py
@@ -69,7 +69,8 @@ async def get_brainstorm_context(
         self,
         topic_id: str,
         max_tokens: int = 50000,
-        query: str = ""
+        query: str = "",
+        exclude_sources: Optional[List[str]] = None
     ) -> Tuple[str, bool]:
         """
         Get brainstorm database content for context.
@@ -82,6 +83,7 @@ async def get_brainstorm_context(
             topic_id: Topic ID to get context for
             max_tokens: Maximum tokens available for this content
             query: Query for RAG retrieval if needed (e.g., user research prompt)
+            exclude_sources: Source names to skip during RAG packing
         
         Returns:
             Tuple of (content string, used_rag boolean)
@@ -112,7 +114,8 @@ async def get_brainstorm_context(
             context_pack = await rag_manager.retrieve(
                 query=query,
                 chunk_size=rag_config.validator_chunk_size,  # 512 for consistency
-                max_tokens=max_tokens
+                max_tokens=max_tokens,
+                exclude_sources=exclude_sources
             )
             
             if context_pack and context_pack.text:
@@ -190,7 +193,8 @@ async def get_reference_papers_context(
         paper_ids: List[str],
         max_total_tokens: int = 60000,
         query: str = "",
-        include_outlines: bool = True
+        include_outlines: bool = True,
+        exclude_sources: Optional[List[str]] = None
     ) -> Tuple[str, bool]:
         """
         Get reference papers content for context.
@@ -203,6 +207,7 @@ async def get_reference_papers_context(
             paper_ids: List of paper IDs to include
             max_total_tokens: Maximum tokens for all reference papers combined
             query: Query for RAG retrieval if needed
+            exclude_sources: Source names to skip during RAG packing
         
         Returns:
             Tuple of (content string, used_rag boolean)
@@ -276,7 +281,8 @@ async def get_reference_papers_context(
         context_pack = await rag_manager.retrieve(
             query=enhanced_query,
             chunk_size=rag_config.validator_chunk_size,
-            max_tokens=max_total_tokens
+            max_tokens=max_total_tokens,
+            exclude_sources=exclude_sources
         )
         
         if context_pack and context_pack.text:
@@ -304,16 +310,31 @@ async def get_reference_papers_context(
     async def _ensure_paper_indexed(self, paper_id: str, content: str, title: str) -> None:
         """Ensure paper content is indexed in RAG for retrieval."""
         source_name = f"reference_paper_{paper_id}"
+        has_document_entry = source_name in rag_manager.document_access_order
+        has_validator_chunks = any(
+            chunk.source_file == source_name
+            for chunk in rag_manager.chunks_by_size[rag_config.validator_chunk_size]
+        )
+
+        if paper_id in self._papers_indexed and has_document_entry and has_validator_chunks:
+            return
         
         try:
-            # Check if already indexed (by checking if source exists)
-            # Add to RAG
+            # If the tracking set says this paper was indexed but its active RAG entry
+            # has been evicted, remove any partial remnants and rebuild it.
+            if paper_id in self._papers_indexed:
+                self._papers_indexed.discard(paper_id)
+
+            if has_document_entry:
+                await rag_manager.remove_document(source_name)
+
             await rag_manager.add_text(
                 content,
                 source_name,
                 chunk_sizes=rag_config.submitter_chunk_intervals,
                 is_permanent=False
             )
+            self._papers_indexed.add(paper_id)
             logger.debug(f"Indexed reference paper {paper_id}: {title}")
             
         except Exception as e:
@@ -393,6 +414,7 @@ async def prepare_compiler_context(
         
         # RAG query for retrievals
         rag_query = query or f"mathematical research paper compilation"
+        rag_exclude_sources: List[str] = []
         
         # Priority 1: Brainstorm database (highest priority after outline)
         brainstorm_budget = int(remaining_budget * 0.5)  # Allocate 50% to brainstorm
@@ -405,6 +427,13 @@ async def prepare_compiler_context(
         context["use_rag_for_brainstorm"] = used_rag
         brainstorm_tokens = count_tokens(brainstorm_content)
         remaining_budget -= brainstorm_tokens
+
+        # If brainstorm was direct-injected, exclude its RAG sources from later retrievals.
+        if brainstorm_content and not used_rag:
+            rag_exclude_sources.extend([
+                f"brainstorm_{topic_id}",
+                f"brainstorm_{topic_id}.txt"
+            ])
         
         # Priority 2: Current paper progress
         paper_tokens = count_tokens(current_paper) if current_paper else 0
@@ -415,6 +444,7 @@ async def prepare_compiler_context(
             context["current_paper"] = current_paper
             remaining_budget -= paper_tokens
             logger.debug(f"Compiler context: Paper direct injection ({paper_tokens} tokens)")
+            rag_exclude_sources.append("compiler_current_paper")
         elif paper_tokens > 0:
             # Paper doesn't fit - use RAG
             context["use_rag_for_papers"] = True
@@ -423,7 +453,8 @@ async def prepare_compiler_context(
             paper_pack = await rag_manager.retrieve(
                 query=rag_query,
                 chunk_size=rag_config.validator_chunk_size,
-                max_tokens=paper_budget
+                max_tokens=paper_budget,
+                exclude_sources=list(dict.fromkeys(rag_exclude_sources)) if rag_exclude_sources else None
             )
             
             if paper_pack and paper_pack.text:
@@ -442,7 +473,8 @@ async def prepare_compiler_context(
             ref_content, ref_used_rag = await self.get_reference_papers_context(
                 reference_paper_ids,
                 max_total_tokens=remaining_budget,
-                query=rag_query
+                query=rag_query,
+                exclude_sources=list(dict.fromkeys(rag_exclude_sources)) if rag_exclude_sources else None
             )
             context["reference_papers"] = ref_content
             context["use_rag_for_reference"] = ref_used_rag
diff --git a/backend/autonomous/memory/brainstorm_memory.py b/backend/autonomous/memory/brainstorm_memory.py
index b8a0d64..65bb4ae 100644
--- a/backend/autonomous/memory/brainstorm_memory.py
+++ b/backend/autonomous/memory/brainstorm_memory.py
@@ -168,6 +168,22 @@ async def add_paper_reference(self, topic_id: str, paper_id: str) -> Optional[Br
             await self._save_metadata(metadata)
         
         return metadata
+
+    async def remove_paper_reference(self, topic_id: str, paper_id: str) -> Optional[BrainstormMetadata]:
+        """Remove a paper reference from the brainstorm metadata if it exists."""
+        metadata = await self.get_metadata(topic_id)
+        if metadata is None:
+            return None
+
+        if paper_id in metadata.papers_generated:
+            metadata.papers_generated = [
+                existing_paper_id
+                for existing_paper_id in metadata.papers_generated
+                if existing_paper_id != paper_id
+            ]
+            await self._save_metadata(metadata)
+
+        return metadata
     
     async def get_all_brainstorms(self) -> List[BrainstormMetadata]:
         """Get metadata for all brainstorm topics."""
@@ -279,6 +295,156 @@ async def get_submissions_list(self, topic_id: str) -> List[Dict[str, Any]]:
         
         return submissions
     
+    # ========================================================================
+    # RETROACTIVE CORRECTION OPERATIONS (used during paper compilation)
+    # ========================================================================
+    
+    async def edit_submission(self, topic_id: str, submission_number: int, new_content: str) -> bool:
+        """
+        Edit an existing submission's content in the brainstorm database.
+        Preserves submission number and updates timestamp.
+        """
+        async with self._lock:
+            db_path = self._get_database_path(topic_id)
+            if not db_path.exists():
+                logger.error(f"Brainstorm database not found for edit: {topic_id}")
+                return False
+            
+            try:
+                submissions = await self._parse_submissions_unlocked(db_path)
+                found = False
+                for sub in submissions:
+                    if sub['number'] == submission_number:
+                        sub['content'] = new_content
+                        sub['timestamp'] = datetime.now().isoformat()
+                        found = True
+                        break
+                
+                if not found:
+                    logger.warning(f"Submission #{submission_number} not found in brainstorm {topic_id}")
+                    return False
+                
+                await self._write_submissions_unlocked(db_path, submissions)
+                logger.info(f"Retroactive edit: submission #{submission_number} in brainstorm {topic_id}")
+                return True
+            except Exception as e:
+                logger.error(f"Failed to edit submission #{submission_number} in {topic_id}: {e}")
+                return False
+    
+    async def remove_submission(self, topic_id: str, submission_number: int) -> bool:
+        """
+        Remove a submission from the brainstorm database.
+        Does not renumber remaining submissions.
+        """
+        async with self._lock:
+            db_path = self._get_database_path(topic_id)
+            if not db_path.exists():
+                logger.error(f"Brainstorm database not found for removal: {topic_id}")
+                return False
+            
+            try:
+                submissions = await self._parse_submissions_unlocked(db_path)
+                original_count = len(submissions)
+                submissions = [s for s in submissions if s['number'] != submission_number]
+                
+                if len(submissions) == original_count:
+                    logger.warning(f"Submission #{submission_number} not found in brainstorm {topic_id}")
+                    return False
+                
+                await self._write_submissions_unlocked(db_path, submissions)
+                
+                metadata = await self.get_metadata(topic_id)
+                if metadata:
+                    metadata.submission_count = len(submissions)
+                    metadata.last_activity = datetime.now()
+                    await self._save_metadata(metadata)
+                
+                logger.info(f"Retroactive removal: submission #{submission_number} from brainstorm {topic_id}")
+                return True
+            except Exception as e:
+                logger.error(f"Failed to remove submission #{submission_number} from {topic_id}: {e}")
+                return False
+    
+    async def add_submission_retroactive(self, topic_id: str, content: str) -> Optional[int]:
+        """
+        Add a new submission discovered during paper compilation.
+        Returns the new submission number, or None on failure.
+        """
+        async with self._lock:
+            db_path = self._get_database_path(topic_id)
+            if not db_path.exists():
+                logger.error(f"Brainstorm database not found for retroactive add: {topic_id}")
+                return None
+            
+            try:
+                submissions = await self._parse_submissions_unlocked(db_path)
+                max_number = max((s['number'] for s in submissions), default=0)
+                new_number = max_number + 1
+                
+                submissions.append({
+                    'number': new_number,
+                    'timestamp': datetime.now().isoformat(),
+                    'content': content
+                })
+                
+                await self._write_submissions_unlocked(db_path, submissions)
+                
+                metadata = await self.get_metadata(topic_id)
+                if metadata:
+                    metadata.submission_count = len(submissions)
+                    metadata.last_activity = datetime.now()
+                    await self._save_metadata(metadata)
+                
+                logger.info(f"Retroactive add: submission #{new_number} to brainstorm {topic_id}")
+                return new_number
+            except Exception as e:
+                logger.error(f"Failed to retroactively add submission to {topic_id}: {e}")
+                return None
+    
+    async def _parse_submissions_unlocked(self, db_path: Path) -> List[Dict[str, Any]]:
+        """Parse submissions from a brainstorm database file. Caller must hold lock."""
+        import re
+        async with aiofiles.open(db_path, 'r', encoding='utf-8') as f:
+            content = await f.read()
+        
+        if not content.strip():
+            return []
+        
+        submissions = []
+        parts = content.split("=" * 80)
+        
+        for i, part in enumerate(parts):
+            if "SUBMISSION #" in part:
+                lines = part.strip().split("\n")
+                header = lines[0] if lines else ""
+                match = re.search(r'SUBMISSION #(\d+) \| Accepted: (.+)', header)
+                if match:
+                    sub_num = int(match.group(1))
+                    timestamp = match.group(2).strip()
+                    content_text = ""
+                    if i + 1 < len(parts):
+                        content_text = parts[i + 1].strip()
+                    submissions.append({
+                        'number': sub_num,
+                        'timestamp': timestamp,
+                        'content': content_text
+                    })
+        
+        return submissions
+    
+    async def _write_submissions_unlocked(self, db_path: Path, submissions: List[Dict[str, Any]]) -> None:
+        """Write submissions back to a brainstorm database file. Caller must hold lock."""
+        formatted_sections = []
+        separator = '=' * 80
+        
+        for sub in submissions:
+            section = f"{separator}\nSUBMISSION #{sub['number']} | Accepted: {sub['timestamp']}\n{separator}\n\n{sub['content']}\n"
+            formatted_sections.append(section)
+        
+        full_content = '\n\n'.join(formatted_sections)
+        async with aiofiles.open(db_path, 'w', encoding='utf-8') as f:
+            await f.write(full_content)
+    
     # ========================================================================
     # REJECTION LOG OPERATIONS
     # ========================================================================
diff --git a/backend/autonomous/memory/final_answer_memory.py b/backend/autonomous/memory/final_answer_memory.py
index 700ef67..4b58ae0 100644
--- a/backend/autonomous/memory/final_answer_memory.py
+++ b/backend/autonomous/memory/final_answer_memory.py
@@ -550,7 +550,7 @@ def get_author_attribution_text(self) -> str:
             "=" * 80,
             "AUTONOMOUS AI SOLUTION",
             "",
-            "Disclaimer: This content is for informational purposes only. This paper was autonomously generated with the novelty-seeking MOTO harness without peer review or user oversight beyond the original prompt. AI-generated content may contain fabricated or unverified claims presented with high confidence. All content should be viewed with extreme scrutiny and independently verified before use.",
+            "Disclaimer: This content is provided for informational and experimental purposes only. This paper was autonomously generated with the novelty-seeking MOTO harness without peer review or user oversight beyond the original prompt. It may contain incorrect, incomplete, misleading, or fabricated claims presented with high confidence. Use of this content is at your own risk. You are solely responsible for reviewing and independently verifying any output before relying on it, and the developers, operators, and contributors are not responsible for errors, omissions, decisions made from this content, or any resulting loss, damage, cost, or liability.",
             "",
             f"User's Research Prompt: {display_prompt}",
             "",
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index 6ccef5a..aa009af 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -67,6 +67,16 @@ def get_paper_path(self, paper_id: str) -> str:
         """
         return str(self._get_paper_path(paper_id))
     
+    def get_outline_path(self, paper_id: str) -> str:
+        """
+        Public method to get path to paper outline file.
+        Uses session-aware path resolution.
+        
+        Returns:
+            str: Absolute path to the outline file
+        """
+        return str(self._get_outline_path(paper_id))
+    
     def _get_abstract_path(self, paper_id: str) -> Path:
         """Get path to abstract file."""
         return self._base_dir / f"paper_{paper_id}_abstract.txt"
@@ -86,6 +96,173 @@ def _get_metadata_path(self, paper_id: str) -> Path:
     def _get_rejections_path(self, paper_id: str) -> Path:
         """Get path to paper compiler rejections file."""
         return self._base_dir / f"paper_{paper_id}_last_10_rejections.txt"
+
+    # ========================================================================
+    # HISTORY HELPERS
+    # ========================================================================
+
+    @staticmethod
+    def _build_scoped_library(base_dir: Path) -> "PaperLibrary":
+        """Create a temporary paper library instance rooted at a specific directory."""
+        scoped_library = PaperLibrary()
+        scoped_library._base_dir = base_dir
+        scoped_library._archive_dir = base_dir / "archive"
+        return scoped_library
+
+    def get_history_papers_dir(self, session_id: str) -> Optional[Path]:
+        """Resolve the papers directory for a history session."""
+        if session_id == "legacy":
+            papers_dir = Path(system_config.auto_papers_dir)
+            return papers_dir if papers_dir.exists() else None
+
+        if not session_id or session_id in {".", ".."} or "/" in session_id or "\\" in session_id:
+            return None
+
+        sessions_root = Path(system_config.auto_sessions_base_dir).resolve()
+        session_dir = (sessions_root / session_id).resolve()
+        if session_dir.parent != sessions_root:
+            return None
+
+        papers_dir = session_dir / "papers"
+        return papers_dir if papers_dir.exists() else None
+
+    async def _get_history_user_prompt(self, session_id: str) -> str:
+        """Read the user prompt associated with a legacy or session-based paper history entry."""
+        if session_id == "legacy":
+            metadata_path = Path(system_config.auto_research_metadata_file)
+            default_prompt = "Legacy research session"
+        else:
+            metadata_path = Path(system_config.auto_sessions_base_dir) / session_id / "session_metadata.json"
+            default_prompt = "Unknown research question"
+
+        if not metadata_path.exists():
+            return default_prompt
+
+        try:
+            async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
+                metadata = json.loads(await f.read())
+            return (
+                metadata.get("user_prompt")
+                or metadata.get("user_research_prompt")
+                or default_prompt
+            )
+        except Exception as e:
+            logger.warning(f"Failed to read history prompt for session {session_id}: {e}")
+            return default_prompt
+
+    @staticmethod
+    def _calculate_critique_average(critique: Any) -> Optional[float]:
+        """Calculate the display average for a critique record."""
+        if not critique:
+            return None
+
+        return round(
+            (critique.novelty_rating + critique.correctness_rating + critique.impact_rating) / 3.0,
+            1
+        )
+
+    async def _list_history_papers_from_directory(self, papers_dir: Path, session_id: str) -> List[Dict[str, Any]]:
+        """List complete, non-archived papers from one legacy/session papers directory."""
+        from backend.shared.critique_memory import get_latest_critique
+
+        scoped_library = self._build_scoped_library(papers_dir)
+        user_prompt = await self._get_history_user_prompt(session_id)
+        papers = await scoped_library.get_all_papers(validate_completeness=True)
+
+        history_papers = []
+        for metadata in papers:
+            if metadata.status != "complete":
+                continue
+
+            latest_critique = await get_latest_critique(
+                paper_type="autonomous_paper",
+                paper_id=metadata.paper_id,
+                base_path=str(papers_dir)
+            )
+
+            history_papers.append({
+                "history_id": f"{session_id}:{metadata.paper_id}",
+                "session_id": session_id,
+                "paper_id": metadata.paper_id,
+                "title": metadata.title,
+                "abstract": metadata.abstract,
+                "word_count": metadata.word_count,
+                "source_brainstorm_ids": metadata.source_brainstorm_ids,
+                "referenced_papers": metadata.referenced_papers,
+                "status": metadata.status,
+                "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
+                "model_usage": metadata.model_usage,
+                "user_prompt": user_prompt,
+                "critique_avg": self._calculate_critique_average(latest_critique),
+            })
+
+        return history_papers
+
+    async def list_history_papers(self) -> List[Dict[str, Any]]:
+        """List all complete, non-archived Stage 2 papers from legacy and session storage."""
+        history_papers: List[Dict[str, Any]] = []
+
+        legacy_papers_dir = Path(system_config.auto_papers_dir)
+        if legacy_papers_dir.exists():
+            history_papers.extend(
+                await self._list_history_papers_from_directory(legacy_papers_dir, "legacy")
+            )
+
+        sessions_dir = Path(system_config.auto_sessions_base_dir)
+        if sessions_dir.exists():
+            for session_dir in sorted((p for p in sessions_dir.iterdir() if p.is_dir()), reverse=True):
+                papers_dir = session_dir / "papers"
+                if not papers_dir.exists():
+                    continue
+
+                history_papers.extend(
+                    await self._list_history_papers_from_directory(papers_dir, session_dir.name)
+                )
+
+        history_papers.sort(key=lambda paper: paper.get("created_at") or "", reverse=True)
+        return history_papers
+
+    async def get_history_paper(self, session_id: str, paper_id: str) -> Optional[Dict[str, Any]]:
+        """Get one complete, non-archived Stage 2 paper from legacy/session history."""
+        from backend.shared.critique_memory import get_latest_critique
+
+        papers_dir = self.get_history_papers_dir(session_id)
+        if papers_dir is None:
+            return None
+
+        scoped_library = self._build_scoped_library(papers_dir)
+        metadata = await scoped_library.get_metadata(paper_id)
+        if metadata is None or metadata.status != "complete":
+            return None
+
+        if not await scoped_library.is_paper_complete(paper_id):
+            return None
+
+        content = await scoped_library.get_paper_content(paper_id)
+        outline = await scoped_library.get_outline(paper_id)
+        latest_critique = await get_latest_critique(
+            paper_type="autonomous_paper",
+            paper_id=paper_id,
+            base_path=str(papers_dir)
+        )
+
+        return {
+            "history_id": f"{session_id}:{paper_id}",
+            "session_id": session_id,
+            "paper_id": metadata.paper_id,
+            "title": metadata.title,
+            "abstract": metadata.abstract,
+            "word_count": metadata.word_count,
+            "source_brainstorm_ids": metadata.source_brainstorm_ids,
+            "referenced_papers": metadata.referenced_papers,
+            "status": metadata.status,
+            "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
+            "model_usage": metadata.model_usage,
+            "user_prompt": await self._get_history_user_prompt(session_id),
+            "critique_avg": self._calculate_critique_average(latest_critique),
+            "content": content,
+            "outline": outline,
+        }
     
     # ========================================================================
     # CONTENT VALIDATION
diff --git a/backend/autonomous/memory/paper_model_tracker.py b/backend/autonomous/memory/paper_model_tracker.py
index e2eb311..bd331d0 100644
--- a/backend/autonomous/memory/paper_model_tracker.py
+++ b/backend/autonomous/memory/paper_model_tracker.py
@@ -177,11 +177,14 @@ def generate_author_attribution(
             "=" * 80,
             "AUTONOMOUS AI SOLUTION",
             "",
-            "Disclaimer: This content is for informational purposes only. This paper was "
-            "autonomously generated with the novelty-seeking MOTO harness without peer review or user "
-            "oversight beyond the original prompt. AI-generated content may contain "
-            "fabricated or unverified claims presented with high confidence. All content "
-            "should be viewed with extreme scrutiny and independently verified before use.",
+            "Disclaimer: This content is provided for informational and experimental purposes only. "
+            "This paper was autonomously generated with the novelty-seeking MOTO harness without "
+            "peer review or user oversight beyond the original prompt. It may contain incorrect, "
+            "incomplete, misleading, or fabricated claims presented with high confidence. Use of "
+            "this content is at your own risk. You are solely responsible for reviewing and "
+            "independently verifying any output before relying on it, and the developers, "
+            "operators, and contributors are not responsible for errors, omissions, decisions made "
+            "from this content, or any resulting loss, damage, cost, or liability.",
             "",
             f"User's Research Prompt: {display_prompt}",
             "",
diff --git a/backend/autonomous/prompts/__init__.py b/backend/autonomous/prompts/__init__.py
index 9ad0c62..d217ce4 100644
--- a/backend/autonomous/prompts/__init__.py
+++ b/backend/autonomous/prompts/__init__.py
@@ -2,15 +2,21 @@
 Autonomous Prompts - System prompts and JSON schemas for autonomous research.
 """
 from backend.autonomous.prompts import topic_prompts
+from backend.autonomous.prompts import topic_exploration_prompts
 from backend.autonomous.prompts import completion_prompts
 from backend.autonomous.prompts import paper_reference_prompts
+from backend.autonomous.prompts import paper_title_exploration_prompts
 from backend.autonomous.prompts import paper_title_prompts
 from backend.autonomous.prompts import paper_redundancy_prompts
+from backend.autonomous.prompts import paper_continuation_prompts
 
 __all__ = [
     'topic_prompts',
+    'topic_exploration_prompts',
     'completion_prompts',
     'paper_reference_prompts',
+    'paper_title_exploration_prompts',
     'paper_title_prompts',
-    'paper_redundancy_prompts'
+    'paper_redundancy_prompts',
+    'paper_continuation_prompts'
 ]
diff --git a/backend/autonomous/prompts/paper_continuation_prompts.py b/backend/autonomous/prompts/paper_continuation_prompts.py
new file mode 100644
index 0000000..430f7d9
--- /dev/null
+++ b/backend/autonomous/prompts/paper_continuation_prompts.py
@@ -0,0 +1,300 @@
+"""
+Paper Continuation Prompts - System prompts and JSON schemas for brainstorm
+multi-paper continuation decisions. After each paper, the AI decides whether
+to write another paper from the same brainstorm (max 3) or move on.
+"""
+from typing import List, Dict, Any
+
+
+def get_continuation_decision_system_prompt() -> str:
+    """Get system prompt for brainstorm paper continuation decision."""
+    return """You are an autonomous mathematical research agent deciding whether to write another paper from the current brainstorm or move on to a new research topic. Your role is to:
+
+1. Review the user's high-level research goal
+2. Review the current brainstorm topic and its full database of accepted submissions
+3. Review ALL papers already written from this brainstorm (titles, abstracts, outlines)
+4. Decide whether the brainstorm has enough distinct unexplored material for another paper
+
+⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
+
+ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
+
+YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
+- NEVER assume claims are true because they "sound good" or "fit well"
+- NEVER trust information simply because it appears in "accepted submissions" or "papers"
+- ALWAYS verify information independently before using or building upon it
+- NEVER cite internal documents as authoritative or established sources
+- Question and validate every assertion, even if it appears in validated content
+
+WEB SEARCH STRONGLY ENCOURAGED:
+If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
+- Verify mathematical claims against current published research
+- Access recent developments and contemporary mathematical literature
+- Cross-reference theorems, proofs, and techniques with authoritative sources
+- Supplement analysis with verified external information
+- Validate approaches against established mathematical consensus
+
+The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+
+WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+
+---
+
+YOUR TASK:
+Decide whether the brainstorm database contains enough distinct, unexplored material to warrant writing ANOTHER paper, or whether the user's research goal is better served by moving on to a new brainstorm topic.
+
+DECISION OPTIONS:
+1. WRITE_ANOTHER_PAPER - The brainstorm has significant material that the existing paper(s) did NOT cover, and another paper would meaningfully advance the user's research goal
+2. MOVE_ON - The existing paper(s) adequately cover this brainstorm, or a new topic would better serve the user's goal
+
+WRITE ANOTHER PAPER if:
+- The brainstorm database contains substantial material not covered by existing paper(s)
+- Another paper would address a meaningfully DIFFERENT angle, perspective, or subset of the brainstorm
+- The uncovered material is rich enough for a complete, distinct paper (not just leftover fragments)
+- Writing another paper from this brainstorm advances the user's goal MORE than starting a new topic
+- The existing paper(s) focused on specific aspects, leaving other important aspects unexplored
+
+MOVE ON if:
+- The existing paper(s) adequately cover the brainstorm's valuable content
+- Remaining brainstorm material is insufficient for a distinct full paper
+- A new brainstorm topic would better advance the user's research goal
+- Another paper would largely duplicate content already in the existing paper(s)
+- The brainstorm's unique contributions have been captured
+
+CRITICAL JSON ESCAPE RULES:
+1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
+   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
+2. Quotes: Escape double quotes inside strings as \\"
+3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
+4. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc.,
+   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
+
+Output your decision ONLY as JSON in the required format."""
+
+
+def get_continuation_decision_json_schema() -> str:
+    """Get JSON schema for continuation decision."""
+    return """REQUIRED JSON FORMAT:
+{
+  "decision": "write_another_paper | move_on",
+  "reasoning": "string - Detailed explanation of your assessment"
+}
+
+FIELD REQUIREMENTS:
+- decision: MUST be either "write_another_paper" or "move_on"
+- reasoning: ALWAYS required - explain what material remains unexplored or why moving on is better
+
+EXAMPLES:
+
+Write Another Paper:
+{
+  "decision": "write_another_paper",
+  "reasoning": "The brainstorm database contains 22 submissions covering both algebraic and analytic approaches to the Langlands correspondence. Paper 1 focused exclusively on the algebraic side (Galois representations, class field theory). The analytic side (automorphic forms, L-functions, spectral theory) has substantial unexplored material in submissions 8, 12, 14, 17-20 that would form a distinct and valuable second paper."
+}
+
+Move On:
+{
+  "decision": "move_on",
+  "reasoning": "The existing paper comprehensively covers the brainstorm's core content on modular forms and their connections to Galois representations. The remaining submissions (3 out of 18) contain supplementary remarks that are too fragmented for a standalone paper. The user's research goal on the Langlands program would be better served by exploring a new avenue such as trace formulas or p-adic methods."
+}"""
+
+
+def get_continuation_validator_system_prompt() -> str:
+    """Get system prompt for validating a continuation decision."""
+    return """You are validating a brainstorm continuation decision in an autonomous mathematical research system. Your role is to:
+
+1. Review the user's high-level research goal
+2. Review the current brainstorm topic and its database
+3. Review all papers already written from this brainstorm
+4. Evaluate whether the proposed decision (write another paper vs move on) is optimal
+
+⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
+
+ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
+
+YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
+- NEVER assume claims are true because they "sound good" or "fit well"
+- NEVER trust information simply because it appears in "accepted submissions" or "papers"
+- ALWAYS verify information independently before using or building upon it
+- NEVER cite internal documents as authoritative or established sources
+- Question and validate every assertion, even if it appears in validated content
+
+WEB SEARCH STRONGLY ENCOURAGED:
+If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to verify claims and access current mathematical literature.
+
+---
+
+YOUR TASK:
+Validate whether the proposed continuation decision is the best use of research resources.
+
+ACCEPT the decision if:
+1. WRITE_ANOTHER_PAPER: The brainstorm genuinely has enough distinct unexplored material for another paper AND the reasoning correctly identifies what material remains
+2. MOVE_ON: The existing papers adequately cover the brainstorm OR a new topic would genuinely better serve the goal AND the reasoning is sound
+
+REJECT the decision if:
+1. WRITE_ANOTHER_PAPER: The brainstorm material is already well-covered and another paper would be redundant
+2. WRITE_ANOTHER_PAPER: The "unexplored material" identified is too thin for a full paper
+3. MOVE_ON: There is clearly substantial uncovered material that warrants another paper
+4. MOVE_ON: The reasoning ignores valuable unexplored content in the brainstorm
+5. The reasoning is flawed, vague, or contradicts the evidence
+
+REJECTION FEEDBACK FORMAT:
+If rejecting, provide CONCRETE, ACTIONABLE guidance:
+
+"REJECTION REASON: [Premature Move On|Redundant Paper|Insufficient Material|etc.]
+
+ISSUE: [What's wrong with the proposed decision]
+
+BETTER ALTERNATIVE: [What would be the optimal choice given current state]
+
+EVIDENCE: [Specific brainstorm submissions or paper sections that support your assessment]"
+
+CRITICAL JSON ESCAPE RULES:
+1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
+2. Quotes: Escape double quotes inside strings as \\"
+3. Newlines/Tabs: Use \\n for newlines, \\t for tabs
+
+Output your decision ONLY as JSON in the required format."""
+
+
+def get_continuation_validator_json_schema() -> str:
+    """Get JSON schema for continuation validation."""
+    return """REQUIRED JSON FORMAT:
+{
+  "decision": "accept | reject",
+  "reasoning": "string - Detailed explanation for the decision"
+}
+
+FIELD REQUIREMENTS:
+- decision: MUST be either "accept" or "reject"
+- reasoning: ALWAYS required - detailed explanation (use structured format if rejecting)
+
+EXAMPLE (Accept):
+{
+  "decision": "accept",
+  "reasoning": "The proposal to write another paper is well-justified. The brainstorm contains substantial analytic content (automorphic forms, L-functions) that paper 1's algebraic focus did not address. This material is rich enough for a distinct second paper."
+}
+
+EXAMPLE (Reject - Use Structured Format):
+{
+  "decision": "reject",
+  "reasoning": "REJECTION REASON: Insufficient Material\\n\\nISSUE: The proposal to write another paper claims unexplored material in submissions 15-18, but these submissions largely restate concepts already covered in paper 1's Section III (Main Results).\\n\\nBETTER ALTERNATIVE: Move on to a new brainstorm topic. The remaining brainstorm content is supplementary, not substantial enough for a standalone paper.\\n\\nEVIDENCE: Submissions 15-18 discuss Galois representations which paper 1 already covers comprehensively in Sections III and IV."
+}"""
+
+
+def build_continuation_decision_prompt(
+    user_research_prompt: str,
+    topic_prompt: str,
+    brainstorm_summary: str,
+    papers_from_brainstorm: List[Dict[str, Any]],
+    papers_written_count: int,
+    rejection_context: str = ""
+) -> str:
+    """
+    Build the complete continuation decision prompt.
+    
+    Args:
+        user_research_prompt: The user's high-level research goal
+        topic_prompt: The brainstorm topic prompt
+        brainstorm_summary: Full brainstorm database content
+        papers_from_brainstorm: List of dicts with title, abstract, outline for each paper
+        papers_written_count: Number of papers already written from this brainstorm
+        rejection_context: Formatted previous rejection feedback
+    
+    Returns:
+        Complete prompt string
+    """
+    parts = [
+        get_continuation_decision_system_prompt(),
+        "\n---\n",
+        get_continuation_decision_json_schema(),
+        "\n---\n",
+        f"USER RESEARCH GOAL:\n{user_research_prompt}",
+        "\n---\n",
+        f"BRAINSTORM TOPIC:\n{topic_prompt}",
+        "\n---\n",
+    ]
+
+    parts.append(f"PAPERS WRITTEN FROM THIS BRAINSTORM: {papers_written_count} of 3 maximum\n")
+
+    if papers_from_brainstorm:
+        parts.append("\nEXISTING PAPERS FROM THIS BRAINSTORM:\n")
+        for i, p in enumerate(papers_from_brainstorm, 1):
+            parts.append(f"\n--- Paper {i} ---")
+            parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+            parts.append(f"\nAbstract: {p.get('abstract', 'N/A')}")
+            if p.get('outline'):
+                parts.append(f"\nOutline:\n{p.get('outline')}")
+        parts.append("\n---\n")
+    else:
+        parts.append("\nEXISTING PAPERS FROM THIS BRAINSTORM: None\n---\n")
+
+    parts.append(f"BRAINSTORM DATABASE (all accepted submissions):\n{brainstorm_summary}")
+    parts.append("\n---\n")
+
+    if rejection_context:
+        parts.append(f"IMPORTANT - YOUR PREVIOUS DECISION WAS REJECTED:\n{rejection_context}\n---\n")
+
+    parts.append("Now decide whether to write another paper or move on, and provide your decision as JSON:")
+
+    return "".join(parts)
+
+
+def build_continuation_validation_prompt(
+    user_research_prompt: str,
+    topic_prompt: str,
+    brainstorm_summary: str,
+    papers_from_brainstorm: List[Dict[str, Any]],
+    papers_written_count: int,
+    proposed_decision: Dict[str, Any]
+) -> str:
+    """
+    Build the complete continuation validation prompt.
+    
+    Args:
+        user_research_prompt: The user's high-level research goal
+        topic_prompt: The brainstorm topic prompt
+        brainstorm_summary: Full brainstorm database content
+        papers_from_brainstorm: List of dicts with title, abstract, outline for each paper
+        papers_written_count: Number of papers already written from this brainstorm
+        proposed_decision: The continuation decision to validate
+    
+    Returns:
+        Complete prompt string
+    """
+    parts = [
+        get_continuation_validator_system_prompt(),
+        "\n---\n",
+        get_continuation_validator_json_schema(),
+        "\n---\n",
+        f"USER RESEARCH GOAL:\n{user_research_prompt}",
+        "\n---\n",
+        f"BRAINSTORM TOPIC:\n{topic_prompt}",
+        "\n---\n",
+    ]
+
+    parts.append(f"PAPERS WRITTEN FROM THIS BRAINSTORM: {papers_written_count} of 3 maximum\n")
+
+    if papers_from_brainstorm:
+        parts.append("\nEXISTING PAPERS FROM THIS BRAINSTORM:\n")
+        for i, p in enumerate(papers_from_brainstorm, 1):
+            parts.append(f"\n--- Paper {i} ---")
+            parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+            parts.append(f"\nAbstract: {p.get('abstract', 'N/A')[:500]}...")
+            if p.get('outline'):
+                parts.append(f"\nOutline:\n{p.get('outline')}")
+        parts.append("\n---\n")
+    else:
+        parts.append("\nEXISTING PAPERS FROM THIS BRAINSTORM: None\n---\n")
+
+    parts.append(f"BRAINSTORM DATABASE (all accepted submissions):\n{brainstorm_summary}")
+    parts.append("\n---\n")
+
+    parts.append("PROPOSED CONTINUATION DECISION:\n")
+    parts.append(f"Decision: {proposed_decision.get('decision', 'Unknown')}")
+    parts.append(f"\nReasoning: {proposed_decision.get('reasoning', 'N/A')}")
+    parts.append("\n---\n")
+
+    parts.append("Validate this continuation decision and provide your decision as JSON:")
+
+    return "".join(parts)
diff --git a/backend/autonomous/prompts/paper_title_exploration_prompts.py b/backend/autonomous/prompts/paper_title_exploration_prompts.py
new file mode 100644
index 0000000..9193ec0
--- /dev/null
+++ b/backend/autonomous/prompts/paper_title_exploration_prompts.py
@@ -0,0 +1,87 @@
+"""
+Paper Title Exploration Prompts - Builds the aggregator-compatible user prompt for
+the paper title exploration phase that collects 5 validated candidate titles
+before final title selection.
+
+The exploration phase reuses the full Part 1 aggregator infrastructure (parallel
+submitters, batch validation up to 3, queue management) by framing the task as
+a standard aggregation with a specially crafted user prompt.
+"""
+from typing import List, Dict, Any, Optional
+
+
+def build_title_exploration_user_prompt(
+    user_research_prompt: str,
+    topic_prompt: str,
+    brainstorm_summary: str,
+    existing_papers_from_brainstorm: List[Dict[str, Any]],
+    reference_papers: Optional[List[Dict[str, Any]]] = None
+) -> str:
+    """
+    Build the user prompt passed to the aggregator for paper title exploration.
+
+    This prompt frames the aggregation task so that submitters generate candidate
+    paper titles and the validator checks quality plus diversity. The standard
+    aggregator submitter and validator system prompts handle the rest.
+
+    Args:
+        user_research_prompt: User's high-level research goal
+        topic_prompt: Brainstorm topic, Tier 3 certainty context, or chapter brief
+        brainstorm_summary: Summary of the source material the paper will be built from
+        existing_papers_from_brainstorm: Related completed papers that titles must not duplicate
+        reference_papers: Optional reference papers informing this paper or chapter
+    """
+    parts = []
+
+    parts.append("=== PAPER TITLE EXPLORATION PHASE ===\n")
+    parts.append("You are in a PAPER TITLE EXPLORATION phase. You are NOT writing the paper itself.\n")
+    parts.append("Instead, your task is to propose ONE CANDIDATE PAPER TITLE per submission.")
+    parts.append("The system will collect 5 validated candidate titles before a later final")
+    parts.append("selection chooses the actual title.\n")
+    parts.append("Each submission should contain:")
+    parts.append("- One candidate paper title")
+    parts.append("- Brief reasoning for why the title is strong, accurate, and distinct\n")
+    parts.append("The validator will check QUALITY and DIVERSITY:")
+    parts.append("- Weak, vague, or generic titles will be rejected")
+    parts.append("- Titles too similar to already-accepted candidates will be rejected")
+    parts.append("- Titles too similar to already-completed related papers should be rejected")
+    parts.append("- The goal is to map multiple plausible title directions before committing\n")
+    parts.append("WHAT MAKES A GOOD CANDIDATE TITLE:")
+    parts.append("- Accurately captures the paper's likely mathematical content")
+    parts.append("- Specific enough to communicate the core focus")
+    parts.append("- Professional and suitable for a mathematical research paper")
+    parts.append("- Distinct from already-accepted candidate titles")
+    parts.append("- Distinct from related completed papers listed below")
+    parts.append("- If this is a final-answer or chapter paper, the title should match that role directly\n")
+    parts.append("DIVERSITY IS PARAMOUNT:")
+    parts.append("Do not submit near-duplicates, minor rephrasings, or cosmetic variants.")
+    parts.append("Propose genuinely different title framings, emphases, or structural approaches.\n")
+    parts.append("FORMAT YOUR SUBMISSION AS:")
+    parts.append("State the candidate title clearly, then explain why it is valuable and")
+    parts.append("how it differs from existing accepted candidates or related papers.\n")
+
+    parts.append(f"USER RESEARCH GOAL:\n{user_research_prompt}\n")
+    parts.append(f"PAPER CONTEXT / SOURCE TOPIC:\n{topic_prompt}\n")
+    parts.append(f"SOURCE MATERIAL SUMMARY:\n{brainstorm_summary}\n")
+
+    if existing_papers_from_brainstorm:
+        parts.append("\nEXISTING RELATED PAPERS (do not duplicate these title directions):")
+        for paper in existing_papers_from_brainstorm:
+            abstract = paper.get("abstract", "N/A")
+            if isinstance(abstract, str) and len(abstract) > 300:
+                abstract = abstract[:300] + "..."
+            parts.append(f"  - {paper.get('paper_id', 'N/A')}: \"{paper.get('title', 'N/A')}\"")
+            parts.append(f"    Abstract: {abstract}")
+    else:
+        parts.append("\nEXISTING RELATED PAPERS: None")
+
+    if reference_papers:
+        parts.append("\nREFERENCE PAPERS INFORMING THIS TITLE:")
+        for paper in reference_papers:
+            abstract = paper.get("abstract", "N/A")
+            if isinstance(abstract, str) and len(abstract) > 220:
+                abstract = abstract[:220] + "..."
+            parts.append(f"  - {paper.get('paper_id', 'N/A')}: \"{paper.get('title', 'N/A')}\"")
+            parts.append(f"    Abstract: {abstract}")
+
+    return "\n".join(parts)
diff --git a/backend/autonomous/prompts/paper_title_prompts.py b/backend/autonomous/prompts/paper_title_prompts.py
index c10a001..9f8b2d2 100644
--- a/backend/autonomous/prompts/paper_title_prompts.py
+++ b/backend/autonomous/prompts/paper_title_prompts.py
@@ -187,7 +187,8 @@ def build_paper_title_prompt(
     brainstorm_summary: str,
     existing_papers_from_brainstorm: List[Dict[str, Any]],
     reference_papers: List[Dict[str, Any]] = None,
-    rejection_feedback: str = ""
+    rejection_feedback: str = "",
+    candidate_titles: str = ""
 ) -> str:
     """
     Build the paper title selection prompt.
@@ -199,6 +200,7 @@ def build_paper_title_prompt(
         existing_papers_from_brainstorm: Papers already created from this brainstorm
         reference_papers: Selected reference papers (if any)
         rejection_feedback: Accumulated rejection reasons from previous attempts (if any)
+        candidate_titles: Pre-validated candidate titles from exploration phase (if any)
     
     Returns:
         Complete prompt string
@@ -233,6 +235,17 @@ def build_paper_title_prompt(
             parts.append(f"\n- {p.get('title', 'N/A')}")
         parts.append("\n---\n")
     
+    # Inject validated candidate titles from exploration phase
+    if candidate_titles:
+        parts.append(
+            "PRE-VALIDATED CANDIDATE TITLES (from exploration phase):\n"
+            "The following candidate titles have been validated by the system. You may:\n"
+            "- Select one of these candidates directly\n"
+            "- Synthesize or improve upon a candidate\n"
+            "- Propose a NEW title if clearly better — but you MUST justify why it is superior\n\n"
+            f"{candidate_titles}\n---\n"
+        )
+    
     # Inject rejection feedback so the model learns from previous failed attempts
     if rejection_feedback:
         parts.append(
diff --git a/backend/autonomous/prompts/topic_exploration_prompts.py b/backend/autonomous/prompts/topic_exploration_prompts.py
new file mode 100644
index 0000000..f367fe6
--- /dev/null
+++ b/backend/autonomous/prompts/topic_exploration_prompts.py
@@ -0,0 +1,78 @@
+"""
+Topic Exploration Prompts - Builds the aggregator-compatible user prompt for the
+topic exploration phase that collects 5 validated candidate brainstorm questions
+before topic selection.
+
+The exploration phase reuses the full Part 1 aggregator infrastructure (parallel
+submitters, batch validation up to 3, queue management) by framing the task as
+a standard aggregation with a specially crafted user prompt.
+"""
+from typing import List, Dict, Any
+
+
+def build_exploration_user_prompt(
+    user_research_prompt: str,
+    brainstorms_summary: List[Dict[str, Any]],
+    papers_summary: List[Dict[str, Any]]
+) -> str:
+    """
+    Build the user prompt passed to the aggregator for topic exploration.
+    
+    This prompt frames the aggregation task so that submitters generate candidate
+    brainstorm questions and the validator checks quality + diversity. The standard
+    aggregator submitter/validator system prompts handle the rest.
+    
+    Args:
+        user_research_prompt: User's high-level research goal
+        brainstorms_summary: All existing brainstorms with metadata
+        papers_summary: All completed papers with title/abstract
+    """
+    parts = []
+    
+    parts.append("=== TOPIC EXPLORATION PHASE ===\n")
+    parts.append("You are in a TOPIC EXPLORATION phase. You are NOT solving a mathematical problem directly.")
+    parts.append("Instead, your task is to propose CANDIDATE BRAINSTORM QUESTIONS — specific mathematical")
+    parts.append("avenues worth exploring for the research goal below.\n")
+    parts.append("Each submission should contain ONE candidate brainstorm question and reasoning for why")
+    parts.append("it is a valuable, distinct direction. The validator will check quality and DIVERSITY —")
+    parts.append("candidates that overlap with already-accepted ones will be REJECTED.\n")
+    parts.append("WHAT MAKES A GOOD CANDIDATE QUESTION:")
+    parts.append("- Specific enough to guide focused mathematical exploration (not vague)")
+    parts.append("- Novel relative to already-accepted candidates and existing brainstorms")
+    parts.append("- Relevant to the research goal below")
+    parts.append("- Opens a DISTINCT mathematical direction not already represented")
+    parts.append("- Grounded in established mathematical concepts")
+    parts.append("- Actionable — a brainstorm session could produce meaningful insights from it\n")
+    parts.append("DIVERSITY IS PARAMOUNT:")
+    parts.append("Your candidate MUST be SUBSTANTIVELY DIFFERENT from already-accepted candidates.")
+    parts.append("The goal is to map the exploration landscape BROADLY before committing to a direction.")
+    parts.append("Do not propose variations of existing candidates — propose genuinely different avenues.\n")
+    parts.append("FORMAT YOUR SUBMISSION AS:")
+    parts.append("State the candidate brainstorm question clearly, then explain why it is valuable and")
+    parts.append("distinct from any existing candidates.\n")
+    
+    parts.append(f"RESEARCH GOAL:\n{user_research_prompt}\n")
+    
+    # Existing brainstorms
+    if brainstorms_summary:
+        parts.append("\nEXISTING BRAINSTORM TOPICS (already explored or in progress):")
+        for b in brainstorms_summary:
+            parts.append(f"  - {b.get('topic_id', 'N/A')}: {b.get('topic_prompt', 'N/A')} "
+                        f"(status: {b.get('status', 'N/A')}, submissions: {b.get('submission_count', 0)}, "
+                        f"papers: {b.get('papers_generated', 0)})")
+    else:
+        parts.append("\nEXISTING BRAINSTORM TOPICS: None yet")
+    
+    # Existing papers
+    if papers_summary:
+        parts.append("\nCOMPLETED PAPERS:")
+        for p in papers_summary:
+            abstract = p.get('abstract', 'N/A')
+            if len(abstract) > 300:
+                abstract = abstract[:300] + "..."
+            parts.append(f"  - {p.get('paper_id', 'N/A')}: \"{p.get('title', 'N/A')}\"")
+            parts.append(f"    Abstract: {abstract}")
+    else:
+        parts.append("\nCOMPLETED PAPERS: None yet")
+    
+    return "\n".join(parts)
diff --git a/backend/autonomous/prompts/topic_prompts.py b/backend/autonomous/prompts/topic_prompts.py
index 9b31989..69b3223 100644
--- a/backend/autonomous/prompts/topic_prompts.py
+++ b/backend/autonomous/prompts/topic_prompts.py
@@ -227,7 +227,8 @@ def build_topic_selection_prompt(
     user_research_prompt: str,
     brainstorms_summary: List[Dict[str, Any]],
     papers_summary: List[Dict[str, Any]],
-    rejection_context: str = ""
+    rejection_context: str = "",
+    candidate_questions: str = ""
 ) -> str:
     """
     Build the complete topic selection prompt with context.
@@ -237,6 +238,7 @@ def build_topic_selection_prompt(
         brainstorms_summary: List of all brainstorms with metadata
         papers_summary: List of all papers with title, abstract, word count
         rejection_context: Formatted previous rejection feedback
+        candidate_questions: Formatted candidate questions from topic exploration phase
     
     Returns:
         Complete prompt string
@@ -250,6 +252,23 @@ def build_topic_selection_prompt(
         "\n---\n"
     ]
     
+    # Add candidate questions from topic exploration (if available)
+    if candidate_questions:
+        parts.append(f"""TOPIC EXPLORATION RESULTS:
+The following candidate brainstorm questions were brainstormed and validated for quality
+and diversity BEFORE this topic selection. Use them to make an informed strategic decision.
+
+You may:
+- Select one of these candidates directly as your topic (action: new_topic, topic_prompt: the candidate question)
+- Combine or synthesize multiple candidates into a stronger question
+- Continue an existing brainstorm if the candidates reveal it is worth continuing
+- Combine existing brainstorms if the candidates reveal connections
+- Propose something entirely new if the candidates missed a critical avenue
+
+{candidate_questions}
+""")
+        parts.append("\n---\n")
+    
     # Add brainstorms summary
     if brainstorms_summary:
         parts.append("EXISTING BRAINSTORM TOPICS:\n")
diff --git a/backend/autonomous/validation/paper_redundancy_checker.py b/backend/autonomous/validation/paper_redundancy_checker.py
index d95987c..408294f 100644
--- a/backend/autonomous/validation/paper_redundancy_checker.py
+++ b/backend/autonomous/validation/paper_redundancy_checker.py
@@ -1,6 +1,10 @@
 """
 Paper Redundancy Checker - Reviews paper library for redundancy.
 Runs every 3 completed papers to maintain library quality.
+
+NO RAG BY DESIGN: Redundancy is assessed at the abstract/title level — comparing
+high-level paper topics to find overlap. Full paper content is not needed to detect
+whether two papers cover the same ground. All inputs are compact metadata summaries.
 """
 import asyncio
 import json
diff --git a/backend/compiler/agents/critique_submitter.py b/backend/compiler/agents/critique_submitter.py
index 3435cbb..45b74f0 100644
--- a/backend/compiler/agents/critique_submitter.py
+++ b/backend/compiler/agents/critique_submitter.py
@@ -217,6 +217,11 @@ async def submit_critique(
             
         except FreeModelExhaustedError:
             raise
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Error generating critique: {e}", exc_info=True)
+            return None
         except Exception as e:
             logger.error(f"Error generating critique: {e}", exc_info=True)
             return None
@@ -353,6 +358,11 @@ async def submit_rewrite_decision(
             
         except FreeModelExhaustedError:
             raise
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Error generating rewrite decision: {e}", exc_info=True)
+            return None
         except Exception as e:
             logger.error(f"Error generating rewrite decision: {e}", exc_info=True)
             return None
@@ -365,6 +375,7 @@ async def submit_iterative_edit(
         current_outline: str,
         critique_feedback: str,
         edits_applied: List[Dict],
+        reference_papers: Optional[str] = None,
         accumulated_history: Optional[str] = None
     ) -> Optional[Dict]:
         """
@@ -380,6 +391,7 @@ async def submit_iterative_edit(
             current_outline: Paper outline
             critique_feedback: All accepted critiques from this revision cycle
             edits_applied: List of edits already applied in this iteration
+            reference_papers: Optional reference paper content
             accumulated_history: Optional accumulated critique history from previous failed versions
             
         Returns:
@@ -401,6 +413,7 @@ async def submit_iterative_edit(
                 current_outline=current_outline,
                 critique_feedback=critique_feedback,
                 edits_applied=edits_applied,
+                reference_papers=reference_papers,
                 accumulated_critique_history=accumulated_history or ""
             )
             
@@ -488,6 +501,11 @@ async def submit_iterative_edit(
             
         except FreeModelExhaustedError:
             raise
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Error generating iterative edit: {e}", exc_info=True)
+            return None
         except Exception as e:
             logger.error(f"Error generating iterative edit: {e}", exc_info=True)
             return None
diff --git a/backend/compiler/agents/high_context_submitter.py b/backend/compiler/agents/high_context_submitter.py
index 9f4c1b6..b7c5f10 100644
--- a/backend/compiler/agents/high_context_submitter.py
+++ b/backend/compiler/agents/high_context_submitter.py
@@ -293,12 +293,12 @@ async def submit_outline_update(self) -> Optional[CompilerSubmission]:
             logger.info(f"Paper stripped: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers removed)")
             
             # Retrieve aggregator database evidence
+            # Exclude outline and paper (both direct-injected in outline_update mode)
             logger.info("Retrieving aggregator database evidence via RAG...")
-            # Use just the user prompt - the outline is direct-injected anyway
-            # Truncating to 500 chars loses important context
             context_pack = await compiler_rag_manager.retrieve_for_mode(
                 query=self.user_prompt,
-                mode="outline_update"
+                mode="outline_update",
+                exclude_sources=["compiler_outline.txt", "compiler_paper.txt"]
             )
             logger.info(f"RAG retrieval complete: {len(context_pack.text)} chars retrieved")
             
@@ -424,7 +424,9 @@ async def submit_construction(
         section_phase: Optional[str] = None,
         rejection_feedback: Optional[str] = None,
         critique_feedback: Optional[str] = None,
-        pre_critique_paper: Optional[str] = None
+        pre_critique_paper: Optional[str] = None,
+        brainstorm_content: Optional[str] = None,
+        brainstorm_source_name: Optional[str] = None
     ) -> Optional[CompilerSubmission]:
         """
         Submit next paper construction portion.
@@ -436,6 +438,8 @@ async def submit_construction(
             rejection_feedback: Feedback from a previous rejection to guide the model (e.g., "Introduction not found in document")
             critique_feedback: Accepted critique feedback from peer review (for body rewrites only)
             pre_critique_paper: Paper state before critique phase (for body rewrites - shows what failed)
+            brainstorm_content: Full brainstorm database with submission numbers (for retroactive corrections)
+            brainstorm_source_name: RAG source name for brainstorm (e.g., "brainstorm_abc123.txt") to exclude from retrieval
         
         Returns:
             CompilerSubmission for construction
@@ -456,7 +460,32 @@ async def submit_construction(
             paper_for_llm = _strip_paper_markers_for_llm(current_paper)
             logger.info(f"Paper stripped: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers removed)")
             
+            # Calculate RAG budget accounting for brainstorm content (prevents context overflow)
+            max_allowed_tokens = rag_config.get_available_input_tokens(
+                system_config.compiler_high_context_context_window,
+                system_config.compiler_high_context_max_output_tokens
+            )
+            outline_tokens = count_tokens(current_outline)
+            paper_tokens = count_tokens(paper_for_llm) if paper_for_llm else 0
+            brainstorm_tokens = count_tokens(brainstorm_content) if brainstorm_content else 0
+            system_overhead = 5000  # system prompt, JSON schema, headers, separators, rejection history
+            
+            reserved_tokens = outline_tokens + paper_tokens + brainstorm_tokens + system_overhead
+            rag_budget = max(5000, max_allowed_tokens - reserved_tokens)
+            
+            if brainstorm_content and brainstorm_tokens > 0:
+                logger.info(
+                    f"Context budget: max={max_allowed_tokens}, outline={outline_tokens}, "
+                    f"paper={paper_tokens}, brainstorm={brainstorm_tokens}, overhead={system_overhead}, "
+                    f"rag_budget={rag_budget}"
+                )
+            
             # Retrieve aggregator database evidence
+            # Exclude sources already direct-injected to prevent token waste
+            exclude_sources = ["compiler_outline.txt", "compiler_paper.txt"]
+            if brainstorm_source_name:
+                exclude_sources.append(brainstorm_source_name)
+            
             logger.info("Retrieving aggregator database evidence via RAG...")
             query = self.user_prompt
             if not is_first_portion and paper_for_llm:
@@ -465,7 +494,9 @@ async def submit_construction(
             
             context_pack = await compiler_rag_manager.retrieve_for_mode(
                 query=query,
-                mode="construction"
+                mode="construction",
+                max_tokens=rag_budget,
+                exclude_sources=exclude_sources
             )
             logger.info(f"RAG retrieval complete: {len(context_pack.text)} chars retrieved")
             
@@ -481,7 +512,8 @@ async def submit_construction(
                     is_first_portion=is_first_portion,
                     rejection_feedback=rejection_feedback,
                     critique_feedback=critique_feedback,
-                    pre_critique_paper=pre_critique_paper
+                    pre_critique_paper=pre_critique_paper,
+                    brainstorm_content=brainstorm_content
                 )
             elif section_phase == "conclusion":
                 prompt = await build_conclusion_construction_prompt(
@@ -489,7 +521,8 @@ async def submit_construction(
                     current_outline=current_outline,
                     current_paper=paper_for_llm,
                     rag_evidence=context_pack.text,
-                    rejection_feedback=rejection_feedback
+                    rejection_feedback=rejection_feedback,
+                    brainstorm_content=brainstorm_content
                 )
             elif section_phase == "introduction":
                 prompt = await build_introduction_construction_prompt(
@@ -497,7 +530,8 @@ async def submit_construction(
                     current_outline=current_outline,
                     current_paper=paper_for_llm,
                     rag_evidence=context_pack.text,
-                    rejection_feedback=rejection_feedback
+                    rejection_feedback=rejection_feedback,
+                    brainstorm_content=brainstorm_content
                 )
             elif section_phase == "abstract":
                 prompt = await build_abstract_construction_prompt(
@@ -505,7 +539,8 @@ async def submit_construction(
                     current_outline=current_outline,
                     current_paper=paper_for_llm,
                     rag_evidence=context_pack.text,
-                    rejection_feedback=rejection_feedback
+                    rejection_feedback=rejection_feedback,
+                    brainstorm_content=brainstorm_content
                 )
             else:
                 # Fallback to generic prompt for backward compatibility
@@ -522,16 +557,18 @@ async def submit_construction(
                 )
             logger.info(f"Prompt built: {len(prompt)} chars")
             
-            # Validate prompt size
+            # Validate prompt size (max_allowed_tokens already calculated above for RAG budget)
             actual_prompt_tokens = count_tokens(prompt)
-            max_allowed_tokens = rag_config.get_available_input_tokens(system_config.compiler_high_context_context_window, system_config.compiler_high_context_max_output_tokens)
             
             if actual_prompt_tokens > max_allowed_tokens:
                 logger.error(
                     f"construction: Assembled prompt ({actual_prompt_tokens} tokens) exceeds context window "
                     f"({max_allowed_tokens} tokens after safety margin). This indicates a context allocation bug."
                 )
-                return None  # Return None to skip this submission
+                raise ValueError(
+                    f"construction: Prompt too large ({actual_prompt_tokens} tokens > {max_allowed_tokens} max). "
+                    f"Brainstorm={brainstorm_tokens} tokens, outline={outline_tokens}, paper={paper_tokens}, overhead={system_overhead}."
+                )
             
             logger.debug(f"construction prompt: {actual_prompt_tokens} tokens (max: {max_allowed_tokens})")
             
@@ -647,6 +684,21 @@ async def submit_construction(
                 metadata={"coverage": context_pack.coverage, "is_first": is_first_portion, "phase": section_phase}
             )
             
+            # Parse optional brainstorm retroactive operation
+            brainstorm_op_data = data.get("brainstorm_operation")
+            if brainstorm_op_data and isinstance(brainstorm_op_data, dict):
+                try:
+                    from backend.shared.models import BrainstormRetroactiveOperation
+                    submission.brainstorm_operation = BrainstormRetroactiveOperation(
+                        action=brainstorm_op_data.get("action", ""),
+                        submission_number=brainstorm_op_data.get("submission_number"),
+                        new_content=brainstorm_op_data.get("new_content", ""),
+                        reasoning=brainstorm_op_data.get("reasoning", "")
+                    )
+                    logger.info(f"Brainstorm retroactive operation parsed: {submission.brainstorm_operation.action}")
+                except Exception as e:
+                    logger.warning(f"Failed to parse brainstorm_operation, ignoring: {e}")
+            
             # Notify task completed successfully
             if self.task_tracking_callback:
                 self.task_tracking_callback("completed", task_id)
@@ -656,9 +708,17 @@ async def submit_construction(
             
         except FreeModelExhaustedError:
             raise
+        except ValueError:
+            raise
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Failed to generate construction submission: {e}", exc_info=True)
+            if self.task_tracking_callback and 'task_id' in dir():
+                self.task_tracking_callback("completed", task_id)
+            return None
         except Exception as e:
             logger.error(f"Failed to generate construction submission: {e}", exc_info=True)
-            # Notify task completed (failed but still completed)
             if self.task_tracking_callback and 'task_id' in dir():
                 self.task_tracking_callback("completed", task_id)
             return None
@@ -666,7 +726,11 @@ async def submit_construction(
     async def submit_review(self) -> Optional[CompilerSubmission]:
         """
         Submit paper review (or no-op if no edit needed).
-        Note: Aggregator DB is NOT in context for this mode.
+        
+        NO RAG BY DESIGN: Review mode evaluates the paper on its own merits —
+        checking for errors, coherence issues, and improvements against the outline.
+        No aggregator DB, brainstorm, or reference papers in context. The reviewer
+        must judge the paper as a standalone document without external source bias.
         
         Returns:
             CompilerSubmission if edit needed, None otherwise
@@ -703,7 +767,7 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
                     f"review: Assembled prompt ({actual_prompt_tokens} tokens) exceeds context window "
                     f"({max_allowed_tokens} tokens after safety margin). This indicates a context allocation bug."
                 )
-                return None  # Return None to skip this submission
+                raise ValueError(f"review: Prompt too large ({actual_prompt_tokens} tokens > {max_allowed_tokens} max)")
             
             logger.debug(f"review prompt: {actual_prompt_tokens} tokens (max: {max_allowed_tokens})")
             
@@ -765,8 +829,8 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
                 logger.info("Paper review: no edit needed")
                 return None
             
-            # Check if this is a miniscule edit
-            is_miniscule = "miniscule" in data.get("reasoning", "").lower() or "minor" in data.get("reasoning", "").lower()
+            # Check if this is a minuscule edit
+            is_minuscule = "minuscule" in data.get("reasoning", "").lower() or "minor" in data.get("reasoning", "").lower()
             
             # Create submission
             # Use new_string as content for logging
@@ -780,21 +844,29 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
                 old_string=_normalize_string_field(data.get("old_string", "")),
                 new_string=new_string_content,  # Already normalized above
                 reasoning=data.get("reasoning", ""),
-                metadata={"is_miniscule": is_miniscule}
+                metadata={"is_minuscule": is_minuscule}
             )
             
             # Notify task completed successfully
             if self.task_tracking_callback:
                 self.task_tracking_callback("completed", task_id)
             
-            logger.info(f"Review submission generated: {submission.submission_id} (miniscule={is_miniscule})")
+            logger.info(f"Review submission generated: {submission.submission_id} (minuscule={is_minuscule})")
             return submission
             
         except FreeModelExhaustedError:
             raise
+        except ValueError:
+            raise
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Failed to generate review submission: {e}", exc_info=True)
+            if self.task_tracking_callback and 'task_id' in dir():
+                self.task_tracking_callback("completed", task_id)
+            return None
         except Exception as e:
             logger.error(f"Failed to generate review submission: {e}", exc_info=True)
-            # Notify task completed (failed but still completed)
             if self.task_tracking_callback and 'task_id' in dir():
                 self.task_tracking_callback("completed", task_id)
             return None  # Don't crash workflow on review failure
diff --git a/backend/compiler/agents/high_param_submitter.py b/backend/compiler/agents/high_param_submitter.py
index efaa03e..2d9b630 100644
--- a/backend/compiler/agents/high_param_submitter.py
+++ b/backend/compiler/agents/high_param_submitter.py
@@ -169,11 +169,14 @@ async def _step1_planning(self) -> Optional[dict]:
         )
         
         # Try initial RAG retrieval - may overflow if outline + system prompts are large
+        # Exclude outline (always direct-injected in rigor mode)
+        rigor_exclude = ["compiler_outline.txt"]
         try:
             logger.info("Step 1: Retrieving relevant paper sections via RAG...")
             context_pack = await compiler_rag_manager.retrieve_for_mode(
                 query=self.user_prompt + " " + current_paper[-1000:],
-                mode="rigor"
+                mode="rigor",
+                exclude_sources=rigor_exclude
             )
             logger.info(f"Step 1: RAG retrieval complete - {len(context_pack.text)} chars")
             
@@ -217,7 +220,8 @@ async def _step1_planning(self) -> Optional[dict]:
             context_pack = await compiler_rag_manager.retrieve_for_mode(
                 query=self.user_prompt + " " + current_paper[-1000:],
                 mode="rigor",
-                max_tokens=remaining_budget
+                max_tokens=remaining_budget,
+                exclude_sources=rigor_exclude
             )
             
             prompt = await build_rigor_planning_prompt(
@@ -272,6 +276,13 @@ async def _step1_planning(self) -> Optional[dict]:
             
             return data
             
+        except RuntimeError as e:
+            if "credits exhausted" in str(e).lower():
+                raise
+            logger.error(f"Step 1: JSON parse failed - {e}")
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
+            return None
         except Exception as e:
             logger.error(f"Step 1: JSON parse failed - {e}")
             if self.task_tracking_callback:
@@ -308,11 +319,14 @@ async def _step2_standard_execution(
             )
             
             # Try RAG retrieval
+            # Exclude outline (always direct-injected in rigor mode)
+            rigor_exclude = ["compiler_outline.txt"]
             try:
                 logger.info("Step 2: Retrieving paper sections via RAG...")
                 context_pack = await compiler_rag_manager.retrieve_for_mode(
                     query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor"
+                    mode="rigor",
+                    exclude_sources=rigor_exclude
                 )
                 
                 # Build execution prompt
@@ -357,7 +371,8 @@ async def _step2_standard_execution(
                 context_pack = await compiler_rag_manager.retrieve_for_mode(
                     query=self.user_prompt + " " + current_paper[-1000:],
                     mode="rigor",
-                    max_tokens=remaining_budget
+                    max_tokens=remaining_budget,
+                    exclude_sources=rigor_exclude
                 )
                 
                 prompt = await build_rigor_execution_prompt(
@@ -502,11 +517,14 @@ async def _step2_wolfram_execution(
             )
             
             # Try RAG retrieval
+            # Exclude outline (always direct-injected in rigor mode)
+            rigor_exclude = ["compiler_outline.txt"]
             try:
                 logger.info("Step 2 (Wolfram): Retrieving paper sections via RAG...")
                 context_pack = await compiler_rag_manager.retrieve_for_mode(
                     query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor"
+                    mode="rigor",
+                    exclude_sources=rigor_exclude
                 )
                 
                 # Build Wolfram execution prompt
@@ -553,7 +571,8 @@ async def _step2_wolfram_execution(
                 context_pack = await compiler_rag_manager.retrieve_for_mode(
                     query=self.user_prompt + " " + current_paper[-1000:],
                     mode="rigor",
-                    max_tokens=remaining_budget
+                    max_tokens=remaining_budget,
+                    exclude_sources=rigor_exclude
                 )
                 
                 prompt = await build_rigor_wolfram_execution_prompt(
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 01ebf66..6224e27 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -18,6 +18,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.json_parser import parse_json
+from backend.shared.utils import count_tokens
 from backend.compiler.agents.high_context_submitter import HighContextSubmitter
 from backend.compiler.agents.high_param_submitter import HighParamSubmitter
 from backend.compiler.agents.critique_submitter import CritiqueSubmitterAgent
@@ -70,7 +71,7 @@ def __init__(self):
         self.review_acceptances = 0
         self.review_rejections = 0
         self.review_declines = 0
-        self.miniscule_edit_count = 0
+        self.minuscule_edit_count = 0
         
         # Workflow state
         self.construction_cycle_count = 0
@@ -79,6 +80,8 @@ def __init__(self):
         # Autonomous mode (for Part 3 integration)
         self.autonomous_mode = False
         self.autonomous_section_phase = None  # "body", "conclusion", "introduction", "abstract"
+        self._current_topic_id = None  # Set by autonomous coordinator for retroactive brainstorm corrections
+        self._current_reference_paper_ids: List[str] = []  # Autonomous/Tier 3 references preserved for critique and rewrite context
         
         # Critique phase state (post-body peer review)
         self.critique_submitter = None  # CritiqueSubmitterAgent instance
@@ -207,7 +210,7 @@ async def initialize(
         self.review_acceptances = 0
         self.review_rejections = 0
         self.review_declines = 0
-        self.miniscule_edit_count = 0
+        self.minuscule_edit_count = 0
         self.construction_cycle_count = 0
         self.rigor_cycle_active = False
         self.aggregator_acceptances_last_rag = 0
@@ -957,10 +960,24 @@ async def _initial_paper_loop(self) -> None:
             
             try:
                 section_phase = self.autonomous_section_phase if self.autonomous_mode else None
+                
+                # Load brainstorm content for first construction too
+                first_brainstorm_content = None
+                first_brainstorm_source = None
+                if self.autonomous_mode and self._current_topic_id:
+                    try:
+                        from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+                        first_brainstorm_content = await brainstorm_memory.get_database_content(self._current_topic_id)
+                        first_brainstorm_source = f"brainstorm_{self._current_topic_id}.txt"
+                    except Exception:
+                        pass
+                
                 submission = await self.high_context_submitter.submit_construction(
                     is_first_portion=True,
                     section_phase=section_phase,
-                    rejection_feedback=rejection_feedback  # Pass rejection feedback for retry
+                    rejection_feedback=rejection_feedback,
+                    brainstorm_content=first_brainstorm_content,
+                    brainstorm_source_name=first_brainstorm_source
                 )
                 
                 if submission is None:
@@ -981,6 +998,23 @@ async def _initial_paper_loop(self) -> None:
                     
             except FreeModelExhaustedError:
                 raise
+            except ValueError as e:
+                logger.error(f"Construction context overflow in initial loop (attempt {attempt}): {e}")
+                await self._broadcast("compiler_rejection", {
+                    "mode": "construction",
+                    "reasoning": f"Context overflow: {e}"
+                })
+                await compiler_rejection_log.add_rejection(
+                    CompilerValidationResult(
+                        submission_id=str(uuid.uuid4()),
+                        decision="reject",
+                        reasoning=str(e),
+                        summary=str(e)[:750],
+                        validation_stage="internal_error"
+                    ), "construction", ""
+                )
+                await asyncio.sleep(backoff_time)
+                continue
             except Exception as e:
                 logger.error(f"Construction submission failed with error (attempt {attempt}): {e}")
                 await self._broadcast("compiler_retry", {
@@ -1154,13 +1188,48 @@ async def _submit_and_validate_construction(self, rejection_feedback: Optional[s
             pre_critique_paper_for_construction = self.pre_critique_paper
             logger.info("Body construction with critique context (rewrite mode)")
         
-        submission = await self.high_context_submitter.submit_construction(
-            is_first_portion=False,
-            section_phase=section_phase,
-            rejection_feedback=rejection_feedback,
-            critique_feedback=critique_feedback_for_construction,
-            pre_critique_paper=pre_critique_paper_for_construction
-        )
+        # Load brainstorm content for retroactive corrections (autonomous mode only)
+        brainstorm_content_for_submitter = None
+        brainstorm_source_for_submitter = None
+        if self.autonomous_mode and self._current_topic_id:
+            try:
+                from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+                brainstorm_content_for_submitter = await brainstorm_memory.get_database_content(self._current_topic_id)
+                brainstorm_source_for_submitter = f"brainstorm_{self._current_topic_id}.txt"
+                if brainstorm_content_for_submitter:
+                    logger.info(f"Loaded brainstorm content for retroactive corrections: {len(brainstorm_content_for_submitter)} chars")
+            except Exception as e:
+                logger.warning(f"Failed to load brainstorm for retroactive corrections: {e}")
+        
+        submission = None
+        try:
+            submission = await self.high_context_submitter.submit_construction(
+                is_first_portion=False,
+                section_phase=section_phase,
+                rejection_feedback=rejection_feedback,
+                critique_feedback=critique_feedback_for_construction,
+                pre_critique_paper=pre_critique_paper_for_construction,
+                brainstorm_content=brainstorm_content_for_submitter,
+                brainstorm_source_name=brainstorm_source_for_submitter
+            )
+        except ValueError as e:
+            logger.error(f"Construction context overflow: {e}")
+            self.construction_rejections += 1
+            overflow_reason = f"Context overflow: {e}"
+            await compiler_rejection_log.add_rejection(
+                CompilerValidationResult(
+                    submission_id=str(uuid.uuid4()),
+                    decision="reject",
+                    reasoning=overflow_reason,
+                    summary=overflow_reason[:750],
+                    validation_stage="internal_error"
+                ), "construction", ""
+            )
+            await self._broadcast("compiler_rejection", {
+                "mode": "construction",
+                "reasoning": overflow_reason
+            })
+            return False, overflow_reason
         
         if submission is None:
             logger.info("Construction not needed - paper is complete")
@@ -1492,7 +1561,8 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                     return True, None
             
             logger.info(f"Construction accepted ({word_count} words)")
-            return True, None
+            paper_accepted = True
+            paper_rejection_reason = None
         else:
             self.construction_rejections += 1
             
@@ -1505,7 +1575,88 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
             })
             
             logger.info("Construction rejected")
-            return False, result.reasoning
+            paper_accepted = False
+            paper_rejection_reason = result.reasoning
+        
+        # ================================================================
+        # RETROACTIVE BRAINSTORM OPERATION (independent from paper result)
+        # ================================================================
+        if submission.brainstorm_operation and self.autonomous_mode and hasattr(self, '_current_topic_id') and self._current_topic_id:
+            await self._handle_brainstorm_retroactive_operation(submission.brainstorm_operation)
+        
+        return paper_accepted, paper_rejection_reason
+    
+    async def _handle_brainstorm_retroactive_operation(self, brainstorm_op) -> None:
+        """
+        Handle a retroactive brainstorm operation independently from the paper operation.
+        Validates the operation using the compiler validator with brainstorm-only context,
+        then applies if accepted and refreshes RAG.
+        """
+        from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+        
+        topic_id = self._current_topic_id
+        logger.info(f"Processing retroactive brainstorm {brainstorm_op.action} for topic {topic_id}")
+        
+        try:
+            brainstorm_content = await brainstorm_memory.get_database_content(topic_id)
+            if not brainstorm_content:
+                logger.warning(f"Brainstorm {topic_id} is empty, skipping retroactive operation")
+                return
+            
+            result = await self.validator.validate_brainstorm_operation(
+                brainstorm_op, brainstorm_content
+            )
+            
+            if result.decision == "accept":
+                success = False
+                action = brainstorm_op.action
+                
+                if action == "edit":
+                    success = await brainstorm_memory.edit_submission(
+                        topic_id, brainstorm_op.submission_number, brainstorm_op.new_content
+                    )
+                elif action == "delete":
+                    success = await brainstorm_memory.remove_submission(
+                        topic_id, brainstorm_op.submission_number
+                    )
+                elif action == "add":
+                    new_num = await brainstorm_memory.add_submission_retroactive(
+                        topic_id, brainstorm_op.new_content
+                    )
+                    success = new_num is not None
+                
+                if success:
+                    logger.info(f"Retroactive brainstorm {action} accepted and applied for topic {topic_id}")
+                    
+                    # Refresh RAG with updated brainstorm content
+                    try:
+                        db_path = brainstorm_memory.get_database_path(topic_id)
+                        from backend.aggregator.core.rag_manager import rag_manager
+                        await rag_manager.add_document(
+                            db_path,
+                            chunk_sizes=[512],
+                            is_user_file=True
+                        )
+                        logger.info("RAG refreshed with updated brainstorm content")
+                    except Exception as e:
+                        logger.error(f"Failed to refresh RAG after brainstorm {action}: {e}")
+                    
+                    await self._broadcast("brainstorm_retroactive_accepted", {
+                        "action": action,
+                        "topic_id": topic_id,
+                        "submission_number": brainstorm_op.submission_number,
+                    })
+                else:
+                    logger.error(f"Retroactive brainstorm {action} was validated but failed to apply")
+            else:
+                logger.info(f"Retroactive brainstorm {brainstorm_op.action} rejected: {result.reasoning[:200]}")
+                await self._broadcast("brainstorm_retroactive_rejected", {
+                    "action": brainstorm_op.action,
+                    "topic_id": topic_id,
+                    "reasoning": result.reasoning[:500],
+                })
+        except Exception as e:
+            logger.error(f"Error handling retroactive brainstorm operation: {e}")
     
     async def _submit_and_validate_outline_update(self) -> bool:
         """Submit and validate outline update. Returns True if accepted."""
@@ -1617,7 +1768,18 @@ async def _submit_and_validate_review(self) -> bool:
         """Submit and validate review. Returns True if accepted."""
         self.current_mode = "review"
         
-        submission = await self.high_context_submitter.submit_review()
+        submission = None
+        try:
+            submission = await self.high_context_submitter.submit_review()
+        except ValueError as e:
+            logger.error(f"Review context overflow: {e}")
+            self.review_declines += 1
+            await compiler_rejection_log.add_decline("review", f"Context overflow: {e}")
+            await self._broadcast("compiler_decline", {
+                "mode": "review",
+                "reasoning": f"Context overflow: {e}"
+            })
+            return False
         
         if submission is None:
             logger.info("No review edit needed")
@@ -1633,9 +1795,9 @@ async def _submit_and_validate_review(self) -> bool:
         
         self.total_submissions += 1
         
-        # Check for miniscule edit
-        if submission.metadata.get("is_miniscule", False):
-            self.miniscule_edit_count += 1
+        # Check for minuscule edit
+        if submission.metadata.get("is_minuscule", False):
+            self.minuscule_edit_count += 1
         
         await self._broadcast("compiler_submission", {
             "mode": "review",
@@ -2254,6 +2416,87 @@ async def _start_critique_phase(self) -> None:
         
         # Start critique aggregation loop
         await self._run_critique_aggregation()
+
+    async def _get_reference_papers_context_for_critique(
+        self,
+        current_outline: str = "",
+        current_body: str = "",
+        aggregator_db: str = "",
+        critique_feedback: str = "",
+        pre_critique_paper: str = "",
+        accumulated_history: str = ""
+    ) -> Optional[str]:
+        """
+        Prepare reference-paper context for critique/rewrite prompts in autonomous mode.
+
+        This preserves the reference papers selected for the paper instead of
+        silently dropping them once the critique phase begins.
+        """
+        if not self.autonomous_mode or not self._current_reference_paper_ids:
+            return None
+
+        try:
+            from backend.autonomous.core.autonomous_rag_manager import autonomous_rag_manager
+            from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+
+            max_input_tokens = rag_config.get_available_input_tokens(
+                system_config.compiler_critique_submitter_context_window,
+                system_config.compiler_critique_submitter_max_tokens
+            )
+
+            direct_injected_context = "\n\n".join(
+                part for part in [
+                    self.user_prompt or "",
+                    self.paper_title or "",
+                    current_outline or "",
+                    current_body or "",
+                    aggregator_db or "",
+                    critique_feedback or "",
+                    pre_critique_paper or "",
+                    accumulated_history or "",
+                ]
+                if part
+            )
+            direct_tokens = count_tokens(direct_injected_context)
+
+            # Reserve headroom for system prompt, JSON schema, rejection memory,
+            # and the static prompt framing around reference content.
+            reference_budget = min(16000, max_input_tokens - direct_tokens - 10000)
+            if reference_budget <= 0:
+                logger.warning(
+                    "Skipping critique reference context due to prompt budget "
+                    f"(direct={direct_tokens}, max_input={max_input_tokens})"
+                )
+                return None
+
+            exclude_sources = ["compiler_outline.txt", "compiler_paper.txt"]
+            if self._current_topic_id:
+                brainstorm_db_path = brainstorm_memory.get_database_path(self._current_topic_id)
+                exclude_sources.append(Path(brainstorm_db_path).name)
+
+            query = "\n\n".join(
+                part for part in [
+                    self.user_prompt or "",
+                    self.paper_title or "",
+                    current_outline or "",
+                    current_body or "",
+                    critique_feedback or "",
+                    pre_critique_paper or "",
+                ]
+                if part
+            )
+
+            reference_context, _ = await autonomous_rag_manager.get_reference_papers_context(
+                self._current_reference_paper_ids,
+                max_total_tokens=reference_budget,
+                query=query,
+                exclude_sources=exclude_sources
+            )
+
+            return reference_context or None
+        except Exception as e:
+            logger.warning(f"Failed to prepare critique reference context: {e}")
+            return None
     
     async def _run_critique_aggregation(self) -> None:
         """
@@ -2307,11 +2550,17 @@ async def _run_critique_aggregation(self) -> None:
                 # Get existing critiques
                 existing_critiques = await critique_memory.get_all_critiques()
                 
-                # Get reference papers if available
-                reference_papers = None  # TODO: Load if applicable
-                
                 # Format accumulated critique history from previous failed versions
                 accumulated_history = self._format_accumulated_critique_history()
+
+                # Keep autonomous reference papers available during critique/rewrite.
+                reference_papers = await self._get_reference_papers_context_for_critique(
+                    current_outline=current_outline,
+                    current_body=current_body,
+                    aggregator_db=aggregator_db,
+                    critique_feedback=existing_critiques,
+                    accumulated_history=accumulated_history
+                )
                 
                 # Generate critique submission
                 submission = await self.critique_submitter.submit_critique(
@@ -2614,10 +2863,17 @@ async def _trigger_rewrite_decision(self) -> None:
                 # Get context (aggregator DB, reference papers, etc.)
                 from backend.aggregator.memory.shared_training import shared_training_memory
                 aggregator_db = await shared_training_memory.get_all_content()
-                reference_papers = None  # TODO: Load if applicable
-                
                 # Format accumulated critique history from previous failed versions
                 accumulated_history = self._format_accumulated_critique_history()
+
+                reference_papers = await self._get_reference_papers_context_for_critique(
+                    current_outline=current_outline,
+                    current_body=current_body,
+                    aggregator_db=aggregator_db,
+                    critique_feedback=critique_feedback,
+                    pre_critique_paper=self.pre_critique_paper or "",
+                    accumulated_history=accumulated_history
+                )
                 
                 # Critique submitter makes decision
                 logger.info("Critique submitter generating rewrite decision...")
@@ -2841,6 +3097,14 @@ async def _execute_partial_revision(
         
         # Get current outline
         current_outline = await outline_memory.get_outline()
+
+        reference_papers = await self._get_reference_papers_context_for_critique(
+            current_outline=current_outline,
+            current_body=self.pre_critique_paper or "",
+            critique_feedback=critique_feedback,
+            pre_critique_paper=self.pre_critique_paper or "",
+            accumulated_history=accumulated_history or ""
+        )
         
         # ITERATIVE EDIT LOOP
         MAX_EDITS = 20  # Safety limit to prevent infinite loops
@@ -2867,6 +3131,7 @@ async def _execute_partial_revision(
                     current_outline=current_outline,
                     critique_feedback=critique_feedback,
                     edits_applied=edits_applied,
+                    reference_papers=reference_papers,
                     accumulated_history=accumulated_history
                 )
                 
@@ -3357,7 +3622,7 @@ async def get_status(self) -> CompilerState:
             review_acceptances=self.review_acceptances,
             review_rejections=self.review_rejections,
             review_declines=self.review_declines,
-            miniscule_edit_count=self.miniscule_edit_count,
+            minuscule_edit_count=self.minuscule_edit_count,
             in_critique_phase=self.in_critique_phase,
             critique_acceptances=self.critique_acceptances,
             paper_version=self.paper_version,
@@ -3431,7 +3696,7 @@ async def clear_paper(self) -> None:
         self.review_acceptances = 0
         self.review_rejections = 0
         self.review_declines = 0
-        self.miniscule_edit_count = 0
+        self.minuscule_edit_count = 0
         self.construction_cycle_count = 0
         self.rigor_cycle_active = False
         
@@ -3439,6 +3704,7 @@ async def clear_paper(self) -> None:
         if self.autonomous_mode:
             self.autonomous_section_phase = "body"  # Reset to body phase
             logger.info("Reset autonomous section phase to body")
+        self._current_reference_paper_ids = []
         
         # Reset critique phase state
         self.in_critique_phase = False
diff --git a/backend/compiler/core/compiler_rag_manager.py b/backend/compiler/core/compiler_rag_manager.py
index 4a29559..c7b2532 100644
--- a/backend/compiler/core/compiler_rag_manager.py
+++ b/backend/compiler/core/compiler_rag_manager.py
@@ -4,7 +4,7 @@
 Default context window: 4096 tokens (user-configurable via settings).
 """
 import logging
-from typing import Optional
+from typing import Optional, List
 from pathlib import Path
 
 from backend.shared.config import system_config, rag_config
@@ -229,7 +229,8 @@ async def retrieve_for_mode(
         self,
         query: str,
         mode: str,
-        max_tokens: Optional[int] = None
+        max_tokens: Optional[int] = None,
+        exclude_sources: Optional[List[str]] = None
     ) -> ContextPack:
         """
         Retrieve context optimized for specific compiler mode.
@@ -238,6 +239,7 @@ async def retrieve_for_mode(
             query: Search query
             mode: Compiler mode (construction, outline, review, rigor)
             max_tokens: Override max tokens (defaults to available_tokens)
+            exclude_sources: Source names to skip (already direct-injected in prompt)
         
         Returns:
             ContextPack with retrieved context
@@ -245,6 +247,8 @@ async def retrieve_for_mode(
         import time
         
         logger.info(f"Starting RAG retrieval for mode={mode}, query_length={len(query)}")
+        if exclude_sources:
+            logger.info(f"Excluding direct-injected sources: {exclude_sources}")
         start_time = time.time()
         
         try:
@@ -257,7 +261,8 @@ async def retrieve_for_mode(
             context_pack = await rag_manager.retrieve(
                 query=query,
                 chunk_size=chunk_size,
-                max_tokens=max_tokens
+                max_tokens=max_tokens,
+                exclude_sources=exclude_sources
             )
             
             elapsed = time.time() - start_time
diff --git a/backend/compiler/prompts/construction_prompts.py b/backend/compiler/prompts/construction_prompts.py
index 2fd0e46..2c279da 100644
--- a/backend/compiler/prompts/construction_prompts.py
+++ b/backend/compiler/prompts/construction_prompts.py
@@ -89,6 +89,8 @@ def get_body_construction_system_prompt() -> str:
 3. Write the NEXT body section that follows the outline
 4. Set section_complete=true ONLY when ALL body sections from the outline are written
 
+PROGRESSIVE SYSTEM: You will be called repeatedly — once per body section. Focus on writing ONE complete, rigorous section per turn rather than rushing through multiple sections. Write what you can do thoroughly and correctly this turn; you will be called again for the next section.
+
 WHAT COUNTS AS BODY SECTIONS:
 - Definitions and Preliminaries
 - Main Results / Theorems
@@ -856,6 +858,36 @@ def get_construction_json_schema() -> str:
   "new_string": "",
   "reasoning": "The abstract is complete. The paper is finished."
 }
+
+OPTIONAL - RETROACTIVE BRAINSTORM OPERATION (Autonomous Mode Only):
+
+During paper writing, you see the FULL brainstorm database alongside the paper. If you identify
+an error, redundancy, or missing insight in the brainstorm, you may OPTIONALLY include a
+brainstorm_operation field. This is validated INDEPENDENTLY from your paper operation.
+
+CRITICAL INDEPENDENT VALIDITY PRINCIPLE:
+- Your paper edit must be correct even if the brainstorm operation is rejected
+- Your brainstorm operation must be justified even if the paper edit is rejected
+- NEVER write paper content that depends on a simultaneous brainstorm correction for correctness
+- NEVER propose a brainstorm correction that is only justified by what you're writing in the paper
+
+Add this OPTIONAL field to your JSON response:
+{
+  ... (all standard fields above) ...,
+  "brainstorm_operation": {
+    "action": "edit | delete | add",
+    "submission_number": 5,
+    "new_content": "corrected or new content (empty for delete)",
+    "reasoning": "Independent justification - must stand alone without referencing paper edit"
+  }
+}
+
+brainstorm_operation actions:
+- "edit": Correct submission #N with new_content (submission_number required)
+- "delete": Remove submission #N from brainstorm (submission_number required, new_content empty)
+- "add": Add a new insight to the brainstorm (submission_number not needed)
+
+If no brainstorm correction is needed (most turns), simply omit the brainstorm_operation field.
 """
 
 
@@ -872,7 +904,8 @@ async def build_construction_prompt(
     section_phase: Optional[str] = None,
     rejection_feedback: Optional[str] = None,
     critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None
+    pre_critique_paper: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """
     Build complete prompt for construction mode.
@@ -887,6 +920,7 @@ async def build_construction_prompt(
         rejection_feedback: Feedback from a previous rejection to guide the model
         critique_feedback: Accepted critique feedback from peer review (for rewrites)
         pre_critique_paper: Paper state before critique phase (for rewrites - shows what failed)
+        brainstorm_content: Full brainstorm database with submission numbers (for retroactive corrections, autonomous mode)
     
     Returns:
         Complete prompt string
@@ -985,6 +1019,11 @@ async def build_construction_prompt(
         parts.append("TASK: Write the NEXT logical portion following the section order (body → conclusion → intro → abstract).")
     
     parts.append("\n---\n")
+    
+    if brainstorm_content:
+        parts.append(f"BRAINSTORM DATABASE (editable - you may propose corrections via brainstorm_operation):\n{brainstorm_content}")
+        parts.append("\n---\n")
+    
     parts.append(f"AGGREGATOR DATABASE EVIDENCE:\n{rag_evidence}")
     parts.append("\n---\n")
     parts.append("Now generate your submission as JSON (remember to set section_complete appropriately):")
@@ -1001,7 +1040,8 @@ async def build_phase_construction_prompt(
     is_first_in_phase: bool = False,
     rejection_feedback: Optional[str] = None,
     critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None
+    pre_critique_paper: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """
     Build prompt for a specific construction phase.
@@ -1018,6 +1058,7 @@ async def build_phase_construction_prompt(
         rejection_feedback: Feedback from a previous rejection to guide the model
         critique_feedback: Accepted critique feedback from peer review (for rewrites)
         pre_critique_paper: Paper state before critique phase (for rewrites)
+        brainstorm_content: Full brainstorm database with submission numbers (autonomous mode)
     
     Returns:
         Complete prompt string
@@ -1031,7 +1072,8 @@ async def build_phase_construction_prompt(
         section_phase=phase,
         rejection_feedback=rejection_feedback,
         critique_feedback=critique_feedback,
-        pre_critique_paper=pre_critique_paper
+        pre_critique_paper=pre_critique_paper,
+        brainstorm_content=brainstorm_content
     )
 
 
@@ -1047,7 +1089,8 @@ async def build_body_construction_prompt(
     is_first_portion: bool = False,
     rejection_feedback: Optional[str] = None,
     critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None
+    pre_critique_paper: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """
     Build prompt for BODY section construction phase.
@@ -1061,6 +1104,7 @@ async def build_body_construction_prompt(
         rejection_feedback: Feedback from a previous rejection to guide the model
         critique_feedback: Accepted critique feedback from peer review (for rewrites only)
         pre_critique_paper: Paper state before critique phase (for rewrites - shows what failed)
+        brainstorm_content: Full brainstorm database with submission numbers (autonomous mode)
     """
     return await build_phase_construction_prompt(
         user_prompt=user_prompt,
@@ -1071,7 +1115,8 @@ async def build_body_construction_prompt(
         is_first_in_phase=is_first_portion,
         rejection_feedback=rejection_feedback,
         critique_feedback=critique_feedback,
-        pre_critique_paper=pre_critique_paper
+        pre_critique_paper=pre_critique_paper,
+        brainstorm_content=brainstorm_content
     )
 
 
@@ -1080,7 +1125,8 @@ async def build_conclusion_construction_prompt(
     current_outline: str,
     current_paper: str,
     rag_evidence: str,
-    rejection_feedback: Optional[str] = None
+    rejection_feedback: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """Build prompt for CONCLUSION section construction phase."""
     return await build_phase_construction_prompt(
@@ -1090,7 +1136,8 @@ async def build_conclusion_construction_prompt(
         rag_evidence=rag_evidence,
         phase="conclusion",
         is_first_in_phase=True,
-        rejection_feedback=rejection_feedback
+        rejection_feedback=rejection_feedback,
+        brainstorm_content=brainstorm_content
     )
 
 
@@ -1099,7 +1146,8 @@ async def build_introduction_construction_prompt(
     current_outline: str,
     current_paper: str,
     rag_evidence: str,
-    rejection_feedback: Optional[str] = None
+    rejection_feedback: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """Build prompt for INTRODUCTION section construction phase."""
     return await build_phase_construction_prompt(
@@ -1109,7 +1157,8 @@ async def build_introduction_construction_prompt(
         rag_evidence=rag_evidence,
         phase="introduction",
         is_first_in_phase=True,
-        rejection_feedback=rejection_feedback
+        rejection_feedback=rejection_feedback,
+        brainstorm_content=brainstorm_content
     )
 
 
@@ -1118,7 +1167,8 @@ async def build_abstract_construction_prompt(
     current_outline: str,
     current_paper: str,
     rag_evidence: str,
-    rejection_feedback: Optional[str] = None
+    rejection_feedback: Optional[str] = None,
+    brainstorm_content: Optional[str] = None
 ) -> str:
     """Build prompt for ABSTRACT section construction phase."""
     return await build_phase_construction_prompt(
@@ -1128,5 +1178,6 @@ async def build_abstract_construction_prompt(
         rag_evidence=rag_evidence,
         phase="abstract",
         is_first_in_phase=True,
-        rejection_feedback=rejection_feedback
-    )
+        rejection_feedback=rejection_feedback,
+        brainstorm_content=brainstorm_content
+    )
\ No newline at end of file
diff --git a/backend/compiler/prompts/critique_prompts.py b/backend/compiler/prompts/critique_prompts.py
index 3e38373..b2ebbf8 100644
--- a/backend/compiler/prompts/critique_prompts.py
+++ b/backend/compiler/prompts/critique_prompts.py
@@ -53,6 +53,8 @@ def get_critique_submitter_system_prompt() -> str:
 YOUR TASK:
 Assess whether the body section needs substantive critique. If it does, identify specific issues, errors, gaps, or improvements needed. If it doesn't (academically acceptable), decline to critique.
 
+PROGRESSIVE SYSTEM: You will be called multiple times (up to 5 total attempts). Focus on identifying ONE specific, well-substantiated critique per turn. Do not try to list every issue at once — address the most important issue thoroughly this turn, and you will have further opportunities to raise additional issues.
+
 WHAT TO CRITIQUE - Focus on:
 - Mathematical errors or unsound reasoning
 - Missing proofs or incomplete arguments  
@@ -872,6 +874,7 @@ def build_iterative_edit_prompt(
     current_outline: str,
     critique_feedback: str,
     edits_applied: List[Dict],
+    reference_papers: Optional[str] = None,
     accumulated_critique_history: str = ""
 ) -> str:
     """
@@ -884,6 +887,7 @@ def build_iterative_edit_prompt(
         current_outline: The paper outline
         critique_feedback: All accepted critiques from this revision cycle
         edits_applied: List of edits already applied in this iteration
+        reference_papers: Optional reference paper content
         accumulated_critique_history: Critiques from previous failed versions (if any)
         
     Returns:
@@ -915,6 +919,12 @@ def build_iterative_edit_prompt(
         f"CURRENT PAPER (after {len(edits_applied)} edit(s) applied):\n{current_paper}",
         "\n---\n",
     ])
+
+    if reference_papers:
+        parts.extend([
+            f"REFERENCE PAPERS:\n{reference_papers}",
+            "\n---\n",
+        ])
     
     # Show edits already applied
     if edits_applied:
diff --git a/backend/compiler/validation/compiler_validator.py b/backend/compiler/validation/compiler_validator.py
index 9715f1a..ac68edf 100644
--- a/backend/compiler/validation/compiler_validator.py
+++ b/backend/compiler/validation/compiler_validator.py
@@ -122,6 +122,21 @@ def normalize_whitespace(text: str) -> str:
     return re.sub(r'  +', ' ', text)
 
 
+def normalize_all_whitespace(text: str) -> str:
+    """
+    Collapse all whitespace runs (spaces, newlines, tabs) to a single space.
+    
+    Handles the mismatch where models output paragraph breaks as '\\n\\n' but
+    the document has a single space (or vice versa). Used as a fallback after
+    the space-only normalization fails.
+    """
+    if not text:
+        return text
+    
+    import re
+    return re.sub(r'\s+', ' ', text)
+
+
 def normalize_backslashes_for_matching(text: str) -> str:
     """
     Collapse runs of 2+ consecutive backslashes to a single backslash for comparison.
@@ -191,12 +206,31 @@ def find_with_normalized_hyphens(needle: str, haystack: str) -> Tuple[int, str]:
             logger.debug(f"   Whitespace normalization matched: '{needle[:50]}...' found as '{actual_text[:50]}...'")
             return (match.start(), actual_text)
 
+    # Try full whitespace normalization (3b layer - handles newline vs space mismatches)
+    # Models may output \n\n where the document has a single space, or vice versa.
+    # Collapses ALL whitespace runs (spaces, newlines, tabs) to a single space.
+    aws_needle = normalize_all_whitespace(normalized_needle)
+    aws_haystack = normalize_all_whitespace(normalized_haystack)
+
+    aws_pos = aws_haystack.find(aws_needle)
+    if aws_pos >= 0:
+        import re
+        escaped = re.escape(aws_needle)
+        flexible_pattern = escaped.replace(r'\ ', r'\s+')
+
+        match = re.search(flexible_pattern, haystack)
+        if match:
+            actual_text = match.group(0)
+            logger.info(f"ALL_WHITESPACE_NORMALIZED_MATCH: Found at pos {match.start()}")
+            logger.debug(f"   All-whitespace normalization matched: '{needle[:50]}...' found as '{actual_text[:50]}...'")
+            return (match.start(), actual_text)
+
     # Try backslash normalization (4th layer - handles model over-escaping quirks)
     # e.g., model writes \\\\mathbb in JSON -> \\mathbb after json.loads, but document has \mathbb
-    bs_needle = normalize_backslashes_for_matching(ws_needle)
-    bs_haystack = normalize_backslashes_for_matching(ws_haystack)
+    bs_needle = normalize_backslashes_for_matching(aws_needle)
+    bs_haystack = normalize_backslashes_for_matching(aws_haystack)
 
-    if bs_needle != ws_needle:  # Only attempt if backslash normalization actually changed the needle
+    if bs_needle != aws_needle:  # Only attempt if backslash normalization actually changed the needle
         bs_pos = bs_haystack.find(bs_needle)
         if bs_pos >= 0:
             # Convert normalized needle to a regex that allows 1+ backslashes wherever
@@ -228,8 +262,9 @@ def find_with_normalized_hyphens(needle: str, haystack: str) -> Tuple[int, str]:
 
     # === DEEP DIAGNOSTICS FOR COMPLETE FAILURE ===
     logger.warning(f"MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:")
-    logger.warning(f"   Needle (first 200 chars): {repr(needle[:200])}")
-    logger.warning(f"   Needle (last 200 chars): {repr(needle[-200:])}")
+    logger.warning(f"   Needle FULL:\n{needle}")
+    logger.warning(f"   Needle (first 200 chars repr): {repr(needle[:200])}")
+    logger.warning(f"   Needle (last 200 chars repr): {repr(needle[-200:])}")
     logger.warning(f"   Haystack (first 200 chars): {repr(haystack[:200])}")
     logger.warning(f"   Haystack (last 200 chars): {repr(haystack[-200:])}")
     
@@ -526,6 +561,7 @@ def _pre_validate_exact_string_match(
         logger.info(f"PRE_VALIDATE_START: mode={submission.mode}, operation={submission.operation}")
         if submission.old_string:
             logger.info(f"   old_string preview: {repr(submission.old_string[:100])}{'...' if len(submission.old_string) > 100 else ''}")
+            logger.debug(f"   old_string full: {repr(submission.old_string)}")
             logger.debug(f"   old_string diagnostics: {_diagnostic_char_info(submission.old_string)}")
         
         # Determine which document to check against based on mode
@@ -636,6 +672,7 @@ def _pre_validate_exact_string_match(
                 if outline_confusion:
                     # Provide targeted feedback for outline vs paper confusion
                     logger.warning(f"Pre-validation failed: old_string found in OUTLINE but not in PAPER (outline confusion)")
+                    logger.warning(f"FULL old_string that failed to match paper:\n{submission.old_string}")
                     return CompilerValidationResult(
                         submission_id=submission.submission_id,
                         decision="reject",
@@ -665,6 +702,7 @@ def _pre_validate_exact_string_match(
                     fix_suggestion = f"\n\nNo similar text found. Verify the old_string matches something in the current {document_name} exactly."
                 
                 logger.warning(f"Pre-validation failed: old_string not found in {document_name}")
+                logger.warning(f"FULL old_string that failed to match:\n{submission.old_string}")
                 return CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
@@ -692,6 +730,7 @@ def _pre_validate_exact_string_match(
         match_count = normalized_doc.count(normalized_old)
         if match_count > 1:
             logger.warning(f"Pre-validation failed: old_string appears {match_count} times in {document_name} (not unique)")
+            logger.warning(f"FULL old_string that matched multiple times:\n{submission.old_string}")
             return CompilerValidationResult(
                 submission_id=submission.submission_id,
                 decision="reject",
@@ -1020,6 +1059,183 @@ async def validate_submission(
                 validation_stage="internal_error"
             )
     
+    async def validate_brainstorm_operation(
+        self,
+        brainstorm_op: "BrainstormRetroactiveOperation",
+        brainstorm_content: str
+    ) -> CompilerValidationResult:
+        """
+        Validate a retroactive brainstorm operation independently.
+        
+        The validator sees ONLY the brainstorm database and the proposed operation.
+        It never sees the paper operation that may accompany this brainstorm operation.
+        Each operation must be justified on its own merits.
+        """
+        from backend.shared.models import BrainstormRetroactiveOperation
+        logger.info(f"Validating brainstorm retroactive operation: {brainstorm_op.action}")
+        
+        prompt = self._build_brainstorm_validation_prompt(brainstorm_op, brainstorm_content)
+        
+        actual_prompt_tokens = count_tokens(prompt)
+        from backend.shared.config import system_config, rag_config
+        max_allowed_tokens = rag_config.get_available_input_tokens(
+            system_config.compiler_validator_context_window,
+            system_config.compiler_validator_max_output_tokens
+        )
+        
+        if actual_prompt_tokens > max_allowed_tokens:
+            logger.error(f"Brainstorm validation prompt too large: {actual_prompt_tokens} > {max_allowed_tokens}")
+            return CompilerValidationResult(
+                submission_id=str(uuid.uuid4()),
+                decision="reject",
+                reasoning=f"Internal error: Brainstorm validation prompt too large ({actual_prompt_tokens} tokens)",
+                summary="Internal context overflow error",
+                json_valid=False,
+                validation_stage="internal_error"
+            )
+        
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+        
+        if self.task_tracking_callback:
+            self.task_tracking_callback("started", task_id)
+        
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_name,
+                messages=[{"role": "user", "content": prompt}],
+                temperature=0.0,
+                max_tokens=system_config.compiler_validator_max_output_tokens
+            )
+            
+            message = response["choices"][0]["message"]
+            llm_output = message.get("content") or message.get("reasoning") or ""
+            
+            validation_data = await self._parse_json_with_retry(llm_output, prompt, "", 0)
+            
+            decision = validation_data.get("decision", "reject")
+            reasoning = validation_data.get("reasoning", "No reasoning provided")
+            
+            result = CompilerValidationResult(
+                submission_id=str(uuid.uuid4()),
+                decision=decision,
+                reasoning=reasoning,
+                summary=reasoning[:750],
+                json_valid=True,
+                validation_stage="llm_validation"
+            )
+            
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
+            
+            logger.info(f"Brainstorm operation validation: {decision}")
+            return result
+            
+        except FreeModelExhaustedError:
+            raise
+        except Exception as e:
+            logger.error(f"Brainstorm operation validation failed: {e}")
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
+            return CompilerValidationResult(
+                submission_id=str(uuid.uuid4()),
+                decision="reject",
+                reasoning=f"Validation error: {str(e)}",
+                summary=f"Validation error: {str(e)}"[:750],
+                json_valid=False,
+                validation_stage="internal_error"
+            )
+    
+    def _build_brainstorm_validation_prompt(
+        self,
+        brainstorm_op: "BrainstormRetroactiveOperation",
+        brainstorm_content: str
+    ) -> str:
+        """Build prompt for brainstorm retroactive operation validation."""
+        action = brainstorm_op.action
+        
+        system_prompt = f"""You are validating a retroactive correction to a brainstorm knowledge database. This correction was proposed during paper compilation by a submitter who identified an issue in the source material.
+
+You see ONLY the brainstorm database and the proposed operation. You do NOT see the paper or any paper edits. Your decision must be based solely on whether this operation improves the brainstorm database.
+
+OPERATION TYPE: {action.upper()}
+
+"""
+        if action == "delete":
+            system_prompt += """VALIDATION CRITERIA (DELETE):
+A brainstorm submission should be REMOVED if it:
+1. Contains mathematical errors or logically unsound reasoning
+2. Is redundant with other submissions (content fully covered elsewhere)
+3. Contradicts established mathematical principles evident in other submissions
+4. Was marginally useful but provides no unique value given the current database state
+
+KEEP the submission if:
+1. It provides ANY unique information not covered elsewhere
+2. There is ANY doubt about whether it's truly harmful or redundant
+3. It offers a different perspective even if related to other content
+
+CONSERVATIVE DEFAULT: When in doubt, reject the removal (keep the submission).
+"""
+        elif action == "edit":
+            system_prompt += """VALIDATION CRITERIA (EDIT):
+A brainstorm submission edit should be ACCEPTED if:
+1. The corrected version fixes a genuine mathematical error
+2. The corrected version is more accurate than the original
+3. The correction improves the submission's value to the knowledge pool
+4. The correction is mathematically sound and well-justified
+
+REJECT the edit if:
+1. The original was not actually wrong
+2. The edit introduces new errors or reduces quality
+3. The reasoning for correction is weak or unconvincing
+4. The edit is a stylistic preference rather than a substantive correction
+
+CONSERVATIVE DEFAULT: When in doubt, reject the edit (keep the original).
+"""
+        elif action == "add":
+            system_prompt += """VALIDATION CRITERIA (ADD):
+A new brainstorm submission should be ACCEPTED if:
+1. It adds genuinely new mathematical insight not already in the database
+2. It connects existing concepts in novel ways
+3. It provides concrete methods, theorems, proofs, or techniques
+4. It is grounded in established mathematical principles
+
+REJECT the addition if:
+1. It is redundant with existing submissions
+2. It contains trivial or commonly known information already present
+3. It contains unsupported claims or logical fallacies
+4. It is too vague or generic to be actionable
+"""
+        
+        system_prompt += """
+Output your decision ONLY as JSON:
+{
+  "decision": "accept" or "reject",
+  "reasoning": "Detailed explanation of your decision"
+}
+"""
+        
+        parts = [system_prompt, "\n---\n"]
+        parts.append(f"BRAINSTORM DATABASE:\n{brainstorm_content}")
+        parts.append("\n---\n")
+        
+        if action == "delete":
+            parts.append(f"PROPOSED REMOVAL: Submission #{brainstorm_op.submission_number}")
+            parts.append(f"\nREASONING: {brainstorm_op.reasoning}")
+        elif action == "edit":
+            parts.append(f"PROPOSED EDIT: Submission #{brainstorm_op.submission_number}")
+            parts.append(f"\nNEW CONTENT:\n{brainstorm_op.new_content}")
+            parts.append(f"\nREASONING: {brainstorm_op.reasoning}")
+        elif action == "add":
+            parts.append(f"PROPOSED NEW SUBMISSION:\n{brainstorm_op.new_content}")
+            parts.append(f"\nREASONING: {brainstorm_op.reasoning}")
+        
+        parts.append("\n---\nNow validate this brainstorm operation as JSON:")
+        
+        return "\n".join(parts)
+    
     def _strip_placeholder_text(self, text: str) -> str:
         """
         Strip any placeholder markers from text.
diff --git a/backend/shared/api_client_manager.py b/backend/shared/api_client_manager.py
index baba4a7..018eef4 100644
--- a/backend/shared/api_client_manager.py
+++ b/backend/shared/api_client_manager.py
@@ -22,8 +22,10 @@
 )
 from backend.shared.boost_manager import boost_manager
 from backend.shared.boost_logger import boost_logger
+from backend.shared.config import rag_config
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.models import ModelConfig
+from backend.shared.token_tracker import token_tracker
 
 logger = logging.getLogger(__name__)
 
@@ -62,6 +64,9 @@ def __init__(self):
         # Current autonomous phase (set by autonomous coordinator)
         self._current_autonomous_phase: str = "unknown"
         
+        # Track roles that have already broadcast fallback_failed (prevent GUI log spam)
+        self._fallback_failed_notified: set = set()
+        
         # Lock for thread-safe state updates
         self._state_lock = asyncio.Lock()
     
@@ -74,6 +79,43 @@ async def _broadcast(self, event: str, data: Dict[str, Any] = None) -> None:
         if self._broadcast_callback:
             await self._broadcast_callback(event, data or {})
     
+    async def _with_hung_connection_watchdog(
+        self,
+        coro,
+        role_id: str,
+        model: str,
+        provider: str,
+        timeout_seconds: int = 900
+    ):
+        """Wrap an API call coroutine with a watchdog that alerts after timeout_seconds (default 15 min)."""
+        async def _watchdog():
+            await asyncio.sleep(timeout_seconds)
+            minutes = timeout_seconds // 60
+            logger.warning(
+                f"API call for role '{role_id}' using {model} via {provider} "
+                f"has been running for {minutes}+ minutes — possible hung connection"
+            )
+            await self._broadcast("hung_connection_alert", {
+                "role_id": role_id,
+                "model": model,
+                "provider": provider,
+                "elapsed_minutes": minutes,
+                "message": (
+                    f"API call to {model} via {provider} has been running for {minutes}+ minutes. "
+                    f"The connection may be hung. Consider stopping and trying a different host/provider."
+                )
+            })
+
+        watchdog_task = asyncio.create_task(_watchdog())
+        try:
+            return await coro
+        finally:
+            watchdog_task.cancel()
+            try:
+                await watchdog_task
+            except asyncio.CancelledError:
+                pass
+
     def set_model_tracking_callback(self, callback: Optional[Callable]) -> None:
         """
         Set callback for model usage tracking during Tier 3 final answer generation.
@@ -248,17 +290,29 @@ async def generate_completion(
             start_time = time.time()
             
             try:
+                boost_api_key = (
+                    boost_manager.boost_config.openrouter_api_key or
+                    rag_config.openrouter_api_key
+                )
+                if not boost_api_key:
+                    raise RuntimeError("Boost requested but no OpenRouter API key is available")
+
                 # Create temporary client with boost API key
-                boost_client = OpenRouterClient(boost_manager.boost_config.openrouter_api_key)
+                boost_client = OpenRouterClient(boost_api_key)
                 boost_provider = boost_manager.boost_config.boost_provider
                 try:
-                    result = await boost_client.generate_completion(
+                    result = await self._with_hung_connection_watchdog(
+                        boost_client.generate_completion(
+                            model=boost_model,
+                            messages=messages,
+                            temperature=temperature,
+                            max_tokens=max_tokens or boost_manager.boost_config.boost_max_output_tokens,
+                            response_format=response_format,
+                            provider=boost_provider
+                        ),
+                        role_id=role_id,
                         model=boost_model,
-                        messages=messages,
-                        temperature=temperature,
-                        max_tokens=max_tokens or boost_manager.boost_config.boost_max_output_tokens,
-                        response_format=response_format,
-                        provider=boost_provider
+                        provider=boost_provider or "OpenRouter"
                     )
                     
                     # Calculate duration
@@ -272,6 +326,11 @@ async def generate_completion(
                         response_content = message.get("content") or message.get("reasoning") or ""
                     if result.get("usage"):
                         tokens_used = result["usage"].get("total_tokens")
+                        _pt = result["usage"].get("prompt_tokens")
+                        _ct = result["usage"].get("completion_tokens")
+                        if _pt is not None and _ct is not None:
+                            token_tracker.track(boost_model, _pt, _ct)
+                            await self._broadcast("token_usage_updated", token_tracker.get_stats())
                     
                     # Log the boost call
                     await boost_logger.log_boost_call(
@@ -554,13 +613,18 @@ async def generate_completion(
                 
                 try:
                     logger.debug(f"Role {role_id} using OpenRouter: {openrouter_model}{provider_info}")
-                    result = await self._openrouter_client.generate_completion(
+                    result = await self._with_hung_connection_watchdog(
+                        self._openrouter_client.generate_completion(
+                            model=openrouter_model,
+                            messages=messages,
+                            temperature=temperature,
+                            max_tokens=max_tokens or role_config.max_output_tokens,
+                            response_format=response_format,
+                            provider=openrouter_provider
+                        ),
+                        role_id=role_id,
                         model=openrouter_model,
-                        messages=messages,
-                        temperature=temperature,
-                        max_tokens=max_tokens or role_config.max_output_tokens,
-                        response_format=response_format,
-                        provider=openrouter_provider  # Pass specific provider if configured
+                        provider=openrouter_provider or "OpenRouter"
                     )
                     
                     # Calculate duration and extract response
@@ -572,6 +636,11 @@ async def generate_completion(
                         response_content = message.get("content") or message.get("reasoning") or ""
                     if result.get("usage"):
                         tokens_used = result["usage"].get("total_tokens")
+                        _pt = result["usage"].get("prompt_tokens")
+                        _ct = result["usage"].get("completion_tokens")
+                        if _pt is not None and _ct is not None:
+                            token_tracker.track(openrouter_model, _pt, _ct)
+                            await self._broadcast("token_usage_updated", token_tracker.get_stats())
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
@@ -752,11 +821,13 @@ async def generate_completion(
                             f"fallback model in settings."
                         )
                         logger.error(error_msg)
-                        await self._broadcast("openrouter_fallback_failed", {
-                            "role_id": role_id,
-                            "reason": "no_fallback_configured",
-                            "message": error_msg
-                        })
+                        if role_id not in self._fallback_failed_notified:
+                            self._fallback_failed_notified.add(role_id)
+                            await self._broadcast("openrouter_fallback_failed", {
+                                "role_id": role_id,
+                                "reason": "no_fallback_configured",
+                                "message": error_msg
+                            })
                         raise RuntimeError(error_msg)
                     
                     # Fallback IS configured - use it
@@ -822,13 +893,18 @@ async def generate_completion(
         start_time = time.time()
         
         try:
-            result = await lm_studio_client.generate_completion(
+            result = await self._with_hung_connection_watchdog(
+                lm_studio_client.generate_completion(
+                    model=model,
+                    messages=messages,
+                    temperature=temperature,
+                    max_tokens=max_tokens,
+                    response_format=response_format,
+                    **kwargs
+                ),
+                role_id=role_id,
                 model=model,
-                messages=messages,
-                temperature=temperature,
-                max_tokens=max_tokens,
-                response_format=response_format,
-                **kwargs
+                provider="LM Studio"
             )
             
             # Calculate duration and extract response
@@ -840,6 +916,11 @@ async def generate_completion(
                 response_content = message.get("content") or message.get("reasoning") or ""
             if result.get("usage"):
                 tokens_used = result["usage"].get("total_tokens")
+                _pt = result["usage"].get("prompt_tokens")
+                _ct = result["usage"].get("completion_tokens")
+                if _pt is not None and _ct is not None:
+                    token_tracker.track(model, _pt, _ct)
+                    await self._broadcast("token_usage_updated", token_tracker.get_stats())
             
             # Log to autonomous API logger if callback set
             if self._autonomous_logger_callback:
@@ -921,14 +1002,25 @@ async def _try_free_model_rotation(
                     "reason": "rate_limit",
                 })
                 try:
-                    result = await self._openrouter_client.generate_completion(
+                    result = await self._with_hung_connection_watchdog(
+                        self._openrouter_client.generate_completion(
+                            model=alt_model,
+                            messages=messages,
+                            temperature=temperature,
+                            max_tokens=max_tokens,
+                            response_format=response_format,
+                        ),
+                        role_id=role_id,
                         model=alt_model,
-                        messages=messages,
-                        temperature=temperature,
-                        max_tokens=max_tokens,
-                        response_format=response_format,
+                        provider="OpenRouter (free rotation)"
                     )
                     await self._track_model_usage(alt_model)
+                    if result.get("usage"):
+                        _pt = result["usage"].get("prompt_tokens")
+                        _ct = result["usage"].get("completion_tokens")
+                        if _pt is not None and _ct is not None:
+                            token_tracker.track(alt_model, _pt, _ct)
+                            await self._broadcast("token_usage_updated", token_tracker.get_stats())
                     if free_model_manager.is_account_exhausted():
                         free_model_manager.clear_account_exhaustion()
                     return result
@@ -948,14 +1040,25 @@ async def _try_free_model_rotation(
                 "original_model": original_model,
             })
             try:
-                result = await self._openrouter_client.generate_completion(
+                result = await self._with_hung_connection_watchdog(
+                    self._openrouter_client.generate_completion(
+                        model=auto_model,
+                        messages=messages,
+                        temperature=temperature,
+                        max_tokens=max_tokens,
+                        response_format=response_format,
+                    ),
+                    role_id=role_id,
                     model=auto_model,
-                    messages=messages,
-                    temperature=temperature,
-                    max_tokens=max_tokens,
-                    response_format=response_format,
+                    provider="OpenRouter (auto-selector)"
                 )
                 await self._track_model_usage(auto_model)
+                if result.get("usage"):
+                    _pt = result["usage"].get("prompt_tokens")
+                    _ct = result["usage"].get("completion_tokens")
+                    if _pt is not None and _ct is not None:
+                        token_tracker.track(auto_model, _pt, _ct)
+                        await self._broadcast("token_usage_updated", token_tracker.get_stats())
                 if free_model_manager.is_account_exhausted():
                     free_model_manager.clear_account_exhaustion()
                 return result
@@ -985,6 +1088,31 @@ def get_all_fallback_states(self) -> Dict[str, str]:
         """
         return self._role_fallback_state.copy()
     
+    async def reset_openrouter_fallbacks(self) -> Dict[str, str]:
+        """
+        Reset all roles that were originally configured for OpenRouter back to 'openrouter' state.
+        Called when user adds credits and wants to retry OpenRouter without restarting.
+        
+        Returns:
+            Dict of role_id -> new_state for roles that were reset
+        """
+        reset_roles = {}
+        async with self._state_lock:
+            for role_id, config in self._role_model_configs.items():
+                if config.provider == "openrouter" and self._role_fallback_state.get(role_id) == "lm_studio":
+                    self._role_fallback_state[role_id] = "openrouter"
+                    reset_roles[role_id] = "openrouter"
+                    logger.info(f"Reset role '{role_id}' back to OpenRouter (was fallen back to LM Studio)")
+        
+        if reset_roles:
+            self._fallback_failed_notified.difference_update(reset_roles.keys())
+            await self._broadcast("openrouter_fallbacks_reset", {
+                "reset_roles": list(reset_roles.keys()),
+                "message": f"Reset {len(reset_roles)} role(s) back to OpenRouter"
+            })
+        
+        return reset_roles
+    
     async def get_embeddings(self, texts: List[str], model: str = None) -> List[List[float]]:
         """
         Get embeddings, routing to LM Studio first, then OpenRouter fallback.
diff --git a/backend/shared/boost_manager.py b/backend/shared/boost_manager.py
index f79438a..4417933 100644
--- a/backend/shared/boost_manager.py
+++ b/backend/shared/boost_manager.py
@@ -35,6 +35,8 @@
     "comp_hp": "High-Param Submitter",
     "comp_val": "Compiler Validator",
     # Autonomous
+    "auto_te": "Topic Explorer",
+    "auto_tev": "Topic Explorer Validator",
     "auto_ts": "Topic Selector",
     "auto_tv": "Topic Validator",
     "auto_cr": "Completion Reviewer",
@@ -340,6 +342,8 @@ def get_available_categories(self, mode: str = "all") -> List[Dict[str, str]]:
         
         if mode in ("autonomous", "all"):
             categories.extend([
+                {"id": "auto_te", "label": "Topic Explore", "group": "Autonomous"},
+                {"id": "auto_tev", "label": "Topic Explore Val", "group": "Autonomous"},
                 {"id": "auto_ts", "label": "Topic Sel", "group": "Autonomous"},
                 {"id": "auto_tv", "label": "Topic Val", "group": "Autonomous"},
                 {"id": "auto_cr", "label": "Completion", "group": "Autonomous"},
diff --git a/backend/shared/config.py b/backend/shared/config.py
index 441ceb5..c07c4e4 100644
--- a/backend/shared/config.py
+++ b/backend/shared/config.py
@@ -34,6 +34,7 @@ class RAGConfig(BaseSettings):
     
     # Memory limits
     max_documents: int = 10000  # For RAG document cache; user files never evicted; high for infinite runtime
+    max_chunks_per_size: int = 10000  # Per-size chunk cap; oldest non-permanent trimmed when exceeded
     max_shared_training_insights: int = 999999  # Effectively unlimited for infinite runtime
     max_local_rejections: int = 5  # Per rules: "last 5 rejections"
     
@@ -57,8 +58,8 @@ class RAGConfig(BaseSettings):
     embedding_model: str = "text-embedding-nomic-embed-text-v1.5"
     
     # OpenRouter API (Global Configuration)
-    # This is the global API key used for per-role OpenRouter model selection
-    # Separate from boost API key which is stored in BoostConfig
+    # This is the default OpenRouter API key used for per-role model selection.
+    # API Boost can also reuse it unless the boost modal supplies an override key.
     openrouter_api_key: Optional[str] = None
     openrouter_enabled: bool = False  # True when API key is set and validated
     
@@ -151,7 +152,6 @@ class SystemConfig(BaseSettings):
     autonomous_completion_review_interval: int = 10  # Every 10 acceptances
     autonomous_paper_redundancy_interval: int = 3  # Every 3 completed papers
     autonomous_max_reference_papers: int = 6  # Max papers for reference context
-    autonomous_topic_selection_retry_limit: int = 3
     
     # Wolfram Alpha integration (optional)
     wolfram_alpha_enabled: bool = False
diff --git a/backend/shared/critique_prompts.py b/backend/shared/critique_prompts.py
index af09e9c..fd5a7e8 100644
--- a/backend/shared/critique_prompts.py
+++ b/backend/shared/critique_prompts.py
@@ -2,8 +2,14 @@
 Paper Critique Prompts Module.
 
 Contains the default critique prompt and helper functions for building
-critique requests to the validator model.
+critique requests to the validator model. Also provides lenient parsing
+for critique responses that may be truncated by max_tokens limits.
 """
+import json
+import re
+import logging
+
+logger = logging.getLogger(__name__)
 
 # Default critique prompt that can be customized by users
 DEFAULT_CRITIQUE_PROMPT = """You are an expert academic reviewer providing an honest, thorough critique of a research paper.
@@ -85,3 +91,151 @@ def get_default_critique_prompt() -> str:
     """
     return DEFAULT_CRITIQUE_PROMPT
 
+
+def parse_critique_response(response_content: str) -> dict:
+    """
+    Parse a critique LLM response with lenient fallback for truncated JSON.
+    
+    Critique responses are especially prone to truncation because reasoning models
+    burn tokens on internal thinking before the JSON, and the full_critique field
+    (the last and longest field) often gets cut off right before the closing '}'.
+    
+    Strategy:
+    1. Try strict parse_json() first
+    2. If truncated, try repairing by appending closing characters
+    3. If still fails, extract ratings and feedback via regex
+    
+    Returns:
+        Parsed critique dict with all expected fields
+    """
+    from backend.shared.json_parser import parse_json, sanitize_json_response
+
+    # Step 1: Try strict parsing
+    try:
+        return parse_json(response_content)
+    except Exception as strict_err:
+        logger.info(f"Strict critique parse failed ({strict_err}), attempting truncation repair")
+
+    # Step 2: Try repairing truncated JSON
+    # Common case: model wrote all content but ran out of tokens before closing '}'
+    try:
+        sanitized = sanitize_json_response(response_content)
+    except (ValueError, Exception):
+        # sanitize_json_response raises ValueError on truncation - that's expected
+        # Fall through to repair attempts using raw content
+        sanitized = _strip_to_json(response_content)
+
+    repaired = _try_repair_json(sanitized)
+    if repaired is not None:
+        logger.info("Critique JSON repaired after truncation - recovered all fields")
+        return repaired
+
+    # Step 3: Regex extraction fallback
+    logger.warning("Critique JSON repair failed, falling back to regex extraction")
+    return _regex_extract_critique(response_content)
+
+
+def _strip_to_json(raw: str) -> str:
+    """Strip thinking tokens, markdown, and prefixes to get to the JSON content."""
+    content = raw.strip()
+
+    # Strip <think>...</think>
+    content = re.sub(r'<think>.*?</think>', '', content, flags=re.DOTALL | re.IGNORECASE).strip()
+    content = re.sub(r'</think\s*>', '', content, flags=re.IGNORECASE).strip()
+    content = re.sub(r'<think\s*>', '', content, flags=re.IGNORECASE).strip()
+
+    # Strip markdown code blocks
+    if content.startswith('```'):
+        lines = content.split('\n')
+        if len(lines) > 2:
+            closing = -1
+            for i in range(1, len(lines)):
+                if lines[i].strip() == '```':
+                    closing = i
+                    break
+            if closing > 0:
+                content = '\n'.join(lines[1:closing]).strip()
+
+    # Strip prefix before first '{'
+    brace = content.find('{')
+    if brace > 0:
+        content = content[brace:]
+
+    return content
+
+
+def _try_repair_json(content: str):
+    """
+    Attempt to repair truncated critique JSON by appending missing closing characters.
+    Only repairs simple truncation (missing '}', or string cut off mid-value).
+    """
+    if not content or '{' not in content:
+        return None
+
+    # Try progressively more aggressive repairs
+    repairs = [
+        '}',        # Missing only closing brace
+        '"}',       # String value ended, missing quote + brace  
+        '..."}',    # Truncated mid-word in last string value
+    ]
+
+    for suffix in repairs:
+        candidate = content.rstrip() + suffix
+        try:
+            result = json.loads(candidate)
+            if isinstance(result, dict) and result.get("novelty_rating"):
+                return result
+        except (json.JSONDecodeError, ValueError):
+            continue
+
+    # More aggressive: find last complete key-value pair and close from there
+    # Handles case where truncation happened mid-field-value
+    last_complete = content.rfind('","')
+    if last_complete > 0:
+        truncated = content[:last_complete + 1] + '}'
+        try:
+            result = json.loads(truncated)
+            if isinstance(result, dict) and result.get("novelty_rating"):
+                return result
+        except (json.JSONDecodeError, ValueError):
+            pass
+
+    return None
+
+
+def _regex_extract_critique(raw: str) -> dict:
+    """
+    Last-resort extraction of critique fields from raw text via regex.
+    Ratings appear early in the JSON and are almost always present even in
+    heavily truncated responses.
+    """
+    def extract_rating(field: str) -> int:
+        m = re.search(rf'"{field}"\s*:\s*(\d+)', raw)
+        if m:
+            val = int(m.group(1))
+            return val if 1 <= val <= 10 else 0
+        return 0
+
+    def extract_string(field: str) -> str:
+        m = re.search(rf'"{field}"\s*:\s*"((?:[^"\\]|\\.)*)"', raw, re.DOTALL)
+        return m.group(1) if m else ""
+
+    novelty = extract_rating("novelty_rating")
+    correctness = extract_rating("correctness_rating")
+    impact = extract_rating("impact_rating")
+
+    result = {
+        "novelty_rating": novelty,
+        "novelty_feedback": extract_string("novelty_feedback") or ("Unable to parse structured response" if novelty == 0 else ""),
+        "correctness_rating": correctness,
+        "correctness_feedback": extract_string("correctness_feedback") or ("Unable to parse structured response" if correctness == 0 else ""),
+        "impact_rating": impact,
+        "impact_feedback": extract_string("impact_feedback") or ("Unable to parse structured response" if impact == 0 else ""),
+        "full_critique": extract_string("full_critique") or raw,
+    }
+
+    recovered = sum(1 for k in ["novelty_rating", "correctness_rating", "impact_rating"] if result[k] > 0)
+    logger.info(f"Regex extraction recovered {recovered}/3 ratings: N={novelty}, C={correctness}, I={impact}")
+
+    return result
+
diff --git a/backend/shared/models.py b/backend/shared/models.py
index a617630..830e483 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -184,6 +184,10 @@ class CompilerSubmission(BaseModel):
     
     For outline_create mode, uses full_content operation where content is the complete outline.
     For other modes, content stores the submission for logging while old_string/new_string specify the edit.
+    
+    Retroactive brainstorm operations (optional, autonomous mode only):
+    - brainstorm_operation: Optional operation on the source brainstorm database.
+      Validated independently from paper operations. Each must stand on its own merits.
     """
     submission_id: str
     mode: Literal["outline_create", "outline_update", "construction", "review", "rigor"]
@@ -201,10 +205,31 @@ class CompilerSubmission(BaseModel):
     needs_edit: Optional[bool] = None  # For review mode: False = no edit needed
     needs_enhancement: Optional[bool] = None  # For rigor mode: False = no enhancement needed
     needs_update: Optional[bool] = None  # For outline_update mode: False = no update needed
+    
+    # Retroactive brainstorm correction (optional, autonomous paper writing only)
+    brainstorm_operation: Optional["BrainstormRetroactiveOperation"] = None
+    
     timestamp: datetime = Field(default_factory=datetime.now)
     metadata: Dict[str, Any] = Field(default_factory=dict)
 
 
+class BrainstormRetroactiveOperation(BaseModel):
+    """Optional retroactive operation on the source brainstorm database.
+    
+    Proposed by the compiler submitter during paper writing and validated
+    independently from the paper operation. The validator sees ONLY the
+    brainstorm context when validating this, never the paper operation.
+    Each operation must be independently justified.
+    """
+    action: Literal["edit", "delete", "add"]
+    submission_number: Optional[int] = None  # Required for edit/delete, None for add
+    new_content: str = ""  # Required for edit/add, empty for delete
+    reasoning: str  # Independent justification (must not depend on paper operation)
+
+
+CompilerSubmission.model_rebuild()
+
+
 class CompilerValidationResult(BaseModel):
     """Result of validation by compiler validator."""
     submission_id: str
@@ -238,7 +263,7 @@ class CompilerState(BaseModel):
     review_acceptances: int = 0
     review_rejections: int = 0
     review_declines: int = 0
-    miniscule_edit_count: int = 0
+    minuscule_edit_count: int = 0
     in_critique_phase: bool = False
     critique_acceptances: int = 0
     paper_version: int = 1
@@ -326,9 +351,16 @@ class TopicValidationResult(BaseModel):
     """Result of topic validation."""
     decision: Literal["accept", "reject"]
     reasoning: str
+    summary: str = ""  # Rejection feedback (max 750 chars)
     timestamp: datetime = Field(default_factory=datetime.now)
 
 
+class BrainstormContinuationDecision(BaseModel):
+    """Decision on whether to write another paper from the same brainstorm or move on."""
+    decision: Literal["write_another_paper", "move_on"]
+    reasoning: str
+
+
 class CompletionReviewResult(BaseModel):
     """Result of brainstorm completion review."""
     decision: Literal["continue_brainstorm", "write_paper"]
diff --git a/backend/shared/token_tracker.py b/backend/shared/token_tracker.py
new file mode 100644
index 0000000..4505d9f
--- /dev/null
+++ b/backend/shared/token_tracker.py
@@ -0,0 +1,85 @@
+"""
+Token Tracker - Tracks cumulative input/output token usage across the session,
+with per-model breakdown and a research timer.
+"""
+import logging
+import time
+from typing import Dict, Any, Optional
+
+logger = logging.getLogger(__name__)
+
+
+class TokenTracker:
+    """
+    Singleton that accumulates prompt_tokens and completion_tokens
+    from every successful LLM completion call, broken down by model.
+    Also provides a simple elapsed-time research timer.
+    """
+    _instance = None
+
+    def __new__(cls):
+        if cls._instance is None:
+            cls._instance = super().__new__(cls)
+            cls._instance._initialized = False
+        return cls._instance
+
+    def __init__(self):
+        if self._initialized:
+            return
+        self._initialized = True
+        self._total_input = 0
+        self._total_output = 0
+        self._by_model: Dict[str, Dict[str, int]] = {}
+        self._start_time: Optional[float] = None
+        self._stopped_elapsed: float = 0.0
+        logger.info("TokenTracker initialized")
+
+    def track(self, model_id: str, prompt_tokens: int, completion_tokens: int) -> None:
+        """Record token usage for one successful API call."""
+        self._total_input += prompt_tokens
+        self._total_output += completion_tokens
+        if model_id not in self._by_model:
+            self._by_model[model_id] = {"input": 0, "output": 0}
+        self._by_model[model_id]["input"] += prompt_tokens
+        self._by_model[model_id]["output"] += completion_tokens
+
+    def start_timer(self) -> None:
+        """Start (or resume) the research timer."""
+        if self._start_time is None:
+            self._start_time = time.time()
+            logger.info("TokenTracker timer started")
+
+    def stop_timer(self) -> None:
+        """Pause the timer, preserving elapsed time so it can be resumed."""
+        if self._start_time is not None:
+            self._stopped_elapsed += time.time() - self._start_time
+            self._start_time = None
+            logger.info(f"TokenTracker timer stopped (elapsed: {self._stopped_elapsed:.1f}s)")
+
+    def get_elapsed_seconds(self) -> float:
+        """Return total elapsed seconds (running + previously stopped segments)."""
+        elapsed = self._stopped_elapsed
+        if self._start_time is not None:
+            elapsed += time.time() - self._start_time
+        return elapsed
+
+    def get_stats(self) -> Dict[str, Any]:
+        """Return current cumulative stats for the frontend."""
+        return {
+            "total_input": self._total_input,
+            "total_output": self._total_output,
+            "by_model": dict(self._by_model),
+            "elapsed_seconds": round(self.get_elapsed_seconds(), 1),
+        }
+
+    def reset(self) -> None:
+        """Clear all counters and timer for a new session."""
+        self._total_input = 0
+        self._total_output = 0
+        self._by_model.clear()
+        self._start_time = None
+        self._stopped_elapsed = 0.0
+        logger.info("TokenTracker reset")
+
+
+token_tracker = TokenTracker()
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index 65a00b4..f90b2df 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.4",
+  "version": "1.0.5",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "asi-aggregator-frontend",
-      "version": "1.0.4",
+      "version": "1.0.5",
       "license": "MIT",
       "dependencies": {
         "dompurify": "^3.2.4",
@@ -1163,9 +1163,9 @@
       "license": "ISC"
     },
     "node_modules/picomatch": {
-      "version": "4.0.3",
-      "resolved": "https://registry.npmjs.org/picomatch/-/picomatch-4.0.3.tgz",
-      "integrity": "sha512-5gTmgEY/sqK6gFXLIsQNH19lWb4ebPDLA4SdLP7dsWkIXHWlG66oPuVvXSGFPppYZz8ZDZq0dYYrbHfBCVUb1Q==",
+      "version": "4.0.4",
+      "resolved": "https://registry.npmjs.org/picomatch/-/picomatch-4.0.4.tgz",
+      "integrity": "sha512-QP88BAKvMam/3NxH6vj2o21R6MjxZUAd6nlwAS/pnGvN9IVLocLHxGYIzFhg6fUQ+5th6P4dv4eW9jX3DSIj7A==",
       "dev": true,
       "license": "MIT",
       "engines": {
@@ -1362,9 +1362,9 @@
       }
     },
     "node_modules/vite": {
-      "version": "7.3.0",
-      "resolved": "https://registry.npmjs.org/vite/-/vite-7.3.0.tgz",
-      "integrity": "sha512-dZwN5L1VlUBewiP6H9s2+B3e3Jg96D0vzN+Ry73sOefebhYr9f94wwkMNN/9ouoU8pV1BqA1d1zGk8928cx0rg==",
+      "version": "7.3.2",
+      "resolved": "https://registry.npmjs.org/vite/-/vite-7.3.2.tgz",
+      "integrity": "sha512-Bby3NOsna2jsjfLVOHKes8sGwgl4TT0E6vvpYgnAYDIF/tie7MRaFthmKuHx1NSXjiTueXH3do80FMQgvEktRg==",
       "dev": true,
       "license": "MIT",
       "dependencies": {
diff --git a/frontend/package.json b/frontend/package.json
index 2268980..62fb80b 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -1,6 +1,6 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.4",
+  "version": "1.0.5",
   "description": "Frontend UI for MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "author": "Intrafere LLC",
   "license": "MIT",
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 2a63048..9d32b8c 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -1,4 +1,4 @@
-import React, { useState, useEffect } from 'react';
+import React, { useState, useEffect, useRef, useCallback } from 'react';
 import AggregatorInterface from './components/aggregator/AggregatorInterface';
 import AggregatorSettings from './components/aggregator/AggregatorSettings';
 import AggregatorLogs from './components/aggregator/AggregatorLogs';
@@ -11,6 +11,7 @@ import {
   AutonomousResearchInterface,
   BrainstormList,
   PaperLibrary,
+  Stage2PaperHistory,
   AutonomousResearchSettings,
   AutonomousResearchLogs,
   FinalAnswerView,
@@ -19,23 +20,79 @@ import {
 import WorkflowPanel from './components/WorkflowPanel';
 import BoostControlModal from './components/BoostControlModal';
 import BoostLogs from './components/BoostLogs';
+import StartupProviderSetupModal from './components/StartupProviderSetupModal';
 import OpenRouterApiKeyModal from './components/OpenRouterApiKeyModal';
 import OpenRouterPrivacyWarningModal from './components/OpenRouterPrivacyWarningModal';
 import CritiqueNotificationStack from './components/CritiqueNotificationStack';
+import CreditExhaustionNotificationStack from './components/CreditExhaustionNotificationStack';
+import HungConnectionNotificationStack from './components/HungConnectionNotificationStack';
 import PaperCritiqueModal from './components/PaperCritiqueModal';
 import { websocket } from './services/websocket';
 import { api, autonomousAPI, openRouterAPI } from './services/api';
+import {
+  LM_STUDIO_STARTUP_CHOICE,
+  RECOMMENDED_PROFILE_KEY,
+  STARTUP_PROVIDER_CHOICE_STORAGE_KEY,
+  applyAutonomousProfileSelection,
+  applyLmStudioStartupDefaults,
+  getStoredAutonomousSettings,
+  settingsToAutonomousConfig,
+  persistAutonomousSettings,
+} from './utils/autonomousProfiles';
+
+const APP_MODE_STORAGE_KEY = 'appMode';
+const AUTONOMOUS_TAB_STORAGE_KEY = 'autonomousActiveTab';
+const MANUAL_TAB_STORAGE_KEY = 'manualActiveTab';
+const LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY = 'singlePaperWriterExpanded';
+const EMBEDDING_MODEL_HINTS = ['embed', 'embedding', 'nomic', 'bge', 'e5', 'gte'];
+
+function normalizeLoadedLmStudioModelId(modelId = '') {
+  return String(modelId).replace(/:\d+$/, '');
+}
+
+function isLikelyEmbeddingModel(modelId = '') {
+  const normalizedModelId = normalizeLoadedLmStudioModelId(modelId).toLowerCase();
+  return EMBEDDING_MODEL_HINTS.some((hint) => normalizedModelId.includes(hint));
+}
+
+function getUsableLoadedLmStudioChatModelId(loadedModels = []) {
+  for (const loadedModelId of loadedModels) {
+    const normalizedModelId = normalizeLoadedLmStudioModelId(loadedModelId);
+    if (!normalizedModelId || isLikelyEmbeddingModel(normalizedModelId)) {
+      continue;
+    }
+    return normalizedModelId;
+  }
+
+  return '';
+}
 
 function App() {
-  const [activeTab, setActiveTab] = useState('auto-interface');
-  
-  // Single Paper Writer expandable section state
-  const [showSinglePaperWriter, setShowSinglePaperWriter] = useState(() => {
-    const saved = localStorage.getItem('singlePaperWriterExpanded');
-    return saved ? JSON.parse(saved) : false;
-  });
+  const [appMode, setAppMode] = useState(() => {
+    const savedMode = localStorage.getItem(APP_MODE_STORAGE_KEY);
+    if (savedMode === 'autonomous' || savedMode === 'manual') {
+      return savedMode;
+    }
+
+    const legacyExpanded = localStorage.getItem(LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY);
+    if (!legacyExpanded) {
+      return 'autonomous';
+    }
 
-  const [singlePaperWriterActiveTab, setSinglePaperWriterActiveTab] = useState('aggregator-interface');
+    try {
+      return JSON.parse(legacyExpanded) ? 'manual' : 'autonomous';
+    } catch {
+      return 'autonomous';
+    }
+  });
+  const [autonomousActiveTab, setAutonomousActiveTab] = useState(
+    () => localStorage.getItem(AUTONOMOUS_TAB_STORAGE_KEY) || 'auto-interface'
+  );
+  const [manualActiveTab, setManualActiveTab] = useState(
+    () => localStorage.getItem(MANUAL_TAB_STORAGE_KEY) || 'aggregator-interface'
+  );
+  const [utilityActiveTab, setUtilityActiveTab] = useState(null);
+  const activeTab = utilityActiveTab || (appMode === 'manual' ? manualActiveTab : autonomousActiveTab);
   
   // Models list (fetched from API)
   const [models, setModels] = useState([]);
@@ -49,6 +106,15 @@ function App() {
   
   // LM Studio availability state (for determining default provider)
   const [lmStudioAvailable, setLmStudioAvailable] = useState(true);
+  const [lmStudioStatus, setLmStudioStatus] = useState({
+    available: true,
+    has_models: false,
+    model_count: 0,
+    models: [],
+    error: null,
+    usable_chat_model_id: '',
+    has_usable_chat_model: false,
+  });
   const [hasOpenRouterKey, setHasOpenRouterKey] = useState(false);
   
   // Track if any workflow is running (for WorkflowPanel visibility)
@@ -59,6 +125,22 @@ function App() {
     const savedState = localStorage.getItem('workflow_panel_collapsed');
     return savedState === 'true';
   });
+
+  useEffect(() => {
+    localStorage.setItem(APP_MODE_STORAGE_KEY, appMode);
+    localStorage.setItem(
+      LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY,
+      JSON.stringify(appMode === 'manual')
+    );
+  }, [appMode]);
+
+  useEffect(() => {
+    localStorage.setItem(AUTONOMOUS_TAB_STORAGE_KEY, autonomousActiveTab);
+  }, [autonomousActiveTab]);
+
+  useEffect(() => {
+    localStorage.setItem(MANUAL_TAB_STORAGE_KEY, manualActiveTab);
+  }, [manualActiveTab]);
   
   // Initialize config from localStorage or use defaults
   // CRITICAL: Read from 'aggregator_settings' (used by AggregatorSettings component)
@@ -157,6 +239,9 @@ function App() {
   
   // Disclaimer modal state (shows on every app load)
   const [showDisclaimer, setShowDisclaimer] = useState(true);
+  const [showStartupSetupModal, setShowStartupSetupModal] = useState(false);
+  const [startupSetupMessage, setStartupSetupMessage] = useState('');
+  const [checkingLmStudioStartupChoice, setCheckingLmStudioStartupChoice] = useState(false);
   
   // OpenRouter privacy warning modal state
   const [showPrivacyWarning, setShowPrivacyWarning] = useState(false);
@@ -170,96 +255,40 @@ function App() {
   const [selectedCritiquePaper, setSelectedCritiquePaper] = useState(null);
   const [showCritiqueModal, setShowCritiqueModal] = useState(false);
 
+  // Credit exhaustion notification state (persistent until dismissed)
+  const [creditExhaustionNotifications, setCreditExhaustionNotifications] = useState([]);
+
+  // Hung connection notification state (persistent until dismissed)
+  const [hungConnectionNotifications, setHungConnectionNotifications] = useState([]);
+
+  // Live refs used by websocket listeners (which are registered once)
+  const autonomousRunningRef = useRef(autonomousRunning);
+  const autonomousTierRef = useRef(autonomousStatus?.current_tier || null);
+  const openRouterKeyJustSavedRef = useRef(false);
+
+  useEffect(() => {
+    autonomousRunningRef.current = autonomousRunning;
+  }, [autonomousRunning]);
+
+  useEffect(() => {
+    autonomousTierRef.current = autonomousStatus?.current_tier || null;
+  }, [autonomousStatus]);
+
   // Autonomous config with localStorage persistence
   // CRITICAL: Read from 'autonomous_research_settings' (used by AutonomousResearchSettings component)
   const [autonomousConfig, setAutonomousConfig] = useState(() => {
-    // Try to load from the settings component key first
-    const settingsConfig = localStorage.getItem('autonomous_research_settings');
-    if (settingsConfig) {
-      try {
-        const settings = JSON.parse(settingsConfig);
-        const localConfig = settings.localConfig || {};
-        return {
-          submitter_configs: settings.submitterConfigs || [
-            { submitterId: 1, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 2, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 3, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 }
-          ],
-          validator_provider: localConfig.validator_provider,
-          validator_model: localConfig.validator_model,
-          validator_openrouter_provider: localConfig.validator_openrouter_provider,
-          validator_lm_studio_fallback: localConfig.validator_lm_studio_fallback,
-          validator_context_window: localConfig.validator_context_window,
-          validator_max_tokens: localConfig.validator_max_tokens,
-          high_context_provider: localConfig.high_context_provider,
-          high_context_model: localConfig.high_context_model,
-          high_context_openrouter_provider: localConfig.high_context_openrouter_provider,
-          high_context_lm_studio_fallback: localConfig.high_context_lm_studio_fallback,
-          high_context_context_window: localConfig.high_context_context_window,
-          high_context_max_tokens: localConfig.high_context_max_tokens,
-          high_param_provider: localConfig.high_param_provider,
-          high_param_model: localConfig.high_param_model,
-          high_param_openrouter_provider: localConfig.high_param_openrouter_provider,
-          high_param_lm_studio_fallback: localConfig.high_param_lm_studio_fallback,
-          high_param_context_window: localConfig.high_param_context_window,
-          high_param_max_tokens: localConfig.high_param_max_tokens,
-          critique_submitter_provider: localConfig.critique_submitter_provider,
-          critique_submitter_model: localConfig.critique_submitter_model,
-          critique_submitter_openrouter_provider: localConfig.critique_submitter_openrouter_provider,
-          critique_submitter_lm_studio_fallback: localConfig.critique_submitter_lm_studio_fallback,
-          critique_submitter_context_window: localConfig.critique_submitter_context_window,
-          critique_submitter_max_tokens: localConfig.critique_submitter_max_tokens,
-          tier3_enabled: settings.tier3Enabled ?? false
-        };
-      } catch (e) {
-        console.error('Failed to parse autonomous_research_settings:', e);
-      }
-    }
-    
-    // Final fallback - use ACTUAL working defaults (OpenRouter API IDs)
-    return {
-      submitter_configs: [
-        { submitterId: 1, provider: 'openrouter', modelId: 'openai/gpt-oss-120b', openrouterProvider: 'Google', lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-        { submitterId: 2, provider: 'openrouter', modelId: 'openai/gpt-oss-20b', openrouterProvider: 'Groq', lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-        { submitterId: 3, provider: 'openrouter', modelId: 'openai/gpt-oss-120b', openrouterProvider: 'Google', lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 }
-      ],
-      validator_provider: 'openrouter',
-      validator_model: 'openai/gpt-oss-120b',
-      validator_openrouter_provider: 'Google',
-      validator_lm_studio_fallback: null,
-      validator_context_window: 131072,
-      validator_max_tokens: 25000,
-      high_context_provider: 'openrouter',
-      high_context_model: 'openai/gpt-oss-120b',
-      high_context_openrouter_provider: 'Google',
-      high_context_lm_studio_fallback: null,
-      high_context_context_window: 131072,
-      high_context_max_tokens: 25000,
-      high_param_provider: 'openrouter',
-      high_param_model: 'openai/gpt-oss-120b',
-      high_param_openrouter_provider: 'Google',
-      high_param_lm_studio_fallback: null,
-      high_param_context_window: 131072,
-      high_param_max_tokens: 25000,
-      critique_submitter_provider: 'openrouter',
-      critique_submitter_model: 'openai/gpt-oss-120b',
-      critique_submitter_openrouter_provider: 'Google',
-      critique_submitter_lm_studio_fallback: null,
-      critique_submitter_context_window: 131072,
-      critique_submitter_max_tokens: 25000,
-      tier3_enabled: false
-    };
+    return settingsToAutonomousConfig(getStoredAutonomousSettings());
   });
 
   // Save autonomous config to localStorage
-  // CRITICAL: Save to BOTH keys to maintain backward compatibility
   useEffect(() => {
-    localStorage.setItem('autonomousConfig', JSON.stringify(autonomousConfig));
-    // Also save to autonomous_research_settings in the format expected by AutonomousResearchSettings
-    const settingsToSave = {
-      numSubmitters: autonomousConfig.submitter_configs?.length || 3,
-      submitterConfigs: autonomousConfig.submitter_configs || [],
+    const existingSettings = getStoredAutonomousSettings();
+    persistAutonomousSettings({
+      ...existingSettings,
+      numSubmitters: autonomousConfig.submitter_configs?.length || existingSettings.numSubmitters || 3,
+      submitterConfigs: autonomousConfig.submitter_configs || existingSettings.submitterConfigs,
       localConfig: {
+        ...existingSettings.localConfig,
         validator_provider: autonomousConfig.validator_provider,
         validator_model: autonomousConfig.validator_model,
         validator_openrouter_provider: autonomousConfig.validator_openrouter_provider,
@@ -283,67 +312,137 @@ function App() {
         critique_submitter_openrouter_provider: autonomousConfig.critique_submitter_openrouter_provider,
         critique_submitter_lm_studio_fallback: autonomousConfig.critique_submitter_lm_studio_fallback,
         critique_submitter_context_window: autonomousConfig.critique_submitter_context_window,
-        critique_submitter_max_tokens: autonomousConfig.critique_submitter_max_tokens
+        critique_submitter_max_tokens: autonomousConfig.critique_submitter_max_tokens,
       },
-      freeOnly: false, // Default value
-      tier3Enabled: autonomousConfig.tier3_enabled ?? false
-    };
-    localStorage.setItem('autonomous_research_settings', JSON.stringify(settingsToSave));
+      tier3Enabled: autonomousConfig.tier3_enabled ?? existingSettings.tier3Enabled ?? false,
+    });
   }, [autonomousConfig]);
 
-  // Check LM Studio availability and fetch models on mount
+  const syncProviderAvailability = useCallback(async () => {
+    let lmResult = {
+      available: false,
+      has_models: false,
+      model_count: 0,
+      models: [],
+      error: null,
+    };
+
+    try {
+      lmResult = await openRouterAPI.checkLMStudioAvailability();
+    } catch (err) {
+      console.error('Failed to check LM Studio availability:', err);
+      lmResult = {
+        available: false,
+        has_models: false,
+        model_count: 0,
+        models: [],
+        error: err.message || 'Failed to check LM Studio availability.',
+      };
+    }
+
+    const usableLmStudioChatModelId = getUsableLoadedLmStudioChatModelId(lmResult.models || []);
+    const hasUsableLmStudioChatModel = Boolean(usableLmStudioChatModelId);
+    const lmAvailable = Boolean(lmResult.available && lmResult.has_models);
+    setLmStudioStatus({
+      ...lmResult,
+      usable_chat_model_id: usableLmStudioChatModelId,
+      has_usable_chat_model: hasUsableLmStudioChatModel,
+    });
+    setLmStudioAvailable(lmAvailable);
+
+    let keyStatus = { has_key: false };
+    try {
+      keyStatus = await openRouterAPI.getApiKeyStatus();
+    } catch (err) {
+      console.error('Failed to check OpenRouter key status:', err);
+    }
+
+    let finalHasOpenRouterKey = Boolean(keyStatus.has_key);
+    const storedKey = localStorage.getItem('openrouter_api_key');
+    if (storedKey && !finalHasOpenRouterKey) {
+      try {
+        await openRouterAPI.setApiKey(storedKey);
+        finalHasOpenRouterKey = true;
+      } catch (err) {
+        console.error('Failed to restore OpenRouter key:', err);
+        localStorage.removeItem('openrouter_api_key');
+      }
+    }
+    setHasOpenRouterKey(finalHasOpenRouterKey);
+
+    let availableModels = [];
+    if (lmAvailable) {
+      try {
+        const data = await api.getModels();
+        availableModels = data.models || data || [];
+        setModels(availableModels);
+      } catch (err) {
+        console.error('Failed to fetch LM Studio models:', err);
+        setModels([]);
+      }
+    } else {
+      setModels([]);
+    }
+
+    return {
+      lmAvailable,
+      hasOpenRouterKey: finalHasOpenRouterKey,
+      hasUsableLmStudioChatModel,
+      lmStudioStatus: {
+        ...lmResult,
+        usable_chat_model_id: usableLmStudioChatModelId,
+        has_usable_chat_model: hasUsableLmStudioChatModel,
+      },
+      defaultLmStudioModelId: usableLmStudioChatModelId,
+    };
+  }, []);
+
+  useEffect(() => {
+    syncProviderAvailability();
+  }, [syncProviderAvailability]);
+
   useEffect(() => {
-    const checkAvailability = async () => {
+    const restoreWolframKey = async () => {
+      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
+      if (!storedWolframKey) {
+        return;
+      }
+
+      try {
+        await api.setWolframApiKey(storedWolframKey);
+      } catch (err) {
+        console.error('Failed to restore Wolfram Alpha key:', err);
+        localStorage.removeItem('wolfram_alpha_api_key');
+      }
+    };
+
+    restoreWolframKey();
+  }, []);
+
+  // Periodically re-check OpenRouter key status to keep indicator in sync
+  useEffect(() => {
+    const interval = setInterval(async () => {
       try {
-        // Check LM Studio availability
-        const lmResult = await openRouterAPI.checkLMStudioAvailability();
-        const lmAvailable = lmResult.available && lmResult.has_models;
-        setLmStudioAvailable(lmAvailable);
-        
-        // Check if OpenRouter API key is configured
         const keyStatus = await openRouterAPI.getApiKeyStatus();
         setHasOpenRouterKey(keyStatus.has_key);
-        
-        // Also check localStorage for saved key and sync with backend
-        const storedKey = localStorage.getItem('openrouter_api_key');
-        if (storedKey && !keyStatus.has_key) {
-          // Restore key to backend from localStorage
-          try {
-            await openRouterAPI.setApiKey(storedKey);
-            setHasOpenRouterKey(true);
-          } catch (err) {
-            console.error('Failed to restore OpenRouter key:', err);
-            localStorage.removeItem('openrouter_api_key');
+
+        if (!keyStatus.has_key) {
+          const storedKey = localStorage.getItem('openrouter_api_key');
+          if (storedKey) {
+            try {
+              await openRouterAPI.setApiKey(storedKey);
+              setHasOpenRouterKey(true);
+            } catch {
+              // Silent retry next interval
+            }
           }
         }
-        
-        // If LM Studio not available and no OpenRouter key, prompt for key
-        if (!lmAvailable && !keyStatus.has_key && !storedKey) {
-          console.log('LM Studio not available, prompting for OpenRouter API key...');
-          setOpenRouterKeyReason('lm_studio_unavailable');
-          setShowOpenRouterKeyModal(true);
-        }
-        
-        // Fetch LM Studio models if available
-        if (lmAvailable) {
-          api.getModels().then(data => {
-            setModels(data.models || data);
-          }).catch(err => {
-            console.error('Failed to fetch LM Studio models:', err);
-          });
-        }
-      } catch (err) {
-        console.error('Failed to check availability:', err);
-        // Fallback to fetching models directly
-        api.getModels().then(data => {
-          setModels(data.models || data);
-        }).catch(modelErr => {
-          console.error('Failed to fetch models:', modelErr);
-        });
+      } catch {
+        // Backend unreachable, skip this cycle
       }
-    };
-    
-    checkAvailability();
+    }, 30000);
+
+    return () => clearInterval(interval);
   }, []);
 
   // Check autonomous research status on mount (handles page refresh while running)
@@ -399,6 +498,86 @@ function App() {
     const addActivity = (event) => {
       setAutonomousActivity(prev => [...prev, event].slice(-MAX_ACTIVITY_EVENTS));
     };
+    const isAutonomousTier2Active = () =>
+      autonomousRunningRef.current && autonomousTierRef.current === 'tier2_paper_writing';
+    const formatCompilerMode = (mode) => {
+      switch (mode) {
+        case 'outline_create':
+          return 'Outline creation';
+        case 'construction':
+          return 'Construction';
+        case 'outline_update':
+          return 'Outline update';
+        case 'review':
+          return 'Review';
+        case 'rigor':
+          return 'Rigor';
+        default:
+          return mode || 'Compiler';
+      }
+    };
+    const formatReason = (reasoning, maxLen = 140) => {
+      if (!reasoning) return '';
+      const cleaned = String(reasoning).replace(/\s+/g, ' ').trim();
+      if (!cleaned) return '';
+      return cleaned.length > maxLen ? `${cleaned.slice(0, maxLen)}...` : cleaned;
+    };
+    
+    // Topic exploration events (pre-brainstorm candidate collection)
+    unsubscribers.push(websocket.on('topic_exploration_started', (data) => {
+      addActivity({
+        event: 'topic_exploration_started',
+        timestamp: new Date().toISOString(),
+        message: `Topic exploration started (target: ${data.target || 5} candidates${data.resumed_count ? `, resuming with ${data.resumed_count}` : ''})`,
+        data
+      });
+    }));
+    
+    unsubscribers.push(websocket.on('topic_exploration_progress', (data) => {
+      addActivity({
+        event: 'topic_exploration_progress',
+        timestamp: new Date().toISOString(),
+        message: `Exploration candidate ${data.accepted}/${data.target} accepted: ${data.latest_question ? data.latest_question.substring(0, 100) + '...' : ''}`,
+        data
+      });
+    }));
+    
+    unsubscribers.push(websocket.on('topic_exploration_complete', (data) => {
+      addActivity({
+        event: 'topic_exploration_complete',
+        timestamp: new Date().toISOString(),
+        message: `Topic exploration complete: ${data.accepted_count} candidates collected from ${data.total_attempts} attempts`,
+        data
+      });
+    }));
+    
+    // Paper title exploration events (pre-title-selection candidate collection)
+    unsubscribers.push(websocket.on('paper_title_exploration_started', (data) => {
+      addActivity({
+        event: 'paper_title_exploration_started',
+        timestamp: new Date().toISOString(),
+        message: `Title exploration started (target: ${data.target || 5} candidate titles)`,
+        data
+      });
+    }));
+    
+    unsubscribers.push(websocket.on('paper_title_exploration_progress', (data) => {
+      addActivity({
+        event: 'paper_title_exploration_progress',
+        timestamp: new Date().toISOString(),
+        message: `Title candidate ${data.accepted}/${data.target} accepted`,
+        data
+      });
+    }));
+    
+    unsubscribers.push(websocket.on('paper_title_exploration_complete', (data) => {
+      addActivity({
+        event: 'paper_title_exploration_complete',
+        timestamp: new Date().toISOString(),
+        message: `Title exploration complete: ${data.accepted_count} candidates collected from ${data.total_attempts} attempts`,
+        data
+      });
+    }));
     
     // Topic selection events
     unsubscribers.push(websocket.on('topic_selected', (data) => {
@@ -470,6 +649,7 @@ function App() {
     
     // Paper events
     unsubscribers.push(websocket.on('paper_writing_started', (data) => {
+      autonomousTierRef.current = 'tier2_paper_writing';
       addActivity({
         event: 'paper_writing_started',
         timestamp: new Date().toISOString(),
@@ -477,6 +657,54 @@ function App() {
         data
       });
     }));
+
+    // Compiler writing activity events (Tier 2 paper writing internals)
+    unsubscribers.push(websocket.on('compiler_acceptance', (data) => {
+      if (!isAutonomousTier2Active()) return;
+      const modeLabel = formatCompilerMode(data.mode);
+      const iterationSuffix = data.iteration ? ` (iteration ${data.iteration})` : '';
+      addActivity({
+        event: 'compiler_acceptance',
+        timestamp: new Date().toISOString(),
+        message: `${modeLabel}: ✓ ACCEPTED${iterationSuffix}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('compiler_rejection', (data) => {
+      if (!isAutonomousTier2Active()) return;
+      const modeLabel = formatCompilerMode(data.mode);
+      const iterationSuffix = data.iteration ? ` (iteration ${data.iteration})` : '';
+      const reason = formatReason(data.reasoning);
+      addActivity({
+        event: 'compiler_rejection',
+        timestamp: new Date().toISOString(),
+        message: `${modeLabel}: ✗ REJECTED${iterationSuffix}${reason ? ` - ${reason}` : ''}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('compiler_decline', (data) => {
+      if (!isAutonomousTier2Active()) return;
+      const modeLabel = formatCompilerMode(data.mode);
+      const reason = formatReason(data.reasoning, 100);
+      addActivity({
+        event: 'compiler_decline',
+        timestamp: new Date().toISOString(),
+        message: `${modeLabel}: ↷ DECLINED${reason ? ` - ${reason}` : ''}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('outline_locked', (data) => {
+      if (!isAutonomousTier2Active()) return;
+      addActivity({
+        event: 'outline_locked',
+        timestamp: new Date().toISOString(),
+        message: `Outline locked after ${data.total_iterations || data.iteration || '?'} iteration(s)`,
+        data
+      });
+    }));
     
     // Critique phase events (paper writing substages)
     unsubscribers.push(websocket.on('critique_phase_started', (data) => {
@@ -578,6 +806,9 @@ function App() {
       // Handle resume after crash/restart - sync running state
       console.log('Autonomous research resumed:', data);
       setAutonomousRunning(true);
+      if (data?.tier) {
+        autonomousTierRef.current = data.tier;
+      }
       addActivity({
         event: 'auto_research_resumed',
         timestamp: new Date().toISOString(),
@@ -592,10 +823,13 @@ function App() {
     
     unsubscribers.push(websocket.on('auto_research_stopped', () => {
       setAutonomousRunning(false);
+      autonomousTierRef.current = null;
+      setHungConnectionNotifications([]);
     }));
     
     // Tier 3 events
     unsubscribers.push(websocket.on('tier3_started', (data) => {
+      autonomousTierRef.current = 'tier3_final_answer';
       addActivity({
         event: 'tier3_started',
         timestamp: new Date().toISOString(),
@@ -701,6 +935,7 @@ function App() {
     
     // Paper writing resumed (after crash recovery)
     unsubscribers.push(websocket.on('paper_writing_resumed', (data) => {
+      autonomousTierRef.current = 'tier2_paper_writing';
       addActivity({
         event: 'paper_writing_resumed',
         timestamp: new Date().toISOString(),
@@ -847,6 +1082,111 @@ function App() {
         message: `❌ Account free credits depleted: ${data.message}`,
         ...data
       });
+      setCreditExhaustionNotifications(prev => {
+        const roleId = data.role_id || 'Account';
+        if (prev.some(n => n.role_id === roleId && n.reason === 'account_credits_exhausted')) return prev;
+        return [...prev, {
+          id: `account_exhausted_${Date.now()}`,
+          role_id: roleId,
+          reason: 'account_credits_exhausted',
+          message: data.message || 'Account free credits depleted.',
+          timestamp: new Date().toISOString()
+        }];
+      });
+    }));
+
+    // OpenRouter fallback event (credit exhaustion triggered fallback to LM Studio)
+    unsubscribers.push(websocket.on('openrouter_fallback', (data) => {
+      console.warn('OpenRouter fallback triggered:', data);
+      addActivity({
+        event: 'openrouter_fallback',
+        timestamp: new Date().toISOString(),
+        message: `⚠️ OpenRouter credits exhausted for ${data.role_id} — fell back to ${data.fallback_model || 'LM Studio'}`,
+        ...data
+      });
+      setCreditExhaustionNotifications(prev => {
+        const reason = data.reason || 'credit_exhaustion';
+        if (prev.some(n => n.role_id === data.role_id && n.reason === reason)) return prev;
+        return [...prev, {
+          id: `fallback_${data.role_id}_${Date.now()}`,
+          role_id: data.role_id,
+          reason,
+          message: data.message,
+          fallback_model: data.fallback_model,
+          timestamp: new Date().toISOString()
+        }];
+      });
+    }));
+
+    // OpenRouter fallback failed (no fallback configured — role stopped)
+    unsubscribers.push(websocket.on('openrouter_fallback_failed', (data) => {
+      console.error('OpenRouter fallback failed:', data);
+      addActivity({
+        event: 'openrouter_fallback_failed',
+        timestamp: new Date().toISOString(),
+        message: `🛑 OpenRouter credits exhausted for ${data.role_id} — NO FALLBACK configured!`,
+        ...data
+      });
+      setCreditExhaustionNotifications(prev => {
+        if (prev.some(n => n.role_id === data.role_id && n.reason === 'no_fallback_configured')) return prev;
+        return [...prev, {
+          id: `fallback_failed_${data.role_id}_${Date.now()}`,
+          role_id: data.role_id,
+          reason: 'no_fallback_configured',
+          message: data.message,
+          timestamp: new Date().toISOString()
+        }];
+      });
+    }));
+
+    // Boost credits exhausted
+    unsubscribers.push(websocket.on('boost_credits_exhausted', (data) => {
+      console.warn('Boost credits exhausted:', data);
+      addActivity({
+        event: 'boost_credits_exhausted',
+        timestamp: new Date().toISOString(),
+        message: `⚠️ Boost credits exhausted for task ${data.task_id}`,
+        ...data
+      });
+      setCreditExhaustionNotifications(prev => {
+        if (prev.some(n => n.reason === 'boost_credits_exhausted')) return prev;
+        return [...prev, {
+          id: `boost_exhausted_${Date.now()}`,
+          role_id: `Boost (${data.task_id || 'unknown'})`,
+          reason: 'boost_credits_exhausted',
+          message: data.message || 'Boost API credits exhausted. Falling back to primary model.',
+          timestamp: new Date().toISOString()
+        }];
+      });
+    }));
+
+    unsubscribers.push(websocket.on('openrouter_fallbacks_reset', (data) => {
+      console.info('OpenRouter fallbacks reset:', data);
+      addActivity({
+        event: 'openrouter_fallbacks_reset',
+        timestamp: new Date().toISOString(),
+        message: `OpenRouter reset: ${data.message}`,
+        ...data
+      });
+      setCreditExhaustionNotifications([]);
+      setHungConnectionNotifications([]);
+    }));
+
+    unsubscribers.push(websocket.on('hung_connection_alert', (data) => {
+      console.warn('Hung connection alert:', data);
+      addLog({
+        type: 'warning',
+        message: `⏳ Possible hung connection: ${data.model} via ${data.provider} (${data.elapsed_minutes}+ min)`,
+        ...data
+      });
+      setHungConnectionNotifications(prev => {
+        if (prev.some(n => n.role_id === data.role_id)) return prev;
+        return [...prev, {
+          id: `hung_${data.role_id}_${Date.now()}`,
+          ...data,
+          timestamp: Date.now()
+        }];
+      });
     }));
 
     unsubscribers.push(websocket.on('final_answer_complete', (data) => {
@@ -1001,7 +1341,7 @@ function App() {
       setAutonomousRunning(true);
       setAutonomousActivity([]);
     } catch (error) {
-      alert(`Failed to start autonomous research: ${error.message}`);
+      alert(`Failed to start autonomous research: ${error.details || error.message}`);
     }
   };
 
@@ -1061,7 +1401,7 @@ function App() {
   // Determine Final Answer tab label based on Tier 3 status
   const getFinalAnswerLabel = () => {
     if (autonomousStatus?.is_tier3_active) {
-      return 'Stage 3:FINAL ANSWER IN PROGRESS';
+      return 'Autonomous Stage 3: FINAL ANSWER IN PROGRESS';
     }
     if (autonomousStatus?.tier3_status === 'complete') {
       return 'Stage 3: FINAL ANSWER COMPLETE ✓';
@@ -1083,6 +1423,41 @@ function App() {
     setShowCritiqueModal(false);
     setSelectedCritiquePaper(null);
   };
+
+  const handleModeChange = (nextMode) => {
+    setAppMode(nextMode);
+    setUtilityActiveTab(null);
+  };
+
+  const handleAutonomousTabSelect = (tabId) => {
+    setAutonomousActiveTab(tabId);
+    setUtilityActiveTab(null);
+    if (appMode !== 'autonomous') {
+      setAppMode('autonomous');
+    }
+  };
+
+  const handleManualTabSelect = (tabId) => {
+    setManualActiveTab(tabId);
+    setUtilityActiveTab(null);
+    if (appMode !== 'manual') {
+      setAppMode('manual');
+    }
+  };
+
+  const handleUtilityTabSelect = (tabId) => {
+    setUtilityActiveTab(tabId);
+  };
+
+  // Credit exhaustion notification handler
+  const handleDismissCreditNotification = (notificationId) => {
+    setCreditExhaustionNotifications(prev => prev.filter(n => n.id !== notificationId));
+  };
+
+  // Hung connection notification handler
+  const handleDismissHungNotification = (notificationId) => {
+    setHungConnectionNotifications(prev => prev.filter(n => n.id !== notificationId));
+  };
   
   // Critique modal API functions
   const handleGenerateCritique = async (customPrompt, validatorConfig) => {
@@ -1103,35 +1478,126 @@ function App() {
     return response;
   };
 
+  const handleDisclaimerAcknowledge = async () => {
+    setShowDisclaimer(false);
+    setStartupSetupMessage('');
+
+    const {
+      lmAvailable,
+      hasOpenRouterKey: keyPresent,
+      hasUsableLmStudioChatModel,
+    } = await syncProviderAvailability();
+    if (keyPresent) {
+      return;
+    }
+
+    const startupChoice = localStorage.getItem(STARTUP_PROVIDER_CHOICE_STORAGE_KEY);
+    if (startupChoice === LM_STUDIO_STARTUP_CHOICE && lmAvailable && hasUsableLmStudioChatModel) {
+      return;
+    }
+
+    if (startupChoice === LM_STUDIO_STARTUP_CHOICE && (!lmAvailable || !hasUsableLmStudioChatModel)) {
+      setStartupSetupMessage(
+        'LM Studio was previously selected, but it is not fully ready. Start LM Studio, load nomic-ai/nomic-embed-text-v1.5 and at least one usable local chat model, then try again.'
+      );
+    }
+
+    setShowStartupSetupModal(true);
+  };
+
+  const handleStartupOpenRouterChoice = () => {
+    setStartupSetupMessage('');
+    setShowStartupSetupModal(false);
+    setOpenRouterKeyReason('startup_setup');
+    setShowOpenRouterKeyModal(true);
+  };
+
+  const handleCloseOpenRouterKeyModal = () => {
+    const keyWasJustSaved = openRouterKeyJustSavedRef.current;
+    const shouldReturnToStartup = openRouterKeyReason === 'startup_setup' && !keyWasJustSaved && !hasOpenRouterKey;
+    openRouterKeyJustSavedRef.current = false;
+    setShowOpenRouterKeyModal(false);
+
+    if (shouldReturnToStartup) {
+      setShowStartupSetupModal(true);
+    }
+  };
+
+  const handleStartupLmStudioChoice = async () => {
+    setCheckingLmStudioStartupChoice(true);
+    setStartupSetupMessage('');
+
+    try {
+      const { lmAvailable, hasUsableLmStudioChatModel, defaultLmStudioModelId } = await syncProviderAvailability();
+
+      if (!lmAvailable) {
+        setStartupSetupMessage(
+          'LM Studio is not detected with a loaded model yet. Install LM Studio, start the local server, load nomic-ai/nomic-embed-text-v1.5, and then try again.'
+        );
+        return;
+      }
+
+      if (!hasUsableLmStudioChatModel || !defaultLmStudioModelId) {
+        setStartupSetupMessage(
+          'LM Studio is running, but no usable chat model is currently loaded. Load at least one local chat model in addition to nomic-ai/nomic-embed-text-v1.5, then try again.'
+        );
+        return;
+      }
+
+      const { config: nextAutonomousConfig } = applyLmStudioStartupDefaults(defaultLmStudioModelId);
+      setAutonomousConfig(nextAutonomousConfig);
+      localStorage.setItem(STARTUP_PROVIDER_CHOICE_STORAGE_KEY, LM_STUDIO_STARTUP_CHOICE);
+      setShowStartupSetupModal(false);
+    } finally {
+      setCheckingLmStudioStartupChoice(false);
+    }
+  };
+
+  const handleOpenRouterKeySet = async () => {
+    if (openRouterKeyReason === 'startup_setup') {
+      const { config: nextAutonomousConfig } = await applyAutonomousProfileSelection(RECOMMENDED_PROFILE_KEY);
+      setAutonomousConfig(nextAutonomousConfig);
+      setShowStartupSetupModal(false);
+      setStartupSetupMessage('');
+    }
+
+    openRouterKeyJustSavedRef.current = true;
+    setHasOpenRouterKey(true);
+    console.log('OpenRouter API key set successfully');
+  };
+
   const mainTabs = [
     { id: 'auto-interface', label: 'Start Here: Autonomous Deep Research Controller', group: 'autonomous-main' },
-    { id: 'auto-brainstorms', label: 'Stage 1: Brainstorms', group: 'autonomous-main' },
-    { id: 'auto-papers', label: 'Stage 2: Short-Form Final Answer(s)', subtext: '(Less Hallucinatory - Short-Form Final Answers)', subtextClass: 'green', group: 'autonomous-main' },
+    { id: 'auto-brainstorms', label: 'Autonomous Stage 1: Brainstorms', group: 'autonomous-main' },
+    { id: 'auto-papers', label: 'Autonomous Stage 2: Papers', subtext: '(Less Hallucinatory - Recommended Output)', subtextClass: 'green', group: 'autonomous-main' },
     ...(autonomousConfig.tier3_enabled ? [
       { id: 'auto-final-answer', label: getFinalAnswerLabel(), subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-main' },
     ] : []),
   ];
 
   const autonomousSettingsTabs = [
-    { id: 'auto-final-answer-library', label: 'Long-Form Final Answer History', subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-settings' },
+    { id: 'auto-stage2-history', label: 'Stage 2 Final Answers History', group: 'autonomous-settings' },
+    { id: 'auto-final-answer-library', label: 'Stage 3 Final Answers History', subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-settings' },
     { id: 'auto-logs', label: 'API Call Logs', group: 'autonomous-settings' },
     { id: 'auto-settings', label: 'Autonomous Model Selection & Settings', group: 'autonomous-settings' },
   ];
 
-  const singlePaperWriterTabs = {
-    aggregator: [
-      { id: 'aggregator-interface', label: 'Interface' },
-      { id: 'aggregator-settings', label: 'Settings' },
-      { id: 'aggregator-logs', label: 'Logs' },
-      { id: 'aggregator-results', label: 'Live Results' },
-    ],
-    compiler: [
-      { id: 'compiler-interface', label: 'Interface' },
-      { id: 'compiler-settings', label: 'Settings' },
-      { id: 'compiler-logs', label: 'Logs' },
-      { id: 'compiler-live-paper', label: 'Live Paper' },
-    ]
-  };
+  const manualTabs = [
+    { id: 'aggregator-interface', label: 'Aggregator', subtext: 'Part 1', subtextClass: 'green', group: 'aggregator' },
+    { id: 'aggregator-settings', label: 'Aggregator Settings', group: 'aggregator' },
+    { id: 'aggregator-logs', label: 'Aggregator Logs', group: 'aggregator' },
+    { id: 'aggregator-results', label: 'Live Results', subtext: 'Part 1 Live Results', subtextClass: 'green', group: 'aggregator' },
+    { id: 'compiler-interface', label: 'Compiler', subtext: 'Part 2', subtextClass: 'green', group: 'compiler' },
+    { id: 'compiler-settings', label: 'Compiler Settings', group: 'compiler' },
+    { id: 'compiler-logs', label: 'Compiler Logs', group: 'compiler' },
+    { id: 'compiler-live-paper', label: 'Live Paper', subtext: 'Part 2 Live Results', subtextClass: 'green', group: 'compiler' },
+  ];
+
+  useEffect(() => {
+    if (!autonomousConfig.tier3_enabled && autonomousActiveTab === 'auto-final-answer') {
+      setAutonomousActiveTab('auto-interface');
+    }
+  }, [autonomousConfig.tier3_enabled, autonomousActiveTab]);
 
   // Sync with WorkflowPanel collapse state (stored in localStorage)
   useEffect(() => {
@@ -1177,10 +1643,10 @@ function App() {
         <div className="banner-content">
           <h1 className="banner-title">
             <span className="banner-moto">M.O.T.O.</span>
-            <span className="banner-subtitle">Deep Research Harness</span>
+            <span className="banner-subtitle">Autonomous ASI</span>
           </h1>
-          <p className="banner-variant"> A Prototype Super Intelligence - Creative Math Researcher Variant for S.T.E.M. (High Risk, High Reward Outputs)</p>
           <p className="banner-company">By Intrafere Research Group</p>
+          <p className="banner-variant">A Prototype Artificial Superintelligence - Novelty Seeking Autonomous S.T.E.M. Researcher For Automated Theorem Generation</p>
         </div>
       </div>
       
@@ -1189,6 +1655,20 @@ function App() {
       {/* They are visible at program launch and stay visible forever */}
       {/* Slide with WorkflowPanel collapse/expand animation */}
       <div className={`app-header ${workflowPanelCollapsed ? 'panel-collapsed' : ''}`}>
+        <div className="mode-switch-control">
+          <label className="mode-switch-label" htmlFor="app-mode-select">
+            Change Mode
+          </label>
+          <select
+            id="app-mode-select"
+            className="mode-switch-select"
+            value={appMode}
+            onChange={(e) => handleModeChange(e.target.value)}
+          >
+            <option value="autonomous">Autonomous S.T.E.M. ASI</option>
+            <option value="manual">Advanced Manual S.T.E.M. ASI</option>
+          </select>
+        </div>
         <button 
           className="boost-btn"
           onClick={() => setShowBoostModal(true)}
@@ -1199,8 +1679,7 @@ function App() {
         <button 
           className="boost-logs-btn"
           onClick={() => {
-            setActiveTab('boost-logs');
-            setShowSinglePaperWriter(false);
+            handleUtilityTabSelect('boost-logs');
           }}
           title="View Boost Logs"
         >
@@ -1216,8 +1695,8 @@ function App() {
           style={{
             marginLeft: '0.5rem',
             padding: '0.4rem 0.8rem',
-            backgroundColor: hasOpenRouterKey ? '#2d5a27' : '#4a3a00',
-            border: hasOpenRouterKey ? '1px solid #4CAF50' : '1px solid #f1c40f',
+            backgroundColor: hasOpenRouterKey ? '#2d5a27' : '#153815',
+            border: hasOpenRouterKey ? '1px solid #4CAF50' : '1px solid #1eff1c',
             borderRadius: '4px',
             color: '#fff',
             cursor: 'pointer',
@@ -1229,10 +1708,10 @@ function App() {
         {!lmStudioAvailable && (
           <span style={{ 
             marginLeft: '0.5rem', 
-            color: '#f1c40f', 
+            color: '#1eff1c', 
             fontSize: '0.8rem',
             padding: '0.25rem 0.5rem',
-            backgroundColor: 'rgba(241, 196, 15, 0.1)',
+            backgroundColor: 'rgba(30, 255, 28, 0.1)',
             borderRadius: '4px',
           }}>
             LM Studio Offline
@@ -1240,114 +1719,75 @@ function App() {
         )}
       </div>
       
-      <div className="tabs">
-        {mainTabs.map((tab, index) => {
-          const prevTab = mainTabs[index - 1];
-          const showSeparator = prevTab && prevTab.group !== tab.group;
-          
-          // Special styling for Final Answer tab
-          const isFinalAnswerTab = tab.id === 'auto-final-answer';
-          const tier3Classes = isFinalAnswerTab 
-            ? (autonomousStatus?.tier3_status === 'complete' 
-                ? 'tab-tier3-complete' 
-                : (autonomousStatus?.is_tier3_active ? 'tab-tier3-active' : ''))
-            : '';
-          
-          return (
-            <React.Fragment key={tab.id}>
-              {showSeparator && <div className="tab-separator" />}
-              <button
-                className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group} ${tier3Classes} ${tab.subtext ? 'tab-with-subtext' : ''}`}
-                onClick={() => {
-                  setActiveTab(tab.id);
-                  setShowSinglePaperWriter(false);
-                }}
-              >
-                <div className="tab-content-wrapper">
-                  <span className="tab-main-label">{tab.label}</span>
-                  {tab.subtext && <span className={`tab-subtext ${tab.subtextClass || ''}`}>{tab.subtext}</span>}
-                </div>
-              </button>
-            </React.Fragment>
-          );
-        })}
-        
-        {/* Large spacer for settings group */}
-        <div className="tab-group-spacer-large"></div>
-        
-        {autonomousSettingsTabs.map(tab => {
-          return (
-            <React.Fragment key={tab.id}>
-              <button
-                className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group}`}
-                onClick={() => {
-                  setActiveTab(tab.id);
-                  setShowSinglePaperWriter(false);
-                }}
-              >
-                {tab.label}
-              </button>
-            </React.Fragment>
-          );
-        })}
-      </div>
-      
-      {/* Expandable Single Paper Writer Section */}
-      <div className="expandable-section">
-        <button 
-          className={`expandable-trigger ${showSinglePaperWriter ? 'expanded' : ''}`}
-          onClick={() => {
-            const newState = !showSinglePaperWriter;
-            setShowSinglePaperWriter(newState);
-            localStorage.setItem('singlePaperWriterExpanded', JSON.stringify(newState));
-            if (newState && !singlePaperWriterActiveTab) {
-              setSinglePaperWriterActiveTab('aggregator-interface');
-            }
-          }}
-        >
-          <span className="expand-icon">{showSinglePaperWriter ? '▼' : '▶'}</span>
-          <span className="section-title">[Secondary Tool] SINGLE PAPER WRITER</span>
-          <span className="section-subtitle">(A manual brainstorm aggregator & paper compiler, an advanced controller mode with a "two user prompts" control mechanic, a separate optional mode from the Autonomous Deep Research mode above)</span>
-        </button>
-        
-        {showSinglePaperWriter && (
-          <div className="expandable-content">
-            <div className="subsection">
-              <div className="subsection-header">AGGREGATOR</div>
-              <div className="subsection-tabs">
-                {singlePaperWriterTabs.aggregator.map(tab => (
+      <div className={`tabs ${appMode === 'manual' ? 'tabs-manual' : ''}`}>
+        {appMode === 'autonomous' ? (
+          <>
+            {mainTabs.map((tab, index) => {
+              const prevTab = mainTabs[index - 1];
+              const showSeparator = prevTab && prevTab.group !== tab.group;
+              
+              // Special styling for Final Answer tab
+              const isFinalAnswerTab = tab.id === 'auto-final-answer';
+              const tier3Classes = isFinalAnswerTab 
+                ? (autonomousStatus?.tier3_status === 'complete' 
+                    ? 'tab-tier3-complete' 
+                    : (autonomousStatus?.is_tier3_active ? 'tab-tier3-active' : ''))
+                : '';
+              
+              return (
+                <React.Fragment key={tab.id}>
+                  {showSeparator && <div className="tab-separator" />}
                   <button
-                    key={tab.id}
-                    className={`subtab ${singlePaperWriterActiveTab === tab.id ? 'active' : ''}`}
-                    onClick={() => {
-                      setSinglePaperWriterActiveTab(tab.id);
-                      setActiveTab(null);
-                    }}
+                    className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group} ${tier3Classes} ${tab.subtext ? 'tab-with-subtext' : ''}`}
+                    onClick={() => handleAutonomousTabSelect(tab.id)}
                   >
-                    {tab.label}
+                    <div className="tab-content-wrapper">
+                      <span className="tab-main-label">{tab.label}</span>
+                      {tab.subtext && <span className={`tab-subtext ${tab.subtextClass || ''}`}>{tab.subtext}</span>}
+                    </div>
                   </button>
-                ))}
-              </div>
-            </div>
+                </React.Fragment>
+              );
+            })}
+            
+            {/* Large spacer for settings group */}
+            <div className="tab-group-spacer-large"></div>
             
-            <div className="subsection">
-              <div className="subsection-header">COMPILER</div>
-              <div className="subsection-tabs">
-                {singlePaperWriterTabs.compiler.map(tab => (
+            {autonomousSettingsTabs.map(tab => {
+              return (
+                <React.Fragment key={tab.id}>
                   <button
-                    key={tab.id}
-                    className={`subtab ${singlePaperWriterActiveTab === tab.id ? 'active' : ''}`}
-                    onClick={() => {
-                      setSinglePaperWriterActiveTab(tab.id);
-                      setActiveTab(null);
-                    }}
+                    className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group}`}
+                    onClick={() => handleAutonomousTabSelect(tab.id)}
                   >
                     {tab.label}
                   </button>
-                ))}
-              </div>
-            </div>
-          </div>
+                </React.Fragment>
+              );
+            })}
+          </>
+        ) : (
+          <>
+            {manualTabs.map((tab, index) => {
+              const prevTab = manualTabs[index - 1];
+              const showSeparator = prevTab && prevTab.group !== tab.group;
+
+              return (
+                <React.Fragment key={tab.id}>
+                  {showSeparator && <div className="tab-separator" />}
+                  <button
+                    className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group} ${tab.subtext ? 'tab-with-subtext' : ''}`}
+                    onClick={() => handleManualTabSelect(tab.id)}
+                  >
+                    <div className="tab-content-wrapper">
+                      <span className="tab-main-label">{tab.label}</span>
+                      {tab.subtext && <span className={`tab-subtext ${tab.subtextClass || ''}`}>{tab.subtext}</span>}
+                    </div>
+                  </button>
+                </React.Fragment>
+              );
+            })}
+          </>
         )}
       </div>
       
@@ -1383,6 +1823,7 @@ function App() {
           {activeTab === 'auto-interface' && (
             <AutonomousResearchInterface
               isRunning={autonomousRunning}
+              anyWorkflowRunning={anyWorkflowRunning}
               status={autonomousStatus}
               activity={autonomousActivity}
               onStart={handleAutonomousStart}
@@ -1420,6 +1861,13 @@ function App() {
               status={autonomousStatus}
             />
           )}
+          {activeTab === 'auto-stage2-history' && (
+            <Stage2PaperHistory
+              onCurrentSessionDataChanged={async () => {
+                await Promise.all([refreshPapers(), refreshBrainstorms()]);
+              }}
+            />
+          )}
           {activeTab === 'auto-final-answer-library' && (
             <FinalAnswerLibrary />
           )}
@@ -1431,20 +1879,28 @@ function App() {
           )}
           {activeTab === 'boost-logs' && <BoostLogs />}
           
-          {/* Single Paper Writer Content - ONLY when section is expanded */}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'aggregator-interface' && (
-            <AggregatorInterface config={config} setConfig={setConfig} />
+          {activeTab === 'aggregator-interface' && (
+            <AggregatorInterface
+              config={config}
+              setConfig={setConfig}
+              anyWorkflowRunning={anyWorkflowRunning}
+            />
           )}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'aggregator-settings' && (
+          {activeTab === 'aggregator-settings' && (
             <AggregatorSettings config={config} setConfig={setConfig} />
           )}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'aggregator-logs' && <AggregatorLogs />}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'aggregator-results' && <LiveResults />}
+          {activeTab === 'aggregator-logs' && <AggregatorLogs />}
+          {activeTab === 'aggregator-results' && <LiveResults />}
           
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'compiler-interface' && <CompilerInterface activeTab={singlePaperWriterActiveTab} />}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'compiler-settings' && <CompilerSettings />}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'compiler-logs' && <CompilerLogs />}
-          {showSinglePaperWriter && singlePaperWriterActiveTab === 'compiler-live-paper' && <LivePaper />}
+          {activeTab === 'compiler-interface' && (
+            <CompilerInterface
+              activeTab={activeTab}
+              anyWorkflowRunning={anyWorkflowRunning}
+            />
+          )}
+          {activeTab === 'compiler-settings' && <CompilerSettings />}
+          {activeTab === 'compiler-logs' && <CompilerLogs />}
+          {activeTab === 'compiler-live-paper' && <LivePaper />}
         </div>
       </div>
       
@@ -1469,32 +1925,62 @@ function App() {
           <div className="disclaimer-overlay" onClick={(e) => e.stopPropagation()} />
           <div className="disclaimer-modal">
             <div className="disclaimer-content">
-              <h2 style={{ marginTop: 0, marginBottom: '1.5rem', color: '#f1c40f' }}>
-                  In-Development Program Disclaimer
+              <h2 style={{ marginTop: 0, marginBottom: '1.5rem', color: '#1eff1c' }}>
+                  Disclaimer & Quickstart
               </h2>
-              <p style={{ fontSize: '0.95rem', lineHeight: '1.5', marginBottom: '1.5rem' }}>
-                Disclaimer: This program is a prototype super intelligence and is actively in development. MOTO operates by forcing your selected AI to attempt to output novel solutions toward your user prompt. Quality, correctness or any other aspects of a given solution are not guaranteed and should be examined with care and scrutiny. MOTO is not meant to produce a single paper, the first paper may lack in quality, MOTO is intended to generate many papers and improve with each completely new paper, best results show after 10+ papers.
-                Monitor the harness, logs and API keys for infinite loops, wasted API calls, and any other bugs. The paper text rendering system is experimental—display issues are <em>not</em> reflective of paper quality. If formatting appears messy, try a 3rd-party LaTeX renderer or copy the raw text into another LLM chat for verification.
-              </p>
-              <p style={{ fontSize: '1.1rem', lineHeight: '1.6', marginBottom: '1.5rem', color: '#ffcc00' }}>
-                <strong>QUICKSTART:</strong> (Optional) Load your Nomic embedding agent on LM STUDIO, or use an OpenRouter API key-only instead of LM STUDIO and go straight to picking your models, and then start the program - expect it to run for at the VERY LEAST hours to days once you hit run. You must leave your PC on and awake during runtime.
-              </p>
-              <p style={{ fontSize: '0.95rem', lineHeight: '1.5', marginBottom: '1.5rem', color: '#bbb' }}>
-                Please report all bugs and issues to project the repo at <a href="https://github.com/Intrafere/MOTO-Autonomous-ASI" target="_blank" rel="noopener noreferrer" style={{ color: '#f1c40f', textDecoration: 'none' }}>GitHub</a>.
-              </p>
-              <p style={{ fontSize: '0.95rem', lineHeight: '1.5', marginBottom: '1.5rem', color: '#bbb' }}>
-                Trouble shoot and modify this program easily using the code's specialized rules for AIs and Cursor.com's agentic code editing app - no programming experience required!
+              <p style={{ fontSize: '1.1rem', lineHeight: '1.6', marginBottom: '1.5rem', color: '#1eff1c' }}>
+                <strong>QUICKSTART:</strong> In LM Studio, load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code> by <strong>Nomic AI</strong> (optional but recommended), or use only an OpenRouter API key instead of LM Studio. You must leave your PC on and awake during runtime, the program will often run for days without interruption.
               </p>
+              <div
+                style={{
+                  marginBottom: '1.5rem',
+                  padding: '1rem 1.1rem',
+                  border: '1px solid rgba(30, 255, 28, 0.24)',
+                  borderRadius: '10px',
+                  background: 'rgba(30, 255, 28, 0.05)',
+                }}
+              >
+                <p
+                  style={{
+                    margin: '0 0 0.75rem 0',
+                    fontSize: '0.82rem',
+                    fontWeight: 700,
+                    letterSpacing: '0.06em',
+                    textTransform: 'uppercase',
+                    color: '#1eff1c',
+                  }}
+                >
+                  Legal Disclaimer
+                </p>
+                <p style={{ fontSize: '0.95rem', lineHeight: '1.5', margin: 0 }}>
+                  MOTO is an experimental prototype system and remains under active development. It directs selected AI models to generate novel solution attempts in response to your prompt. Outputs may be incorrect, incomplete, misleading, fabricated, poorly reasoned, or otherwise unsuitable for reliance without independent review, especially for high-stakes, academic, financial, legal, medical, engineering, or operational use.
+                  <br />
+                  <br />
+                  This software and all generated content are provided as-is and at your own risk. By using MOTO, you acknowledge that you are solely responsible for reviewing, validating, and deciding how to use any output, and that the developers, operators, and contributors are not responsible or liable for incorrect solutions, hallucinations, omissions, formatting issues, infinite loops, wasted API calls, model or provider failures, data loss, third-party charges, or any direct or indirect loss, damage, cost, or liability resulting from use of the program or its outputs.
+                </p>
+              </div>
               <button 
                 className="disclaimer-acknowledge-btn"
-                onClick={() => setShowDisclaimer(false)}
+                onClick={handleDisclaimerAcknowledge}
               >
-                Acknowledged
+                I Have Read and Acknowledge This Disclaimer
               </button>
             </div>
           </div>
         </>
       )}
+
+      <StartupProviderSetupModal
+        isOpen={showStartupSetupModal}
+        lmStudioAvailable={lmStudioAvailable}
+        hasUsableLmStudioChatModel={Boolean(lmStudioStatus.has_usable_chat_model)}
+        lmStudioModelCount={lmStudioStatus.model_count || 0}
+        lmStudioError={lmStudioStatus.error || ''}
+        statusMessage={startupSetupMessage}
+        isCheckingLmStudio={checkingLmStudioStartupChoice}
+        onChooseOpenRouter={handleStartupOpenRouterChoice}
+        onConfirmLmStudio={handleStartupLmStudioChoice}
+      />
       
       {/* Boost Control Modal */}
       <BoostControlModal 
@@ -1505,11 +1991,8 @@ function App() {
       {/* OpenRouter API Key Modal */}
       <OpenRouterApiKeyModal
         isOpen={showOpenRouterKeyModal}
-        onClose={() => setShowOpenRouterKeyModal(false)}
-        onKeySet={(key) => {
-          setHasOpenRouterKey(true);
-          console.log('OpenRouter API key set successfully');
-        }}
+        onClose={handleCloseOpenRouterKeyModal}
+        onKeySet={handleOpenRouterKeySet}
         reason={openRouterKeyReason}
       />
       
@@ -1527,6 +2010,19 @@ function App() {
         onClickNotification={handleClickNotification}
       />
       
+      {/* Credit Exhaustion Notification Stack - Persists until user dismisses */}
+      <CreditExhaustionNotificationStack
+        notifications={creditExhaustionNotifications}
+        onDismiss={handleDismissCreditNotification}
+        onDismissAll={() => setCreditExhaustionNotifications([])}
+      />
+
+      {/* Hung Connection Notification Stack - Persists until user dismisses */}
+      <HungConnectionNotificationStack
+        notifications={hungConnectionNotifications}
+        onDismiss={handleDismissHungNotification}
+      />
+      
       {/* Critique Modal - Opens when notification is clicked */}
       {showCritiqueModal && selectedCritiquePaper && (
         <PaperCritiqueModal
@@ -1557,7 +2053,7 @@ function App() {
               className="footer-link"
             >
               <span className="footer-icon">ℹ️</span>
-              About M.O.T.O.
+              Read More About MOTO ASI
             </a>
             <a
               href="https://intrafere.com/structured-brainstorming-validated-feedback/"
@@ -1576,6 +2072,23 @@ function App() {
             >
               MOTO News and Updates
             </a>
+            <a
+              href="https://intrafere.com/order-a-custom-orchestrator/"
+              target="_blank"
+              rel="noopener noreferrer"
+              className="footer-link footer-link-purchase"
+            >
+              Purchase a Custom ASI Program
+            </a>
+            <a
+              href="https://github.com/"
+              target="_blank"
+              rel="noopener noreferrer"
+              className="footer-link footer-link-github"
+            >
+              <span className="footer-icon">⭐</span>
+              Star Us on GitHub for More ASI Programs
+            </a>
           </div>
         </div>
       </footer>
diff --git a/frontend/src/components/BoostControlModal.css b/frontend/src/components/BoostControlModal.css
index 8c296bb..fbb5939 100644
--- a/frontend/src/components/BoostControlModal.css
+++ b/frontend/src/components/BoostControlModal.css
@@ -4,23 +4,24 @@
   left: 0;
   right: 0;
   bottom: 0;
-  background: rgba(0, 0, 0, 0.7);
+  background: rgba(0, 0, 0, 0.65);
   display: flex;
   align-items: center;
   justify-content: center;
   z-index: 2000;
+  backdrop-filter: blur(4px);
 }
 
 .boost-modal {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2, #1a1a22);
+  border: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
+  border-radius: var(--radius-lg, 14px);
   width: 90%;
   max-width: 600px;
   max-height: 90vh;
   display: flex;
   flex-direction: column;
-  box-shadow: 0 10px 40px rgba(0, 0, 0, 0.5);
+  box-shadow: var(--shadow-lg, 0 10px 40px rgba(0, 0, 0, 0.5));
 }
 
 .modal-header {
@@ -28,20 +29,21 @@
   justify-content: space-between;
   align-items: center;
   padding: 1.5rem;
-  border-bottom: 1px solid #333;
-  background: #0f0f0f;
+  border-bottom: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
+  background: var(--surface-0, #0b0b0f);
+  border-radius: var(--radius-lg, 14px) var(--radius-lg, 14px) 0 0;
 }
 
 .modal-header h2 {
   margin: 0;
   font-size: 1.5rem;
-  color: #ffd700;
+  color: var(--gold, #1eff1c);
 }
 
 .close-btn {
   background: none;
   border: none;
-  color: #888;
+  color: var(--text-muted, #666);
   font-size: 2rem;
   cursor: pointer;
   padding: 0;
@@ -54,7 +56,7 @@
 }
 
 .close-btn:hover {
-  color: #fff;
+  color: var(--text-primary, #e0e0e0);
 }
 
 .modal-body {
@@ -76,14 +78,14 @@
 }
 
 .boost-status-banner.enabled {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
+  background: linear-gradient(135deg, #1eff1c 0%, #7dff6f 100%);
   color: #000;
 }
 
 .boost-status-banner.disabled {
-  background: #2a2a2a;
-  color: #888;
-  border: 1px solid #444;
+  background: var(--surface-3, #22222c);
+  color: var(--text-muted, #666);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
 }
 
 .boost-model {
@@ -108,41 +110,42 @@
   border-radius: 4px;
 }
 
-.form-group {
+.boost-form-group {
   margin-bottom: 1.5rem;
 }
 
-.form-group label {
+.boost-form-group label {
   display: block;
   margin-bottom: 0.5rem;
   font-weight: 600;
   color: #fff;
 }
 
-.form-group input,
-.form-group select {
+.boost-form-group input,
+.boost-form-group select {
   width: 100%;
   padding: 0.75rem;
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
-  color: #fff;
+  background: var(--surface-3, #22222c);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
+  border-radius: var(--radius-sm, 6px);
+  color: var(--text-primary, #e0e0e0);
   font-size: 1rem;
 }
 
-.form-group input:focus,
-.form-group select:focus {
+.boost-form-group input:focus,
+.boost-form-group select:focus {
   outline: none;
-  border-color: #ffd700;
+  border-color: var(--gold, #1eff1c);
+  box-shadow: 0 0 0 3px var(--gold-glow, rgba(30, 255, 28, 0.12));
 }
 
-.form-group input:disabled,
-.form-group select:disabled {
+.boost-form-group input:disabled,
+.boost-form-group select:disabled {
   opacity: 0.5;
   cursor: not-allowed;
 }
 
-.form-group small {
+.boost-form-group small {
   display: block;
   margin-top: 0.5rem;
   color: #888;
@@ -155,13 +158,13 @@
   gap: 1rem;
 }
 
-.button-group {
+.boost-button-group {
   display: flex;
   gap: 0.75rem;
   margin-bottom: 1.5rem;
 }
 
-.button-group button {
+.boost-button-group button {
   flex: 1;
 }
 
@@ -185,23 +188,23 @@
 }
 
 .info-box {
-  background: #242424;
-  border: 1px solid #444;
-  border-radius: 6px;
+  background: var(--surface-3, #22222c);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
+  border-radius: var(--radius-sm, 6px);
   padding: 1rem;
   margin-top: 1.5rem;
 }
 
 .info-box h4 {
   margin: 0 0 0.75rem 0;
-  color: #4CAF50;
+  color: var(--accent-green, #4CAF50);
   font-size: 1rem;
 }
 
 .info-box ul {
   margin: 0;
   padding-left: 1.5rem;
-  color: #aaa;
+  color: var(--text-secondary, #9d9db0);
 }
 
 .info-box li {
@@ -214,8 +217,9 @@
   justify-content: flex-end;
   gap: 0.75rem;
   padding: 1.5rem;
-  border-top: 1px solid #333;
-  background: #0f0f0f;
+  border-top: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
+  background: var(--surface-0, #0b0b0f);
+  border-radius: 0 0 var(--radius-lg, 14px) var(--radius-lg, 14px);
 }
 
 button {
@@ -234,23 +238,23 @@ button:disabled {
 }
 
 button.primary {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
+  background: linear-gradient(135deg, #1eff1c 0%, #7dff6f 100%);
   color: #000;
 }
 
 button.primary:hover:not(:disabled) {
   transform: translateY(-1px);
-  box-shadow: 0 4px 12px rgba(255, 215, 0, 0.3);
+  box-shadow: 0 4px 12px rgba(30, 255, 28, 0.3);
 }
 
 button.secondary {
-  background: #2a2a2a;
-  color: #fff;
-  border: 1px solid #444;
+  background: var(--surface-3, #22222c);
+  color: var(--text-primary, #e0e0e0);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
 }
 
 button.secondary:hover:not(:disabled) {
-  background: #333;
+  background: var(--surface-4, #2a2a36);
 }
 
 button.danger {
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 14371f0..62f736d 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -1,5 +1,5 @@
 import React, { useState, useEffect } from 'react';
-import { api, boostAPI } from '../services/api';
+import { boostAPI, openRouterAPI } from '../services/api';
 import './BoostControlModal.css';
 
 export default function BoostControlModal({ isOpen, onClose }) {
@@ -17,49 +17,21 @@ export default function BoostControlModal({ isOpen, onClose }) {
   const [success, setSuccess] = useState('');
   const [boostStatus, setBoostStatus] = useState(null);
   const [freeOnly, setFreeOnly] = useState(false);
+  const [hasGlobalKey, setHasGlobalKey] = useState(false);
 
-  // Load saved API key from localStorage
-  useEffect(() => {
-    const savedKey = localStorage.getItem('openrouter_api_key');
-    if (savedKey) {
-      setApiKey(savedKey);
-    }
-  }, []);
-
-  // Fetch boost status
-  useEffect(() => {
-    if (isOpen) {
-      fetchBoostStatus();
-    }
-  }, [isOpen]);
+  const hasAvailableKey = Boolean(apiKey.trim() || hasGlobalKey);
 
-  const fetchBoostStatus = async () => {
-    try {
-      const response = await boostAPI.getStatus();
-      if (response.status) {
-        setBoostStatus(response.status);
-        if (response.status.enabled) {
-          setBoostModel(response.status.model_id);
-          setSelectedProvider(response.status.provider || '');
-          setContextWindow(response.status.context_window);
-          setMaxOutputTokens(response.status.max_output_tokens);
-        }
-      }
-    } catch (error) {
-      console.error('Failed to fetch boost status:', error);
-    }
-  };
-
-  // Fetch providers when model is selected
-  const fetchProviders = async (modelId) => {
-    if (!apiKey || !modelId) {
+  const fetchProviders = async (modelId, keyOverride = undefined) => {
+    if (!modelId) {
       setProviders([]);
       return;
     }
 
+    const effectiveKey = keyOverride === undefined ? apiKey.trim() : keyOverride;
+
     setLoadingProviders(true);
     try {
-      const response = await boostAPI.getModelProviders(apiKey, modelId);
+      const response = await boostAPI.getModelProviders(effectiveKey || null, modelId);
       if (response.providers) {
         setProviders(response.providers);
       } else {
@@ -73,6 +45,30 @@ export default function BoostControlModal({ isOpen, onClose }) {
     }
   };
 
+  const fetchBoostStatus = async (keyOverride = undefined) => {
+    const effectiveKey = keyOverride === undefined ? apiKey.trim() : keyOverride;
+
+    try {
+      const response = await boostAPI.getStatus();
+      if (response.status) {
+        setBoostStatus(response.status);
+        if (response.status.enabled) {
+          setBoostModel(response.status.model_id);
+          setSelectedProvider(response.status.provider || '');
+          setContextWindow(response.status.context_window);
+          setMaxOutputTokens(response.status.max_output_tokens);
+          if (response.status.model_id) {
+            await fetchProviders(response.status.model_id, effectiveKey);
+          }
+        } else {
+          setProviders([]);
+        }
+      }
+    } catch (error) {
+      console.error('Failed to fetch boost status:', error);
+    }
+  };
+
   // Handle model selection change
   const handleModelChange = (modelId) => {
     setBoostModel(modelId);
@@ -84,53 +80,96 @@ export default function BoostControlModal({ isOpen, onClose }) {
     }
   };
 
-  const fetchModels = async (freeFilter = freeOnly) => {
-    if (!apiKey) {
-      setError('Please enter an API key first');
-      return;
-    }
+  const fetchModels = async (
+    freeFilter = freeOnly,
+    { silent = false, keyOverride = undefined } = {}
+  ) => {
+    const effectiveKey = keyOverride === undefined ? apiKey.trim() : keyOverride;
 
     setLoading(true);
-    setError('');
+    if (!silent) {
+      setError('');
+      setSuccess('');
+    }
 
     try {
-      const response = await boostAPI.getOpenRouterModels(apiKey);
+      const response = await boostAPI.getOpenRouterModels(effectiveKey || null);
       if (response.models) {
-        // Filter for free models only if enabled
-        const filtered = freeFilter 
+        const filtered = freeFilter
           ? response.models.filter(model => model.pricing && model.pricing.prompt === '0' && model.pricing.completion === '0')
           : response.models;
         setModels(filtered);
-        setSuccess(`Models loaded successfully (${filtered.length} ${freeFilter ? 'free ' : ''}models)`);
+        if (!silent) {
+          setSuccess(`Models loaded successfully (${filtered.length} ${freeFilter ? 'free ' : ''}models)`);
+        }
       }
     } catch (error) {
-      setError(error.message || 'Failed to fetch models');
+      if (!silent) {
+        setError(error.message || 'Failed to fetch models');
+      }
     } finally {
       setLoading(false);
     }
   };
 
+  useEffect(() => {
+    if (!isOpen) {
+      return;
+    }
+
+    const initializeModal = async () => {
+      const savedKey = (localStorage.getItem('openrouter_api_key') || '').trim();
+      setApiKey(savedKey);
+      setError('');
+      setSuccess('');
+
+      let useGlobalKey = false;
+      try {
+        const keyStatus = await openRouterAPI.getApiKeyStatus();
+        useGlobalKey = Boolean(keyStatus.has_key);
+        setHasGlobalKey(useGlobalKey);
+      } catch (error) {
+        console.error('Failed to check OpenRouter key status for boost modal:', error);
+        setHasGlobalKey(false);
+      }
+
+      const preferredKey = useGlobalKey ? null : savedKey;
+      await fetchBoostStatus(preferredKey);
+
+      if (useGlobalKey || savedKey) {
+        await fetchModels(freeOnly, { silent: true, keyOverride: preferredKey });
+      } else {
+        setModels([]);
+      }
+    };
+
+    initializeModal();
+  }, [isOpen]);
+
   // Refetch models when free-only toggle changes
   useEffect(() => {
-    if (apiKey && models.length > 0) {
-      fetchModels(freeOnly);
+    if (isOpen && hasAvailableKey && models.length > 0) {
+      fetchModels(freeOnly, { silent: true });
     }
   }, [freeOnly]);
 
   const testConnection = async () => {
-    if (!apiKey) {
-      setError('Please enter an API key');
+    if (!hasAvailableKey) {
+      setError('Please enter an API key or use an active OpenRouter key');
       return;
     }
 
+    const effectiveKey = apiKey.trim() || null;
+    const usingGlobalKey = !apiKey.trim() && hasGlobalKey;
+
     setTesting(true);
     setError('');
     setSuccess('');
 
     try {
-      const response = await boostAPI.getOpenRouterModels(apiKey);
+      const response = await boostAPI.getOpenRouterModels(effectiveKey);
       if (response.models && response.models.length > 0) {
-        setSuccess(`✓ Connected successfully! Found ${response.models.length} models.`);
+        setSuccess(`✓ Connected successfully${usingGlobalKey ? ' using the active OpenRouter key' : ''}! Found ${response.models.length} models.`);
         setModels(response.models);
       } else {
         setError('Connected but no models found');
@@ -143,11 +182,13 @@ export default function BoostControlModal({ isOpen, onClose }) {
   };
 
   const enableBoost = async () => {
-    if (!apiKey || !boostModel) {
-      setError('Please enter API key and select a model');
+    if (!boostModel) {
+      setError('Please select a model');
       return;
     }
 
+    const trimmedApiKey = apiKey.trim();
+
     setLoading(true);
     setError('');
     setSuccess('');
@@ -155,7 +196,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
     try {
       const config = {
         enabled: true,
-        openrouter_api_key: apiKey,
+        openrouter_api_key: trimmedApiKey,
         boost_model_id: boostModel,
         boost_provider: selectedProvider || null,
         boost_context_window: contextWindow,
@@ -171,8 +212,9 @@ export default function BoostControlModal({ isOpen, onClose }) {
         response = await boostAPI.updateModel(config);
         
         if (response.success) {
-          // Save API key to localStorage
-          localStorage.setItem('openrouter_api_key', apiKey);
+          if (trimmedApiKey) {
+            localStorage.setItem('openrouter_api_key', trimmedApiKey);
+          }
           
           setSuccess(`✓ Boost model updated! State preserved: ${response.preserved_state.boost_next_count} next calls`);
           await fetchBoostStatus();
@@ -185,8 +227,9 @@ export default function BoostControlModal({ isOpen, onClose }) {
         response = await boostAPI.enable(config);
         
         if (response.success) {
-          // Save API key to localStorage
-          localStorage.setItem('openrouter_api_key', apiKey);
+          if (trimmedApiKey) {
+            localStorage.setItem('openrouter_api_key', trimmedApiKey);
+          }
           
           setSuccess('✓ Boost enabled successfully!');
           await fetchBoostStatus();
@@ -254,7 +297,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
             </div>
           )}
 
-          <div className="form-group">
+          <div className="boost-form-group">
             <label>OpenRouter API Key</label>
             <input
               type="password"
@@ -263,20 +306,20 @@ export default function BoostControlModal({ isOpen, onClose }) {
               placeholder="sk-or-..."
               disabled={loading}
             />
-            <small>Your API key is stored locally and never sent to our servers</small>
+            <small>Leave this blank to reuse the active OpenRouter key, or paste a different key just for boost.</small>
           </div>
 
-          <div className="button-group">
+          <div className="boost-button-group">
             <button 
               onClick={testConnection} 
-              disabled={testing || !apiKey}
+              disabled={testing || !hasAvailableKey}
               className="secondary"
             >
               {testing ? 'Testing...' : 'Test Connection'}
             </button>
             <button 
               onClick={() => fetchModels(freeOnly)} 
-              disabled={loading || !apiKey}
+              disabled={loading || !hasAvailableKey}
               className="secondary"
             >
               {loading ? 'Loading...' : 'Load Models'}
@@ -292,7 +335,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
             </label>
           </div>
 
-          <div className="form-group">
+          <div className="boost-form-group">
             <label>Boost Model</label>
             <select
               value={boostModel}
@@ -307,12 +350,12 @@ export default function BoostControlModal({ isOpen, onClose }) {
               ))}
             </select>
             {models.length === 0 && (
-              <small>Click "Load Models" to fetch available models</small>
+              <small>Models load automatically when an OpenRouter key is active. Use "Load Models" to refresh.</small>
             )}
           </div>
 
           {boostModel && (
-            <div className="form-group">
+            <div className="boost-form-group">
               <label>Provider</label>
               <select
                 value={selectedProvider}
@@ -339,7 +382,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
           )}
 
           <div className="form-row">
-            <div className="form-group">
+            <div className="boost-form-group">
               <label>Context Window</label>
               <input
                 type="number"
@@ -352,7 +395,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
               />
             </div>
 
-            <div className="form-group">
+            <div className="boost-form-group">
               <label>Max Output Tokens</label>
               <input
                 type="number"
@@ -384,7 +427,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
               <li>Click tasks in the MOTO Workflow panel to toggle boost</li>
               <li>Boosted tasks use your OpenRouter model instead of LM Studio</li>
               <li>If credits run out, system falls back to LM Studio automatically</li>
-              <li>You can continuously select which tasks use the boost</li>
+              <li>You can toggle which tasks use the boost at any time</li>
             </ul>
           </div>
         </div>
@@ -394,7 +437,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
             <>
               <button 
                 onClick={enableBoost} 
-                disabled={loading || !apiKey || !boostModel}
+                disabled={loading || !boostModel}
                 className="primary"
                 title="Update boost model (preserves boost_next_count and categories)"
               >
@@ -411,7 +454,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
           ) : (
             <button 
               onClick={enableBoost} 
-              disabled={loading || !apiKey || !boostModel}
+              disabled={loading || !boostModel}
               className="primary"
             >
               {loading ? 'Enabling...' : 'Enable Boost'}
diff --git a/frontend/src/components/BoostLogs.css b/frontend/src/components/BoostLogs.css
index 7c2593f..720dd46 100644
--- a/frontend/src/components/BoostLogs.css
+++ b/frontend/src/components/BoostLogs.css
@@ -13,7 +13,7 @@
 
 .boost-logs-header h2 {
   margin: 0;
-  color: #ffd700;
+  color: var(--gold, #1eff1c);
   font-size: 1.5rem;
 }
 
@@ -80,26 +80,26 @@
 }
 
 .stat-card {
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 8px;
+  background: var(--surface-3, #22222c);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
+  border-radius: var(--radius-md, 10px);
   padding: 1rem;
   text-align: center;
 }
 
 .stat-card.success {
-  border-color: #4CAF50;
+  border-color: rgba(76, 175, 80, 0.35);
 }
 
 .stat-card.error {
-  border-color: #dc3545;
+  border-color: rgba(220, 53, 69, 0.35);
 }
 
 .stat-value {
   display: block;
   font-size: 1.75rem;
   font-weight: 700;
-  color: #ffd700;
+  color: var(--gold, #1eff1c);
   margin-bottom: 0.25rem;
 }
 
@@ -142,8 +142,8 @@
 
 /* Logs List */
 .boost-logs-list {
-  border: 1px solid #333;
-  border-radius: 8px;
+  border: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
+  border-radius: var(--radius-md, 10px);
   overflow: hidden;
 }
 
@@ -163,20 +163,20 @@
   font-style: italic;
 }
 
-.log-entry {
-  border-bottom: 1px solid #333;
-  background: #1a1a1a;
+.boost-log-entry {
+  border-bottom: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
+  background: var(--surface-2, #1a1a22);
 }
 
-.log-entry:last-child {
+.boost-log-entry:last-child {
   border-bottom: none;
 }
 
-.log-entry.success {
-  border-left: 3px solid #4CAF50;
+.boost-log-entry.success {
+  border-left: 3px solid var(--accent-green, #4CAF50);
 }
 
-.log-entry.error {
+.boost-log-entry.error {
   border-left: 3px solid #dc3545;
 }
 
@@ -191,7 +191,7 @@
 }
 
 .log-summary:hover {
-  background: #242424;
+  background: var(--surface-3, #22222c);
 }
 
 .log-status {
@@ -204,11 +204,11 @@
   font-weight: 700;
 }
 
-.log-entry.success .log-status {
+.boost-log-entry.success .log-status {
   color: #4CAF50;
 }
 
-.log-entry.error .log-status {
+.boost-log-entry.error .log-status {
   color: #dc3545;
 }
 
@@ -233,10 +233,10 @@
 }
 
 .log-mode-badge {
-  background: #ffd700;
+  background: var(--gold, #1eff1c);
   color: #000;
   padding: 0.15rem 0.4rem;
-  border-radius: 3px;
+  border-radius: var(--radius-sm, 6px);
   font-size: 0.7rem;
   font-weight: 600;
   text-transform: uppercase;
@@ -270,8 +270,8 @@
 /* Log Details (Expanded) */
 .log-details {
   padding: 1rem;
-  background: #0f0f0f;
-  border-top: 1px solid #333;
+  background: var(--surface-0, #0b0b0f);
+  border-top: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
 }
 
 .log-detail-section {
diff --git a/frontend/src/components/BoostLogs.jsx b/frontend/src/components/BoostLogs.jsx
index 08fd336..f0def8e 100644
--- a/frontend/src/components/BoostLogs.jsx
+++ b/frontend/src/components/BoostLogs.jsx
@@ -178,7 +178,7 @@ export default function BoostLogs() {
           logs.map((log, index) => (
             <div 
               key={index} 
-              className={`log-entry ${log.success ? 'success' : 'error'} ${expandedIndex === index ? 'expanded' : ''}`}
+              className={`boost-log-entry ${log.success ? 'success' : 'error'} ${expandedIndex === index ? 'expanded' : ''}`}
             >
               <div 
                 className="log-summary"
diff --git a/frontend/src/components/CreditExhaustionNotificationStack.jsx b/frontend/src/components/CreditExhaustionNotificationStack.jsx
new file mode 100644
index 0000000..8c6f78a
--- /dev/null
+++ b/frontend/src/components/CreditExhaustionNotificationStack.jsx
@@ -0,0 +1,259 @@
+import React from 'react';
+import { openRouterAPI } from '../services/api';
+
+const IconX = ({ className }) => (
+  <svg className={className} width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+    <line x1="18" y1="6" x2="6" y2="18"></line>
+    <line x1="6" y1="6" x2="18" y2="18"></line>
+  </svg>
+);
+
+const IconAlert = ({ className, style }) => (
+  <svg className={className} style={style} width="18" height="18" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+    <path d="M10.29 3.86L1.82 18a2 2 0 0 0 1.71 3h16.94a2 2 0 0 0 1.71-3L13.71 3.86a2 2 0 0 0-3.42 0z"></path>
+    <line x1="12" y1="9" x2="12" y2="13"></line>
+    <line x1="12" y1="17" x2="12.01" y2="17"></line>
+  </svg>
+);
+
+/**
+ * Persistent notification stack for OpenRouter credit exhaustion alerts.
+ * Red-themed, stays visible until the user explicitly dismisses each notification.
+ * Includes a "Retry OpenRouter" button that resets exhaustion flags so roles resume.
+ *
+ * Props:
+ * - notifications: Array of { id, role_id, message, reason, timestamp }
+ * - onDismiss: (id) => void
+ * - onDismissAll: () => void
+ */
+export default function CreditExhaustionNotificationStack({ notifications, onDismiss, onDismissAll }) {
+  const [resetting, setResetting] = React.useState(false);
+  const [resetResult, setResetResult] = React.useState(null);
+
+  if (!notifications || notifications.length === 0) {
+    return null;
+  }
+
+  const handleRetryOpenRouter = async () => {
+    setResetting(true);
+    setResetResult(null);
+    try {
+      const result = await openRouterAPI.resetCreditExhaustion();
+      setResetResult({ success: true, message: result.message });
+      setTimeout(() => {
+        if (onDismissAll) onDismissAll();
+        setResetResult(null);
+      }, 2000);
+    } catch (err) {
+      setResetResult({ success: false, message: err.message || 'Reset failed' });
+    } finally {
+      setResetting(false);
+    }
+  };
+
+  return (
+    <div
+      style={{
+        position: 'fixed',
+        bottom: '20px',
+        left: '20px',
+        zIndex: 999999,
+        display: 'flex',
+        flexDirection: 'column',
+        gap: '8px',
+        pointerEvents: 'none',
+      }}
+    >
+      {notifications.map((notification) => (
+        <CreditExhaustionNotification
+          key={notification.id}
+          notification={notification}
+          onDismiss={onDismiss}
+        />
+      ))}
+
+      {/* Retry OpenRouter button */}
+      <div style={{ pointerEvents: 'auto' }}>
+        {resetResult && (
+          <div style={{
+            padding: '8px 12px',
+            borderRadius: '8px',
+            fontSize: '11px',
+            fontWeight: '500',
+            textAlign: 'center',
+            backgroundColor: resetResult.success ? 'rgba(76, 175, 80, 0.15)' : 'rgba(244, 67, 54, 0.15)',
+            color: resetResult.success ? '#4CAF50' : '#f44336',
+            border: `1px solid ${resetResult.success ? 'rgba(76, 175, 80, 0.4)' : 'rgba(244, 67, 54, 0.4)'}`,
+          }}>
+            {resetResult.message}
+          </div>
+        )}
+        <button
+          onClick={handleRetryOpenRouter}
+          disabled={resetting}
+          style={{
+            width: '320px',
+            padding: '10px 16px',
+            backgroundColor: resetting ? '#333' : 'rgba(108, 92, 231, 0.9)',
+            border: '1px solid rgba(108, 92, 231, 0.6)',
+            borderRadius: '10px',
+            color: '#fff',
+            fontSize: '13px',
+            fontWeight: '600',
+            cursor: resetting ? 'not-allowed' : 'pointer',
+            opacity: resetting ? 0.6 : 1,
+            transition: 'all 0.2s',
+          }}
+          onMouseEnter={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(108, 92, 231, 1)'; }}
+          onMouseLeave={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(108, 92, 231, 0.9)'; }}
+        >
+          {resetting ? 'Resetting...' : 'Retry OpenRouter (Credits Added)'}
+        </button>
+      </div>
+    </div>
+  );
+}
+
+function CreditExhaustionNotification({ notification, onDismiss }) {
+  const [isHovered, setIsHovered] = React.useState(false);
+  const [isExiting, setIsExiting] = React.useState(false);
+
+  const handleDismiss = (e) => {
+    e.stopPropagation();
+    setIsExiting(true);
+    setTimeout(() => {
+      onDismiss(notification.id);
+    }, 300);
+  };
+
+  const roleLabel = notification.role_id
+    ? notification.role_id.replace(/_/g, ' ').replace(/\b\w/g, c => c.toUpperCase())
+    : 'Unknown Role';
+
+  const isNoFallback = notification.reason === 'no_fallback_configured';
+
+  return (
+    <div
+      onMouseEnter={() => setIsHovered(true)}
+      onMouseLeave={() => setIsHovered(false)}
+      style={{
+        width: '320px',
+        minHeight: '90px',
+        background: `linear-gradient(135deg, ${isHovered ? 'rgba(180, 30, 30, 0.97)' : 'rgba(60, 15, 15, 0.96)'}, ${isHovered ? 'rgba(140, 20, 20, 0.97)' : 'rgba(40, 10, 10, 0.96)'})`,
+        backdropFilter: 'blur(8px)',
+        borderRadius: '12px',
+        padding: '14px',
+        boxShadow: isHovered
+          ? '0 20px 40px -12px rgba(231, 76, 60, 0.6), 0 0 0 1px rgba(231, 76, 60, 0.5)'
+          : '0 10px 30px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(231, 76, 60, 0.4)',
+        border: `1px solid ${isHovered ? 'rgba(231, 76, 60, 0.7)' : 'rgba(231, 76, 60, 0.5)'}`,
+        transition: 'all 0.3s cubic-bezier(0.4, 0, 0.2, 1)',
+        transform: isExiting
+          ? 'translateX(-360px) scale(0.8)'
+          : `scale(${isHovered ? 1.02 : 1})`,
+        opacity: isExiting ? 0 : 1,
+        pointerEvents: 'auto',
+        animation: isExiting ? 'none' : 'creditSlideIn 0.4s cubic-bezier(0.4, 0, 0.2, 1)',
+      }}
+    >
+      {/* Header */}
+      <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: '8px' }}>
+        <div style={{ display: 'flex', alignItems: 'center', gap: '8px' }}>
+          <div
+            style={{
+              padding: '6px',
+              backgroundColor: 'rgba(231, 76, 60, 0.35)',
+              borderRadius: '8px',
+              display: 'flex',
+              alignItems: 'center',
+              justifyContent: 'center',
+            }}
+          >
+            <IconAlert style={{ color: '#ff6b6b' }} />
+          </div>
+          <div>
+            <div style={{ fontSize: '10px', color: '#ff9999', textTransform: 'uppercase', letterSpacing: '0.05em', fontWeight: '600' }}>
+              Credits Exhausted
+            </div>
+            <div style={{ fontSize: '14px', fontWeight: '700', lineHeight: '1.2', color: '#ff6b6b' }}>
+              OpenRouter
+            </div>
+          </div>
+        </div>
+
+        {/* Dismiss button */}
+        <button
+          onClick={handleDismiss}
+          style={{
+            padding: '4px',
+            backgroundColor: 'transparent',
+            border: 'none',
+            borderRadius: '6px',
+            cursor: 'pointer',
+            color: '#ff9999',
+            transition: 'all 0.2s',
+            display: 'flex',
+            alignItems: 'center',
+            justifyContent: 'center',
+          }}
+          onMouseEnter={(e) => {
+            e.currentTarget.style.backgroundColor = 'rgba(255, 100, 100, 0.25)';
+            e.currentTarget.style.color = '#ffffff';
+          }}
+          onMouseLeave={(e) => {
+            e.currentTarget.style.backgroundColor = 'transparent';
+            e.currentTarget.style.color = '#ff9999';
+          }}
+        >
+          <IconX />
+        </button>
+      </div>
+
+      {/* Role info */}
+      <div
+        style={{
+          fontSize: '12px',
+          fontWeight: '500',
+          color: '#f3f4f6',
+          lineHeight: '1.4',
+          marginBottom: '4px',
+        }}
+      >
+        {roleLabel}
+      </div>
+
+      {/* Message */}
+      <div
+        style={{
+          fontSize: '11px',
+          color: '#ffbbbb',
+          lineHeight: '1.4',
+          overflow: 'hidden',
+          textOverflow: 'ellipsis',
+          display: '-webkit-box',
+          WebkitLineClamp: 3,
+          WebkitBoxOrient: 'vertical',
+        }}
+      >
+        {isNoFallback
+          ? 'No LM Studio fallback configured. This role has stopped. Configure a fallback model or add credits.'
+          : notification.fallback_model
+            ? `Fell back to LM Studio model: ${notification.fallback_model}`
+            : (notification.message || 'OpenRouter credits have been exhausted for this role.')}
+      </div>
+
+      <style>{`
+        @keyframes creditSlideIn {
+          from {
+            transform: translateX(-360px) scale(0.8);
+            opacity: 0;
+          }
+          to {
+            transform: translateX(0) scale(1);
+            opacity: 1;
+          }
+        }
+      `}</style>
+    </div>
+  );
+}
diff --git a/frontend/src/components/CritiqueNotificationStack.jsx b/frontend/src/components/CritiqueNotificationStack.jsx
index 1237003..01e5f31 100644
--- a/frontend/src/components/CritiqueNotificationStack.jsx
+++ b/frontend/src/components/CritiqueNotificationStack.jsx
@@ -18,9 +18,9 @@ const IconStar = ({ className }) => (
  * Get color classes based on average rating
  */
 function getRatingColor(rating) {
-  if (rating >= 8) return { text: 'text-emerald-400', bg: 'bg-emerald-500', gradient: 'from-emerald-600 to-emerald-500' };
-  if (rating >= 6.25) return { text: 'text-blue-400', bg: 'bg-blue-500', gradient: 'from-blue-600 to-blue-500' };
-  return { text: 'text-gray-400', bg: 'bg-gray-500', gradient: 'from-gray-600 to-gray-500' };
+  if (rating >= 8) return { text: '#34d399', bg: '#10b981' };
+  if (rating >= 6.25) return { text: '#60a5fa', bg: '#3b82f6' };
+  return { text: '#9ca3af', bg: '#6b7280' };
 }
 
 /**
@@ -98,14 +98,14 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       style={{
         width: '280px',
         minHeight: '80px',
-        background: `linear-gradient(135deg, ${isHovered ? 'rgba(88, 28, 135, 0.95)' : 'rgba(26, 26, 46, 0.95)'}, ${isHovered ? 'rgba(30, 58, 138, 0.95)' : 'rgba(17, 24, 39, 0.95)'})`,
+        background: `linear-gradient(135deg, ${isHovered ? 'rgba(20, 83, 45, 0.95)' : 'rgba(26, 26, 46, 0.95)'}, ${isHovered ? 'rgba(15, 60, 15, 0.95)' : 'rgba(17, 24, 39, 0.95)'})`,
         backdropFilter: 'blur(8px)',
         borderRadius: '12px',
         padding: '12px',
         boxShadow: isHovered 
-          ? '0 20px 40px -12px rgba(147, 51, 234, 0.6), 0 0 0 1px rgba(147, 51, 234, 0.5)'
-          : '0 10px 30px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(147, 51, 234, 0.3)',
-        border: `1px solid ${isHovered ? 'rgba(147, 51, 234, 0.6)' : 'rgba(147, 51, 234, 0.4)'}`,
+          ? '0 20px 40px -12px rgba(30, 255, 28, 0.5), 0 0 0 1px rgba(30, 255, 28, 0.5)'
+          : '0 10px 30px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(30, 255, 28, 0.3)',
+        border: `1px solid ${isHovered ? 'rgba(30, 255, 28, 0.6)' : 'rgba(30, 255, 28, 0.4)'}`,
         cursor: 'pointer',
         transition: 'all 0.3s cubic-bezier(0.4, 0, 0.2, 1)',
         transform: isExiting 
@@ -122,20 +122,20 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
           <div
             style={{
               padding: '6px',
-              backgroundColor: 'rgba(147, 51, 234, 0.3)',
+              backgroundColor: 'rgba(30, 255, 28, 0.2)',
               borderRadius: '8px',
               display: 'flex',
               alignItems: 'center',
               justifyContent: 'center',
             }}
           >
-            <IconStar className={`w-4 h-4 ${colors.text}`} />
+            <IconStar style={{ color: colors.text }} />
           </div>
           <div>
             <div style={{ fontSize: '10px', color: '#9ca3af', textTransform: 'uppercase', letterSpacing: '0.05em' }}>
               High Score
             </div>
-            <div className={colors.text} style={{ fontSize: '18px', fontWeight: '700', lineHeight: '1' }}>
+            <div style={{ color: colors.text, fontSize: '18px', fontWeight: '700', lineHeight: '1' }}>
               {notification.average_rating.toFixed(1)}/10
             </div>
           </div>
@@ -165,7 +165,7 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
             e.target.style.color = '#9ca3af';
           }}
         >
-          <IconX className="w-3 h-3" />
+          <IconX />
         </button>
       </div>
 
@@ -191,7 +191,7 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       <div
         style={{
           fontSize: '10px',
-          color: '#a78bfa',
+          color: '#1eff1c',
           marginTop: '6px',
           opacity: isHovered ? 1 : 0.7,
           transition: 'opacity 0.2s',
diff --git a/frontend/src/components/HungConnectionNotificationStack.jsx b/frontend/src/components/HungConnectionNotificationStack.jsx
new file mode 100644
index 0000000..765f8d8
--- /dev/null
+++ b/frontend/src/components/HungConnectionNotificationStack.jsx
@@ -0,0 +1,188 @@
+import React from 'react';
+
+const IconX = ({ className }) => (
+  <svg className={className} width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+    <line x1="18" y1="6" x2="6" y2="18"></line>
+    <line x1="6" y1="6" x2="18" y2="18"></line>
+  </svg>
+);
+
+const IconClock = ({ style }) => (
+  <svg style={style} width="18" height="18" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+    <circle cx="12" cy="12" r="10"></circle>
+    <polyline points="12 6 12 12 16 14"></polyline>
+  </svg>
+);
+
+/**
+ * Persistent notification stack for hung API connection alerts.
+ * Amber-themed, stays visible until the user explicitly dismisses each notification.
+ *
+ * Props:
+ * - notifications: Array of { id, role_id, model, provider, elapsed_minutes, message, timestamp }
+ * - onDismiss: (id) => void
+ */
+export default function HungConnectionNotificationStack({ notifications, onDismiss }) {
+  if (!notifications || notifications.length === 0) {
+    return null;
+  }
+
+  return (
+    <div
+      style={{
+        position: 'fixed',
+        bottom: '20px',
+        left: '360px',
+        zIndex: 999999,
+        display: 'flex',
+        flexDirection: 'column',
+        gap: '8px',
+        pointerEvents: 'none',
+      }}
+    >
+      {notifications.map((notification) => (
+        <HungConnectionNotification
+          key={notification.id}
+          notification={notification}
+          onDismiss={onDismiss}
+        />
+      ))}
+    </div>
+  );
+}
+
+function HungConnectionNotification({ notification, onDismiss }) {
+  const [isHovered, setIsHovered] = React.useState(false);
+  const [isExiting, setIsExiting] = React.useState(false);
+
+  const handleDismiss = (e) => {
+    e.stopPropagation();
+    setIsExiting(true);
+    setTimeout(() => {
+      onDismiss(notification.id);
+    }, 300);
+  };
+
+  const modelLabel = notification.model || 'Unknown Model';
+  const providerLabel = notification.provider || 'Unknown Provider';
+
+  return (
+    <div
+      onMouseEnter={() => setIsHovered(true)}
+      onMouseLeave={() => setIsHovered(false)}
+      style={{
+        width: '320px',
+        minHeight: '90px',
+        background: `linear-gradient(135deg, ${isHovered ? 'rgba(180, 120, 20, 0.97)' : 'rgba(60, 40, 10, 0.96)'}, ${isHovered ? 'rgba(140, 90, 10, 0.97)' : 'rgba(40, 25, 5, 0.96)'})`,
+        backdropFilter: 'blur(8px)',
+        borderRadius: '12px',
+        padding: '14px',
+        boxShadow: isHovered
+          ? '0 20px 40px -12px rgba(255, 165, 0, 0.6), 0 0 0 1px rgba(255, 165, 0, 0.5)'
+          : '0 10px 30px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(255, 165, 0, 0.4)',
+        border: `1px solid ${isHovered ? 'rgba(255, 165, 0, 0.7)' : 'rgba(255, 165, 0, 0.5)'}`,
+        transition: 'all 0.3s cubic-bezier(0.4, 0, 0.2, 1)',
+        transform: isExiting
+          ? 'translateX(-360px) scale(0.8)'
+          : `scale(${isHovered ? 1.02 : 1})`,
+        opacity: isExiting ? 0 : 1,
+        pointerEvents: 'auto',
+        animation: isExiting ? 'none' : 'hungSlideIn 0.4s cubic-bezier(0.4, 0, 0.2, 1)',
+      }}
+    >
+      {/* Header */}
+      <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: '8px' }}>
+        <div style={{ display: 'flex', alignItems: 'center', gap: '8px' }}>
+          <div
+            style={{
+              padding: '6px',
+              backgroundColor: 'rgba(255, 165, 0, 0.35)',
+              borderRadius: '8px',
+              display: 'flex',
+              alignItems: 'center',
+              justifyContent: 'center',
+            }}
+          >
+            <IconClock style={{ color: '#ffb347' }} />
+          </div>
+          <div>
+            <div style={{ fontSize: '10px', color: '#ffd699', textTransform: 'uppercase', letterSpacing: '0.05em', fontWeight: '600' }}>
+              Possible Hung Connection
+            </div>
+            <div style={{ fontSize: '14px', fontWeight: '700', lineHeight: '1.2', color: '#ffb347' }}>
+              {notification.elapsed_minutes}+ Minutes
+            </div>
+          </div>
+        </div>
+
+        <button
+          onClick={handleDismiss}
+          style={{
+            padding: '4px',
+            backgroundColor: 'transparent',
+            border: 'none',
+            borderRadius: '6px',
+            cursor: 'pointer',
+            color: '#ffd699',
+            transition: 'all 0.2s',
+            display: 'flex',
+            alignItems: 'center',
+            justifyContent: 'center',
+          }}
+          onMouseEnter={(e) => {
+            e.currentTarget.style.backgroundColor = 'rgba(255, 180, 50, 0.25)';
+            e.currentTarget.style.color = '#ffffff';
+          }}
+          onMouseLeave={(e) => {
+            e.currentTarget.style.backgroundColor = 'transparent';
+            e.currentTarget.style.color = '#ffd699';
+          }}
+        >
+          <IconX />
+        </button>
+      </div>
+
+      {/* Model info */}
+      <div
+        style={{
+          fontSize: '12px',
+          fontWeight: '500',
+          color: '#f3f4f6',
+          lineHeight: '1.4',
+          marginBottom: '4px',
+        }}
+      >
+        {modelLabel} via {providerLabel}
+      </div>
+
+      {/* Message */}
+      <div
+        style={{
+          fontSize: '11px',
+          color: '#ffe0a3',
+          lineHeight: '1.4',
+          overflow: 'hidden',
+          textOverflow: 'ellipsis',
+          display: '-webkit-box',
+          WebkitLineClamp: 3,
+          WebkitBoxOrient: 'vertical',
+        }}
+      >
+        Connection may be hung. Consider stopping and trying a different host/provider.
+      </div>
+
+      <style>{`
+        @keyframes hungSlideIn {
+          from {
+            transform: translateX(-360px) scale(0.8);
+            opacity: 0;
+          }
+          to {
+            transform: translateX(0) scale(1);
+            opacity: 1;
+          }
+        }
+      `}</style>
+    </div>
+  );
+}
diff --git a/frontend/src/components/LatexRenderer.css b/frontend/src/components/LatexRenderer.css
index 025f22a..5b163f2 100644
--- a/frontend/src/components/LatexRenderer.css
+++ b/frontend/src/components/LatexRenderer.css
@@ -10,28 +10,28 @@
   align-items: center;
   justify-content: space-between;
   padding: 0.5rem 1rem;
-  background: #1a1a1a;
-  border-bottom: 1px solid #333;
+  background: var(--surface-2, #1a1a22);
+  border-bottom: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
   flex-shrink: 0;
 }
 
 .latex-toggle-buttons {
   display: flex;
   gap: 0.25rem;
-  background: #0f0f0f;
+  background: var(--surface-0, #0b0b0f);
   padding: 0.25rem;
-  border-radius: 6px;
+  border-radius: var(--radius-sm, 6px);
 }
 
 .latex-toggle-btn {
   padding: 0.5rem 1rem;
   background: transparent;
   border: none;
-  color: #999;
+  color: var(--text-secondary, #999);
   cursor: pointer;
   font-size: 0.85rem;
   font-weight: 500;
-  border-radius: 4px;
+  border-radius: var(--radius-sm, 6px);
   transition: all 0.2s ease;
   display: flex;
   align-items: center;
@@ -39,33 +39,33 @@
 }
 
 .latex-toggle-btn:hover {
-  color: #fff;
-  background: rgba(255, 255, 255, 0.1);
+  color: var(--text-primary, #fff);
+  background: rgba(255, 255, 255, 0.06);
 }
 
 .latex-toggle-btn.active {
-  background: #4CAF50;
+  background: var(--accent-green, #4CAF50);
   color: white;
   font-weight: 600;
 }
 
 .latex-indicator {
   font-size: 0.8rem;
-  color: #4CAF50;
+  color: var(--accent-green, #4CAF50);
   display: flex;
   align-items: center;
   gap: 0.25rem;
 }
 
 .latex-indicator.no-latex {
-  color: #666;
+  color: var(--text-muted, #666);
 }
 
 .latex-content-container {
   flex: 1;
   overflow-y: visible;
   padding: 3rem 4.5rem;
-  background: #0a0a0a;
+  background: var(--surface-1, #131318);
   min-height: 400px;
 }
 
@@ -194,12 +194,12 @@
 }
 
 .latex-theorem {
-  border-color: #ffd700;
-  background: rgba(255, 215, 0, 0.05);
+  border-color: #1eff1c;
+  background: rgba(30, 255, 28, 0.05);
 }
 
 .latex-theorem strong {
-  color: #ffd700;
+  color: #1eff1c;
 }
 
 .latex-lemma {
@@ -326,11 +326,11 @@
 
 .latex-chapter {
   font-size: 2rem !important;
-  border-bottom: 3px solid #ffd700 !important;
+  border-bottom: 3px solid #1eff1c !important;
   padding-bottom: 1rem !important;
   margin-top: 3rem !important;
   margin-bottom: 1.5rem !important;
-  color: #ffd700 !important;
+  color: #1eff1c !important;
 }
 
 .latex-section {
@@ -596,18 +596,18 @@
 }
 
 .latex-content-container::-webkit-scrollbar-track {
-  background: #1a1a1a;
+  background: var(--surface-2, #1a1a22);
   border-radius: 5px;
 }
 
 .latex-content-container::-webkit-scrollbar-thumb {
-  background: #444;
+  background: var(--surface-4, #2a2a36);
   border-radius: 5px;
-  border: 2px solid #1a1a1a;
+  border: 2px solid var(--surface-2, #1a1a22);
 }
 
 .latex-content-container::-webkit-scrollbar-thumb:hover {
-  background: #555;
+  background: var(--border-strong, rgba(255,255,255,0.16));
 }
 
 /* ================================
diff --git a/frontend/src/components/LatexRenderer.jsx b/frontend/src/components/LatexRenderer.jsx
index 43fe6ce..f746ac5 100644
--- a/frontend/src/components/LatexRenderer.jsx
+++ b/frontend/src/components/LatexRenderer.jsx
@@ -1121,14 +1121,14 @@ const LatexRenderer = ({
               }}
               title="Show rendered LaTeX"
             >
-              📐 Rendered {isLargeDoc ? '' : '(Experimental)'}
+              Rendered View
             </button>
             <button
               className={`latex-toggle-btn ${viewMode === 'raw' ? 'active' : ''}`}
               onClick={() => setInternalViewMode('raw')}
               title="Show raw text"
             >
-              Raw Text
+              Raw Text View
             </button>
           </div>
           {viewMode === 'rendered' && chunks.length > 1 && (
diff --git a/frontend/src/components/OpenRouterApiKeyModal.jsx b/frontend/src/components/OpenRouterApiKeyModal.jsx
index dd1414a..87d52a0 100644
--- a/frontend/src/components/OpenRouterApiKeyModal.jsx
+++ b/frontend/src/components/OpenRouterApiKeyModal.jsx
@@ -1,9 +1,10 @@
 import React, { useState, useEffect } from 'react';
 import { openRouterAPI } from '../services/api';
+import './settings-common.css';
 
 /**
  * Modal for configuring the global OpenRouter API key.
- * This key is used for per-role OpenRouter model selection (separate from boost).
+ * This key is used for per-role OpenRouter model selection and can also be reused by boost.
  * 
  * Shows when:
  * 1. User clicks "Use OpenRouter" on any role but no API key is configured
@@ -76,7 +77,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
       
       // Notify parent
       if (onKeySet) {
-        onKeySet(apiKey.trim());
+        await onKeySet(apiKey.trim());
       }
       
       onClose();
@@ -103,38 +104,29 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
 
   const reasonMessages = {
     setup: 'Configure your OpenRouter API key to use OpenRouter models for any role.',
+    startup_setup: 'Save your OpenRouter API key to unlock cloud models. MOTO will apply the recommended default profile immediately, and you can switch to your team profile or another default profile later in Settings.',
     lm_studio_unavailable: 'LM Studio is not available. Configure OpenRouter to continue.',
     no_key: 'An OpenRouter API key is required to use OpenRouter models.',
   };
 
   return (
     <div 
+      className="inline-modal-overlay"
       style={{
-        position: 'fixed',
-        top: 0,
-        left: 0,
-        right: 0,
-        bottom: 0,
-        backgroundColor: 'rgba(0, 0, 0, 0.75)',
-        display: 'flex',
-        alignItems: 'center',
-        justifyContent: 'center',
         zIndex: 10000,
       }}
       onClick={(e) => e.target === e.currentTarget && onClose()}
     >
       <div 
+        className="inline-modal-content"
         style={{
-          backgroundColor: '#1a1a2e',
-          borderRadius: '12px',
-          padding: '2rem',
           width: '500px',
           maxWidth: '90vw',
-          boxShadow: '0 8px 32px rgba(0, 0, 0, 0.4)',
-          border: '1px solid #333',
+          backgroundColor: '#1a1a2e',
+          borderRadius: '12px',
         }}
       >
-        <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: '1.5rem' }}>
+        <div className="settings-header-row" style={{ marginBottom: '1.5rem' }}>
           <h2 style={{ margin: 0, color: '#fff', fontSize: '1.4rem' }}>
             OpenRouter API Key
           </h2>
@@ -167,18 +159,12 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
             value={apiKey}
             onChange={(e) => setApiKey(e.target.value)}
             placeholder="sk-or-v1-..."
+            className="input-dark"
             style={{
-              width: '100%',
-              padding: '0.75rem',
-              backgroundColor: '#0d0d1a',
-              border: '1px solid #333',
-              borderRadius: '6px',
-              color: '#fff',
               fontSize: '0.95rem',
-              boxSizing: 'border-box',
             }}
           />
-          <small style={{ color: '#666', display: 'block', marginTop: '0.5rem' }}>
+          <small className="hint-text hint-text--dim">
             Get your API key at{' '}
             <a 
               href="https://openrouter.ai/keys" 
@@ -193,14 +179,8 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
 
         {/* Error Message */}
         {error && (
-          <div style={{
-            backgroundColor: 'rgba(244, 67, 54, 0.1)',
-            border: '1px solid #f44336',
-            borderRadius: '6px',
-            padding: '0.75rem',
+          <div className="test-result-banner test-result-banner--error" style={{
             marginBottom: '1rem',
-            color: '#f44336',
-            fontSize: '0.9rem',
           }}>
             {error}
           </div>
@@ -208,14 +188,8 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
 
         {/* Test Result */}
         {testResult && testResult.connected && (
-          <div style={{
-            backgroundColor: 'rgba(76, 175, 80, 0.1)',
-            border: '1px solid #4CAF50',
-            borderRadius: '6px',
-            padding: '0.75rem',
+          <div className="test-result-banner test-result-banner--success" style={{
             marginBottom: '1rem',
-            color: '#4CAF50',
-            fontSize: '0.9rem',
           }}>
             Connection successful! {testResult.model_count} models available.
           </div>
@@ -265,15 +239,10 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
         {apiKey && (
           <button
             onClick={handleClearKey}
+            className="btn-ghost"
             style={{
               width: '100%',
               marginTop: '1rem',
-              padding: '0.5rem',
-              backgroundColor: 'transparent',
-              border: '1px solid #444',
-              borderRadius: '6px',
-              color: '#888',
-              cursor: 'pointer',
               fontSize: '0.85rem',
             }}
           >
@@ -291,7 +260,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
           borderRadius: '6px',
         }}>
           This API key is stored locally and sent to the backend for OpenRouter API calls.
-          It's separate from the Boost API key used for boost mode.
+          API Boost can reuse this key automatically, or you can override it inside the boost modal.
         </p>
       </div>
     </div>
diff --git a/frontend/src/components/OpenRouterPrivacyWarningModal.jsx b/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
index ecd08d1..a610ff0 100644
--- a/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
+++ b/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
@@ -1,4 +1,5 @@
 import React from 'react';
+import './settings-common.css';
 
 /**
  * Modal that displays OpenRouter privacy policy warning.
@@ -21,20 +22,11 @@ function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData }) {
 
   return (
     <div 
-      className="modal-overlay"
+      className="inline-modal-overlay"
       onClick={handleOverlayClick}
       style={{
-        position: 'fixed',
-        top: 0,
-        left: 0,
-        right: 0,
-        bottom: 0,
-        backgroundColor: 'rgba(0, 0, 0, 0.75)',
-        display: 'flex',
-        alignItems: 'center',
-        justifyContent: 'center',
-        zIndex: 10000,
-        padding: '20px'
+        padding: '20px',
+        zIndex: 10000
       }}
     >
       <div 
@@ -190,37 +182,26 @@ function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData }) {
         }}>
           <button
             onClick={handleOpenSettings}
+            className="btn-success-sm"
             style={{
               padding: '12px 24px',
-              backgroundColor: '#4caf50',
-              color: 'white',
-              border: 'none',
-              borderRadius: '6px',
               fontSize: '14px',
-              fontWeight: '600',
-              cursor: 'pointer',
-              transition: 'background-color 0.2s'
+              fontWeight: '600'
             }}
-            onMouseEnter={(e) => e.target.style.backgroundColor = '#45a049'}
-            onMouseLeave={(e) => e.target.style.backgroundColor = '#4caf50'}
           >
             Open Privacy Settings
           </button>
           <button
             onClick={onClose}
+            className="btn-ghost"
             style={{
               padding: '12px 24px',
-              backgroundColor: '#555',
-              color: 'white',
-              border: 'none',
-              borderRadius: '6px',
               fontSize: '14px',
               fontWeight: '600',
-              cursor: 'pointer',
-              transition: 'background-color 0.2s'
+              backgroundColor: '#555',
+              color: 'white',
+              border: 'none'
             }}
-            onMouseEnter={(e) => e.target.style.backgroundColor = '#666'}
-            onMouseLeave={(e) => e.target.style.backgroundColor = '#555'}
           >
             OK, I Understand
           </button>
diff --git a/frontend/src/components/PaperCritiqueModal.jsx b/frontend/src/components/PaperCritiqueModal.jsx
index e86a445..fed01df 100644
--- a/frontend/src/components/PaperCritiqueModal.jsx
+++ b/frontend/src/components/PaperCritiqueModal.jsx
@@ -1,5 +1,6 @@
 import React, { useState, useEffect } from 'react';
 import { createPortal } from 'react-dom';
+import './critique-modal.css';
 
 // Simple inline icon components
 const IconX = ({ className }) => (
@@ -39,54 +40,20 @@ const IconAlertCircle = ({ className }) => (
   </svg>
 );
 
-/**
- * Get color class based on rating value (1-10)
- */
 function getRatingColor(rating) {
-  if (rating >= 8) return 'text-emerald-400';
-  if (rating >= 6) return 'text-blue-400';
-  if (rating >= 4) return 'text-yellow-400';
-  if (rating >= 2) return 'text-orange-400';
-  return 'text-red-400';
+  if (rating >= 8) return 'critique-color--emerald';
+  if (rating >= 6) return 'critique-color--blue';
+  if (rating >= 4) return 'critique-color--yellow';
+  if (rating >= 2) return 'critique-color--orange';
+  return 'critique-color--red';
 }
 
 function getRatingBgColor(rating) {
-  if (rating >= 8) return 'bg-emerald-500';
-  if (rating >= 6) return 'bg-blue-500';
-  if (rating >= 4) return 'bg-yellow-500';
-  if (rating >= 2) return 'bg-orange-500';
-  return 'bg-red-500';
-}
-
-/**
- * Rating display component with progress bar
- */
-function RatingDisplay({ label, rating, feedback }) {
-  const percentage = (rating / 10) * 100;
-  
-  return (
-    <div className="bg-gray-800/50 rounded-lg p-4">
-      <div className="flex items-center justify-between mb-2">
-        <span className="text-sm font-medium text-gray-300">{label}</span>
-        <span className={`text-2xl font-bold ${getRatingColor(rating)}`}>
-          {rating > 0 ? rating : '—'}/10
-        </span>
-      </div>
-      
-      {/* Progress bar */}
-      <div className="h-2 bg-gray-700 rounded-full mb-3 overflow-hidden">
-        <div 
-          className={`h-full rounded-full transition-all duration-500 ${getRatingBgColor(rating)}`}
-          style={{ width: `${percentage}%` }}
-        />
-      </div>
-      
-      {/* Feedback text */}
-      {feedback && (
-        <p className="text-sm text-gray-400 leading-relaxed">{feedback}</p>
-      )}
-    </div>
-  );
+  if (rating >= 8) return 'critique-bg--emerald';
+  if (rating >= 6) return 'critique-bg--blue';
+  if (rating >= 4) return 'critique-bg--yellow';
+  if (rating >= 2) return 'critique-bg--orange';
+  return 'critique-bg--red';
 }
 
 /**
@@ -201,20 +168,6 @@ export default function PaperCritiqueModal({
   const modalContent = (
     <div 
       className="critique-modal-overlay"
-      style={{
-        position: 'fixed',
-        top: 0,
-        left: 0,
-        right: 0,
-        bottom: 0,
-        backgroundColor: 'rgba(0, 0, 0, 0.7)',
-        backdropFilter: 'blur(4px)',
-        display: 'flex',
-        alignItems: 'center',
-        justifyContent: 'center',
-        zIndex: 999999, // Very high z-index to ensure visibility
-        padding: '20px',
-      }}
       onClick={(e) => {
         // Close when clicking the backdrop
         if (e.target === e.currentTarget) {
@@ -223,144 +176,64 @@ export default function PaperCritiqueModal({
       }}
     >
       <div 
-        className="critique-modal-content"
-        style={{
-          backgroundColor: '#1a1a2e',
-          borderRadius: '12px',
-          width: '100%',
-          maxWidth: '1200px',
-          height: '85vh',
-          display: 'flex',
-          flexDirection: 'column',
-          boxShadow: '0 25px 50px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(147, 51, 234, 0.3)',
-          border: '1px solid rgba(147, 51, 234, 0.4)',
-          overflow: 'hidden',
-        }}
+        className="critique-modal-panel"
         onClick={(e) => e.stopPropagation()}
       >
         {/* Header - Compact */}
-        <div style={{
-          display: 'flex',
-          alignItems: 'center',
-          justifyContent: 'space-between',
-          padding: '12px 16px',
-          borderBottom: '1px solid rgba(75, 85, 99, 0.5)',
-          backgroundColor: 'rgba(147, 51, 234, 0.1)',
-        }}>
-          <div style={{ display: 'flex', alignItems: 'center', gap: '10px' }}>
-            <div style={{
-              padding: '6px',
-              backgroundColor: 'rgba(147, 51, 234, 0.2)',
-              borderRadius: '8px',
-            }}>
-              <IconStar className="w-4 h-4 text-purple-400" />
+        <div className="critique-modal-header">
+          <div className="critique-header-left">
+            <div className="critique-header-icon">
+              <IconStar className="critique-icon--green" />
             </div>
             <div>
-              <h2 style={{ 
-                fontSize: '14px', 
-                fontWeight: '600', 
-                color: '#f3f4f6',
-                margin: 0,
-              }}>Validator Critique</h2>
-              <p style={{ 
-                fontSize: '11px', 
-                color: '#9ca3af',
-                margin: 0,
-                maxWidth: '300px',
-                overflow: 'hidden',
-                textOverflow: 'ellipsis',
-                whiteSpace: 'nowrap',
-              }} title={paperTitle}>
+              <h2 className="critique-modal-title">Validator Critique</h2>
+              <p className="critique-modal-subtitle" title={paperTitle}>
                 {paperTitle || 'Paper'}
               </p>
             </div>
           </div>
           <button
             onClick={onClose}
-            style={{
-              color: '#9ca3af',
-              padding: '6px',
-              backgroundColor: 'transparent',
-              border: 'none',
-              borderRadius: '6px',
-              cursor: 'pointer',
-              transition: 'all 0.2s',
-            }}
-            onMouseEnter={(e) => {
-              e.target.style.backgroundColor = 'rgba(75, 85, 99, 0.5)';
-              e.target.style.color = '#f3f4f6';
-            }}
-            onMouseLeave={(e) => {
-              e.target.style.backgroundColor = 'transparent';
-              e.target.style.color = '#9ca3af';
-            }}
+            className="critique-close-btn"
           >
-            <IconX className="w-4 h-4" />
+            <IconX className="critique-icon--close" />
           </button>
         </div>
 
         {/* Content - Scrollable */}
-        <div style={{
-          flex: 1,
-          overflowY: 'auto',
-          padding: '16px',
-          minHeight: '500px',
-        }}>
+        <div className="critique-modal-body">
           {loading ? (
-            <div style={{ 
-              display: 'flex', 
-              alignItems: 'center', 
-              justifyContent: 'center',
-              height: '150px',
-            }}>
-              <div style={{ textAlign: 'center' }}>
-                <div style={{
-                  width: '28px',
-                  height: '28px',
-                  border: '2px solid #a855f7',
-                  borderTopColor: 'transparent',
-                  borderRadius: '50%',
-                  margin: '0 auto 10px',
-                  animation: 'spin 1s linear infinite',
-                }}></div>
-                <p style={{ color: '#9ca3af', fontSize: '13px' }}>Loading critiques...</p>
+            <div className="critique-loading-wrapper">
+              <div className="critique-loading-inner">
+                <div className="critique-spinner"></div>
+                <p className="critique-loading-text">Loading critiques...</p>
               </div>
             </div>
           ) : error ? (
-            <div style={{
-              backgroundColor: 'rgba(127, 29, 29, 0.2)',
-              border: '1px solid rgba(239, 68, 68, 0.3)',
-              borderRadius: '8px',
-              padding: '12px',
-            }}>
-              <div style={{ display: 'flex', alignItems: 'flex-start', gap: '10px' }}>
-                <IconAlertCircle className="w-4 h-4 text-red-400" style={{ flexShrink: 0, marginTop: '2px' }} />
+            <div className="critique-error-box">
+              <div className="critique-error-row">
+                <IconAlertCircle className="critique-icon--red" style={{ flexShrink: 0, marginTop: '2px' }} />
                 <div>
-                  <h4 style={{ color: '#f87171', fontWeight: '500', marginBottom: '4px', fontSize: '13px' }}>Error</h4>
-                  <p style={{ fontSize: '12px', color: 'rgba(252, 165, 165, 0.8)' }}>{error}</p>
+                  <h4 className="critique-error-title">Error</h4>
+                  <p className="critique-error-message">{error}</p>
                 </div>
               </div>
             </div>
           ) : selectedCritique ? (
-            <div style={{ display: 'flex', flexDirection: 'column', gap: '12px', height: '100%' }}>
+            <div className="critique-content-layout">
               {/* Critic Identity - Compact */}
-              <div style={{
-                background: 'linear-gradient(to right, rgba(88, 28, 135, 0.3), rgba(30, 58, 138, 0.3))',
-                borderRadius: '8px',
-                padding: '10px 12px',
-                border: '1px solid rgba(147, 51, 234, 0.2)',
-              }}>
-                <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between' }}>
+              <div className="critique-identity-card">
+                <div className="critique-identity-row">
                   <div>
-                    <p style={{ fontSize: '10px', color: '#9ca3af', textTransform: 'uppercase', letterSpacing: '0.05em', marginBottom: '2px' }}>Critique by</p>
-                    <p style={{ fontSize: '14px', fontWeight: '600', color: '#f3f4f6' }}>{selectedCritique.model_id}</p>
+                    <p className="critique-identity-label">Critique by</p>
+                    <p className="critique-model-name">{selectedCritique.model_id}</p>
                     {selectedCritique.host_provider && (
-                      <p style={{ fontSize: '11px', color: '#c4b5fd' }}>via {selectedCritique.host_provider}</p>
+                      <p className="critique-host-provider">via {selectedCritique.host_provider}</p>
                     )}
                   </div>
-                  <div style={{ textAlign: 'right' }}>
-                    <div style={{ display: 'flex', alignItems: 'center', gap: '4px', color: '#9ca3af', fontSize: '11px' }}>
-                      <IconClock className="w-3 h-3" />
+                  <div className="critique-date-area">
+                    <div className="critique-date-row">
+                      <IconClock className="critique-icon--sm" />
                       {formatDate(selectedCritique.date)}
                     </div>
                   </div>
@@ -368,7 +241,7 @@ export default function PaperCritiqueModal({
               </div>
 
               {/* Ratings - Compact Grid */}
-              <div style={{ display: 'grid', gridTemplateColumns: 'repeat(3, 1fr)', gap: '8px' }}>
+              <div className="critique-ratings-grid">
                 <CompactRating label="Novelty" rating={selectedCritique.novelty_rating} feedback={selectedCritique.novelty_feedback} />
                 <CompactRating label="Correctness" rating={selectedCritique.correctness_rating} feedback={selectedCritique.correctness_feedback} />
                 <CompactRating label="Impact" rating={selectedCritique.impact_rating} feedback={selectedCritique.impact_feedback} />
@@ -376,24 +249,9 @@ export default function PaperCritiqueModal({
 
               {/* Full Critique - Expanded to fill space */}
               {selectedCritique.full_critique && (
-                <div style={{
-                  backgroundColor: 'rgba(31, 41, 55, 0.5)',
-                  borderRadius: '8px',
-                  padding: '10px 12px',
-                  flex: 1,
-                  display: 'flex',
-                  flexDirection: 'column',
-                  minHeight: '200px',
-                }}>
-                  <h3 style={{ fontSize: '11px', fontWeight: '500', color: '#d1d5db', marginBottom: '8px' }}>Full Critique</h3>
-                  <p style={{ 
-                    color: '#d1d5db', 
-                    lineHeight: '1.5', 
-                    whiteSpace: 'pre-wrap',
-                    fontSize: '12px',
-                    flex: 1,
-                    overflowY: 'auto',
-                  }}>
+                <div className="critique-full-box">
+                  <h3 className="critique-section-label">Full Critique</h3>
+                  <p className="critique-full-text">
                     {selectedCritique.full_critique}
                   </p>
                 </div>
@@ -401,45 +259,21 @@ export default function PaperCritiqueModal({
 
               {/* History - Compact */}
               {critiques.length > 1 && (
-                <div style={{
-                  border: '1px solid rgba(75, 85, 99, 0.5)',
-                  borderRadius: '8px',
-                  overflow: 'hidden',
-                }}>
+                <div className="critique-history-container">
                   <button
                     onClick={() => setHistoryOpen(!historyOpen)}
-                    style={{
-                      width: '100%',
-                      display: 'flex',
-                      alignItems: 'center',
-                      justifyContent: 'space-between',
-                      padding: '8px 12px',
-                      backgroundColor: 'rgba(31, 41, 55, 0.3)',
-                      border: 'none',
-                      cursor: 'pointer',
-                      transition: 'background-color 0.2s',
-                    }}
-                    onMouseEnter={(e) => e.target.style.backgroundColor = 'rgba(31, 41, 55, 0.5)'}
-                    onMouseLeave={(e) => e.target.style.backgroundColor = 'rgba(31, 41, 55, 0.3)'}
+                    className="critique-history-toggle"
                   >
-                    <span style={{ fontSize: '12px', fontWeight: '500', color: '#d1d5db' }}>
+                    <span className="critique-history-label">
                       History ({critiques.length})
                     </span>
                     <IconChevronDown 
-                      className="w-3 h-3 text-gray-400"
-                      style={{ 
-                        transition: 'transform 0.2s',
-                        transform: historyOpen ? 'rotate(180deg)' : 'rotate(0deg)',
-                      }}
+                      className={`critique-icon--sm critique-icon--muted critique-history-chevron ${historyOpen ? 'critique-history-chevron--open' : ''}`}
                     />
                   </button>
                   
                   {historyOpen && (
-                    <div style={{ 
-                      borderTop: '1px solid rgba(75, 85, 99, 0.5)',
-                      maxHeight: '120px',
-                      overflowY: 'auto',
-                    }}>
+                    <div className="critique-history-list">
                       {critiques.map((critique, idx) => (
                         <button
                           key={critique.critique_id || idx}
@@ -447,32 +281,13 @@ export default function PaperCritiqueModal({
                             setSelectedCritique(critique);
                             setHistoryOpen(false);
                           }}
-                          style={{
-                            width: '100%',
-                            textAlign: 'left',
-                            padding: '8px 12px',
-                            backgroundColor: selectedCritique?.critique_id === critique.critique_id ? 'rgba(88, 28, 135, 0.2)' : 'transparent',
-                            border: 'none',
-                            borderBottom: idx < critiques.length - 1 ? '1px solid rgba(75, 85, 99, 0.3)' : 'none',
-                            cursor: 'pointer',
-                            transition: 'background-color 0.2s',
-                          }}
-                          onMouseEnter={(e) => {
-                            if (selectedCritique?.critique_id !== critique.critique_id) {
-                              e.target.style.backgroundColor = 'rgba(31, 41, 55, 0.5)';
-                            }
-                          }}
-                          onMouseLeave={(e) => {
-                            if (selectedCritique?.critique_id !== critique.critique_id) {
-                              e.target.style.backgroundColor = 'transparent';
-                            }
-                          }}
+                          className={`critique-history-item ${selectedCritique?.critique_id === critique.critique_id ? 'critique-history-item--selected' : ''}`}
                         >
-                          <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between' }}>
-                            <span style={{ fontSize: '11px', color: '#d1d5db' }}>{critique.model_id}</span>
-                            <span style={{ fontSize: '10px', color: '#6b7280' }}>{formatDate(critique.date)}</span>
+                          <div className="critique-history-item-row">
+                            <span className="critique-history-model">{critique.model_id}</span>
+                            <span className="critique-history-date">{formatDate(critique.date)}</span>
                           </div>
-                          <div style={{ display: 'flex', gap: '8px', marginTop: '2px', fontSize: '10px' }}>
+                          <div className="critique-history-ratings">
                             <span className={getRatingColor(critique.novelty_rating)}>N: {critique.novelty_rating}</span>
                             <span className={getRatingColor(critique.correctness_rating)}>C: {critique.correctness_rating}</span>
                             <span className={getRatingColor(critique.impact_rating)}>I: {critique.impact_rating}</span>
@@ -485,24 +300,12 @@ export default function PaperCritiqueModal({
               )}
             </div>
           ) : (
-            <div style={{ 
-              display: 'flex', 
-              flexDirection: 'column', 
-              alignItems: 'center', 
-              justifyContent: 'center',
-              height: '150px',
-              textAlign: 'center',
-            }}>
-              <div style={{
-                padding: '12px',
-                backgroundColor: 'rgba(31, 41, 55, 0.5)',
-                borderRadius: '50%',
-                marginBottom: '12px',
-              }}>
-                <IconStar className="w-8 h-8 text-gray-600" />
+            <div className="critique-empty-state">
+              <div className="critique-empty-icon">
+                <IconStar className="critique-icon--lg critique-icon--muted" />
               </div>
-              <h3 style={{ fontSize: '14px', fontWeight: '500', color: '#d1d5db', marginBottom: '6px' }}>No Critique Yet</h3>
-              <p style={{ fontSize: '11px', color: '#6b7280', maxWidth: '280px' }}>
+              <h3 className="critique-empty-title">No Critique Yet</h3>
+              <p className="critique-empty-desc">
                 Click "Generate Critique" to have your validator model provide an honest assessment of this paper.
               </p>
             </div>
@@ -510,80 +313,30 @@ export default function PaperCritiqueModal({
         </div>
 
         {/* Footer - Compact */}
-        <div style={{
-          display: 'flex',
-          alignItems: 'center',
-          justifyContent: 'space-between',
-          padding: '10px 16px',
-          borderTop: '1px solid rgba(75, 85, 99, 0.5)',
-          backgroundColor: 'rgba(31, 41, 55, 0.3)',
-        }}>
-          <p style={{ fontSize: '10px', color: '#6b7280' }}>
+        <div className="critique-modal-footer">
+          <p className="critique-footer-note">
             {critiques.length > 0 && 'Up to 10 critiques saved'}
           </p>
-          <div style={{ display: 'flex', alignItems: 'center', gap: '8px' }}>
+          <div className="critique-footer-actions">
             <button
               onClick={onClose}
-              style={{
-                padding: '6px 12px',
-                fontSize: '12px',
-                color: '#d1d5db',
-                backgroundColor: 'transparent',
-                border: 'none',
-                cursor: 'pointer',
-                borderRadius: '6px',
-                transition: 'all 0.2s',
-              }}
-              onMouseEnter={(e) => {
-                e.target.style.backgroundColor = 'rgba(75, 85, 99, 0.3)';
-                e.target.style.color = '#f3f4f6';
-              }}
-              onMouseLeave={(e) => {
-                e.target.style.backgroundColor = 'transparent';
-                e.target.style.color = '#d1d5db';
-              }}
+              className="critique-btn-secondary"
             >
               Close
             </button>
             <button
               onClick={handleGenerateCritique}
               disabled={generating}
-              style={{
-                display: 'flex',
-                alignItems: 'center',
-                gap: '6px',
-                padding: '6px 12px',
-                backgroundColor: generating ? '#6b21a8' : '#9333ea',
-                color: 'white',
-                border: 'none',
-                borderRadius: '6px',
-                fontSize: '12px',
-                fontWeight: '500',
-                cursor: generating ? 'not-allowed' : 'pointer',
-                transition: 'background-color 0.2s',
-              }}
-              onMouseEnter={(e) => {
-                if (!generating) e.target.style.backgroundColor = '#a855f7';
-              }}
-              onMouseLeave={(e) => {
-                if (!generating) e.target.style.backgroundColor = '#9333ea';
-              }}
+              className="critique-btn-primary"
             >
               {generating ? (
                 <>
-                  <div style={{
-                    width: '12px',
-                    height: '12px',
-                    border: '2px solid white',
-                    borderTopColor: 'transparent',
-                    borderRadius: '50%',
-                    animation: 'spin 1s linear infinite',
-                  }}></div>
+                  <div className="critique-spinner--sm"></div>
                   Generating...
                 </>
               ) : (
                 <>
-                  <IconRefresh className="w-3 h-3" />
+                  <IconRefresh className="critique-icon--sm" />
                   {selectedCritique ? 'Regenerate' : 'Generate Critique'}
                 </>
               )}
@@ -591,14 +344,6 @@ export default function PaperCritiqueModal({
           </div>
         </div>
       </div>
-      
-      {/* Keyframes for spinner animation */}
-      <style>{`
-        @keyframes spin {
-          from { transform: rotate(0deg); }
-          to { transform: rotate(360deg); }
-        }
-      `}</style>
     </div>
   );
 
@@ -613,46 +358,25 @@ function CompactRating({ label, rating, feedback }) {
   const percentage = (rating / 10) * 100;
   
   return (
-    <div style={{
-      backgroundColor: 'rgba(31, 41, 55, 0.5)',
-      borderRadius: '8px',
-      padding: '8px 10px',
-    }}>
-      <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: '4px' }}>
-        <span style={{ fontSize: '10px', fontWeight: '500', color: '#d1d5db' }}>{label}</span>
-        <span className={getRatingColor(rating)} style={{ fontSize: '14px', fontWeight: '700' }}>
+    <div className="critique-compact-card">
+      <div className="critique-compact-header">
+        <span className="critique-compact-label">{label}</span>
+        <span className={`${getRatingColor(rating)} critique-compact-value`}>
           {rating > 0 ? rating : '—'}
         </span>
       </div>
       
       {/* Progress bar */}
-      <div style={{
-        height: '4px',
-        backgroundColor: 'rgba(55, 65, 81, 1)',
-        borderRadius: '9999px',
-        overflow: 'hidden',
-        marginBottom: feedback ? '6px' : '0',
-      }}>
+      <div className="critique-compact-track" style={{ marginBottom: feedback ? '6px' : '0' }}>
         <div 
-          className={getRatingBgColor(rating)}
-          style={{ 
-            height: '100%', 
-            width: `${percentage}%`,
-            borderRadius: '9999px',
-            transition: 'width 0.5s',
-          }}
+          className={`${getRatingBgColor(rating)} critique-compact-fill`}
+          style={{ width: `${percentage}%` }}
         />
       </div>
       
       {/* Feedback text - full display */}
       {feedback && (
-        <p style={{ 
-          fontSize: '11px', 
-          color: '#9ca3af', 
-          lineHeight: '1.5',
-          maxHeight: '250px',
-          overflowY: 'auto',
-        }}>{feedback}</p>
+        <p className="critique-compact-feedback">{feedback}</p>
       )}
     </div>
   );
diff --git a/frontend/src/components/StartupProviderSetupModal.jsx b/frontend/src/components/StartupProviderSetupModal.jsx
new file mode 100644
index 0000000..259c5ec
--- /dev/null
+++ b/frontend/src/components/StartupProviderSetupModal.jsx
@@ -0,0 +1,163 @@
+import React from 'react';
+import './settings-common.css';
+
+export default function StartupProviderSetupModal({
+  isOpen,
+  lmStudioAvailable,
+  hasUsableLmStudioChatModel = false,
+  lmStudioModelCount = 0,
+  lmStudioError = '',
+  statusMessage = '',
+  isCheckingLmStudio = false,
+  onChooseOpenRouter,
+  onConfirmLmStudio,
+}) {
+  if (!isOpen) return null;
+
+  return (
+    <div
+      className="inline-modal-overlay"
+      style={{ zIndex: 10000 }}
+      onClick={(e) => e.stopPropagation()}
+    >
+      <div
+        className="inline-modal-content"
+        style={{
+          width: '760px',
+          maxWidth: '92vw',
+          backgroundColor: '#141426',
+          borderRadius: '14px',
+        }}
+      >
+        <div className="settings-header-row" style={{ marginBottom: '1rem' }}>
+          <h2 style={{ margin: 0, color: '#fff', fontSize: '1.45rem' }}>
+            Choose Your Startup Setup
+          </h2>
+        </div>
+
+        <p style={{ color: '#ddd', lineHeight: '1.6', marginBottom: '0.9rem' }}>
+          MOTO needs <strong>an OpenRouter API key or a running LM Studio server</strong> before you start.
+          The best experience is to use both: OpenRouter for cloud models and LM Studio for free, faster local RAG and embeddings.
+        </p>
+
+        <div
+          style={{
+            marginBottom: '1rem',
+            padding: '0.9rem 1rem',
+            borderRadius: '8px',
+            backgroundColor: 'rgba(30, 255, 28, 0.08)',
+            border: '1px solid rgba(30, 255, 28, 0.25)',
+            color: '#d8ffd8',
+            lineHeight: '1.55',
+          }}
+        >
+          <strong>Highly recommended:</strong> install LM Studio even if you plan to use OpenRouter. LM Studio
+          gives MOTO free local embedding/RAG calls and noticeably faster retrieval than OpenRouter embeddings.
+        </div>
+
+        <div style={{ display: 'grid', gap: '1rem', gridTemplateColumns: 'repeat(auto-fit, minmax(280px, 1fr))' }}>
+          <div
+            style={{
+              padding: '1rem',
+              borderRadius: '10px',
+              backgroundColor: '#1c1c33',
+              border: '1px solid #34345c',
+            }}
+          >
+            <h3 style={{ marginTop: 0, color: '#a29bfe' }}>OpenRouter Setup</h3>
+            <ol style={{ margin: '0 0 1rem 1.1rem', padding: 0, color: '#d7d7e8', lineHeight: '1.55' }}>
+              <li>Create or sign in to your account at <a href="https://openrouter.ai/" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>openrouter.ai</a>.</li>
+              <li>Generate an API key at <a href="https://openrouter.ai/keys" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>openrouter.ai/keys</a>.</li>
+              <li>Paste that key into MOTO. The recommended default profile will be applied right away.</li>
+            </ol>
+            <button
+              type="button"
+              onClick={onChooseOpenRouter}
+              style={{
+                width: '100%',
+                padding: '0.8rem 1rem',
+                backgroundColor: '#6c5ce7',
+                border: 'none',
+                borderRadius: '8px',
+                color: '#fff',
+                fontSize: '0.95rem',
+                fontWeight: '600',
+                cursor: 'pointer',
+              }}
+            >
+              Enter OpenRouter Key
+            </button>
+          </div>
+
+          <div
+            style={{
+              padding: '1rem',
+              borderRadius: '10px',
+              backgroundColor: '#1c1c33',
+              border: '1px solid #2f5c36',
+            }}
+          >
+            <h3 style={{ marginTop: 0, color: '#7CFC90' }}>LM Studio Setup</h3>
+            <ol style={{ margin: '0 0 1rem 1.1rem', padding: 0, color: '#d7d7e8', lineHeight: '1.55' }}>
+              <li>Install LM Studio from <a href="https://lmstudio.ai/" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>lmstudio.ai</a>.</li>
+              <li>Enable Developer or Power User mode if needed, then open the server tab.</li>
+              <li>Load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code>.</li>
+              <li>Optionally load one or more local chat models, then start the local server on <code>http://127.0.0.1:1234</code>.</li>
+            </ol>
+            <button
+              type="button"
+              onClick={onConfirmLmStudio}
+              disabled={isCheckingLmStudio}
+              style={{
+                width: '100%',
+                padding: '0.8rem 1rem',
+                backgroundColor: lmStudioAvailable && hasUsableLmStudioChatModel ? '#1f7a33' : '#21492a',
+                border: '1px solid #2f8f45',
+                borderRadius: '8px',
+                color: '#fff',
+                fontSize: '0.95rem',
+                fontWeight: '600',
+                cursor: isCheckingLmStudio ? 'not-allowed' : 'pointer',
+                opacity: isCheckingLmStudio ? 0.7 : 1,
+              }}
+            >
+              {isCheckingLmStudio ? 'Checking LM Studio...' : "I'm Running LM Studio"}
+            </button>
+          </div>
+        </div>
+
+        <div
+          style={{
+            marginTop: '1rem',
+            padding: '0.9rem 1rem',
+            borderRadius: '8px',
+            backgroundColor: lmStudioAvailable ? 'rgba(30, 255, 28, 0.08)' : 'rgba(255, 184, 77, 0.08)',
+            border: lmStudioAvailable ? '1px solid rgba(30, 255, 28, 0.25)' : '1px solid rgba(255, 184, 77, 0.28)',
+            color: lmStudioAvailable ? '#dbffdd' : '#ffe1ad',
+            lineHeight: '1.5',
+          }}
+        >
+          {lmStudioAvailable && hasUsableLmStudioChatModel
+            ? `LM Studio is currently detected with ${lmStudioModelCount} loaded model${lmStudioModelCount === 1 ? '' : 's'}, including a usable chat model.`
+            : lmStudioAvailable
+              ? 'LM Studio is running, but you still need at least one loaded chat model in addition to embeddings.'
+              : `LM Studio is not detected yet${lmStudioError ? `: ${lmStudioError}` : '.'}`}
+        </div>
+
+        {statusMessage && (
+          <div
+            className="test-result-banner test-result-banner--error"
+            style={{ marginTop: '1rem' }}
+          >
+            {statusMessage}
+          </div>
+        )}
+
+        <p style={{ color: '#aaa', lineHeight: '1.55', marginTop: '1rem', marginBottom: 0 }}>
+          After setup, open <strong>Autonomous Model Selection &amp; Settings</strong> to pick your saved team
+          profile or switch to any built-in default profile.
+        </p>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/TextFileUploader.css b/frontend/src/components/TextFileUploader.css
index 0d33804..0d19392 100644
--- a/frontend/src/components/TextFileUploader.css
+++ b/frontend/src/components/TextFileUploader.css
@@ -8,15 +8,15 @@
 
 /* Upload Button - Matches button.secondary pattern */
 .text-upload-btn {
-  background: #666;           /* Matches button.secondary from index.css line 345 */
+  background: var(--surface-4, #2a2a36);
   color: white;
-  padding: 0.75rem 1.5rem;    /* Standard button padding from index.css line 324 */
+  padding: 0.75rem 1.5rem;
   border: none;
-  border-radius: 4px;
+  border-radius: var(--radius-sm, 6px);
   cursor: pointer;
   font-size: 0.95rem;
   font-weight: 600;
-  transition: background 0.2s;
+  transition: all var(--transition-fast, 0.15s);
   display: inline-flex;
   align-items: center;
   gap: 0.5rem;
@@ -25,17 +25,17 @@
 }
 
 .text-upload-btn:hover:not(:disabled) {
-  background: #777;           /* Matches button.secondary:hover from index.css line 348 */
+  filter: brightness(1.2);
 }
 
 .text-upload-btn:disabled {
-  background: #555;           /* Matches button:disabled from index.css line 340 */
+  background: var(--surface-3, #22222c);
   cursor: not-allowed;
   opacity: 0.7;
 }
 
 .text-upload-btn:focus {
-  outline: 2px solid #4CAF50;
+  outline: 2px solid var(--accent-green, #4CAF50);
   outline-offset: 2px;
 }
 
diff --git a/frontend/src/components/WorkflowPanel.css b/frontend/src/components/WorkflowPanel.css
index 20047f9..36f885f 100644
--- a/frontend/src/components/WorkflowPanel.css
+++ b/frontend/src/components/WorkflowPanel.css
@@ -4,12 +4,13 @@
   top: 0;
   height: 100vh;
   width: 320px;
-  background: #1a1a1a;
-  border-left: 1px solid #333;
+  background: var(--surface-1);
+  border-left: 1px solid var(--border-subtle);
   display: flex;
   flex-direction: column;
   z-index: 1000;
   transition: width 0.15s ease;
+  box-shadow: -4px 0 20px rgba(0, 0, 0, 0.3);
 }
 
 .workflow-panel.collapsed {
@@ -21,27 +22,27 @@
   justify-content: space-between;
   align-items: center;
   padding: 1rem;
-  border-bottom: 1px solid #333;
-  background: #0f0f0f;
+  border-bottom: 1px solid var(--border-subtle);
+  background: var(--surface-0);
 }
 
 .workflow-header h3 {
   margin: 0;
   font-size: 1.1rem;
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .collapse-btn {
   background: none;
   border: none;
-  color: #888;
+  color: var(--text-muted);
   font-size: 1.2rem;
   cursor: pointer;
   padding: 0.25rem 0.5rem;
 }
 
 .collapse-btn:hover {
-  color: #fff;
+  color: var(--text-primary);
 }
 
 .workflow-panel.collapsed .workflow-header h3 {
@@ -50,14 +51,14 @@
 
 .workflow-mode {
   padding: 0.75rem 1rem;
-  background: #242424;
-  border-bottom: 1px solid #333;
+  background: var(--surface-2);
+  border-bottom: 1px solid var(--border-subtle);
   font-size: 0.9rem;
-  color: #aaa;
+  color: var(--text-secondary);
 }
 
-.mode-badge {
-  color: #4CAF50;
+.wf-mode-badge {
+  color: var(--accent-green);
   font-weight: 600;
   text-transform: capitalize;
 }
@@ -65,8 +66,8 @@
 /* Boost Controls */
 .boost-controls {
   padding: 0.75rem 1rem;
-  background: #1f1f1f;
-  border-bottom: 1px solid #333;
+  background: var(--surface-1);
+  border-bottom: 1px solid var(--border-subtle);
 }
 
 .boost-section {
@@ -80,7 +81,7 @@
 .boost-label {
   display: block;
   font-size: 0.75rem;
-  color: #888;
+  color: var(--text-muted);
   margin-bottom: 0.5rem;
   text-transform: uppercase;
   letter-spacing: 0.5px;
@@ -95,49 +96,49 @@
 .boost-next-input {
   width: 60px;
   padding: 0.4rem 0.5rem;
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
-  color: #fff;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
+  color: var(--text-primary);
   font-size: 0.9rem;
 }
 
 .boost-next-input:focus {
   outline: none;
-  border-color: #ffd700;
+  border-color: var(--gold-dim);
 }
 
 .boost-next-input::placeholder {
-  color: #666;
+  color: var(--text-muted);
 }
 
 .boost-apply-btn {
   padding: 0.4rem 0.75rem;
-  background: #ffd700;
+  background: var(--gold);
   border: none;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   color: #000;
   font-size: 0.8rem;
   font-weight: 600;
   cursor: pointer;
-  transition: background 0.2s;
+  transition: all var(--transition-fast);
 }
 
 .boost-apply-btn:hover:not(:disabled) {
-  background: #ffed4e;
+  background: #7dff6f;
 }
 
 .boost-apply-btn:disabled {
-  background: #555;
-  color: #888;
+  background: var(--surface-4);
+  color: var(--text-muted);
   cursor: not-allowed;
 }
 
 .boost-count-badge {
-  background: #ffd700;
+  background: var(--gold);
   color: #000;
   padding: 0.25rem 0.5rem;
-  border-radius: 10px;
+  border-radius: var(--radius-pill);
   font-size: 0.7rem;
   font-weight: 600;
 }
@@ -150,34 +151,34 @@
 
 .category-btn {
   padding: 0.3rem 0.6rem;
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
-  color: #aaa;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
+  color: var(--text-secondary);
   font-size: 0.75rem;
   cursor: pointer;
-  transition: all 0.2s;
+  transition: all var(--transition-fast);
 }
 
 .category-btn:hover {
-  background: #333;
-  border-color: #555;
-  color: #fff;
+  background: var(--surface-4);
+  border-color: var(--border-strong);
+  color: var(--text-primary);
 }
 
 .category-btn.active {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
-  border-color: #ffd700;
+  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
+  border-color: var(--gold);
   color: #000;
   font-weight: 600;
 }
 
 .boost-disabled-notice {
   padding: 0.75rem 1rem;
-  background: #1f1f1f;
-  border-bottom: 1px solid #333;
+  background: var(--surface-1);
+  border-bottom: 1px solid var(--border-subtle);
   font-size: 0.8rem;
-  color: #666;
+  color: var(--text-muted);
   text-align: center;
   font-style: italic;
 }
@@ -191,32 +192,32 @@
 .no-tasks {
   text-align: center;
   padding: 2rem 1rem;
-  color: #666;
+  color: var(--text-muted);
   font-style: italic;
 }
 
 .task-card {
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 6px;
+  background: var(--surface-3);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
   padding: 0.75rem;
   margin-bottom: 0.5rem;
   display: grid;
   grid-template-columns: auto 1fr auto auto;
   gap: 0.75rem;
   align-items: center;
-  transition: all 0.2s ease;
+  transition: all var(--transition-fast);
 }
 
 .task-card:hover:not(.completed) {
-  background: #333;
-  border-color: #555;
+  background: var(--surface-4);
+  border-color: var(--border-default);
   transform: translateX(-2px);
 }
 
 .task-card.boosted {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
-  border-color: #ffd700;
+  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
+  border-color: var(--gold);
   color: #000;
 }
 
@@ -242,15 +243,15 @@
 }
 
 .task-card.completed {
-  background: #2d5f2d;
-  border-color: #4CAF50;
+  background: rgba(76, 175, 80, 0.1);
+  border-color: rgba(76, 175, 80, 0.3);
   opacity: 0.7;
 }
 
 .task-number {
   font-weight: 700;
   font-size: 0.85rem;
-  color: #888;
+  color: var(--text-muted);
   min-width: 30px;
 }
 
@@ -277,7 +278,7 @@
 
 .task-mode {
   font-size: 0.75rem;
-  color: #aaa;
+  color: var(--text-secondary);
 }
 
 .task-card.boosted .task-mode {
@@ -318,10 +319,10 @@
 .task-provider {
   font-size: 0.7rem;
   font-weight: 600;
-  color: #666;
-  background: #1a1a1a;
+  color: var(--text-muted);
+  background: var(--surface-2);
   padding: 0.25rem 0.5rem;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
 }
 
 .task-card.boosted .task-provider {
@@ -331,8 +332,8 @@
 
 .workflow-legend {
   padding: 0.75rem 1rem;
-  border-top: 1px solid #333;
-  background: #0f0f0f;
+  border-top: 1px solid var(--border-subtle);
+  background: var(--surface-0);
   display: grid;
   grid-template-columns: 1fr 1fr;
   gap: 0.5rem;
@@ -343,22 +344,22 @@
   display: flex;
   align-items: center;
   gap: 0.5rem;
-  color: #aaa;
+  color: var(--text-secondary);
 }
 
 .legend-color {
   width: 16px;
   height: 16px;
-  border-radius: 3px;
-  border: 1px solid #444;
+  border-radius: var(--radius-sm);
+  border: 1px solid var(--border-default);
 }
 
 .legend-color.default {
-  background: #2a2a2a;
+  background: var(--surface-3);
 }
 
 .legend-color.boosted {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
+  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
 }
 
 .legend-color.active {
@@ -366,7 +367,143 @@
 }
 
 .legend-color.completed {
-  background: #2d5f2d;
+  background: rgba(76, 175, 80, 0.25);
+}
+
+/* Token Stats & Research Timer */
+.token-stats-section {
+  padding: 0.75rem 1rem;
+  background: var(--surface-0);
+  border-bottom: 1px solid var(--border-subtle);
+}
+
+.research-timer {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-bottom: 0.6rem;
+  padding-bottom: 0.6rem;
+  border-bottom: 1px solid var(--border-subtle);
+}
+
+.timer-label {
+  font-size: 0.75rem;
+  color: var(--text-muted);
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
+}
+
+.timer-value {
+  font-family: 'Courier New', Courier, monospace;
+  font-size: 1rem;
+  font-weight: 700;
+  color: var(--accent-green);
+}
+
+.token-totals {
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+  margin-bottom: 0.5rem;
+}
+
+.token-row {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+}
+
+.token-label {
+  font-size: 0.75rem;
+  color: var(--text-muted);
+}
+
+.token-value {
+  font-family: 'Courier New', Courier, monospace;
+  font-size: 0.85rem;
+  color: var(--text-secondary);
+}
+
+.token-total-row {
+  border-top: 1px solid var(--border-subtle);
+  padding-top: 0.3rem;
+  margin-top: 0.15rem;
+}
+
+.token-total-row .token-label {
+  color: var(--text-secondary);
+  font-weight: 600;
+}
+
+.token-total-row .token-value {
+  color: var(--text-primary);
+  font-weight: 600;
+}
+
+.per-model-section {
+  margin-top: 0.25rem;
+}
+
+.per-model-toggle {
+  background: none;
+  border: none;
+  color: var(--text-muted);
+  font-size: 0.75rem;
+  cursor: pointer;
+  padding: 0.25rem 0;
+  transition: color var(--transition-fast);
+}
+
+.per-model-toggle:hover {
+  color: var(--text-secondary);
+}
+
+.per-model-list {
+  margin-top: 0.4rem;
+  display: flex;
+  flex-direction: column;
+  gap: 0.35rem;
+  max-height: 180px;
+  overflow-y: auto;
+}
+
+.per-model-list::-webkit-scrollbar {
+  width: 4px;
+}
+
+.per-model-list::-webkit-scrollbar-thumb {
+  background: #444;
+  border-radius: 2px;
+}
+
+.model-row {
+  background: var(--surface-1);
+  border-radius: var(--radius-sm);
+  padding: 0.4rem 0.5rem;
+}
+
+.model-name {
+  font-size: 0.7rem;
+  color: var(--text-secondary);
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  margin-bottom: 0.15rem;
+}
+
+.model-tokens {
+  display: flex;
+  gap: 0.75rem;
+  font-family: 'Courier New', Courier, monospace;
+  font-size: 0.7rem;
+}
+
+.model-in {
+  color: #6aa7e8;
+}
+
+.model-out {
+  color: #e8a86a;
 }
 
 /* Scrollbar styling */
@@ -375,15 +512,15 @@
 }
 
 .workflow-tasks::-webkit-scrollbar-track {
-  background: #1a1a1a;
+  background: var(--surface-1);
 }
 
 .workflow-tasks::-webkit-scrollbar-thumb {
-  background: #444;
+  background: var(--surface-4);
   border-radius: 3px;
 }
 
 .workflow-tasks::-webkit-scrollbar-thumb:hover {
-  background: #555;
+  background: var(--border-strong);
 }
 
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index dfc3640..efe0569 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -1,8 +1,17 @@
-import React, { useState, useEffect, useCallback } from 'react';
+import React, { useState, useEffect, useCallback, useRef } from 'react';
 import { websocket } from '../services/websocket';
 import { boostAPI, workflowAPI } from '../services/api';
 import './WorkflowPanel.css';
 
+const formatNumber = (n) => n.toLocaleString();
+
+const formatTime = (totalSeconds) => {
+  const h = Math.floor(totalSeconds / 3600);
+  const m = Math.floor((totalSeconds % 3600) / 60);
+  const s = Math.floor(totalSeconds % 60);
+  return `${String(h).padStart(2, '0')}h ${String(m).padStart(2, '0')}m ${String(s).padStart(2, '0')}s`;
+};
+
 export default function WorkflowPanel({ isRunning }) {
   const [tasks, setTasks] = useState([]);
   const [collapsed, setCollapsed] = useState(false);
@@ -15,6 +24,17 @@ export default function WorkflowPanel({ isRunning }) {
   const [availableCategories, setAvailableCategories] = useState([]);
   const [boostEnabled, setBoostEnabled] = useState(false);
 
+  // Token tracking & timer state
+  const [tokenStats, setTokenStats] = useState({ total_input: 0, total_output: 0, by_model: {}, elapsed_seconds: 0 });
+  const [showPerModel, setShowPerModel] = useState(false);
+  const [localElapsed, setLocalElapsed] = useState(0);
+  const lastSyncRef = useRef(Date.now());
+
+  const expandPanel = useCallback(() => {
+    setCollapsed(false);
+    localStorage.setItem('workflow_panel_collapsed', 'false');
+  }, []);
+
   // Fetch boost status and categories when running
   const fetchBoostStatus = useCallback(async () => {
     try {
@@ -45,6 +65,12 @@ export default function WorkflowPanel({ isRunning }) {
     return () => clearInterval(interval);
   }, [fetchBoostStatus]);
 
+  useEffect(() => {
+    if (boostEnabled) {
+      expandPanel();
+    }
+  }, [boostEnabled, expandPanel]);
+
   // Handle setting boost next count
   const handleSetBoostNextCount = async () => {
     const count = parseInt(boostNextInput, 10);
@@ -73,6 +99,41 @@ export default function WorkflowPanel({ isRunning }) {
     }
   };
 
+  // Token stats: initial fetch on mount and when isRunning changes
+  useEffect(() => {
+    const fetchTokenStats = async () => {
+      try {
+        const resp = await workflowAPI.getTokenStats();
+        if (resp.success) {
+          setTokenStats(resp);
+          setLocalElapsed(resp.elapsed_seconds || 0);
+          lastSyncRef.current = Date.now();
+        }
+      } catch { /* ignore */ }
+    };
+    fetchTokenStats();
+  }, [isRunning]);
+
+  // Token stats: listen for real-time WebSocket updates
+  useEffect(() => {
+    const handleTokenUpdate = (data) => {
+      setTokenStats(data);
+      setLocalElapsed(data.elapsed_seconds || 0);
+      lastSyncRef.current = Date.now();
+    };
+    websocket.on('token_usage_updated', handleTokenUpdate);
+    return () => websocket.off('token_usage_updated', handleTokenUpdate);
+  }, []);
+
+  // Local 1-second timer tick for smooth elapsed display
+  useEffect(() => {
+    if (!isRunning) return;
+    const interval = setInterval(() => {
+      setLocalElapsed(prev => prev + 1);
+    }, 1000);
+    return () => clearInterval(interval);
+  }, [isRunning]);
+
   // Poll for workflow predictions when running
   useEffect(() => {
     if (!isRunning) {
@@ -288,6 +349,7 @@ export default function WorkflowPanel({ isRunning }) {
     // NEW: Handle boost enabled/disabled
     const handleBoostEnabled = () => {
       setBoostEnabled(true);
+      expandPanel();
       fetchBoostStatus();
     };
 
@@ -318,7 +380,7 @@ export default function WorkflowPanel({ isRunning }) {
       websocket.off('boost_enabled', handleBoostEnabled);
       websocket.off('boost_disabled', handleBoostDisabled);
     };
-  }, [isRunning, fetchBoostStatus]);
+  }, [isRunning, fetchBoostStatus, expandPanel]);
 
   const handleTaskClick = async (task) => {
     if (task.completed) return; // Can't toggle completed tasks
@@ -379,7 +441,7 @@ export default function WorkflowPanel({ isRunning }) {
       {!collapsed && (
         <>
           <div className="workflow-mode">
-            Mode: <span className="mode-badge">{mode}</span>
+            Mode: <span className="wf-mode-badge">{mode}</span>
           </div>
 
           {/* BOOST CONTROLS - ETERNAL (always visible, even when boost not enabled) */}
@@ -443,6 +505,55 @@ export default function WorkflowPanel({ isRunning }) {
             )}
           </div>
 
+          {/* RESEARCH TIMER & TOKEN STATS */}
+          <div className="token-stats-section">
+            <div className="research-timer">
+              <span className="timer-label">Elapsed</span>
+              <span className="timer-value">{formatTime(localElapsed)}</span>
+            </div>
+
+            <div className="token-totals">
+              <div className="token-row">
+                <span className="token-label">Input</span>
+                <span className="token-value">{formatNumber(tokenStats.total_input)}</span>
+              </div>
+              <div className="token-row">
+                <span className="token-label">Output</span>
+                <span className="token-value">{formatNumber(tokenStats.total_output)}</span>
+              </div>
+              <div className="token-row token-total-row">
+                <span className="token-label">Total</span>
+                <span className="token-value">{formatNumber(tokenStats.total_input + tokenStats.total_output)}</span>
+              </div>
+            </div>
+
+            {Object.keys(tokenStats.by_model || {}).length > 0 && (
+              <div className="per-model-section">
+                <button
+                  className="per-model-toggle"
+                  onClick={() => setShowPerModel(prev => !prev)}
+                >
+                  {showPerModel ? '▾' : '▸'} Per Model ({Object.keys(tokenStats.by_model).length})
+                </button>
+                {showPerModel && (
+                  <div className="per-model-list">
+                    {Object.entries(tokenStats.by_model)
+                      .sort((a, b) => (b[1].input + b[1].output) - (a[1].input + a[1].output))
+                      .map(([modelId, usage]) => (
+                        <div key={modelId} className="model-row">
+                          <div className="model-name" title={modelId}>{modelId}</div>
+                          <div className="model-tokens">
+                            <span className="model-in">In: {formatNumber(usage.input)}</span>
+                            <span className="model-out">Out: {formatNumber(usage.output)}</span>
+                          </div>
+                        </div>
+                      ))}
+                  </div>
+                )}
+              </div>
+            )}
+          </div>
+
           <div className="workflow-tasks">
             {tasks.length === 0 ? (
               <div className="no-tasks">Loading workflow...</div>
diff --git a/frontend/src/components/aggregator/AggregatorInterface.jsx b/frontend/src/components/aggregator/AggregatorInterface.jsx
index 9701ec4..343790d 100644
--- a/frontend/src/components/aggregator/AggregatorInterface.jsx
+++ b/frontend/src/components/aggregator/AggregatorInterface.jsx
@@ -1,8 +1,9 @@
 import React, { useState, useEffect } from 'react';
 import { api } from '../../services/api';
 import TextFileUploader from '../TextFileUploader';
+import '../settings-common.css';
 
-export default function AggregatorInterface({ config, setConfig }) {
+export default function AggregatorInterface({ config, setConfig, anyWorkflowRunning = false }) {
   const [isRunning, setIsRunning] = useState(false);
   const [status, setStatus] = useState(null);
   const [uploadedFiles, setUploadedFiles] = useState([]);
@@ -49,6 +50,11 @@ export default function AggregatorInterface({ config, setConfig }) {
   };
 
   const handleStart = async () => {
+    if (anyWorkflowRunning && !isRunning) {
+      alert('Another workflow is already running. Stop it before starting the Aggregator.');
+      return;
+    }
+
     if (!config.userPrompt.trim()) {
       alert('Please enter a user prompt');
       return;
@@ -97,7 +103,7 @@ export default function AggregatorInterface({ config, setConfig }) {
       setIsRunning(true);
     } catch (error) {
       console.error('Failed to start aggregator:', error);
-      alert('Failed to start aggregator. Check console for details.');
+      alert(`Failed to start aggregator: ${error.details || error.message}`);
     }
   };
 
@@ -159,7 +165,9 @@ export default function AggregatorInterface({ config, setConfig }) {
 
       <div className="button-group">
         {!isRunning ? (
-          <button onClick={handleStart}>Start Aggregator</button>
+          <button onClick={handleStart} disabled={anyWorkflowRunning && !isRunning}>
+            Start Aggregator
+          </button>
         ) : (
           <button onClick={handleStop} className="danger">Stop Aggregator</button>
         )}
@@ -179,7 +187,7 @@ export default function AggregatorInterface({ config, setConfig }) {
           </div>
           <div className="metric-card">
             <div className="metric-label">Rejected</div>
-            <div className="metric-value" style={{ color: '#f44336' }}>
+            <div className="metric-value error-text">
               {status.total_rejections}
             </div>
           </div>
diff --git a/frontend/src/components/aggregator/AggregatorLogs.jsx b/frontend/src/components/aggregator/AggregatorLogs.jsx
index 34746a0..c1eebec 100644
--- a/frontend/src/components/aggregator/AggregatorLogs.jsx
+++ b/frontend/src/components/aggregator/AggregatorLogs.jsx
@@ -1,6 +1,7 @@
 import React, { useState, useEffect } from 'react';
 import { websocket } from '../../services/websocket';
 import { api } from '../../services/api';
+import '../settings-common.css';
 
 export default function AggregatorLogs() {
   const [events, setEvents] = useState([]);
@@ -213,16 +214,16 @@ export default function AggregatorLogs() {
 
           {recoveryStatus && recoveryStatus.in_recovery && (
             <div style={{ 
-              backgroundColor: '#fff3cd', 
-              border: '2px solid #ffc107',
+              backgroundColor: 'rgba(30, 255, 28, 0.1)', 
+              border: '2px solid #1eff1c',
               borderRadius: '8px',
               padding: '1rem',
               margin: '1rem 0'
             }}>
-              <h2 style={{ color: '#856404', margin: '0 0 0.5rem 0' }}>
+              <h2 style={{ color: '#1eff1c', margin: '0 0 0.5rem 0' }}>
                 Model Recovery in Progress
               </h2>
-              <div style={{ color: '#856404' }}>
+              <div style={{ color: '#c6ffc5' }}>
                 <div><strong>Model:</strong> {recoveryStatus.recovering_model}</div>
                 <div><strong>Stage:</strong> {recoveryStatus.recovery_stage}</div>
                 <div style={{ marginTop: '0.5rem', fontSize: '0.9rem' }}>
@@ -246,7 +247,7 @@ export default function AggregatorLogs() {
                   <div key={model} className="metric-card" style={{ 
                     borderColor: count >= recoveryStatus.corruption_threshold ? '#f44336' : '#ff9800'
                   }}>
-                    <div className="metric-label" style={{ fontSize: '0.85rem' }}>{model}</div>
+                    <div className="metric-label label--sm">{model}</div>
                     <div style={{ fontSize: '0.9rem', marginTop: '0.5rem' }}>
                       <div style={{ color: count >= recoveryStatus.corruption_threshold ? '#f44336' : '#ff9800' }}>
                         Failures: {count}/{recoveryStatus.corruption_threshold}
@@ -271,7 +272,7 @@ export default function AggregatorLogs() {
                 <div style={{ fontSize: '0.9rem', marginTop: '0.5rem' }}>
                   <div>Submissions: {submitter.total_submissions}</div>
                   <div style={{ color: '#4CAF50' }}>Acceptances: {submitter.total_acceptances}</div>
-                  <div style={{ color: '#f44336' }}>Consecutive Rejections: {submitter.consecutive_rejections}</div>
+                  <div className="error-text">Consecutive Rejections: {submitter.consecutive_rejections}</div>
                 </div>
               </div>
             ))}
diff --git a/frontend/src/components/aggregator/AggregatorSettings.jsx b/frontend/src/components/aggregator/AggregatorSettings.jsx
index ed5ca1d..a7baffb 100644
--- a/frontend/src/components/aggregator/AggregatorSettings.jsx
+++ b/frontend/src/components/aggregator/AggregatorSettings.jsx
@@ -1,5 +1,6 @@
 import React, { useState, useEffect } from 'react';
 import { api, openRouterAPI } from '../../services/api';
+import '../settings-common.css';
 
 const DEFAULT_SUBMITTER_CONFIG = {
   submitterId: 1,
@@ -294,22 +295,13 @@ export default function AggregatorSettings({ config, setConfig }) {
     return (
       <>
         {/* Provider Toggle */}
-        <div className="form-group" style={{ margin: 0 }}>
-          <label style={{ fontSize: '0.85rem' }}>Provider</label>
-          <div style={{ display: 'flex', gap: '0.5rem' }}>
+        <div className="form-group form-group--compact">
+          <label className="label--sm">Provider</label>
+          <div className="provider-toggle-group">
             <button
               type="button"
               onClick={() => onProviderChange('lm_studio')}
-              style={{
-                flex: 1,
-                padding: '0.5rem',
-                backgroundColor: provider === 'lm_studio' ? '#4CAF50' : '#333',
-                border: 'none',
-                borderRadius: '4px',
-                color: '#fff',
-                cursor: 'pointer',
-                fontSize: '0.8rem'
-              }}
+              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
             >
               LM Studio
             </button>
@@ -317,16 +309,7 @@ export default function AggregatorSettings({ config, setConfig }) {
               type="button"
               onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
               disabled={!hasOpenRouterKey}
-              style={{
-                flex: 1,
-                padding: '0.5rem',
-                backgroundColor: provider === 'openrouter' ? '#6c5ce7' : '#333',
-                border: 'none',
-                borderRadius: '4px',
-                color: hasOpenRouterKey ? '#fff' : '#666',
-                cursor: hasOpenRouterKey ? 'pointer' : 'not-allowed',
-                fontSize: '0.8rem'
-              }}
+              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
               title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
             >
               OpenRouter
@@ -335,12 +318,12 @@ export default function AggregatorSettings({ config, setConfig }) {
         </div>
 
         {/* Model Selection */}
-        <div className="form-group" style={{ margin: 0 }}>
-          <label style={{ fontSize: '0.85rem' }}>{label}</label>
+        <div className="form-group form-group--compact">
+          <label className="label--sm">{label}</label>
           <select
             value={modelId || ''}
             onChange={(e) => onModelChange(e.target.value)}
-            style={{ fontSize: '0.85rem' }}
+            className="select--sm"
           >
             <option value="">Select model...</option>
             {models.map(model => {
@@ -361,12 +344,12 @@ export default function AggregatorSettings({ config, setConfig }) {
 
         {/* OpenRouter Provider Selection (only for OpenRouter) */}
         {provider === 'openrouter' && modelId && (
-          <div className="form-group" style={{ margin: 0 }}>
-            <label style={{ fontSize: '0.85rem' }}>Host Provider (optional)</label>
+          <div className="form-group form-group--compact">
+            <label className="label--sm">Host Provider (optional)</label>
             <select
               value={orProvider || ''}
               onChange={(e) => onOpenrouterProviderChange(e.target.value || null)}
-              style={{ fontSize: '0.85rem' }}
+              className="select--sm"
             >
               <option value="">Auto (let OpenRouter choose)</option>
               {providers.map(p => (
@@ -378,21 +361,21 @@ export default function AggregatorSettings({ config, setConfig }) {
 
         {/* LM Studio Fallback (only for OpenRouter) */}
         {provider === 'openrouter' && (
-          <div className="form-group" style={{ margin: 0 }}>
-            <label style={{ fontSize: '0.85rem', color: '#999' }}>
+          <div className="form-group form-group--compact">
+            <label className="label--sm label--muted">
               LM Studio Fallback (optional)
             </label>
             <select
               value={lmStudioFallbackId || ''}
               onChange={(e) => onFallbackChange(e.target.value || null)}
-              style={{ fontSize: '0.85rem', borderColor: '#444' }}
+              className="select--sm"
             >
               <option value="">No fallback</option>
               {lmStudioModels.map(model => (
                 <option key={model.id} value={model.id}>{model.id}</option>
               ))}
             </select>
-            <small style={{ color: '#666', display: 'block', marginTop: '0.25rem' }}>
+            <small className="hint-text hint-text--dim" style={{ marginTop: '0.25rem' }}>
               Used if OpenRouter credits run out
             </small>
           </div>
@@ -403,10 +386,10 @@ export default function AggregatorSettings({ config, setConfig }) {
 
   return (
     <div>
-      <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
+      <div className="settings-header-row">
         <h1>Aggregator Settings</h1>
         {saveMessage && (
-          <div style={{ color: '#4CAF50', fontSize: '0.9rem', fontWeight: '500' }}>
+          <div className="save-message">
             {saveMessage}
           </div>
         )}
@@ -414,14 +397,8 @@ export default function AggregatorSettings({ config, setConfig }) {
 
       {/* OpenRouter Status Banner */}
       {!hasOpenRouterKey && (
-        <div style={{
-          backgroundColor: 'rgba(108, 92, 231, 0.1)',
-          border: '1px solid #6c5ce7',
-          borderRadius: '8px',
-          padding: '1rem',
-          marginBottom: '1.5rem'
-        }}>
-          <p style={{ color: '#a29bfe', margin: 0 }}>
+        <div className="openrouter-banner">
+          <p className="openrouter-banner__text">
             <strong>💡 OpenRouter Available:</strong> Set your OpenRouter API key in the header to enable cloud model selection for any role.
           </p>
         </div>
@@ -430,15 +407,15 @@ export default function AggregatorSettings({ config, setConfig }) {
       {loading ? (
         <div>Loading models...</div>
       ) : lmStudioModels.length === 0 && !hasOpenRouterKey ? (
-        <div style={{ color: '#f44336' }}>
+        <div className="error-text">
           <p>No models found. Make sure LM Studio is running on http://127.0.0.1:1234 or configure OpenRouter.</p>
           <button onClick={fetchModels} className="secondary">Retry</button>
         </div>
       ) : (
         <>
           {/* Number of Submitters Slider */}
-          <div className="form-group" style={{ marginBottom: '2rem', padding: '1rem', background: '#1a2332', borderRadius: '8px' }}>
-            <label style={{ fontSize: '1.1rem', fontWeight: '600' }}>
+          <div className="form-group settings-panel settings-panel--blue">
+            <label className="label--lg">
               Number of Aggregator Submitters: {numSubmitters}
             </label>
             <input
@@ -447,62 +424,46 @@ export default function AggregatorSettings({ config, setConfig }) {
               max="10"
               value={numSubmitters}
               onChange={(e) => handleNumSubmittersChange(e.target.value)}
-              style={{ width: '100%', marginTop: '0.5rem' }}
+              className="range-slider"
             />
-            <div style={{ display: 'flex', justifyContent: 'space-between', fontSize: '0.8rem', color: '#888' }}>
+            <div className="range-labels">
               <span>1</span>
               <span>5</span>
               <span>10</span>
             </div>
-            <small style={{ color: '#999', display: 'block', marginTop: '0.5rem' }}>
+            <small className="hint-text">
               Multiple submitters run in parallel exploring different avenues. Each can use a different model.
             </small>
           </div>
 
           {/* Per-Submitter Configuration Cards */}
-          <div style={{ marginBottom: '2rem' }}>
-            <h3 style={{ marginBottom: '1rem', borderBottom: '1px solid #333', paddingBottom: '0.5rem' }}>
+          <div className="mb-2">
+            <h3 className="section-heading--bordered">
               Submitter Configurations
             </h3>
             
             {submitterConfigs.map((cfg, idx) => (
               <div 
                 key={cfg.submitterId}
-                style={{
-                  background: cfg.submitterId === 1 ? '#1a2838' : '#1a1a24',
-                  border: cfg.provider === 'openrouter' 
-                    ? '2px solid #6c5ce7' 
-                    : (cfg.submitterId === 1 ? '2px solid #4CAF50' : '1px solid #333'),
-                  borderRadius: '8px',
-                  padding: '1rem',
-                  marginBottom: '1rem'
-                }}
+                className={`role-config-card${cfg.provider === 'openrouter' ? ' role-config-card--openrouter role-config-card--highlight' : (cfg.submitterId === 1 ? ' role-config-card--main role-config-card--highlight' : '')}`}
               >
-                <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: '1rem' }}>
-                  <h4 style={{ margin: 0, color: cfg.provider === 'openrouter' ? '#a29bfe' : (cfg.submitterId === 1 ? '#4CAF50' : '#fff') }}>
+                <div className="card-header-row">
+                  <h4 style={{ margin: 0 }} className={cfg.provider === 'openrouter' ? 'card-title--purple' : (cfg.submitterId === 1 ? 'card-title--green' : '')}>
                     Submitter {cfg.submitterId} 
-                    {cfg.submitterId === 1 && <span style={{ fontWeight: 'normal' }}> (Main Submitter)</span>}
-                    {cfg.provider === 'openrouter' && <span style={{ fontWeight: 'normal', color: '#6c5ce7' }}> [OpenRouter]</span>}
+                    {cfg.submitterId === 1 && <span className="provider-badge-inline"> (Main Submitter)</span>}
+                    {cfg.provider === 'openrouter' && <span className="provider-badge-inline" style={{ color: '#6c5ce7' }}> [OpenRouter]</span>}
                   </h4>
                   {cfg.submitterId === 1 && numSubmitters > 1 && (
                     <button 
                       onClick={() => applyToAll(1)}
-                      style={{ 
-                        fontSize: '0.8rem', 
-                        padding: '0.3rem 0.6rem',
-                        background: '#4CAF50',
-                        border: 'none',
-                        borderRadius: '4px',
-                        cursor: 'pointer',
-                        color: '#fff'
-                      }}
+                      className="btn-apply-all"
                     >
                       Apply to All
                     </button>
                   )}
                 </div>
 
-                <div style={{ display: 'grid', gridTemplateColumns: cfg.provider === 'openrouter' ? '1fr 1fr' : '1fr 1fr 1fr', gap: '1rem' }}>
+                <div className={`config-grid ${cfg.provider === 'openrouter' ? 'config-grid--2col' : 'config-grid--3col'}`}>
                   <ModelSelector
                     provider={cfg.provider}
                     modelId={cfg.modelId}
@@ -514,8 +475,8 @@ export default function AggregatorSettings({ config, setConfig }) {
                     onFallbackChange={(f) => updateSubmitterConfig(cfg.submitterId, 'lmStudioFallbackId', f)}
                   />
 
-                  <div className="form-group" style={{ margin: 0 }}>
-                    <label style={{ fontSize: '0.85rem' }}>Context Window</label>
+                  <div className="form-group form-group--compact">
+                    <label className="label--sm">Context Window</label>
                     <input
                       type="number"
                       value={cfg.contextWindow}
@@ -523,12 +484,12 @@ export default function AggregatorSettings({ config, setConfig }) {
                       min="4096"
                       max="999999"
                       step="1024"
-                      style={{ fontSize: '0.85rem' }}
+                      className="input--sm"
                     />
                   </div>
 
-                  <div className="form-group" style={{ margin: 0 }}>
-                    <label style={{ fontSize: '0.85rem' }}>Max Output Tokens</label>
+                  <div className="form-group form-group--compact">
+                    <label className="label--sm">Max Output Tokens</label>
                     <input
                       type="number"
                       value={cfg.maxOutputTokens}
@@ -536,7 +497,7 @@ export default function AggregatorSettings({ config, setConfig }) {
                       min="1000"
                       max="100000"
                       step="1000"
-                      style={{ fontSize: '0.85rem' }}
+                      className="input--sm"
                     />
                   </div>
                 </div>
@@ -545,22 +506,16 @@ export default function AggregatorSettings({ config, setConfig }) {
           </div>
 
           {/* Validator Configuration (Single) */}
-          <div style={{ 
-            marginBottom: '2rem', 
-            padding: '1rem', 
-            background: validatorProvider === 'openrouter' ? '#1a1a2e' : '#241a1a', 
-            border: validatorProvider === 'openrouter' ? '2px solid #6c5ce7' : '1px solid #663333', 
-            borderRadius: '8px' 
-          }}>
-            <h3 style={{ marginBottom: '1rem', color: validatorProvider === 'openrouter' ? '#a29bfe' : '#ff6b6b' }}>
+          <div className={`role-config-card${validatorProvider === 'openrouter' ? ' role-config-card--openrouter role-config-card--highlight' : ' settings-panel--validator'}`}>
+            <h3 className={validatorProvider === 'openrouter' ? 'card-title--purple' : ''} style={{ marginBottom: '1rem', color: validatorProvider === 'openrouter' ? undefined : '#ff6b6b' }}>
               Validator Configuration (Single)
-              {validatorProvider === 'openrouter' && <span style={{ fontWeight: 'normal', marginLeft: '0.5rem' }}>[OpenRouter]</span>}
+              {validatorProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
             </h3>
-            <small style={{ color: '#999', display: 'block', marginBottom: '1rem' }}>
-              Only one validator is allowed to maintain single Markov chain evolution of the database.
+            <small className="hint-text" style={{ marginBottom: '1rem' }}>
+              Only one validator is allowed to maintain a single Markov chain evolution of the database.
             </small>
 
-            <div style={{ display: 'grid', gridTemplateColumns: validatorProvider === 'openrouter' ? '1fr 1fr' : '1fr', gap: '1rem' }}>
+            <div className={`config-grid ${validatorProvider === 'openrouter' ? 'config-grid--2col' : 'config-grid--1col'}`}>
               <ModelSelector
                 provider={validatorProvider}
                 modelId={config.validatorModel}
@@ -598,7 +553,7 @@ export default function AggregatorSettings({ config, setConfig }) {
                 max="999999"
                 step="1024"
               />
-              <small style={{ color: '#999', display: 'block', marginTop: '0.5rem' }}>
+              <small className="hint-text">
                 {validatorProvider === 'lm_studio' 
                   ? 'Must match the context length you set in LM Studio for this model.'
                   : 'Set based on the OpenRouter model\'s context window.'
@@ -609,10 +564,7 @@ export default function AggregatorSettings({ config, setConfig }) {
             <div className="form-group">
               <label>
                 Validator Max Output Tokens{' '}
-                <span 
-                  title="Default: 25000"
-                  style={{ cursor: 'help', marginLeft: '0.5rem', color: '#888' }}
-                >
+                <span className="help-hint" title="Default: 25000">
                   ℹ️
                 </span>
               </label>
@@ -632,25 +584,24 @@ export default function AggregatorSettings({ config, setConfig }) {
             </div>
           </div>
 
-          <button onClick={fetchModels} className="secondary" style={{ marginRight: '0.5rem' }}>
+          <button onClick={fetchModels} className="secondary mr-05">
             Refresh LM Studio Models
           </button>
           {hasOpenRouterKey && (
             <>
-              <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary" disabled={loadingOpenRouter} style={{ marginRight: '0.5rem' }}>
+              <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary mr-05" disabled={loadingOpenRouter}>
                 {loadingOpenRouter ? 'Loading...' : 'Refresh OpenRouter Models'}
               </button>
-              <label style={{ display: 'inline-flex', alignItems: 'center', marginLeft: '1rem', fontSize: '0.9rem' }}>
+              <label className="settings-checkbox-label" style={{ marginLeft: '1rem' }}>
                 <input
                   type="checkbox"
                   checked={freeOnly}
                   onChange={(e) => setFreeOnly(e.target.checked)}
-                  style={{ marginRight: '0.5rem' }}
                 />
                 Show only free models
               </label>
-              <div style={{ display: 'flex', flexDirection: 'column', gap: '0.4rem', marginTop: '0.5rem' }}>
-                <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
+              <div className="checkbox-group-col">
+                <label className="settings-checkbox-label">
                   <input
                     type="checkbox"
                     checked={freeModelLooping}
@@ -658,15 +609,11 @@ export default function AggregatorSettings({ config, setConfig }) {
                       setFreeModelLooping(e.target.checked);
                       openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
                     }}
-                    style={{ marginRight: '0.5rem' }}
                   />
                   Enable Free Model Looping
-                  <span
-                    title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
-                    style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
-                  >(?)</span>
+                  <span className="help-hint" title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.">(?)</span>
                 </label>
-                <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
+                <label className="settings-checkbox-label">
                   <input
                     type="checkbox"
                     checked={freeModelAutoSelector}
@@ -674,13 +621,9 @@ export default function AggregatorSettings({ config, setConfig }) {
                       setFreeModelAutoSelector(e.target.checked);
                       openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
                     }}
-                    style={{ marginRight: '0.5rem' }}
                   />
                   Use OpenRouter Free Models Auto-Selector as Backup
-                  <span
-                    title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
-                    style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
-                  >(?)</span>
+                  <span className="help-hint" title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping.">(?)</span>
                 </label>
               </div>
             </>
@@ -689,9 +632,9 @@ export default function AggregatorSettings({ config, setConfig }) {
       )}
 
       {/* Current Configuration Summary */}
-      <div style={{ marginTop: '2rem', padding: '1rem', background: '#1a1a1a', borderRadius: '6px' }}>
+      <div className="settings-panel mt-1">
         <h3>Current Configuration Summary</h3>
-        <pre style={{ color: '#4CAF50', fontSize: '0.85rem', overflow: 'auto' }}>
+        <pre className="config-summary-pre">
           {JSON.stringify({
             numSubmitters: submitterConfigs.length,
             submitterConfigs: submitterConfigs.map(s => ({
diff --git a/frontend/src/components/aggregator/LiveResults.jsx b/frontend/src/components/aggregator/LiveResults.jsx
index 1cf0211..6a970db 100644
--- a/frontend/src/components/aggregator/LiveResults.jsx
+++ b/frontend/src/components/aggregator/LiveResults.jsx
@@ -5,6 +5,7 @@ import React, { useState, useEffect, useRef } from 'react';
 import { api } from '../../services/api';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
 
 export default function LiveResults() {
   const [results, setResults] = useState('');
@@ -74,7 +75,7 @@ export default function LiveResults() {
       return;
     }
     
-    const blob = new Blob([results], { type: 'text/plain' });
+    const blob = new Blob([prependDisclaimer(results, 'brainstorm')], { type: 'text/plain' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');
     a.href = url;
@@ -118,7 +119,7 @@ export default function LiveResults() {
 
       <div className="results-container" ref={resultsRef}>
         <LatexRenderer
-          content={results}
+          content={prependDisclaimer(results, 'brainstorm')}
           className="results-latex-renderer"
           showToggle={false}
           showLatex={showLatex}
diff --git a/frontend/src/components/autonomous/ArchiveViewerModal.css b/frontend/src/components/autonomous/ArchiveViewerModal.css
new file mode 100644
index 0000000..86ba3c2
--- /dev/null
+++ b/frontend/src/components/autonomous/ArchiveViewerModal.css
@@ -0,0 +1,264 @@
+/* ============================================
+   ArchiveViewerModal — Research lineage viewer
+   ============================================ */
+
+/* Overlay */
+.archive-overlay {
+  position: fixed;
+  inset: 0;
+  background: rgba(0, 0, 0, 0.5);
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  z-index: 50;
+}
+
+/* Panel */
+.archive-panel {
+  background: #111827;
+  border-radius: 8px;
+  width: 91.666%;
+  height: 83.333%;
+  max-width: 72rem;
+  display: flex;
+  flex-direction: column;
+}
+
+/* Header */
+.archive-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 1rem;
+  border-bottom: 1px solid #374151;
+}
+
+.archive-title {
+  font-size: 1.25rem;
+  font-weight: 600;
+  color: #f3f4f6;
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  margin: 0;
+}
+
+.archive-close-btn {
+  color: #9ca3af;
+  background: transparent;
+  border: none;
+  cursor: pointer;
+  padding: 4px;
+  transition: color 0.2s;
+}
+
+.archive-close-btn:hover {
+  color: #e5e7eb;
+}
+
+/* Tabs */
+.archive-tabs {
+  display: flex;
+  border-bottom: 1px solid #374151;
+}
+
+.archive-tab {
+  padding: 0.75rem 1.5rem;
+  font-weight: 500;
+  background: transparent;
+  border: none;
+  border-bottom: 2px solid transparent;
+  cursor: pointer;
+  transition: color 0.2s, border-color 0.2s;
+  color: #9ca3af;
+}
+
+.archive-tab:hover {
+  color: #e5e7eb;
+}
+
+.archive-tab--active {
+  color: #60a5fa;
+  border-bottom-color: #60a5fa;
+}
+
+.archive-tab-icon {
+  display: inline;
+  width: 16px;
+  height: 16px;
+  margin-right: 0.5rem;
+}
+
+/* Content area */
+.archive-content {
+  flex: 1;
+  overflow-y: auto;
+  padding: 1rem;
+}
+
+.archive-placeholder {
+  text-align: center;
+  color: #9ca3af;
+  padding: 2rem 0;
+}
+
+/* List items */
+.archive-list {
+  display: flex;
+  flex-direction: column;
+  gap: 0.75rem;
+}
+
+.archive-card {
+  background: #1f2937;
+  padding: 1rem;
+  border-radius: 8px;
+  cursor: pointer;
+  transition: background-color 0.2s;
+}
+
+.archive-card:hover {
+  background: #283344;
+}
+
+.archive-card-row {
+  display: flex;
+  align-items: flex-start;
+  justify-content: space-between;
+}
+
+.archive-card-body {
+  flex: 1;
+}
+
+.archive-card-title {
+  font-size: 1.125rem;
+  font-weight: 600;
+  color: #f3f4f6;
+  margin-bottom: 0.5rem;
+}
+
+.archive-card-desc {
+  font-size: 0.875rem;
+  color: #9ca3af;
+  display: -webkit-box;
+  -webkit-line-clamp: 2;
+  -webkit-box-orient: vertical;
+  overflow: hidden;
+}
+
+.archive-card-meta {
+  margin-top: 0.5rem;
+  font-size: 0.75rem;
+  color: #6b7280;
+}
+
+.archive-card-chevron {
+  width: 20px;
+  height: 20px;
+  color: #6b7280;
+  margin-left: 1rem;
+  flex-shrink: 0;
+}
+
+/* Detail view */
+.archive-back-btn {
+  color: #60a5fa;
+  background: transparent;
+  border: none;
+  cursor: pointer;
+  display: flex;
+  align-items: center;
+  gap: 0.25rem;
+  margin-bottom: 1rem;
+  padding: 0;
+  font-size: inherit;
+  transition: color 0.2s;
+}
+
+.archive-back-btn:hover {
+  color: #93c5fd;
+}
+
+.archive-detail {
+  background: #1f2937;
+  padding: 1.5rem;
+  border-radius: 8px;
+}
+
+.archive-detail-divider {
+  margin-bottom: 1rem;
+  padding-bottom: 1rem;
+  border-bottom: 1px solid #374151;
+}
+
+.archive-badge-readonly {
+  font-size: 0.75rem;
+  color: #eab308;
+  background: rgba(234, 179, 8, 0.1);
+  padding: 0.25rem 0.5rem;
+  border-radius: 4px;
+}
+
+.archive-detail-title {
+  font-size: 1.5rem;
+  font-weight: 700;
+  color: #f3f4f6;
+  margin-bottom: 1rem;
+}
+
+.archive-section {
+  margin-bottom: 1.5rem;
+}
+
+.archive-section-heading {
+  font-size: 0.875rem;
+  font-weight: 600;
+  color: #9ca3af;
+  margin-bottom: 0.5rem;
+}
+
+.archive-section-text {
+  color: #d1d5db;
+}
+
+.archive-section-meta {
+  font-size: 0.875rem;
+  color: #9ca3af;
+}
+
+.archive-section-meta div {
+  margin-bottom: 0.25rem;
+}
+
+.archive-content-viewer {
+  background: #111827;
+  border-radius: 4px;
+  max-height: 24rem;
+  overflow-y: auto;
+}
+
+.archive-pre-content {
+  color: #d1d5db;
+  white-space: pre-wrap;
+  font-family: monospace;
+  font-size: 0.875rem;
+  background: #111827;
+  padding: 1rem;
+  border-radius: 4px;
+  max-height: 24rem;
+  overflow-y: auto;
+  margin: 0;
+}
+
+/* Icon sizing */
+.archive-icon-header {
+  width: 20px;
+  height: 20px;
+  color: #60a5fa;
+}
+
+.archive-icon-close {
+  width: 24px;
+  height: 24px;
+}
diff --git a/frontend/src/components/autonomous/ArchiveViewerModal.jsx b/frontend/src/components/autonomous/ArchiveViewerModal.jsx
index da67b45..e07d440 100644
--- a/frontend/src/components/autonomous/ArchiveViewerModal.jsx
+++ b/frontend/src/components/autonomous/ArchiveViewerModal.jsx
@@ -1,8 +1,8 @@
 import React, { useState, useEffect } from 'react';
 import { api } from '../../services/api';
 import LatexRenderer from '../LatexRenderer';
+import './ArchiveViewerModal.css';
 
-// Simple inline icon components (no external dependency)
 const IconX = ({ className }) => (
   <svg className={className} viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
     <line x1="18" y1="6" x2="6" y2="18"></line>
@@ -30,12 +30,8 @@ const IconChevronRight = ({ className }) => (
   </svg>
 );
 
-/**
- * Modal overlay for viewing archived research lineage (papers + brainstorms).
- * Read-only view that looks similar to live interface but can't be continued.
- */
 export default function ArchiveViewerModal({ answerId, onClose }) {
-  const [activeTab, setActiveTab] = useState('papers'); // 'papers' | 'brainstorms'
+  const [activeTab, setActiveTab] = useState('papers');
   const [papers, setPapers] = useState([]);
   const [brainstorms, setBrainstorms] = useState([]);
   const [selectedPaper, setSelectedPaper] = useState(null);
@@ -49,15 +45,10 @@ export default function ArchiveViewerModal({ answerId, onClose }) {
   const loadArchive = async () => {
     try {
       setLoading(true);
-      
-      // Load papers list
-      const papersRes = await api.get(`/auto-research/final-answer/${answerId}/archive/papers`);
-      setPapers(papersRes.data.papers);
-      
-      // Load brainstorms list
-      const brainstormsRes = await api.get(`/auto-research/final-answer/${answerId}/archive/brainstorms`);
-      setBrainstorms(brainstormsRes.data.brainstorms);
-      
+      const papersRes = await api.get(`/api/auto-research/final-answer/${answerId}/archive/papers`);
+      setPapers(papersRes.papers);
+      const brainstormsRes = await api.get(`/api/auto-research/final-answer/${answerId}/archive/brainstorms`);
+      setBrainstorms(brainstormsRes.brainstorms);
     } catch (error) {
       console.error('Failed to load archive:', error);
     } finally {
@@ -67,8 +58,8 @@ export default function ArchiveViewerModal({ answerId, onClose }) {
 
   const loadPaperDetails = async (paperId) => {
     try {
-      const res = await api.get(`/auto-research/final-answer/${answerId}/archive/papers/${paperId}`);
-      setSelectedPaper(res.data);
+      const res = await api.get(`/api/auto-research/final-answer/${answerId}/archive/papers/${paperId}`);
+      setSelectedPaper(res);
     } catch (error) {
       console.error('Failed to load paper:', error);
     }
@@ -76,66 +67,46 @@ export default function ArchiveViewerModal({ answerId, onClose }) {
 
   const loadBrainstormDetails = async (topicId) => {
     try {
-      const res = await api.get(`/auto-research/final-answer/${answerId}/archive/brainstorms/${topicId}`);
-      setSelectedBrainstorm(res.data);
+      const res = await api.get(`/api/auto-research/final-answer/${answerId}/archive/brainstorms/${topicId}`);
+      setSelectedBrainstorm(res);
     } catch (error) {
       console.error('Failed to load brainstorm:', error);
     }
   };
 
   return (
-    <div className="fixed inset-0 bg-black bg-opacity-50 flex items-center justify-center z-50">
-      <div className="bg-gray-900 rounded-lg w-11/12 h-5/6 max-w-6xl flex flex-col">
-        {/* Header */}
-        <div className="flex items-center justify-between p-4 border-b border-gray-700">
-          <h2 className="text-xl font-semibold text-gray-100 flex items-center gap-2">
-            <IconDatabase className="w-5 h-5 text-blue-400" />
+    <div className="archive-overlay">
+      <div className="archive-panel">
+        <div className="archive-header">
+          <h2 className="archive-title">
+            <IconDatabase className="archive-icon-header" />
             Research Archive (Read-Only)
           </h2>
-          <button
-            onClick={onClose}
-            className="text-gray-400 hover:text-gray-200"
-          >
-            <IconX className="w-6 h-6" />
+          <button onClick={onClose} className="archive-close-btn">
+            <IconX className="archive-icon-close" />
           </button>
         </div>
 
-        {/* Tabs */}
-        <div className="flex border-b border-gray-700">
+        <div className="archive-tabs">
           <button
-            onClick={() => {
-              setActiveTab('papers');
-              setSelectedPaper(null);
-            }}
-            className={`px-6 py-3 font-medium transition-colors ${
-              activeTab === 'papers'
-                ? 'text-blue-400 border-b-2 border-blue-400'
-                : 'text-gray-400 hover:text-gray-200'
-            }`}
+            onClick={() => { setActiveTab('papers'); setSelectedPaper(null); }}
+            className={`archive-tab ${activeTab === 'papers' ? 'archive-tab--active' : ''}`}
           >
-            <IconFileText className="inline w-4 h-4 mr-2" />
+            <IconFileText className="archive-tab-icon" />
             Papers ({papers.length})
           </button>
           <button
-            onClick={() => {
-              setActiveTab('brainstorms');
-              setSelectedBrainstorm(null);
-            }}
-            className={`px-6 py-3 font-medium transition-colors ${
-              activeTab === 'brainstorms'
-                ? 'text-blue-400 border-b-2 border-blue-400'
-                : 'text-gray-400 hover:text-gray-200'
-            }`}
+            onClick={() => { setActiveTab('brainstorms'); setSelectedBrainstorm(null); }}
+            className={`archive-tab ${activeTab === 'brainstorms' ? 'archive-tab--active' : ''}`}
           >
-            <IconDatabase className="inline w-4 h-4 mr-2" />
+            <IconDatabase className="archive-tab-icon" />
             Brainstorms ({brainstorms.length})
           </button>
         </div>
 
-        {/* Content */}
-        <div className="flex-1 overflow-y-auto p-4">
+        <div className="archive-content">
           {loading ? (
-            <div className="text-center text-gray-400 py-8">Loading archive...</div>
+            <div className="archive-placeholder">Loading archive...</div>
           ) : (
             <>
               {activeTab === 'papers' && (
@@ -145,7 +116,6 @@ export default function ArchiveViewerModal({ answerId, onClose }) {
                   <PapersListView papers={papers} onSelectPaper={loadPaperDetails} />
                 )
               )}
-              
               {activeTab === 'brainstorms' && (
                 selectedBrainstorm ? (
                   <BrainstormDetailView brainstorm={selectedBrainstorm} onBack={() => setSelectedBrainstorm(null)} />
@@ -161,29 +131,24 @@ export default function ArchiveViewerModal({ answerId, onClose }) {
   );
 }
 
-// Papers list view
 function PapersListView({ papers, onSelectPaper }) {
   if (papers.length === 0) {
-    return <div className="text-gray-400 text-center py-8">No papers in archive</div>;
+    return <div className="archive-placeholder">No papers in archive</div>;
   }
 
   return (
-    <div className="space-y-3">
+    <div className="archive-list">
       {papers.map((paper) => (
-        <div
-          key={paper.paper_id}
-          onClick={() => onSelectPaper(paper.paper_id)}
-          className="bg-gray-800 p-4 rounded-lg cursor-pointer hover:bg-gray-750 transition-colors"
-        >
-          <div className="flex items-start justify-between">
-            <div className="flex-1">
-              <h3 className="text-lg font-semibold text-gray-100 mb-2">{paper.title}</h3>
-              <p className="text-sm text-gray-400 line-clamp-2">{paper.abstract}</p>
-              <div className="mt-2 text-xs text-gray-500">
-                {paper.word_count} words • Paper ID: {paper.paper_id}
+        <div key={paper.paper_id} onClick={() => onSelectPaper(paper.paper_id)} className="archive-card">
+          <div className="archive-card-row">
+            <div className="archive-card-body">
+              <h3 className="archive-card-title">{paper.title}</h3>
+              <p className="archive-card-desc">{paper.abstract}</p>
+              <div className="archive-card-meta">
+                {paper.word_count} words &bull; Paper ID: {paper.paper_id}
               </div>
             </div>
-            <IconChevronRight className="w-5 h-5 text-gray-500 ml-4 flex-shrink-0" />
+            <IconChevronRight className="archive-card-chevron" />
           </div>
         </div>
       ))}
@@ -191,34 +156,24 @@ function PapersListView({ papers, onSelectPaper }) {
   );
 }
 
-// Paper detail view
 function PaperDetailView({ paper, onBack }) {
   return (
     <div>
-      <button
-        onClick={onBack}
-        className="text-blue-400 hover:text-blue-300 mb-4 flex items-center gap-1"
-      >
-        ← Back to Papers
+      <button onClick={onBack} className="archive-back-btn">
+        &larr; Back to Papers
       </button>
-      
-      <div className="bg-gray-800 p-6 rounded-lg">
-        <div className="mb-4 pb-4 border-b border-gray-700">
-          <span className="text-xs text-yellow-500 bg-yellow-500/10 px-2 py-1 rounded">
-            ARCHIVED - READ ONLY
-          </span>
+      <div className="archive-detail">
+        <div className="archive-detail-divider">
+          <span className="archive-badge-readonly">ARCHIVED - READ ONLY</span>
         </div>
-        
-        <h2 className="text-2xl font-bold text-gray-100 mb-4">{paper.metadata.title}</h2>
-        
-        <div className="mb-6">
-          <h3 className="text-sm font-semibold text-gray-400 mb-2">Abstract</h3>
-          <p className="text-gray-300">{paper.abstract}</p>
+        <h2 className="archive-detail-title">{paper.metadata.title}</h2>
+        <div className="archive-section">
+          <h3 className="archive-section-heading">Abstract</h3>
+          <p className="archive-section-text">{paper.abstract}</p>
         </div>
-        
-        <div className="mb-6">
-          <h3 className="text-sm font-semibold text-gray-400 mb-2">Paper Content</h3>
-          <div className="bg-gray-900 rounded max-h-96 overflow-y-auto">
+        <div className="archive-section">
+          <h3 className="archive-section-heading">Paper Content</h3>
+          <div className="archive-content-viewer">
             <LatexRenderer
               content={
                 paper.outline
@@ -236,31 +191,26 @@ function PaperDetailView({ paper, onBack }) {
   );
 }
 
-// Brainstorms list view
 function BrainstormsListView({ brainstorms, onSelectBrainstorm }) {
   if (brainstorms.length === 0) {
-    return <div className="text-gray-400 text-center py-8">No brainstorms in archive</div>;
+    return <div className="archive-placeholder">No brainstorms in archive</div>;
   }
 
   return (
-    <div className="space-y-3">
+    <div className="archive-list">
       {brainstorms.map((brainstorm) => (
-        <div
-          key={brainstorm.topic_id}
-          onClick={() => onSelectBrainstorm(brainstorm.topic_id)}
-          className="bg-gray-800 p-4 rounded-lg cursor-pointer hover:bg-gray-750 transition-colors"
-        >
-          <div className="flex items-start justify-between">
-            <div className="flex-1">
-              <h3 className="text-lg font-semibold text-gray-100 mb-2">{brainstorm.topic_prompt}</h3>
-              <div className="text-sm text-gray-400">
-                {brainstorm.submission_count} submissions • Status: {brainstorm.status}
+        <div key={brainstorm.topic_id} onClick={() => onSelectBrainstorm(brainstorm.topic_id)} className="archive-card">
+          <div className="archive-card-row">
+            <div className="archive-card-body">
+              <h3 className="archive-card-title">{brainstorm.topic_prompt}</h3>
+              <div className="archive-card-desc">
+                {brainstorm.submission_count} submissions &bull; Status: {brainstorm.status}
               </div>
-              <div className="mt-2 text-xs text-gray-500">
+              <div className="archive-card-meta">
                 Topic ID: {brainstorm.topic_id}
               </div>
             </div>
-            <IconChevronRight className="w-5 h-5 text-gray-500 ml-4 flex-shrink-0" />
+            <IconChevronRight className="archive-card-chevron" />
           </div>
         </div>
       ))}
@@ -268,40 +218,27 @@ function BrainstormsListView({ brainstorms, onSelectBrainstorm }) {
   );
 }
 
-// Brainstorm detail view
 function BrainstormDetailView({ brainstorm, onBack }) {
   return (
     <div>
-      <button
-        onClick={onBack}
-        className="text-blue-400 hover:text-blue-300 mb-4 flex items-center gap-1"
-      >
-        ← Back to Brainstorms
+      <button onClick={onBack} className="archive-back-btn">
+        &larr; Back to Brainstorms
       </button>
-      
-      <div className="bg-gray-800 p-6 rounded-lg">
-        <div className="mb-4 pb-4 border-b border-gray-700">
-          <span className="text-xs text-yellow-500 bg-yellow-500/10 px-2 py-1 rounded">
-            ARCHIVED - READ ONLY
-          </span>
+      <div className="archive-detail">
+        <div className="archive-detail-divider">
+          <span className="archive-badge-readonly">ARCHIVED - READ ONLY</span>
         </div>
-        
-        <h2 className="text-2xl font-bold text-gray-100 mb-4">{brainstorm.metadata.topic_prompt}</h2>
-        
-        <div className="mb-6 text-sm text-gray-400">
+        <h2 className="archive-detail-title">{brainstorm.metadata.topic_prompt}</h2>
+        <div className="archive-section archive-section-meta">
           <div>Status: {brainstorm.metadata.status}</div>
           <div>Submissions: {brainstorm.metadata.submission_count}</div>
           <div>Topic ID: {brainstorm.topic_id}</div>
         </div>
-        
         <div>
-          <h3 className="text-sm font-semibold text-gray-400 mb-2">Brainstorm Database</h3>
-          <pre className="text-gray-300 whitespace-pre-wrap font-mono text-sm bg-gray-900 p-4 rounded max-h-96 overflow-y-auto">
-            {brainstorm.content}
-          </pre>
+          <h3 className="archive-section-heading">Brainstorm Database</h3>
+          <pre className="archive-pre-content">{brainstorm.content}</pre>
         </div>
       </div>
     </div>
   );
 }
-
diff --git a/frontend/src/components/autonomous/AutonomousResearch.css b/frontend/src/components/autonomous/AutonomousResearch.css
index 8c95059..ebbf347 100644
--- a/frontend/src/components/autonomous/AutonomousResearch.css
+++ b/frontend/src/components/autonomous/AutonomousResearch.css
@@ -7,7 +7,7 @@
 .api-logs-section {
   margin-top: 2rem;
   padding-top: 2rem;
-  border-top: 2px solid #333;
+  border-top: 1px solid var(--border-default);
 }
 
 .api-logs-header {
@@ -19,7 +19,7 @@
 
 .api-logs-header h3 {
   margin: 0;
-  color: #4CAF50;
+  color: var(--accent-green);
   font-size: 1.3rem;
 }
 
@@ -45,30 +45,30 @@
 }
 
 .phase-stats-label {
-  color: #888;
+  color: var(--text-secondary);
   font-size: 0.85rem;
 }
 
 .phase-stat-badge {
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
   padding: 0.25rem 0.5rem;
   font-size: 0.8rem;
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .api-logs-list {
-  border: 1px solid #333;
-  border-radius: 8px;
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   overflow: hidden;
   max-height: 600px;
   overflow-y: auto;
 }
 
 .api-log-entry {
-  border-bottom: 1px solid #333;
-  background: #1a1a1a;
+  border-bottom: 1px solid var(--border-subtle);
+  background: var(--surface-2);
 }
 
 .api-log-entry:last-child {
@@ -76,7 +76,7 @@
 }
 
 .api-log-entry.success {
-  border-left: 3px solid #4CAF50;
+  border-left: 3px solid var(--accent-green);
 }
 
 .api-log-entry.error {
@@ -87,40 +87,40 @@
   background: #2563eb;
   color: #fff;
   padding: 0.15rem 0.4rem;
-  border-radius: 3px;
+  border-radius: var(--radius-sm);
   font-size: 0.7rem;
   font-weight: 600;
   text-transform: uppercase;
 }
 
 .log-provider-badge {
-  background: #666;
-  color: #fff;
+  background: var(--surface-4);
+  color: var(--text-primary);
   padding: 0.15rem 0.4rem;
-  border-radius: 3px;
+  border-radius: var(--radius-sm);
   font-size: 0.7rem;
   font-weight: 600;
 }
 
 .log-tokens {
-  color: #ffd700;
+  color: var(--gold);
 }
 
 .copy-btn {
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
   padding: 0.3rem 0.6rem;
-  color: #888;
+  color: var(--text-secondary);
   font-size: 0.8rem;
   cursor: pointer;
-  transition: all 0.2s;
+  transition: all var(--transition-fast);
 }
 
 .copy-btn:hover {
-  background: #333;
-  border-color: #555;
-  color: #fff;
+  background: var(--surface-4);
+  border-color: var(--border-strong);
+  color: var(--text-primary);
 }
 
 /* ============================================================
@@ -296,8 +296,8 @@
 }
 
 .status-tier3 {
-  background: linear-gradient(135deg, rgba(241, 196, 15, 0.3), rgba(230, 126, 34, 0.3));
-  color: #f1c40f;
+  background: linear-gradient(135deg, rgba(30, 255, 28, 0.22), rgba(24, 204, 23, 0.24));
+  color: #1eff1c;
   animation: tier3-status-pulse 2s infinite;
 }
 
@@ -369,9 +369,9 @@
 }
 
 .brainstorm-stats .submission-count.queue {
-  background: rgba(241, 196, 15, 0.15);
-  color: #f1c40f;
-  border: 1px solid rgba(241, 196, 15, 0.3);
+  background: rgba(30, 255, 28, 0.15);
+  color: #7dff6f;
+  border: 1px solid rgba(30, 255, 28, 0.3);
 }
 
 /* Statistics */
@@ -487,10 +487,10 @@
 }
 
 .activity-tier3-complete {
-  background: linear-gradient(135deg, rgba(46, 204, 113, 0.2), rgba(241, 196, 15, 0.2));
-  color: #f1c40f;
+  background: linear-gradient(135deg, rgba(46, 204, 113, 0.2), rgba(30, 255, 28, 0.2));
+  color: #1eff1c;
   font-weight: 600;
-  border: 1px solid rgba(241, 196, 15, 0.3);
+  border: 1px solid rgba(30, 255, 28, 0.3);
 }
 
 /* Brainstorm List */
@@ -558,8 +558,8 @@
 }
 
 .brainstorm-status.in-progress {
-  background: rgba(241, 196, 15, 0.2);
-  color: #f1c40f;
+  background: rgba(30, 255, 28, 0.2);
+  color: #7dff6f;
 }
 
 .brainstorm-card-prompt {
@@ -863,7 +863,9 @@
   font-weight: 600;
   display: flex;
   align-items: center;
+  justify-content: center;
   gap: 0.5rem;
+  text-align: center;
 }
 
 .models-list {
@@ -873,6 +875,27 @@
   padding: 0 0.75rem;
 }
 
+.models-podium {
+  background: linear-gradient(180deg, rgba(30, 255, 28, 0.06) 0%, rgba(24, 204, 23, 0.04) 100%);
+  border: 1px solid rgba(30, 255, 28, 0.15);
+  border-radius: 8px;
+  padding: 0.6rem 0.5rem 0.5rem;
+  margin-bottom: 0.6rem;
+  display: flex;
+  flex-direction: column;
+  gap: 0.5rem;
+}
+
+.models-podium-label {
+  text-align: center;
+  font-size: 0.65rem;
+  font-weight: 700;
+  text-transform: uppercase;
+  letter-spacing: 1.5px;
+  color: rgba(30, 255, 28, 0.55);
+  margin-bottom: 0.1rem;
+}
+
 .model-item {
   background: var(--bg-secondary, #252525);
   border: 1px solid rgba(52, 152, 219, 0.2);
@@ -1095,11 +1118,11 @@
 }
 
 .settings-notice {
-  background: rgba(241, 196, 15, 0.1);
-  border: 1px solid rgba(241, 196, 15, 0.3);
+  background: rgba(30, 255, 28, 0.1);
+  border: 1px solid rgba(30, 255, 28, 0.3);
   border-radius: 6px;
   padding: 0.75rem 1rem;
-  color: #f1c40f;
+  color: #1eff1c;
   font-size: 0.9rem;
   text-align: center;
 }
@@ -1324,7 +1347,7 @@
   overflow-y: auto;
 }
 
-.log-entry {
+.auto-log-entry {
   display: flex;
   gap: 0.75rem;
   padding: 0.5rem 0.75rem;
@@ -1334,21 +1357,21 @@
   border-radius: 2px;
 }
 
-.log-entry:last-child {
+.auto-log-entry:last-child {
   border-bottom: none;
 }
 
-.log-entry.log-success {
+.auto-log-entry.log-success {
   border-left-color: #2ecc71;
   background: rgba(46, 204, 113, 0.08);
 }
 
-.log-entry.log-reject {
+.auto-log-entry.log-reject {
   border-left-color: #e74c3c;
   background: rgba(231, 76, 60, 0.08);
 }
 
-.log-entry.log-info {
+.auto-log-entry.log-info {
   border-left-color: #3498db;
   background: rgba(52, 152, 219, 0.08);
 }
@@ -1368,11 +1391,11 @@
   font-family: 'Fira Code', monospace;
 }
 
-.log-entry.log-success .log-event {
+.auto-log-entry.log-success .log-event {
   color: #2ecc71;
 }
 
-.log-entry.log-reject .log-event {
+.auto-log-entry.log-reject .log-event {
   color: #e74c3c;
 }
 
@@ -1484,7 +1507,7 @@
   font-style: italic;
 }
 
-.empty-state {
+.auto-empty-state {
   text-align: center;
   padding: 2rem;
   color: var(--text-secondary, #888);
@@ -1670,8 +1693,8 @@
 .manual-controls {
   margin-top: 15px;
   padding: 15px;
-  background: rgba(156, 39, 176, 0.1);
-  border: 1px solid rgba(156, 39, 176, 0.3);
+  background: rgba(231, 76, 60, 0.1);
+  border: 1px solid rgba(231, 76, 60, 0.3);
   border-radius: 8px;
   display: flex;
   flex-direction: column;
@@ -1680,7 +1703,7 @@
 
 .btn-force-paper {
   padding: 10px 20px;
-  background: linear-gradient(135deg, #9c27b0 0%, #673ab7 100%);
+  background: linear-gradient(135deg, #e74c3c 0%, #c0392b 100%);
   color: white;
   border: none;
   border-radius: 6px;
@@ -1691,7 +1714,7 @@
 
 .btn-force-paper:hover:not(:disabled) {
   transform: translateY(-2px);
-  box-shadow: 0 4px 12px rgba(156, 39, 176, 0.4);
+  box-shadow: 0 4px 12px rgba(231, 76, 60, 0.4);
 }
 
 .btn-force-paper:disabled {
@@ -2341,7 +2364,7 @@
   display: flex;
   align-items: center;
   justify-content: center;
-  z-index: 1000;
+  z-index: 2000;
   backdrop-filter: blur(4px);
 }
 
diff --git a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
index 721690f..5478c1d 100644
--- a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
@@ -10,6 +10,7 @@ import TextFileUploader from '../TextFileUploader';
 
 const AutonomousResearchInterface = ({
   isRunning,
+  anyWorkflowRunning,
   status,
   activity,
   onStart,
@@ -31,6 +32,8 @@ const AutonomousResearchInterface = ({
   const [critiquePhaseActive, setCritiquePhaseActive] = useState(false);
   const [isSkipping, setIsSkipping] = useState(false);
   const [skipQueued, setSkipQueued] = useState(false);  // Skip has been queued pre-emptively
+  const [explorationProgress, setExplorationProgress] = useState(null);  // Topic exploration phase tracking
+  const [titleExplorationProgress, setTitleExplorationProgress] = useState(null);  // Paper title exploration tracking
   const activityEndRef = useRef(null);
 
   // Save research prompt to localStorage
@@ -54,14 +57,29 @@ const AutonomousResearchInterface = ({
       setCritiquePhaseActive(true);
     } else if (lastEvent.event === 'critique_phase_ended') {
       setCritiquePhaseActive(false);
-      // Only reset if critique ended without skip (e.g., rewrite happened)
-      // If skipQueued is true, the skip worked, so keep showing checkmark
     } else if (lastEvent.event === 'critique_phase_skipped') {
       setCritiquePhaseActive(false);
-      // Skip worked! Keep skipQueued=true to show checkmark
     } else if (lastEvent.event === 'paper_writing_started' || lastEvent.event === 'paper_completed') {
       setSkipQueued(false);  // Reset skip state for new paper
     }
+    
+    // Topic exploration phase tracking
+    if (lastEvent.event === 'topic_exploration_started') {
+      setExplorationProgress({ accepted: lastEvent.data?.resumed_count || 0, target: lastEvent.data?.target || 5 });
+    } else if (lastEvent.event === 'topic_exploration_progress') {
+      setExplorationProgress({ accepted: lastEvent.data?.accepted || 0, target: lastEvent.data?.target || 5 });
+    } else if (lastEvent.event === 'topic_exploration_complete' || lastEvent.event === 'topic_selected') {
+      setExplorationProgress(null);
+    }
+    
+    // Paper title exploration phase tracking
+    if (lastEvent.event === 'paper_title_exploration_started') {
+      setTitleExplorationProgress({ accepted: lastEvent.data?.resumed_count || 0, target: lastEvent.data?.target || 5 });
+    } else if (lastEvent.event === 'paper_title_exploration_progress') {
+      setTitleExplorationProgress({ accepted: lastEvent.data?.accepted || 0, target: lastEvent.data?.target || 5 });
+    } else if (lastEvent.event === 'paper_title_exploration_complete' || lastEvent.event === 'paper_writing_started') {
+      setTitleExplorationProgress(null);
+    }
   }, [activity]);
 
   // Reset skip state when tier changes away from paper writing
@@ -80,6 +98,11 @@ const AutonomousResearchInterface = ({
   };
 
   const handleStart = () => {
+    if (anyWorkflowRunning && !isRunning) {
+      alert('Another workflow is already running. Stop it before starting Autonomous Research.');
+      return;
+    }
+
     if (!researchPrompt.trim()) {
       alert('Please enter a research prompt');
       return;
@@ -186,13 +209,32 @@ const AutonomousResearchInterface = ({
   const getActivityIcon = (event) => {
     switch (event) {
       case 'brainstorm_submission_accepted':
+      case 'submission_accepted':
+      case 'compiler_acceptance':
+      case 'outline_locked':
         return '✓';
       case 'brainstorm_submission_rejected':
+      case 'submission_rejected':
+      case 'compiler_rejection':
         return '✗';
       case 'topic_selected':
         return '»';
       case 'topic_selection_rejected':
         return '⚠';
+      case 'topic_exploration_started':
+        return '◉';
+      case 'topic_exploration_progress':
+        return '◈';
+      case 'topic_exploration_rejected':
+        return '⚠';
+      case 'topic_exploration_complete':
+        return '✓';
+      case 'paper_title_exploration_started':
+        return '◉';
+      case 'paper_title_exploration_progress':
+        return '◈';
+      case 'paper_title_exploration_complete':
+        return '✓';
       case 'completion_review_started':
         return '◎';
       case 'completion_review_result':
@@ -215,6 +257,7 @@ const AutonomousResearchInterface = ({
       case 'critique_phase_ended':
         return '✓';
       case 'critique_phase_skipped':
+      case 'compiler_decline':
         return '↷';
       case 'phase_transition':
         return '□';
@@ -222,6 +265,12 @@ const AutonomousResearchInterface = ({
         return '⊟';
       case 'paper_redundancy_review':
         return '◇';
+      case 'brainstorm_continuation_started':
+        return '◎';
+      case 'brainstorm_continuation_decided':
+        return '⊞';
+      case 'brainstorm_paper_limit_reached':
+        return '⊘';
       // Reference selection events
       case 'reference_selection_started':
         return '▭';
@@ -270,8 +319,12 @@ const AutonomousResearchInterface = ({
     }
     // Success events
     if (event.includes('accepted') || 
+        event === 'compiler_acceptance' ||
+        event === 'outline_locked' ||
         event === 'paper_completed' || 
         event === 'partial_revision_complete' ||
+        event === 'topic_exploration_complete' ||
+        event === 'paper_title_exploration_complete' ||
         event === 'tier3_chapter_complete' ||
         event === 'tier3_short_form_complete' ||
         event === 'tier3_long_form_complete' ||
@@ -279,7 +332,7 @@ const AutonomousResearchInterface = ({
       return 'activity-success';
     }
     // Rejection events
-    if (event.includes('rejected') || event === 'tier3_rejection') {
+    if (event.includes('rejected') || event === 'compiler_rejection' || event === 'tier3_rejection') {
       return 'activity-reject';
     }
     // Info events (reviews, starts, tier3 progress, etc.)
@@ -297,8 +350,11 @@ const AutonomousResearchInterface = ({
         event === 'tier3_volume_organized' ||
         event === 'topic_selected' ||
         event === 'reference_selection_started' ||
+        event === 'compiler_decline' ||
         event === 'critique_phase_ended' ||
-        event === 'critique_phase_skipped') {
+        event === 'critique_phase_skipped' ||
+        event === 'brainstorm_continuation_decided' ||
+        event === 'brainstorm_paper_limit_reached') {
       return 'activity-info';
     }
     return 'activity-neutral';
@@ -314,7 +370,10 @@ const AutonomousResearchInterface = ({
             <button 
               className="btn-start"
               onClick={handleStart}
-              disabled={!config?.submitter_configs?.some(s => s.modelId)}
+              disabled={
+                !config?.submitter_configs?.some(s => s.modelId) ||
+                (anyWorkflowRunning && !isRunning)
+              }
             >
               Start Research
             </button>
@@ -348,7 +407,7 @@ const AutonomousResearchInterface = ({
           id="research-prompt"
           value={researchPrompt}
           onChange={(e) => setResearchPrompt(e.target.value)}
-          placeholder="Enter your high level research goal on any topic that related to S.T.E.M. mathematics, anything event remotely related to mathematics (e.g., 'Explore the connections between modular forms and the Langlands program' or )"
+          placeholder="Enter your high level research goal on any topic that relates to S.T.E.M. mathematics, anything remotely related to mathematics (e.g., 'Advance desalination technology' or 'Solve physics unification')"
           disabled={isRunning}
           rows={3}
         />
@@ -371,6 +430,34 @@ const AutonomousResearchInterface = ({
           </span>
         </div>
 
+        {explorationProgress && (
+          <div className="current-brainstorm" style={{ borderLeft: '3px solid #a855f7' }}>
+            <span className="status-label">Topic Exploration:</span>
+            <p className="brainstorm-prompt" style={{ color: '#c4b5fd' }}>
+              Brainstorming candidate directions ({explorationProgress.accepted}/{explorationProgress.target} accepted)
+            </p>
+            <div className="brainstorm-stats">
+              <span className="submission-count accepted">
+                ◈ {explorationProgress.accepted} / {explorationProgress.target} candidates validated
+              </span>
+            </div>
+          </div>
+        )}
+
+        {titleExplorationProgress && (
+          <div className="current-brainstorm" style={{ borderLeft: '3px solid #f59e0b' }}>
+            <span className="status-label">Title Exploration:</span>
+            <p className="brainstorm-prompt" style={{ color: '#7dff6f' }}>
+              Exploring candidate paper titles ({titleExplorationProgress.accepted}/{titleExplorationProgress.target} accepted)
+            </p>
+            <div className="brainstorm-stats">
+              <span className="submission-count accepted">
+                ◈ {titleExplorationProgress.accepted} / {titleExplorationProgress.target} titles validated
+              </span>
+            </div>
+          </div>
+        )}
+
         {status?.current_brainstorm && (
           <div className="current-brainstorm">
             <span className="status-label">Current Brainstorm:</span>
@@ -433,7 +520,7 @@ const AutonomousResearchInterface = ({
         {status?.current_tier === 'tier2_paper_writing' && (
           <div className="paper-status-banner" style={{
             backgroundColor: critiquePhaseActive ? '#2a2a2a' : '#1a1a1a',
-            border: critiquePhaseActive ? '2px solid #ffd700' : '2px solid #666',
+            border: critiquePhaseActive ? '2px solid #1eff1c' : '2px solid #666',
             borderRadius: '8px',
             padding: '1rem',
             marginTop: '1rem',
@@ -445,12 +532,12 @@ const AutonomousResearchInterface = ({
               {critiquePhaseActive ? '◎' : '▬'}
             </span>
             <div style={{ flex: 1 }}>
-              <strong style={{ color: critiquePhaseActive ? '#ffd700' : '#ccc', fontSize: '1.1rem' }}>
+              <strong style={{ color: critiquePhaseActive ? '#1eff1c' : '#ccc', fontSize: '1.1rem' }}>
                 {critiquePhaseActive ? 'Critique Phase in Progress' : 'Paper Writing in Progress'}
               </strong>
               {critiquePhaseActive ? (
                 <p style={{ margin: '0.25rem 0 0 0', fontSize: '0.85rem', color: '#888' }}>
-                  Collecting peer review feedback on body section...
+                  Collecting peer review feedback on the body section...
                 </p>
               ) : (
                 <p style={{ margin: '0.25rem 0 0 0', fontSize: '0.85rem', color: '#888' }}>
diff --git a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
index 61bba03..fd3c03e 100644
--- a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
@@ -7,6 +7,16 @@ import React, { useRef, useEffect, useMemo, useState, useCallback } from 'react'
 import { autonomousAPI } from '../../services/api';
 import './AutonomousResearch.css';
 
+const EMPTY_API_STATS = Object.freeze({
+  total_calls: 0,
+  successful_calls: 0,
+  failed_calls: 0,
+  success_rate: 0,
+  by_phase: {},
+  by_model: {},
+  by_provider: {},
+});
+
 const AutonomousResearchLogs = ({ stats, events }) => {
   const eventsEndRef = useRef(null);
   const [expandedSubmitters, setExpandedSubmitters] = useState({});
@@ -33,21 +43,32 @@ const AutonomousResearchLogs = ({ stats, events }) => {
     }
     
     // Create new abort controller for this request
-    abortControllerRef.current = new AbortController();
+    const controller = new AbortController();
+    abortControllerRef.current = controller;
     
     try {
-      const response = await autonomousAPI.getApiLogs(100);
+      const response = await autonomousAPI.getApiLogs(100, { signal: controller.signal });
+      if (abortControllerRef.current !== controller) {
+        return;
+      }
+
       if (response.success) {
         setApiLogs(response.logs || []);
-        setApiStats(response.stats || null);
+        setApiStats(response.stats || EMPTY_API_STATS);
       }
     } catch (error) {
+      if (abortControllerRef.current !== controller) {
+        return;
+      }
+
       // Don't log abort errors as they're expected on cleanup
       if (error.name !== 'AbortError') {
         console.error('Failed to fetch autonomous API logs:', error);
       }
     } finally {
-      setApiLogsLoading(false);
+      if (abortControllerRef.current === controller) {
+        setApiLogsLoading(false);
+      }
     }
   }, []);
 
@@ -66,6 +87,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
       // Cancel any pending requests on unmount
       if (abortControllerRef.current) {
         abortControllerRef.current.abort();
+        abortControllerRef.current = null;
       }
     };
   }, [fetchApiLogs, apiAutoRefresh]);
@@ -77,10 +99,16 @@ const AutonomousResearchLogs = ({ stats, events }) => {
     }
 
     try {
+      if (abortControllerRef.current) {
+        abortControllerRef.current.abort();
+        abortControllerRef.current = null;
+      }
+
       await autonomousAPI.clearApiLogs();
       setApiLogs([]);
-      setApiStats(null);
+      setApiStats(EMPTY_API_STATS);
       setExpandedApiLogIdx(null);
+      setApiLogsLoading(false);
     } catch (error) {
       console.error('Failed to clear API logs:', error);
     }
@@ -191,6 +219,24 @@ const AutonomousResearchLogs = ({ stats, events }) => {
         return 'Autonomous research started';
       case 'auto_research_stopped':
         return `Research stopped. Total: ${data.final_stats?.total_papers_completed || 0} papers`;
+      // Topic exploration events (pre-brainstorm)
+      case 'topic_exploration_started':
+        return `Topic exploration started (target: ${data.target || 5} candidates${data.resumed_count ? `, resumed: ${data.resumed_count}` : ''})`;
+      case 'topic_exploration_progress': {
+        const question = data.latest_question ? data.latest_question.substring(0, 80) + '...' : '';
+        return `Exploration candidate ${data.accepted}/${data.target} accepted${question ? `: ${question}` : ''}`;
+      }
+      case 'topic_exploration_rejected':
+        return `Exploration candidate rejected (${data.accepted_so_far || 0}/${data.target || 5} accepted)`;
+      case 'topic_exploration_complete':
+        return `Topic exploration complete: ${data.accepted_count} candidates (${data.total_attempts} attempts)`;
+      // Paper title exploration events
+      case 'paper_title_exploration_started':
+        return `Title exploration started (target: ${data.target || 5} candidate titles)`;
+      case 'paper_title_exploration_progress':
+        return `Title candidate ${data.accepted}/${data.target} accepted`;
+      case 'paper_title_exploration_complete':
+        return `Title exploration complete: ${data.accepted_count} candidates (${data.total_attempts} attempts)`;
       case 'topic_selected':
         return `Topic selected: ${data.action} - ${data.topic_prompt || data.topic_id}`;
       case 'topic_selection_rejected':
@@ -225,13 +271,13 @@ const AutonomousResearchLogs = ({ stats, events }) => {
 
   const getEventClass = (event) => {
     const eventName = event.event || '';
-    if (eventName.includes('completed') || eventName.includes('accepted') || eventName === 'submission_accepted') {
+    if (eventName.includes('completed') || eventName.includes('accepted') || eventName === 'submission_accepted' || eventName === 'topic_exploration_complete' || eventName === 'paper_title_exploration_complete') {
       return 'log-success';
     }
-    if (eventName.includes('rejected') || eventName === 'submission_rejected') {
+    if (eventName.includes('rejected') || eventName === 'submission_rejected' || eventName === 'topic_exploration_rejected') {
       return 'log-reject';
     }
-    if (eventName.includes('started') || eventName.includes('review')) {
+    if (eventName.includes('started') || eventName.includes('review') || eventName.includes('progress')) {
       return 'log-info';
     }
     return '';
@@ -305,7 +351,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
       <h4 style={{ marginTop: '20px' }}>Per-Submitter Statistics</h4>
       <div className="submitter-stats-container">
         {Object.keys(submitterStats).length === 0 ? (
-          <div className="empty-state">
+          <div className="auto-empty-state">
             No submission data yet.
           </div>
         ) : (
@@ -552,14 +598,14 @@ const AutonomousResearchLogs = ({ stats, events }) => {
       <h4 style={{ marginTop: '20px' }}>Event Log</h4>
       <div className="logs-events">
         {(!events || events.length === 0) ? (
-          <div className="empty-state">
+          <div className="auto-empty-state">
             No events recorded yet.
           </div>
         ) : (
           events.map((event, index) => (
             <div 
               key={index} 
-              className={`log-entry ${getEventClass(event)}`}
+              className={`auto-log-entry ${getEventClass(event)}`}
             >
               <span className="log-time">
                 {new Date(event.timestamp).toLocaleTimeString()}
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index a9bacf1..fa7110e 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -5,9 +5,17 @@
  * Now supports per-role OpenRouter model selection with provider and fallback options.
  */
 import React, { useState, useEffect } from 'react';
-import { openRouterAPI, api } from '../../services/api';
-import { loadModelCache, getModelApiId } from '../../utils/modelCache';
+import { openRouterAPI, api, autonomousAPI } from '../../services/api';
+import {
+  AUTONOMOUS_SETTINGS_STORAGE_KEY,
+  AUTONOMOUS_PROFILES_STORAGE_KEY,
+  RECOMMENDED_PROFILE_KEYS,
+  RECOMMENDED_PROFILES,
+  applyAutonomousProfileSelection,
+  getStoredAutonomousSettings,
+} from '../../utils/autonomousProfiles';
 import './AutonomousResearch.css';
+import '../settings-common.css';
 
 const DEFAULT_SUBMITTER_CONFIG = {
   submitterId: 1,
@@ -19,134 +27,6 @@ const DEFAULT_SUBMITTER_CONFIG = {
   maxOutputTokens: 25000
 };
 
-// Recommended profiles with hard-coded model IDs (NO pattern matching)
-const RECOMMENDED_PROFILES = {
-  'recommended_fastest_cheapest': {
-    name: 'Fastest, cheapest, least knowledge',
-    numSubmitters: 3,
-    submitters: [
-      { 
-        modelId: 'openai/gpt-oss-120b',
-        provider: 'openrouter',
-        openrouterProvider: 'Google',
-        lmStudioFallbackId: null,
-        contextWindow: 131000,
-        maxOutputTokens: 25000
-      },
-      { 
-        modelId: 'openai/gpt-oss-20b',
-        provider: 'openrouter',
-        openrouterProvider: 'Groq',
-        lmStudioFallbackId: null,
-        contextWindow: 131000,
-        maxOutputTokens: 25000
-      },
-      { 
-        modelId: 'openai/gpt-oss-120b',
-        provider: 'openrouter',
-        openrouterProvider: 'Google',
-        lmStudioFallbackId: null,
-        contextWindow: 131000,
-        maxOutputTokens: 25000
-      }
-    ],
-    validator: { 
-      modelId: 'openai/gpt-oss-120b',
-      provider: 'openrouter',
-      openrouterProvider: 'Google',
-      lmStudioFallbackId: null,
-      contextWindow: 131000,
-      maxOutputTokens: 25000
-    },
-    highContext: { 
-      modelId: 'openai/gpt-oss-120b',
-      provider: 'openrouter',
-      openrouterProvider: 'Google',
-      lmStudioFallbackId: null,
-      contextWindow: 131000,
-      maxOutputTokens: 25000
-    },
-    highParam: { 
-      modelId: 'openai/gpt-oss-120b',
-      provider: 'openrouter',
-      openrouterProvider: 'Google',
-      lmStudioFallbackId: null,
-      contextWindow: 131000,
-      maxOutputTokens: 25000
-    },
-    critique: { 
-      modelId: 'openai/gpt-oss-120b',
-      provider: 'openrouter',
-      openrouterProvider: 'Google',
-      lmStudioFallbackId: null,
-      contextWindow: 131000,
-      maxOutputTokens: 25000
-    }
-  },
-  'recommended_fast_affordable_mid': {
-    name: 'Fast, affordable, mid-tier knowledge',
-    numSubmitters: 3,
-    submitters: [
-      {
-        modelId: 'moonshotai/kimi-k2.5',
-        provider: 'openrouter',
-        openrouterProvider: 'SiliconFlow',
-        lmStudioFallbackId: null,
-        contextWindow: 262000,
-        maxOutputTokens: 40000
-      },
-      {
-        modelId: 'openai/gpt-oss-120b',
-        provider: 'openrouter',
-        openrouterProvider: 'Groq',
-        lmStudioFallbackId: null,
-        contextWindow: 131072,
-        maxOutputTokens: 25000
-      },
-      {
-        modelId: 'deepseek/deepseek-v3.2',
-        provider: 'openrouter',
-        openrouterProvider: 'AtlasCloud',
-        lmStudioFallbackId: null,
-        contextWindow: 163800,
-        maxOutputTokens: 30000
-      }
-    ],
-    validator: {
-      modelId: 'x-ai/grok-4.1-fast',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 2000000,
-      maxOutputTokens: 30000
-    },
-    highContext: {
-      modelId: 'moonshotai/kimi-k2.5',
-      provider: 'openrouter',
-      openrouterProvider: 'SiliconFlow',
-      lmStudioFallbackId: null,
-      contextWindow: 262000,
-      maxOutputTokens: 40000
-    },
-    highParam: {
-      modelId: 'google/gemini-3.1-pro-preview',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500
-    },
-    critique: {
-      modelId: 'google/gemini-3.1-pro-preview',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500
-    }
-  }
-};
-
 // ModelSelector component - extracted outside to prevent recreation on every render
 const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProviderChange, onModelChange, onOpenrouterProviderChange, onFallbackChange, lmStudioModels, openRouterModels, modelProviders, hasOpenRouterKey, isRunning }) => {
   const currentModels = provider === 'openrouter' ? openRouterModels : lmStudioModels;
@@ -157,38 +37,21 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
       {/* Provider Toggle */}
       <div className="settings-row">
         <label>Provider</label>
-        <div style={{ display: 'flex', gap: '0.5rem' }}>
+        <div className="provider-toggle-group">
           <button
             type="button"
+            className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
             onClick={() => onProviderChange('lm_studio')}
             disabled={isRunning}
-            style={{
-              flex: 1,
-              padding: '0.5rem',
-              backgroundColor: provider === 'lm_studio' ? '#4CAF50' : '#333',
-              border: 'none',
-              borderRadius: '4px',
-              color: '#fff',
-              cursor: isRunning ? 'not-allowed' : 'pointer',
-              opacity: isRunning ? 0.6 : 1
-            }}
           >
             LM Studio
           </button>
           <button
             type="button"
+            className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
             onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
             disabled={isRunning || !hasOpenRouterKey}
-            style={{
-              flex: 1,
-              padding: '0.5rem',
-              backgroundColor: provider === 'openrouter' ? '#FF6700' : '#333',
-              border: 'none',
-              borderRadius: '4px',
-              color: hasOpenRouterKey ? '#fff' : '#666',
-              cursor: (isRunning || !hasOpenRouterKey) ? 'not-allowed' : 'pointer',
-              opacity: (isRunning || !hasOpenRouterKey) ? 0.6 : 1
-            }}
+            style={!hasOpenRouterKey ? { color: '#666' } : undefined}
             title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
           >
             OpenRouter
@@ -241,7 +104,7 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
       {/* LM Studio Fallback (if OpenRouter) */}
       {provider === 'openrouter' && (
         <div className="settings-row">
-          <label style={{ color: '#888' }}>LM Studio Fallback (optional)</label>
+          <label className="label--muted">LM Studio Fallback (optional)</label>
           <select
             value={fallback || ''}
             onChange={(e) => onFallbackChange(e.target.value || null)}
@@ -269,12 +132,12 @@ const RoleConfig = ({ title, hint, rolePrefix, borderColor = '#333', localConfig
   const maxTokens = localConfig[`${rolePrefix}_max_tokens`] || 25000;
 
   return (
-    <div className="submitter-config-section" style={{
-      borderColor: provider === 'openrouter' ? '#FF6700' : borderColor
+    <div className={`submitter-config-section${provider === 'openrouter' ? ' role-config-card--openrouter-orange' : ''}`} style={{
+      borderColor: provider === 'openrouter' ? undefined : borderColor
     }}>
-      <h5 style={{ color: provider === 'openrouter' ? '#FF6700' : borderColor }}>
+      <h5 className={provider === 'openrouter' ? 'card-title--orange' : ''} style={provider !== 'openrouter' ? { color: borderColor } : undefined}>
         {title}
-        {provider === 'openrouter' && <span style={{ fontWeight: 'normal', marginLeft: '0.5rem' }}>[OpenRouter]</span>}
+        {provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
       </h5>
       {hint && <p className="settings-hint">{hint}</p>}
 
@@ -353,11 +216,19 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
   const [testingWolfram, setTestingWolfram] = useState(false);
   
   // Critique prompt editor state
+  const [advancedSettingsExpanded, setAdvancedSettingsExpanded] = useState(false);
   const [critiquePromptExpanded, setCritiquePromptExpanded] = useState(false);
   const [customCritiquePrompt, setCustomCritiquePrompt] = useState('');
   const [critiquePromptSaved, setCritiquePromptSaved] = useState(false);
   const [defaultCritiquePrompt, setDefaultCritiquePrompt] = useState('');
 
+  const handleCollapsibleKeyDown = (event, toggleFn) => {
+    if (event.key === 'Enter' || event.key === ' ') {
+      event.preventDefault();
+      toggleFn();
+    }
+  };
+
   // Parse submitter configs from config
   const parseSubmitterConfigs = (cfg) => {
     if (cfg?.submitter_configs && Array.isArray(cfg.submitter_configs)) {
@@ -461,7 +332,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
   useEffect(() => {
     const init = async () => {
       // Load user profiles from localStorage
-      const savedProfiles = localStorage.getItem('autonomous_research_profiles');
+      const savedProfiles = localStorage.getItem(AUTONOMOUS_PROFILES_STORAGE_KEY);
       if (savedProfiles) {
         try {
           let profiles = JSON.parse(savedProfiles);
@@ -473,7 +344,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
           setUserProfiles(normalized);
           // Save normalized profiles back to localStorage if any changes were made
           if (JSON.stringify(normalized) !== JSON.stringify(profiles)) {
-            localStorage.setItem('autonomous_research_profiles', JSON.stringify(normalized));
+            localStorage.setItem(AUTONOMOUS_PROFILES_STORAGE_KEY, JSON.stringify(normalized));
             console.log('[Profile Normalization] Profiles updated and saved to localStorage');
           }
         } catch (err) {
@@ -481,25 +352,18 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
         }
       }
 
-      // Load settings from localStorage
-      const savedSettings = localStorage.getItem('autonomous_research_settings');
-      if (savedSettings) {
-        try {
-          const settings = JSON.parse(savedSettings);
-          if (settings.numSubmitters) setNumSubmitters(settings.numSubmitters);
-          if (settings.submitterConfigs) setSubmitterConfigs(settings.submitterConfigs);
-          if (settings.localConfig) {
-            setLocalConfig(prev => ({ ...prev, ...settings.localConfig }));
-          }
-          if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
-          if (settings.freeModelLooping !== undefined) setFreeModelLooping(settings.freeModelLooping);
-          if (settings.freeModelAutoSelector !== undefined) setFreeModelAutoSelector(settings.freeModelAutoSelector);
-          if (settings.tier3Enabled !== undefined) setTier3Enabled(settings.tier3Enabled);
-          if (settings.modelProviders) setModelProviders(settings.modelProviders);
-        } catch (err) {
-          console.error('Failed to load autonomous research settings:', err);
-        }
+      const settings = getStoredAutonomousSettings();
+      if (settings.numSubmitters) setNumSubmitters(settings.numSubmitters);
+      if (settings.submitterConfigs) setSubmitterConfigs(settings.submitterConfigs);
+      if (settings.localConfig) {
+        setLocalConfig(prev => ({ ...prev, ...settings.localConfig }));
       }
+      setSelectedProfile(settings.selectedProfile || '');
+      if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
+      if (settings.freeModelLooping !== undefined) setFreeModelLooping(settings.freeModelLooping);
+      if (settings.freeModelAutoSelector !== undefined) setFreeModelAutoSelector(settings.freeModelAutoSelector);
+      if (settings.tier3Enabled !== undefined) setTier3Enabled(settings.tier3Enabled);
+      if (settings.modelProviders) setModelProviders(settings.modelProviders);
       
       try {
         const status = await openRouterAPI.getApiKeyStatus();
@@ -511,14 +375,20 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
         console.error('Failed to check OpenRouter key:', err);
       }
       
-      // Load Wolfram Alpha status from backend
-      try {
-        const wolframStatus = await api.getWolframStatus();
-        if (wolframStatus.enabled) {
-          setWolframEnabled(true);
+      // Restore Wolfram Alpha key from localStorage
+      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
+      if (storedWolframKey) {
+        setWolframApiKey(storedWolframKey);
+        setWolframEnabled(true);
+      } else {
+        try {
+          const wolframStatus = await api.getWolframStatus();
+          if (wolframStatus.enabled) {
+            setWolframEnabled(true);
+          }
+        } catch (err) {
+          console.error('Failed to load Wolfram Alpha status:', err);
         }
-      } catch (err) {
-        console.error('Failed to load Wolfram Alpha status:', err);
       }
 
       // Try to fetch fresh LM Studio models
@@ -578,10 +448,11 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
       freeModelLooping,
       freeModelAutoSelector,
       tier3Enabled,
-      modelProviders
+      modelProviders,
+      selectedProfile,
     };
-    localStorage.setItem('autonomous_research_settings', JSON.stringify(settings));
-  }, [isLoadedFromStorage, numSubmitters, submitterConfigs, localConfig, freeOnly, freeModelLooping, freeModelAutoSelector, tier3Enabled, modelProviders]);
+    localStorage.setItem(AUTONOMOUS_SETTINGS_STORAGE_KEY, JSON.stringify(settings));
+  }, [isLoadedFromStorage, numSubmitters, submitterConfigs, localConfig, freeOnly, freeModelLooping, freeModelAutoSelector, tier3Enabled, modelProviders, selectedProfile]);
 
   // Update LM Studio models when prop changes
   useEffect(() => {
@@ -639,7 +510,6 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
     // Fetch default prompt from backend
     const fetchDefaultPrompt = async () => {
       try {
-        const { autonomousAPI } = await import('../../services/api');
         const response = await autonomousAPI.getDefaultCritiquePrompt();
         if (response.prompt) {
           setDefaultCritiquePrompt(response.prompt);
@@ -680,6 +550,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
   };
 
+  const markProfileAsCustom = () => {
+    if (selectedProfile) {
+      setSelectedProfile('');
+    }
+  };
+
   const handleChange = (field, value) => {
     const numericFields = [
       'validator_context_window', 'high_context_context_window', 
@@ -696,6 +572,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
     
     const newConfig = { ...localConfig, [field]: newValue };
+    markProfileAsCustom();
     setLocalConfig(newConfig);
     
     // CRITICAL FIX: Don't propagate numeric field changes to parent on every keystroke
@@ -720,6 +597,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       const finalValue = isNaN(parsed) ? (isContextField ? 131072 : 25000) : parsed;
       
       const newConfig = { ...localConfig, [field]: finalValue };
+      markProfileAsCustom();
       setLocalConfig(newConfig);
       onConfigChange({ ...newConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
     }
@@ -732,6 +610,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       // Keep existing model, openrouter_provider, and lm_studio_fallback - don't reset them
     };
     const newConfig = { ...localConfig, ...updates };
+    markProfileAsCustom();
     setLocalConfig(newConfig);
     onConfigChange({ ...newConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
   };
@@ -747,6 +626,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   // Handle number of submitters change
   const handleNumSubmittersChange = (newCount) => {
     const count = Math.max(1, Math.min(10, parseInt(newCount, 10) || 1));
+    markProfileAsCustom();
     setNumSubmitters(count);
     
     // Expand or contract submitter configs
@@ -767,6 +647,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   // Handler for when user finishes editing number of submitters
   const handleNumSubmittersBlur = (value) => {
     const count = Math.max(1, Math.min(10, parseInt(value, 10) || 1));
+    markProfileAsCustom();
     setNumSubmitters(count);
     
     const newConfigs = [...submitterConfigs];
@@ -815,6 +696,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       fetchProvidersForModel(newValue);
     }
     
+    markProfileAsCustom();
     setSubmitterConfigs(newConfigs);
     
     // CRITICAL FIX: Don't propagate numeric field changes on every keystroke
@@ -837,6 +719,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         [field]: finalValue
       };
       
+      markProfileAsCustom();
       setSubmitterConfigs(newConfigs);
       onConfigChange({ ...localConfig, submitter_configs: newConfigs.slice(0, numSubmitters) });
     }
@@ -855,6 +738,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         contextWindow: main.contextWindow,
         maxOutputTokens: main.maxOutputTokens
       }));
+      markProfileAsCustom();
       setSubmitterConfigs(newConfigs);
       onConfigChange({ ...localConfig, submitter_configs: newConfigs.slice(0, numSubmitters) });
     }
@@ -885,8 +769,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       
       if (response.success) {
         setWolframTestResult(`✓ Success! Result: ${response.result}`);
-        // Save the key to backend
         await api.setWolframApiKey(wolframApiKey);
+        localStorage.setItem('wolfram_alpha_api_key', wolframApiKey);
         setWolframEnabled(true);
       } else {
         setWolframTestResult('✗ Failed: ' + response.message);
@@ -902,6 +786,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const handleClearWolframKey = async () => {
     try {
       await api.clearWolframApiKey();
+      localStorage.removeItem('wolfram_alpha_api_key');
       setWolframApiKey('');
       setWolframEnabled(false);
       setWolframTestResult('Key cleared');
@@ -921,120 +806,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
   // Apply a profile (recommended or user-saved)
   const applyProfile = async (profileKey) => {
-    const isRecommended = profileKey.startsWith('recommended_');
-    const profile = isRecommended
-      ? RECOMMENDED_PROFILES[profileKey]
-      : userProfiles[profileKey];
-    
-    if (!profile) {
-      console.error(`Profile not found: ${profileKey}`);
-      return;
-    }
-
-    console.log(`Applying profile: ${profile.name} (${isRecommended ? 'recommended' : 'user'})`);
-
-    // Load model cache to convert display names to API IDs
-    const modelCache = await loadModelCache();
-    
-    // Helper to convert display name to API ID
-    const convertToApiId = (displayNameOrId) => {
-      if (!displayNameOrId) return '';
-      const apiId = getModelApiId(displayNameOrId);
-      if (apiId !== displayNameOrId) {
-        console.log(`  Converted "${displayNameOrId}" -> "${apiId}"`);
-      }
-      return apiId;
-    };
-
-    // Apply submitter configs using hard-coded modelId values (NO pattern matching)
-    const newSubmitterConfigs = [];
-    for (let i = 0; i < profile.numSubmitters; i++) {
-      const submitterProfile = profile.submitters[i];
-      
-      let modelId, provider, openrouterProv, fallback;
-      
-      if (isRecommended) {
-        // Recommended profiles: convert display name to API ID
-        modelId = convertToApiId(submitterProfile.modelId || '');
-        provider = submitterProfile.provider || 'openrouter';
-        openrouterProv = submitterProfile.openrouterProvider || null;
-        fallback = null; // No fallback for recommended
-      } else {
-        // User profile: use stored settings directly (already in API format)
-        modelId = submitterProfile.modelId || '';
-        provider = submitterProfile.provider || 'openrouter';
-        openrouterProv = submitterProfile.openrouterProvider || null;
-        fallback = submitterProfile.lmStudioFallbackId || null;
-      }
-      
-      newSubmitterConfigs.push({
-        submitterId: i + 1,
-        provider,
-        modelId,
-        openrouterProvider: openrouterProv,
-        lmStudioFallbackId: fallback,
-        contextWindow: submitterProfile.contextWindow,
-        maxOutputTokens: submitterProfile.maxOutputTokens
-      });
+    try {
+      const { profile, settings, config: nextConfig } = await applyAutonomousProfileSelection(profileKey, userProfiles);
+      const isRecommended = profileKey.startsWith('recommended_');
+
+      console.log(`Applying profile: ${profile.name} (${isRecommended ? 'recommended' : 'user'})`);
+
+      setNumSubmitters(settings.numSubmitters);
+      setSubmitterConfigs(settings.submitterConfigs);
+      setLocalConfig(settings.localConfig);
+      setFreeOnly(settings.freeOnly);
+      setFreeModelLooping(settings.freeModelLooping);
+      setFreeModelAutoSelector(settings.freeModelAutoSelector);
+      setTier3Enabled(settings.tier3Enabled);
+      setModelProviders(settings.modelProviders || {});
+      setSelectedProfile(settings.selectedProfile);
+      onConfigChange(nextConfig);
+    } catch (err) {
+      console.error(err.message || 'Failed to apply profile:', err);
     }
-
-    // Helper to get model ID (convert display name to API ID for recommended profiles)
-    const getModelId = (roleProfile) => {
-      if (isRecommended) {
-        return convertToApiId(roleProfile.modelId || '');
-      }
-      return roleProfile.modelId || '';
-    };
-
-    // Helper to get OpenRouter provider
-    const getOpenrouterProvider = (roleProfile) => {
-      if (isRecommended) {
-        return roleProfile.openrouterProvider || null;
-      }
-      return roleProfile.openrouterProvider || null;
-    };
-
-    // Apply validator, high-context, high-param, and critique configs
-    const validatorModelId = getModelId(profile.validator);
-    const highContextModelId = getModelId(profile.highContext);
-    const highParamModelId = getModelId(profile.highParam);
-    const critiqueModelId = getModelId(profile.critique);
-
-    // Update all state
-    setNumSubmitters(profile.numSubmitters);
-    setSubmitterConfigs(newSubmitterConfigs);
-    
-    const newConfig = {
-      ...localConfig,
-      validator_provider: isRecommended ? 'openrouter' : (profile.validator.provider || 'openrouter'),
-      validator_model: validatorModelId,
-      validator_openrouter_provider: getOpenrouterProvider(profile.validator),
-      validator_lm_studio_fallback: isRecommended ? null : (profile.validator.lmStudioFallbackId || null),
-      validator_context_window: profile.validator.contextWindow,
-      validator_max_tokens: profile.validator.maxOutputTokens,
-      high_context_provider: isRecommended ? 'openrouter' : (profile.highContext.provider || 'openrouter'),
-      high_context_model: highContextModelId,
-      high_context_openrouter_provider: getOpenrouterProvider(profile.highContext),
-      high_context_lm_studio_fallback: isRecommended ? null : (profile.highContext.lmStudioFallbackId || null),
-      high_context_context_window: profile.highContext.contextWindow,
-      high_context_max_tokens: profile.highContext.maxOutputTokens,
-      high_param_provider: isRecommended ? 'openrouter' : (profile.highParam.provider || 'openrouter'),
-      high_param_model: highParamModelId,
-      high_param_openrouter_provider: getOpenrouterProvider(profile.highParam),
-      high_param_lm_studio_fallback: isRecommended ? null : (profile.highParam.lmStudioFallbackId || null),
-      high_param_context_window: profile.highParam.contextWindow,
-      high_param_max_tokens: profile.highParam.maxOutputTokens,
-      critique_submitter_provider: isRecommended ? 'openrouter' : (profile.critique.provider || 'openrouter'),
-      critique_submitter_model: critiqueModelId,
-      critique_submitter_openrouter_provider: getOpenrouterProvider(profile.critique),
-      critique_submitter_lm_studio_fallback: isRecommended ? null : (profile.critique.lmStudioFallbackId || null),
-      critique_submitter_context_window: profile.critique.contextWindow,
-      critique_submitter_max_tokens: profile.critique.maxOutputTokens
-    };
-    
-    setLocalConfig(newConfig);
-    onConfigChange({ ...newConfig, submitter_configs: newSubmitterConfigs });
-    setSelectedProfile(profileKey);
   };
 
   // Save current settings as a new profile
@@ -1092,7 +882,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
     const updatedProfiles = { ...userProfiles, [profileKey]: newProfile };
     setUserProfiles(updatedProfiles);
-    localStorage.setItem('autonomous_research_profiles', JSON.stringify(updatedProfiles));
+    localStorage.setItem(AUTONOMOUS_PROFILES_STORAGE_KEY, JSON.stringify(updatedProfiles));
     setSelectedProfile(profileKey);
     setShowSaveDialog(false);
     setNewProfileName('');
@@ -1119,7 +909,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     const updatedProfiles = { ...userProfiles };
     delete updatedProfiles[profileKey];
     setUserProfiles(updatedProfiles);
-    localStorage.setItem('autonomous_research_profiles', JSON.stringify(updatedProfiles));
+    localStorage.setItem(AUTONOMOUS_PROFILES_STORAGE_KEY, JSON.stringify(updatedProfiles));
     
     if (selectedProfile === profileKey) {
       setSelectedProfile('');
@@ -1131,200 +921,86 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       {/* Left Sidebar - Known Compatible Models */}
       <div className="settings-left-sidebar">
         <div className="known-models-sidebar">
-          <h3 style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-            <span>📦 Tested Compatible Models</span>
-            <div style={{ position: 'relative', display: 'inline-block' }}>
+          <h3 className="flex-row-center">
+            <span>Highlighted Models</span>
+            <div className="tooltip-anchor">
               <button
-                style={{
-                  backgroundColor: 'transparent',
-                  border: '2px solid #FF6700',
-                  color: '#FF6700',
-                  padding: '0',
-                  borderRadius: '4px',
-                  cursor: 'pointer',
-                  fontSize: '0.7rem',
-                  fontWeight: 'bold',
-                  width: '16px',
-                  height: '16px',
-                  display: 'flex',
-                  alignItems: 'center',
-                  justifyContent: 'center',
-                  boxShadow: '0 0 8px rgba(255, 103, 0, 0.3)',
-                  transition: 'all 0.2s ease'
-                }}
+                className="info-tooltip-btn info-tooltip-btn--orange"
                 onMouseEnter={() => setShowTestedModelsTooltip(true)}
                 onMouseLeave={() => setShowTestedModelsTooltip(false)}
               >
                 ?
               </button>
               {showTestedModelsTooltip && (
-                <div style={{
-                  position: 'absolute',
-                  backgroundColor: '#1a1a1a',
-                  border: '2px solid #FF6700',
-                  borderRadius: '6px',
-                  padding: '12px 16px',
-                  fontSize: '0.85rem',
-                  color: '#FF6700',
-                  fontWeight: '500',
-                  maxWidth: '280px',
-                  width: '260px',
-                  zIndex: 1000,
-                  boxShadow: '0 8px 24px rgba(255, 103, 0, 0.4)',
-                  textShadow: '0 1px 2px rgba(0, 0, 0, 0.5)',
-                  pointerEvents: 'none',
-                  top: 'calc(100% + 8px)',
-                  left: '50%',
-                  transform: 'translateX(-50%)'
-                }}>
-                  These models and/or hosts are not affiliated with the MOTO program, or Intrafere LLC. This chart contains compatible models to help guide users through developer-tested configurations. Any statements about pricing, cost, models, roles, rankings, effects, or otherwise are speculative and based on individual developer testing experience. Intrafere LLC (Intrafere Research Group), and the MOTO developement team make no guarantees or warranties about the accuracy or truth of this chart. MOTO is a harness that works with the majority of models, including many more models that are not listed here.
+                /* sidebar-escape: fixed positioning so the tooltip breaks out of the
+                   322px sidebar and renders freely. See settings-common.css for coords. */
+                <div className="tooltip-popup tooltip-popup--sidebar-escape">
+                  The models and hosts listed here are not affiliated with MOTO or Intrafere LLC. This chart reflects developer-tested configurations intended to help guide model selection. All statements regarding pricing, performance, roles, rankings, or capabilities are speculative and based on individual testing experience. Intrafere LLC and the MOTO development team make no guarantees about the accuracy of this chart. MOTO is compatible with the majority of models, including many not listed here.
                 </div>
               )}
             </div>
           </h3>
-          <p style={{ fontSize: '.70rem', color: '#888', marginTop: '0.5rem', marginBottom: '1rem', lineHeight: '1.4', marginLeft: '20px' }}>
-            Note: Computer science and/or non-general purpose models may have trouble performing as validators, critique submitters, or in the tier 2 compilation stage. These models generally perform fine for brainstorming. Most text based models over 20 billion parameters are compatible with MOSO, including ones not shown.
+          <p className="hint-text hint-text--dim" style={{ marginLeft: '20px', marginBottom: '0.45rem' }}>
+            Note: Most models over 20 billion parameters are compatible with MOTO.
           </p>
           <div className="models-list">
-            {/* King of the Hill - Gold */}
-            <div className="model-item" style={{ 
-              backgroundColor: 'linear-gradient(135deg, rgba(212, 175, 55, 0.35) 0%, rgba(212, 175, 55, 0.15) 100%)',
-              borderLeft: '5px solid #d4af37',
-              borderRadius: '6px',
-              boxShadow: '0 0 15px rgba(212, 175, 55, 0.3), inset 0 1px 0 rgba(255, 255, 255, 0.15)',
-              paddingLeft: '12px'
-            }}>
-              <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-                <div className="model-item-name">GPT OSS 120B</div>
-                <div style={{
-                  background: 'linear-gradient(135deg, #e8c547 0%, #d4af37 50%, #c9a227 100%)',
-                  color: '#000',
-                  padding: '2px 8px',
-                  borderRadius: '12px',
-                  fontSize: '0.7rem',
-                  fontWeight: 'bold',
-                  boxShadow: '0 2px 8px rgba(212, 175, 55, 0.4), inset 0 1px 0 rgba(255, 255, 255, 0.3)',
-                  textShadow: '0 1px 1px rgba(0, 0, 0, 0.1)'
-                }}>👑 KING OF THE HILL</div>
-                <div style={{ position: 'relative', display: 'inline-block', zIndex: 100 }}>
-                  <button
-                    style={{
-                      backgroundColor: 'transparent',
-                      border: '2px solid #d4af37',
-                      color: '#d4af37',
-                      padding: '2px 6px',
-                      borderRadius: '4px',
-                      cursor: 'pointer',
-                      fontSize: '0.8rem',
-                      fontWeight: 'bold',
-                      width: '20px',
-                      height: '20px',
-                      display: 'flex',
-                      alignItems: 'center',
-                      justifyContent: 'center',
-                      boxShadow: '0 0 8px rgba(212, 175, 55, 0.3)',
-                      transition: 'all 0.2s ease'
-                    }}
-                    onMouseEnter={() => setShowKothTooltip(true)}
-                    onMouseLeave={() => setShowKothTooltip(false)}
-                  >
-                    ?
-                  </button>
-                  {showKothTooltip && (
-                    <div style={{
-                      position: 'fixed',
-                      backgroundColor: '#1a1a1a',
-                      border: '2px solid #FF6700',
-                      borderRadius: '6px',
-                      padding: '12px 16px',
-                      fontSize: '0.85rem',
-                      color: '#FF6700',
-                      fontWeight: '500',
-                      maxWidth: '300px',
-                      width: '280px',
-                      zIndex: 2147483647,
-                      boxShadow: '0 8px 24px rgba(255, 103, 0, 0.4)',
-                      textShadow: '0 1px 2px rgba(0, 0, 0, 0.5)',
-                      pointerEvents: 'none',
-                      top: '50px',
-                      right: '20px'
-                    }}>
-                      This model was chosen by the Intrafere developers as the CURRENT best overall performer in the MOTO harness, optimized for cost, speed, and knowledge.
-                    </div>
-                  )}
+            {/* Podium - Top 3 */}
+            <div className="models-podium">
+              <div className="models-podium-label">Leaderboard</div>
+              <div className="model-item model-item--ranked model-item--gold">
+                <div className="flex-row-center">
+                  <div className="model-item-name">Kimi K2.5</div>
+                  <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
+                  <div className="tooltip-anchor" style={{ zIndex: 100 }}>
+                    <button
+                      className="info-tooltip-btn info-tooltip-btn--gold"
+                      onMouseEnter={() => setShowKothTooltip(true)}
+                      onMouseLeave={() => setShowKothTooltip(false)}
+                    >
+                      ?
+                    </button>
+                    {showKothTooltip && (
+                      <div className="tooltip-popup tooltip-popup--fixed" style={{ top: '50px', right: '20px' }}>
+                        This model was chosen by the Intrafere developers as the best overall performer in the MOTO harness, optimized for cost, speed, and knowledge.
+                      </div>
+                    )}
+                  </div>
                 </div>
+                <div className="model-item-badge">Highly knowledgeable and balanced cost</div>
               </div>
-              <div className="model-item-badge">Balanced knowledge and speed</div>
-              <div className="model-item-note">(outputs may corrupt over time depending on host)</div>
-            </div>
 
-            {/* Runner Up - Silver */}
-            <div className="model-item" style={{ 
-              backgroundColor: 'linear-gradient(135deg, rgba(192, 192, 192, 0.35) 0%, rgba(192, 192, 192, 0.15) 100%)',
-              borderLeft: '5px solid #c0c0c0',
-              borderRadius: '6px',
-              boxShadow: '0 0 15px rgba(192, 192, 192, 0.3), inset 0 1px 0 rgba(255, 255, 255, 0.15)',
-              paddingLeft: '12px'
-            }}>
-              <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-                <div className="model-item-name">Grok 4.1 Fast</div>
-                <div style={{
-                  background: 'linear-gradient(135deg, #e8e8e8 0%, #c0c0c0 50%, #a9a9a9 100%)',
-                  color: '#000',
-                  padding: '2px 8px',
-                  borderRadius: '12px',
-                  fontSize: '0.7rem',
-                  fontWeight: 'bold',
-                  boxShadow: '0 2px 8px rgba(192, 192, 192, 0.4), inset 0 1px 0 rgba(255, 255, 255, 0.3)',
-                  textShadow: '0 1px 1px rgba(0, 0, 0, 0.1)'
-                }}>🥈 SILVER</div>
+              <div className="model-item model-item--ranked model-item--silver">
+                <div className="flex-row-center">
+                  <div className="model-item-name">Grok 4.1 Fast</div>
+                  <div className="ranking-badge ranking-badge--silver">🥈 SILVER</div>
+                </div>
+                <div className="model-item-badge">Fast validator</div>
               </div>
-              <div className="model-item-badge">Fast validator</div>
-            </div>
 
-            {/* Bronze - DeepSeek V3.2 */}
-            <div className="model-item" style={{ 
-              backgroundColor: 'linear-gradient(135deg, rgba(205, 127, 50, 0.35) 0%, rgba(205, 127, 50, 0.15) 100%)',
-              borderLeft: '5px solid #cd7f32',
-              borderRadius: '6px',
-              boxShadow: '0 0 15px rgba(205, 127, 50, 0.3), inset 0 1px 0 rgba(255, 255, 255, 0.15)',
-              paddingLeft: '12px'
-            }}>
-              <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-                <div className="model-item-name">DeepSeek V3.2</div>
-                <div style={{
-                  background: 'linear-gradient(135deg, #d9a574 0%, #cd7f32 50%, #b86f28 100%)',
-                  color: '#fff',
-                  padding: '2px 8px',
-                  borderRadius: '12px',
-                  fontSize: '0.7rem',
-                  fontWeight: 'bold',
-                  boxShadow: '0 2px 8px rgba(205, 127, 50, 0.4), inset 0 1px 0 rgba(255, 255, 255, 0.2)',
-                  textShadow: '0 1px 2px rgba(0, 0, 0, 0.3)'
-                }}>🥉 BRONZE</div>
+              <div className="model-item model-item--ranked model-item--bronze">
+                <div className="flex-row-center">
+                  <div className="model-item-name">GPT OSS 120B</div>
+                  <div className="ranking-badge ranking-badge--bronze">🥉 BRONZE</div>
+                </div>
+                <div className="model-item-badge">Balanced knowledge and speed at low cost</div>
+                <div className="model-item-note">(outputs may corrupt over time depending on host)</div>
               </div>
-              <div className="model-item-badge">Highly knowledgeable</div>
             </div>
 
             {/* Alphabetical list (rest of models) */}
             
             <div className="model-item">
-              <div className="model-item-name">Amazon Nova</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Claude Opus</div>
+              <div className="model-item-name">Amazon Nova Pro/Premier</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">Claude Sonnet</div>
+              <div className="model-item-name">Claude Opus/Sonnet</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">DeepSeek Speciale</div>
+              <div className="model-item-name">DeepSeek</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
@@ -1334,13 +1010,13 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">Gemini Flash Light</div>
-              <div className="model-item-badge">Fast validator</div>
+              <div className="model-item-name">Gemini Pro</div>
+              <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">Gemini Pro</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
+              <div className="model-item-name">Google's Gemma</div>
+              <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
             
             <div className="model-item">
@@ -1348,6 +1024,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
+            <div className="model-item">
+              <div className="model-item-name">GLM Turbo</div>
+              <div className="model-item-badge">Fast validator</div>
+            </div>
+            
             <div className="model-item">
               <div className="model-item-name">GPT Codex</div>
               <div className="model-item-badge">Computer science</div>
@@ -1365,13 +1046,18 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">Kimi K</div>
+              <div className="model-item-name">ChatGPT</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
-            
+
             <div className="model-item">
-              <div className="model-item-name">ChatGPT</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
+              <div className="model-item-name">Inception's Mercury</div>
+              <div className="model-item-badge">Rapid knowledge</div>
+            </div>
+
+            <div className="model-item">
+              <div className="model-item-name">Nemotron Super</div>
+              <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
 
             <div className="model-item">
@@ -1380,14 +1066,19 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">Perplexity: Sonar</div>
-              <div className="model-item-badge">Internet search capability</div>
+              <div className="model-item-name">Perplexity's Sonar</div>
+              <div className="model-item-badge">Native internet search capability</div>
             </div>
             
             <div className="model-item">
               <div className="model-item-name">Microsoft's Phi</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
+
+            <div className="model-item">
+              <div className="model-item-name">MiniMax</div>
+              <div className="model-item-badge">Highly knowledgeable</div>
+            </div>
             
             <div className="model-item">
               <div className="model-item-name">Qwen Coder</div>
@@ -1417,23 +1108,26 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             value={selectedProfile}
             onChange={(e) => {
               const value = e.target.value;
-              if (value) {
-                if (!hasOpenRouterKey) {
-                  alert('OpenRouter API key required to use profiles. Please set your API key first.');
-                  return;
-                }
-                if (openRouterModels.length === 0) {
-                  alert('Please wait for OpenRouter models to load, or click "Refresh OpenRouter Models" button below.');
-                  return;
-                }
-                applyProfile(value);
+              if (!value) {
+                setSelectedProfile('');
+                return;
               }
+
+              if (!hasOpenRouterKey) {
+                alert('OpenRouter API key required to use profiles. Please set your API key first.');
+                return;
+              }
+              if (openRouterModels.length === 0) {
+                alert('Please wait for OpenRouter models to load, or click "Refresh OpenRouter Models" button below.');
+                return;
+              }
+              applyProfile(value);
             }}
             disabled={isRunning}
           >
             <option value="">-- Custom Settings --</option>
             <optgroup label="Recommended Profiles">
-              {['recommended_fastest_cheapest', 'recommended_fast_affordable_mid']
+              {RECOMMENDED_PROFILE_KEYS
                 .filter(key => RECOMMENDED_PROFILES[key])
                 .map(key => (
                   <option key={key} value={key}>
@@ -1455,10 +1149,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           </select>
           
           <button
-            className="secondary"
+            className="secondary ml-05"
             onClick={() => setShowSaveDialog(true)}
             disabled={isRunning}
-            style={{ marginLeft: '0.5rem' }}
             title="Save current settings as a profile"
           >
             Save as Profile
@@ -1480,27 +1173,10 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
       {/* Save Profile Dialog */}
       {showSaveDialog && (
-        <div style={{
-          position: 'fixed',
-          top: 0,
-          left: 0,
-          right: 0,
-          bottom: 0,
-          backgroundColor: 'rgba(0, 0, 0, 0.7)',
-          display: 'flex',
-          alignItems: 'center',
-          justifyContent: 'center',
-          zIndex: 9999
-        }}>
-          <div style={{
-            backgroundColor: '#1e1e1e',
-            padding: '2rem',
-            borderRadius: '8px',
-            border: '1px solid #333',
-            minWidth: '400px'
-          }}>
+        <div className="inline-modal-overlay">
+          <div className="inline-modal-content">
             <h3 style={{ marginTop: 0 }}>Save Profile</h3>
-            <p style={{ color: '#888' }}>
+            <p className="label--muted">
               Enter a name for this profile. Current settings will be saved.
             </p>
             <input
@@ -1508,15 +1184,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               value={newProfileName}
               onChange={(e) => setNewProfileName(e.target.value)}
               placeholder="Profile name..."
-              style={{
-                width: '100%',
-                padding: '0.5rem',
-                marginBottom: '1rem',
-                backgroundColor: '#2a2a2a',
-                border: '1px solid #444',
-                borderRadius: '4px',
-                color: '#fff'
-              }}
+              className="input-dark"
               onKeyPress={(e) => {
                 if (e.key === 'Enter') {
                   saveCurrentAsProfile();
@@ -1535,15 +1203,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 Cancel
               </button>
               <button
+                className="btn-success-sm"
                 onClick={saveCurrentAsProfile}
-                style={{
-                  padding: '0.5rem 1rem',
-                  backgroundColor: '#4CAF50',
-                  border: 'none',
-                  borderRadius: '4px',
-                  color: '#fff',
-                  cursor: 'pointer'
-                }}
               >
                 Save Profile
               </button>
@@ -1554,21 +1215,15 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
       {/* OpenRouter Status Banner */}
       {!hasOpenRouterKey && (
-        <div style={{
-          backgroundColor: 'rgba(255, 103, 0, 0.1)',
-          border: '1px solid #FF6700',
-          borderRadius: '8px',
-          padding: '1rem',
-          marginBottom: '1.5rem'
-        }}>
-          <p style={{ color: '#FF6700', margin: 0 }}>
+        <div className="openrouter-banner openrouter-banner--orange">
+          <p className="openrouter-banner__text">
             <strong>💡 OpenRouter Available:</strong> Set your OpenRouter API key in the header to enable cloud model selection for any role.
           </p>
         </div>
       )}
 
       {/* Show only free models + model refresh controls — grouped at top */}
-      <div style={{ display: 'flex', flexWrap: 'wrap', alignItems: 'center', gap: '0.5rem', marginBottom: '1rem' }}>
+      <div className="model-refresh-controls">
         <button 
           className="secondary"
           onClick={async () => {
@@ -1599,7 +1254,10 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             >
               🔗 OpenRouter Model List
             </button>
-            <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem', cursor: isRunning ? 'not-allowed' : 'pointer' }}>
+            <label
+              className="settings-checkbox-label model-refresh-controls__toggle"
+              style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}
+            >
               <input
                 type="checkbox"
                 checked={freeOnly}
@@ -1607,7 +1265,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 disabled={isRunning}
                 style={{ marginRight: '0.5rem' }}
               />
-              Show only free models
+              Free models only
             </label>
           </>
         )}
@@ -1650,14 +1308,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         {submitterConfigs.slice(0, numSubmitters).map((cfg, idx) => (
           <div 
             key={idx} 
-            className="submitter-config-section"
-            style={{
-              borderColor: cfg.provider === 'openrouter' ? '#FF6700' : (idx === 0 ? '#4CAF50' : '#333')
-            }}
+            className={`submitter-config-section${cfg.provider === 'openrouter' ? ' role-config-card--openrouter-orange' : (idx === 0 ? ' role-config-card--main' : '')}`}
           >
-            <h5 style={{ color: cfg.provider === 'openrouter' ? '#FF6700' : (idx === 0 ? '#4CAF50' : '#fff') }}>
+            <h5 className={cfg.provider === 'openrouter' ? 'card-title--orange' : (idx === 0 ? 'card-title--green' : '')}>
               {idx === 0 ? 'Submitter 1 (Main Submitter)' : `Submitter ${idx + 1}`}
-              {cfg.provider === 'openrouter' && <span style={{ fontWeight: 'normal', marginLeft: '0.5rem' }}>[OpenRouter]</span>}
+              {cfg.provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
             </h5>
             
             <ModelSelector
@@ -1711,7 +1366,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       <div className="settings-group">
         <h4>Validator (Single Instance)</h4>
         <p className="settings-info">
-          Single validator maintains coherent Markov chain evolution for database alignment. This models speed will be your biggest bottleneck for the system, however their knowledge is also very important. Choose this model wisely, about half of all API calls will be to this model. A single validator as the markov chain bottleneck for the solution progression is important to mitigate the "alignment problem" with AI and user prompts. This is the model that will reject wrong answers, off-track answers, etc. at all stages of solution creation.
+          This single validator model is the gatekeeper of what gets accepted. This model's speed will be your biggest bottleneck for the system, however its knowledge capability is also very important. Choose this model wisely, about half of all API calls will be to this model so it will also greatly control system cost. This is the model that will reject wrong answers, off-track answers, etc. at all stages of solution creation and all solutions run through a single instance to ensure user alignment (markov-chain style bottleneck).
         </p>
 
         <RoleConfig
@@ -1759,7 +1414,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           title="High-Parameter Submitter"
           hint="Handles mathematical rigor enhancement."
           rolePrefix="high_param"
-          borderColor="#f1c40f"
+          borderColor="#1eff1c"
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
@@ -1790,305 +1445,302 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         />
       </div>
 
-      {/* Wolfram Alpha Integration */}
       <div className="settings-group">
-        <h3>Wolfram Alpha Integration (Optional)</h3>
-        <small style={{ color: '#888', display: 'block', marginBottom: '1rem' }}>
-          Enable Wolfram Alpha API for computational verification in rigor mode. Shared with manual compiler mode.
-          Get your API key from <a href="https://products.wolframalpha.com/api" target="_blank" rel="noopener noreferrer">developer.wolframalpha.com</a>
-        </small>
-        
-        <label style={{ display: 'flex', alignItems: 'center', marginBottom: '1rem' }}>
-          <input
-            type="checkbox"
-            checked={wolframEnabled}
-            onChange={async (e) => {
-              const checked = e.target.checked;
-              if (!checked) {
-                // Unchecking - clear key from backend
-                await handleClearWolframKey();
-              } else {
-                // Checking - just show UI (key will be saved on Test Connection)
-                setWolframEnabled(true);
-              }
-            }}
-            style={{ marginRight: '0.75rem' }}
-          />
-          <span style={{ fontWeight: '500' }}>Enable Wolfram Alpha Verification in Rigor Mode</span>
-        </label>
-        
-        {wolframEnabled && (
-          <div style={{ marginLeft: '1.75rem', marginTop: '1rem' }}>
-            <div className="form-group">
-              <label>Wolfram Alpha API Key:</label>
-              <input
-                type="password"
-                value={wolframApiKey}
-                onChange={(e) => setWolframApiKey(e.target.value)}
-                placeholder="Enter your Wolfram Alpha App ID"
-                style={{
-                  padding: '0.6rem',
-                  backgroundColor: '#1e1e1e',
-                  border: '1px solid #444',
-                  borderRadius: '4px',
-                  color: '#fff',
-                  width: '100%',
-                  marginBottom: '0.75rem'
-                }}
-              />
-            </div>
-            
-            <div style={{ display: 'flex', gap: '0.75rem', marginTop: '1rem' }}>
-              <button 
-                onClick={handleTestWolframConnection}
-                disabled={testingWolfram}
-                style={{
-                  padding: '0.6rem 1.25rem',
-                  backgroundColor: '#4CAF50',
-                  border: 'none',
-                  borderRadius: '4px',
-                  color: '#fff',
-                  cursor: testingWolfram ? 'wait' : 'pointer',
-                  opacity: testingWolfram ? 0.6 : 1,
-                  fontWeight: '500'
-                }}
-              >
-                {testingWolfram ? 'Testing...' : 'Test Connection'}
-              </button>
-              
-              <button 
-                onClick={handleClearWolframKey}
-                style={{
-                  padding: '0.6rem 1.25rem',
-                  backgroundColor: 'transparent',
-                  border: '1px solid #666',
-                  borderRadius: '4px',
-                  color: '#888',
-                  cursor: 'pointer'
-                }}
-              >
-                Clear Key
-              </button>
-            </div>
-            
-            {wolframTestResult && (
-              <div style={{ 
-                marginTop: '1rem', 
-                padding: '0.75rem', 
-                borderRadius: '4px',
-                backgroundColor: wolframTestResult.includes('✓') ? '#1a3a1a' : '#3a1a1a',
-                color: wolframTestResult.includes('✓') ? '#4CAF50' : '#ff6b6b',
-                fontSize: '0.9rem'
-              }}>
-                {wolframTestResult}
+        <div
+          className="collapsible-trigger settings-trigger--multiline"
+          onClick={() => setAdvancedSettingsExpanded(prev => !prev)}
+          onKeyDown={(event) => handleCollapsibleKeyDown(event, () => setAdvancedSettingsExpanded(prev => !prev))}
+          role="button"
+          tabIndex={0}
+          aria-expanded={advancedSettingsExpanded}
+          aria-controls="advanced-settings-panel"
+          style={{ marginBottom: advancedSettingsExpanded ? '1rem' : 0 }}
+        >
+          <div className="settings-heading-stack">
+            <h4 className="form-group--compact">Advanced Settings</h4>
+            <p className="settings-subsection-description">
+              Optional integrations, Stage 3 controls, prompt customization, interface polish, and OpenRouter fallback behavior.
+            </p>
+          </div>
+          <span className={`collapse-chevron${advancedSettingsExpanded ? ' collapse-chevron--open' : ''}`}>▼</span>
+        </div>
+
+        {advancedSettingsExpanded && (
+          <div className="collapsible-body settings-advanced-content" id="advanced-settings-panel">
+            {isRunning && (
+              <div className="settings-notice">
+                Settings cannot be changed while autonomous research is running.
               </div>
             )}
-            
-            <small style={{ color: '#888', display: 'block', marginTop: '1rem', lineHeight: '1.5' }}>
-              In rigor mode, the AI can request Wolfram Alpha verification of mathematical claims. 
-              This enables computational checking of theorems, solving equations, and verifying properties.
-              This setting is shared with the manual compiler mode.
-            </small>
-          </div>
-        )}
-      </div>
 
-      {/* Tier 3 Final Answer Toggle */}
-      <div className="settings-group" style={{ borderLeft: '4px solid #ff6b6b', paddingLeft: '12px' }}>
-        <h4>Stage 3: Final Answer Generation</h4>
-        <p className="settings-info">
-          Feature in construction. Enabling this is optional and not recommended. Stage 3 is a highly experimental mode. Most users should not enable this feature — it is expensive and wasteful at this current stage of development. When enabled, the system will automatically synthesize all completed Stage 2 papers into a final answer that is often book-length or greater. This feature is highly hallucinatory — Stage 2 papers are the recommended final output. Disabled by default; final paper quality is currently much lower than Stage 2 papers. Once optimized and better-functioning, this mode will be advertised more.
-        </p>
-        <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.95rem', cursor: isRunning ? 'not-allowed' : 'pointer' }}>
-          <input
-            type="checkbox"
-            checked={tier3Enabled}
-            onChange={(e) => setTier3Enabled(e.target.checked)}
-            disabled={isRunning}
-            style={{ marginRight: '0.5rem' }}
-          />
-          Enable Stage 3 Final Answer Generation (Very Experimental)
-        </label>
-      </div>
+            {/* Wolfram Alpha Integration */}
+            <div className="settings-subsection">
+              <div className="settings-subsection-header">
+                <h5 className="settings-subsection-title">Integrations</h5>
+                <p className="settings-subsection-description">
+                  Optional external verification tools used by rigor mode.
+                </p>
+              </div>
 
-      {/* Validator Critique Prompt Editor */}
-      <div className="settings-group">
-        <div 
-          className="collapsible-header"
-          onClick={() => setCritiquePromptExpanded(!critiquePromptExpanded)}
-          style={{
-            display: 'flex',
-            alignItems: 'center',
-            justifyContent: 'space-between',
-            cursor: 'pointer',
-            padding: '0.75rem',
-            backgroundColor: '#1e1e1e',
-            borderRadius: '6px',
-            border: '1px solid #333',
-            marginBottom: critiquePromptExpanded ? '1rem' : 0,
-            width: '100%',
-            maxWidth: '100%',
-            boxSizing: 'border-box'
-          }}
-        >
-          <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-            <h4 style={{ margin: 0 }}>[OPTIONAL] Edit Validator Critique Prompt (for the user feedback mode on individual papers - this is not for the critique submitter used for the internal research workflow)</h4>
-            {isUsingCustomCritiquePrompt && (
-              <span style={{
-                backgroundColor: '#9b59b6',
-                color: '#fff',
-                padding: '2px 8px',
-                borderRadius: '12px',
-                fontSize: '0.7rem',
-                fontWeight: 'bold'
-              }}>CUSTOM</span>
-            )}
-          </div>
-          <span style={{ 
-            transform: critiquePromptExpanded ? 'rotate(180deg)' : 'rotate(0deg)',
-            transition: 'transform 0.2s',
-            fontSize: '1.2rem'
-          }}>▼</span>
-        </div>
+              <h4 className="form-group--compact">Wolfram Alpha Integration (Optional)</h4>
+              <small className="hint-text">
+                Enable Wolfram Alpha API for computational verification in rigor mode. Shared with manual compiler mode.
+                Get your API key from <a href="https://products.wolframalpha.com/api" target="_blank" rel="noopener noreferrer">developer.wolframalpha.com</a>
+              </small>
+
+              <label className="settings-checkbox-label settings-checkbox-label--stacked">
+                <input
+                  type="checkbox"
+                  checked={wolframEnabled}
+                  onChange={async (e) => {
+                    const checked = e.target.checked;
+                    if (!checked) {
+                      await handleClearWolframKey();
+                    } else {
+                      setWolframEnabled(true);
+                    }
+                  }}
+                />
+                <span className="settings-option-copy">
+                  <span className="settings-option-title">Enable Wolfram Alpha Verification in Rigor Mode</span>
+                  <span className="settings-option-description">
+                    Lets rigor mode request computational verification for equations, properties, and theorem checks.
+                  </span>
+                </span>
+              </label>
+
+              {wolframEnabled && (
+                <div className="indented-section">
+                  <div className="form-group">
+                    <label>Wolfram Alpha API Key:</label>
+                    <input
+                      type="password"
+                      value={wolframApiKey}
+                      onChange={(e) => setWolframApiKey(e.target.value)}
+                      placeholder="Enter your Wolfram Alpha App ID"
+                      className="input-dark"
+                    />
+                  </div>
+
+                  <div style={{ display: 'flex', gap: '0.75rem', marginTop: '1rem' }}>
+                    <button
+                      className="btn-success-sm"
+                      onClick={handleTestWolframConnection}
+                      disabled={testingWolfram}
+                      style={testingWolfram ? { cursor: 'wait', opacity: 0.6 } : undefined}
+                    >
+                      {testingWolfram ? 'Testing...' : 'Test Connection'}
+                    </button>
+
+                    <button
+                      className="btn-ghost"
+                      onClick={handleClearWolframKey}
+                    >
+                      Clear Key
+                    </button>
+                  </div>
+
+                  {wolframTestResult && (
+                    <div className={`test-result-banner ${wolframTestResult.includes('✓') ? 'test-result-banner--success' : 'test-result-banner--error'}`}>
+                      {wolframTestResult}
+                    </div>
+                  )}
 
-        {critiquePromptExpanded && (
-          <div style={{
-            padding: '1rem',
-            backgroundColor: '#1a1a1a',
-            borderRadius: '6px',
-            border: '1px solid #333'
-          }}>
-            <p style={{ color: '#888', fontSize: '0.85rem', marginBottom: '1rem' }}>
-              Customize the prompt sent to your validator when requesting a paper critique. 
-              The JSON output schema is automatically appended and cannot be modified.
-            </p>
+                  <small className="hint-text">
+                    In rigor mode, the AI can request Wolfram Alpha verification of mathematical claims.
+                    This enables computational checking of theorems, solving equations, and verifying properties.
+                    This setting is shared with the manual compiler mode.
+                  </small>
+                </div>
+              )}
+            </div>
 
-            <textarea
-              value={customCritiquePrompt}
-              onChange={(e) => setCustomCritiquePrompt(e.target.value)}
-              style={{
-                width: '100%',
-                minHeight: '200px',
-                padding: '0.75rem',
-                backgroundColor: '#2a2a2a',
-                border: '1px solid #444',
-                borderRadius: '4px',
-                color: '#fff',
-                fontFamily: 'monospace',
-                fontSize: '0.85rem',
-                resize: 'vertical',
-                lineHeight: '1.5'
-              }}
-              placeholder="Enter your custom critique prompt..."
-            />
+            {/* Tier 3 Final Answer Toggle */}
+            <div className="settings-subsection settings-subsection--accent-danger">
+              <div className="settings-subsection-header">
+                <h5 className="settings-subsection-title">Experimental / Ending Options</h5>
+              </div>
+              <h4 className="form-group--compact">Stage 3: Final Answer Generation</h4>
+              <p className="settings-info">
+                Feature in construction. Enabling this is optional and not recommended. Stage 3 is a highly experimental mode. Most users should not enable this feature — it is expensive and wasteful at this current stage of development. When enabled, the system will automatically synthesize all completed Stage 2 papers into a final answer that is often book-length or greater. This feature is highly hallucinatory — Stage 2 papers are the recommended final output. Disabled by default; final paper quality is currently much lower than Stage 2 papers. Once optimized and better-functioning, this mode will be advertised more.
+              </p>
+              <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}>
+                <input
+                  type="checkbox"
+                  checked={tier3Enabled}
+                  onChange={(e) => setTier3Enabled(e.target.checked)}
+                  disabled={isRunning}
+                />
+                <span className="settings-option-copy">
+                  <span className="settings-option-title">Enable Stage 3 Final Answer Generation (Very Experimental)</span>
+                  <span className="settings-option-description">
+                    Allows the system to synthesize completed Stage 2 papers into a final answer after enough papers accumulate.
+                  </span>
+                </span>
+              </label>
+            </div>
 
-            <div style={{ 
-              display: 'flex', 
-              justifyContent: 'space-between', 
-              alignItems: 'center',
-              marginTop: '1rem' 
-            }}>
-              <button
-                onClick={handleRestoreCritiquePrompt}
-                style={{
-                  padding: '0.5rem 1rem',
-                  backgroundColor: 'transparent',
-                  border: '1px solid #666',
-                  borderRadius: '4px',
-                  color: '#888',
-                  cursor: 'pointer',
-                  fontSize: '0.85rem'
-                }}
+            {/* Validator Critique Prompt Editor */}
+            <div className="settings-subsection">
+              <div className="settings-subsection-header">
+                <h5 className="settings-subsection-title">Prompt Customization</h5>
+                <p className="settings-subsection-description">
+                  Optional tweaks for the user-facing paper critique prompt only.
+                </p>
+              </div>
+
+              <div
+                className="collapsible-trigger settings-trigger--multiline"
+                onClick={() => setCritiquePromptExpanded(prev => !prev)}
+                onKeyDown={(event) => handleCollapsibleKeyDown(event, () => setCritiquePromptExpanded(prev => !prev))}
+                role="button"
+                tabIndex={0}
+                aria-expanded={critiquePromptExpanded}
+                aria-controls="critique-prompt-panel"
+                style={{ marginBottom: critiquePromptExpanded ? '1rem' : 0 }}
               >
-                Restore to Default
-              </button>
+                <div className="settings-trigger-copy">
+                  <div className="settings-trigger-title-row">
+                    <h4 className="form-group--compact settings-trigger-title">Edit Validator Critique Prompt</h4>
+                    {isUsingCustomCritiquePrompt && (
+                      <span className="tag-badge tag-badge--purple">CUSTOM</span>
+                    )}
+                  </div>
+                  <p className="settings-subsection-description">
+                    Optional prompt customization for the user-facing paper critique mode only. This does not affect the internal critique submitter used during autonomous research.
+                  </p>
+                </div>
+                <span className={`collapse-chevron${critiquePromptExpanded ? ' collapse-chevron--open' : ''}`}>▼</span>
+              </div>
 
-              <div style={{ display: 'flex', alignItems: 'center', gap: '0.75rem' }}>
-                {critiquePromptSaved && (
-                  <span style={{ color: '#4CAF50', fontSize: '0.85rem' }}>✓ Saved!</span>
-                )}
-                <button
-                  onClick={handleSaveCritiquePrompt}
-                  style={{
-                    padding: '0.5rem 1.5rem',
-                    backgroundColor: '#9b59b6',
-                    border: 'none',
-                    borderRadius: '4px',
-                    color: '#fff',
-                    cursor: 'pointer',
-                    fontWeight: '500',
-                    fontSize: '0.85rem'
-                  }}
-                >
-                  Save Prompt
-                </button>
+              {critiquePromptExpanded && (
+                <div className="collapsible-body" id="critique-prompt-panel">
+                  <p className="hint-text">
+                    Customize the prompt sent to your validator when requesting a paper critique.
+                    The JSON output schema is automatically appended and cannot be modified.
+                  </p>
+
+                  <textarea
+                    value={customCritiquePrompt}
+                    onChange={(e) => setCustomCritiquePrompt(e.target.value)}
+                    className="textarea-dark-mono"
+                    placeholder="Enter your custom critique prompt..."
+                  />
+
+                  <div className="actions-row">
+                    <button
+                      className="btn-ghost"
+                      onClick={handleRestoreCritiquePrompt}
+                    >
+                      Restore to Default
+                    </button>
+
+                    <div style={{ display: 'flex', alignItems: 'center', gap: '0.75rem' }}>
+                      {critiquePromptSaved && (
+                        <span className="status-success-text">✓ Saved!</span>
+                      )}
+                      <button
+                        className="btn-accent-purple"
+                        onClick={handleSaveCritiquePrompt}
+                      >
+                        Save Prompt
+                      </button>
+                    </div>
+                  </div>
+                </div>
+              )}
+            </div>
+
+            <div className="settings-subsection">
+              <div className="settings-subsection-header">
+                <h5 className="settings-subsection-title">Interface</h5>
+                <p className="settings-subsection-description">
+                  Display-only controls for the autonomous research UI.
+                </p>
               </div>
+
+              <label className="settings-checkbox-label settings-checkbox-label--stacked">
+                <input
+                  type="checkbox"
+                  checked={(() => {
+                    const saved = localStorage.getItem('banner_shimmer_enabled');
+                    return saved !== null ? JSON.parse(saved) : true;
+                  })()}
+                  onChange={(e) => {
+                    localStorage.setItem('banner_shimmer_enabled', JSON.stringify(e.target.checked));
+                    window.location.reload();
+                  }}
+                />
+                <span className="settings-option-copy">
+                  <span className="settings-option-title">Enable banner shimmer</span>
+                  <span className="settings-option-description">
+                    Keeps the animated banner shimmer on. Disable this when recording video to reduce motion and visual noise.
+                  </span>
+                </span>
+              </label>
             </div>
+
+            {/* Free model looping/auto-selector options */}
+            {hasOpenRouterKey && (
+              <div className="settings-subsection">
+                <div className="settings-subsection-header">
+                  <h5 className="settings-subsection-title">OpenRouter Fallback</h5>
+                  <p className="settings-subsection-description">
+                    Fallback behavior for OpenRouter free-model rate limits.
+                  </p>
+                </div>
+
+                <div className="checkbox-group-col">
+                  <label className="settings-checkbox-label settings-checkbox-label--stacked">
+                    <input
+                      type="checkbox"
+                      checked={freeModelLooping}
+                      onChange={(e) => {
+                        setFreeModelLooping(e.target.checked);
+                        openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
+                      }}
+                    />
+                    <span className="settings-option-copy">
+                      <span className="settings-option-title">
+                        Enable Free Model Looping
+                        <span
+                          title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
+                          className="help-hint"
+                        >(?)</span>
+                      </span>
+                      <span className="settings-option-description">
+                        Automatically rotate to the next selected free model when one hits a rate limit.
+                      </span>
+                    </span>
+                  </label>
+                  <label className="settings-checkbox-label settings-checkbox-label--stacked">
+                    <input
+                      type="checkbox"
+                      checked={freeModelAutoSelector}
+                      onChange={(e) => {
+                        setFreeModelAutoSelector(e.target.checked);
+                        openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
+                      }}
+                    />
+                    <span className="settings-option-copy">
+                      <span className="settings-option-title">
+                        Use OpenRouter Free Models Auto-Selector as Backup
+                        <span
+                          title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
+                          className="help-hint"
+                        >(?)</span>
+                      </span>
+                      <span className="settings-option-description">
+                        Falls back to OpenRouter&apos;s free router when every selected free model is temporarily exhausted.
+                      </span>
+                    </span>
+                  </label>
+                </div>
+              </div>
+            )}
           </div>
         )}
       </div>
-
-      <div style={{ marginTop: '1rem' }}>
-        <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
-          <input
-            type="checkbox"
-            checked={(() => {
-              const saved = localStorage.getItem('banner_shimmer_enabled');
-              return saved !== null ? JSON.parse(saved) : true;
-            })()}
-            onChange={(e) => {
-              localStorage.setItem('banner_shimmer_enabled', JSON.stringify(e.target.checked));
-              window.location.reload(); // Reload to apply change
-            }}
-            style={{ marginRight: '0.5rem' }}
-          />
-          Enable banner shimmer (disable for video recording)
-        </label>
-      </div>
-
-      {isRunning && (
-        <div className="settings-notice">
-          Settings cannot be changed while autonomous research is running.
-        </div>
-      )}
-
-      {/* Free model looping/auto-selector options */}
-      {hasOpenRouterKey && (
-        <div style={{ display: 'flex', flexDirection: 'column', gap: '0.4rem', marginTop: '0.5rem' }}>
-          <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
-            <input
-              type="checkbox"
-              checked={freeModelLooping}
-              onChange={(e) => {
-                setFreeModelLooping(e.target.checked);
-                openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
-              }}
-              style={{ marginRight: '0.5rem' }}
-            />
-            Enable Free Model Looping
-            <span
-              title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
-              style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
-            >(?)</span>
-          </label>
-          <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
-            <input
-              type="checkbox"
-              checked={freeModelAutoSelector}
-              onChange={(e) => {
-                setFreeModelAutoSelector(e.target.checked);
-                openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
-              }}
-              style={{ marginRight: '0.5rem' }}
-            />
-            Use OpenRouter Free Models Auto-Selector as Backup
-            <span
-              title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
-              style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
-            >(?)</span>
-          </label>
-        </div>
-      )}
     </div>
     </div>
   );
diff --git a/frontend/src/components/autonomous/BrainstormList.jsx b/frontend/src/components/autonomous/BrainstormList.jsx
index 461feec..40183b2 100644
--- a/frontend/src/components/autonomous/BrainstormList.jsx
+++ b/frontend/src/components/autonomous/BrainstormList.jsx
@@ -6,6 +6,7 @@ import React, { useState, useEffect, useRef } from 'react';
 import './AutonomousResearch.css';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
 
 const BrainstormList = ({ brainstorms, onRefresh, api }) => {
   const [expandedId, setExpandedId] = useState(null);
@@ -117,7 +118,7 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
     e.stopPropagation();
     if (!fileContent) return;
     
-    const blob = new Blob([fileContent], { type: 'text/plain' });
+    const blob = new Blob([prependDisclaimer(fileContent, 'brainstorm')], { type: 'text/plain' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');
     a.href = url;
@@ -145,7 +146,7 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
         <div className="brainstorm-list-warning">
           (WARNING: Any given brainstorm idea may be pruned/deleted if the AI deems it to hurt the collective database quality)
         </div>
-        <div className="empty-state">
+        <div className="auto-empty-state">
           No brainstorm topics yet. Start autonomous research to create brainstorms.
         </div>
       </div>
@@ -186,7 +187,7 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
 
             <div className="brainstorm-card-meta">
               <span>{brainstorm.submission_count} submissions</span>
-              <span>{brainstorm.papers_generated?.length || 0} papers</span>
+              <span>{brainstorm.papers_generated?.length || 0}/3 papers</span>
               <span>Last: {formatDate(brainstorm.last_activity)}</span>
             </div>
 
@@ -249,7 +250,7 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
                   </div>
                   <div className="brainstorm-content-viewer" onClick={(e) => e.stopPropagation()}>
                     <LatexRenderer
-                      content={fileContent}
+                      content={prependDisclaimer(fileContent, 'brainstorm')}
                       className="brainstorm-latex-renderer"
                       showToggle={false}
                       showLatex={showLatex}
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.css b/frontend/src/components/autonomous/FinalAnswerLibrary.css
index 55852ff..013721b 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.css
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.css
@@ -17,7 +17,7 @@
 }
 
 .library-header h2 {
-  color: #ffd700;
+  color: var(--gold, #1eff1c);
   font-size: 2rem;
   margin-bottom: 10px;
 }
@@ -36,13 +36,13 @@
 }
 
 .stat-badge {
-  background: linear-gradient(135deg, #2a2a2a 0%, #3a3a3a 100%);
+  background: linear-gradient(135deg, var(--surface-3, #22222c) 0%, var(--surface-4, #2a2a36) 100%);
   padding: 8px 16px;
-  border-radius: 6px;
-  color: #ffd700;
+  border-radius: var(--radius-sm, 6px);
+  color: var(--gold, #1eff1c);
   font-weight: 600;
   font-size: 0.9rem;
-  border: 1px solid #444;
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
 }
 
 /* ============================================================================
@@ -61,17 +61,18 @@
   flex: 1;
   min-width: 250px;
   padding: 12px 16px;
-  background: #2a2a2a;
-  border: 2px solid #444;
-  border-radius: 8px;
-  color: #fff;
+  background: var(--surface-3, #22222c);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
+  border-radius: var(--radius-md, 10px);
+  color: var(--text-primary, #e4e4ec);
   font-size: 0.95rem;
   transition: border-color 0.3s;
 }
 
 .search-input:focus {
   outline: none;
-  border-color: #ffd700;
+  border-color: var(--gold, #1eff1c);
+  box-shadow: 0 0 0 3px var(--gold-glow, rgba(30, 255, 28, 0.12));
 }
 
 .search-input::placeholder {
@@ -100,12 +101,99 @@
 }
 
 .filter-buttons button.active {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
-  border-color: #ffd700;
+  background: linear-gradient(135deg, #1eff1c 0%, #7dff6f 100%);
+  border-color: #1eff1c;
   color: #000;
   font-weight: 600;
 }
 
+/* ============================================================================
+   RESEARCH RUN GROUPS
+   ============================================================================ */
+
+.run-history-groups {
+  display: flex;
+  flex-direction: column;
+  gap: 22px;
+}
+
+.run-history-group {
+  background: linear-gradient(180deg, rgba(30, 255, 28, 0.05) 0%, rgba(34, 34, 44, 0.9) 100%);
+  border: 1px solid rgba(30, 255, 28, 0.14);
+  border-radius: 14px;
+  padding: 18px;
+  box-shadow: 0 10px 24px rgba(0, 0, 0, 0.16);
+}
+
+.run-history-group-header {
+  display: flex;
+  justify-content: space-between;
+  gap: 16px;
+  align-items: flex-start;
+  margin-bottom: 16px;
+  padding-bottom: 14px;
+  border-bottom: 1px solid rgba(255, 255, 255, 0.08);
+}
+
+.run-history-group-heading {
+  flex: 1;
+  min-width: 0;
+}
+
+.run-history-group-title {
+  margin: 0 0 8px;
+  color: var(--gold, #1eff1c);
+  font-size: 1.15rem;
+  line-height: 1.35;
+}
+
+.run-history-group-subtitle {
+  margin: 0;
+  color: #b9b9c6;
+  font-size: 0.88rem;
+  line-height: 1.45;
+}
+
+.run-history-group-subtitle + .run-history-group-subtitle {
+  margin-top: 4px;
+}
+
+.run-history-group-badges {
+  display: flex;
+  flex-wrap: wrap;
+  justify-content: flex-end;
+  gap: 8px;
+}
+
+.run-history-group-badge {
+  display: inline-flex;
+  align-items: center;
+  padding: 6px 12px;
+  border-radius: 999px;
+  background: rgba(255, 255, 255, 0.07);
+  border: 1px solid rgba(255, 255, 255, 0.1);
+  color: #d7d7df;
+  font-size: 0.8rem;
+  font-weight: 600;
+  white-space: nowrap;
+}
+
+.run-history-group-badge--current {
+  background: rgba(30, 255, 28, 0.16);
+  border-color: rgba(30, 255, 28, 0.32);
+  color: #b7ffb6;
+}
+
+.run-history-group-badge--linked {
+  background: rgba(46, 134, 222, 0.18);
+  border-color: rgba(46, 134, 222, 0.34);
+  color: #b9ddff;
+}
+
+.run-history-group-body {
+  display: block;
+}
+
 /* ============================================================================
    ANSWER LIST
    ============================================================================ */
@@ -117,21 +205,25 @@
 }
 
 .answer-card {
-  background: #2a2a2a;
-  border: 2px solid #444;
-  border-radius: 10px;
+  background: var(--surface-3, #22222c);
+  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
+  border-radius: var(--radius-md, 10px);
   overflow: hidden;
   transition: all 0.3s;
 }
 
 .answer-card:hover {
-  border-color: #ffd700;
-  box-shadow: 0 4px 12px rgba(255, 215, 0, 0.1);
+  border-color: var(--gold-dim, #18cc17);
+  box-shadow: 0 4px 16px rgba(30, 255, 28, 0.08);
 }
 
 .answer-card.expanded {
-  border-color: #ffd700;
-  box-shadow: 0 8px 20px rgba(255, 215, 0, 0.15);
+  border-color: var(--gold-dim, #18cc17);
+  box-shadow: 0 8px 24px rgba(30, 255, 28, 0.12);
+}
+
+.run-history-group .answer-list {
+  gap: 14px;
 }
 
 /* ============================================================================
@@ -156,7 +248,7 @@
 }
 
 .answer-title {
-  color: #ffd700;
+  color: var(--gold, #1eff1c);
   font-size: 1.3rem;
   margin: 0;
   flex: 1;
@@ -165,7 +257,7 @@
 .expand-button {
   background: transparent;
   border: none;
-  color: #ffd700;
+  color: #1eff1c;
   font-size: 1.2rem;
   cursor: pointer;
   padding: 5px 10px;
@@ -216,7 +308,7 @@
 }
 
 .answer-prompt strong {
-  color: #ffd700;
+  color: #1eff1c;
 }
 
 .answer-footer-info {
@@ -291,9 +383,9 @@
    ============================================================================ */
 
 .answer-content {
-  border-top: 2px solid #444;
+  border-top: 1px solid var(--border-default, rgba(255,255,255,0.1));
   padding: 20px;
-  background: #1a1a1a;
+  background: var(--surface-2, #1a1a22);
 }
 
 .content-actions {
@@ -329,7 +421,7 @@
 }
 
 .chapter-list h4 {
-  color: #ffd700;
+  color: #1eff1c;
   margin-bottom: 10px;
 }
 
@@ -373,7 +465,7 @@
    EMPTY STATE
    ============================================================================ */
 
-.empty-state {
+.fal-empty-state {
   text-align: center;
   padding: 60px 20px;
   color: #888;
@@ -385,13 +477,13 @@
   margin-bottom: 20px;
 }
 
-.empty-state h3 {
+.fal-empty-state h3 {
   color: #ccc;
   font-size: 1.5rem;
   margin-bottom: 10px;
 }
 
-.empty-state p {
+.fal-empty-state p {
   font-size: 1rem;
 }
 
@@ -402,7 +494,7 @@
 .loading-spinner {
   text-align: center;
   padding: 40px;
-  color: #ffd700;
+  color: #1eff1c;
   font-size: 1.2rem;
   animation: spin 2s linear infinite;
 }
@@ -461,9 +553,9 @@
 .refresh-button {
   padding: 12px 24px;
   background: linear-gradient(135deg, #2a2a2a 0%, #3a3a3a 100%);
-  border: 2px solid #ffd700;
+  border: 2px solid #1eff1c;
   border-radius: 8px;
-  color: #ffd700;
+  color: #1eff1c;
   font-size: 0.95rem;
   font-weight: 600;
   cursor: pointer;
@@ -473,7 +565,7 @@
 .refresh-button:hover {
   background: linear-gradient(135deg, #3a3a3a 0%, #4a4a4a 100%);
   transform: translateY(-2px);
-  box-shadow: 0 4px 12px rgba(255, 215, 0, 0.2);
+  box-shadow: 0 4px 12px rgba(30, 255, 28, 0.2);
 }
 
 /* ============================================================================
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
index 6d2d9a4..24a963f 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
@@ -3,6 +3,8 @@ import LatexRenderer from '../LatexRenderer';
 import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
+import { buildResearchRunGroups } from '../../utils/researchRunHistory';
 import './FinalAnswerLibrary.css';
 
 /**
@@ -21,6 +23,8 @@ import './FinalAnswerLibrary.css';
  */
 function FinalAnswerLibrary() {
   const [finalAnswers, setFinalAnswers] = useState([]);
+  const [stage2Papers, setStage2Papers] = useState([]);
+  const [sessionsResponse, setSessionsResponse] = useState(null);
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState(null);
   const [expandedId, setExpandedId] = useState(null);
@@ -42,15 +46,41 @@ function FinalAnswerLibrary() {
     try {
       setLoading(true);
       setError(null);
-      
-      const response = await fetch('/api/auto-research/final-answer-library');
-      const data = await response.json();
-      
-      if (data.success) {
-        setFinalAnswers(data.final_answers || []);
+
+      const [answersResult, sessionsResult, papersResult] = await Promise.allSettled([
+        fetch('/api/auto-research/final-answer-library').then(async (response) => {
+          if (!response.ok) {
+            throw new Error('Failed to load final answer library');
+          }
+          return response.json();
+        }),
+        autonomousAPI.getSessions(),
+        autonomousAPI.getPaperHistory(),
+      ]);
+
+      if (answersResult.status !== 'fulfilled') {
+        throw answersResult.reason;
+      }
+
+      if (answersResult.value.success) {
+        setFinalAnswers(answersResult.value.final_answers || []);
       } else {
         setError('Failed to load final answer library');
       }
+
+      if (sessionsResult.status === 'fulfilled') {
+        setSessionsResponse(sessionsResult.value);
+      } else {
+        setSessionsResponse(null);
+        console.warn('Stage 3 history: failed to load sessions metadata', sessionsResult.reason);
+      }
+
+      if (papersResult.status === 'fulfilled') {
+        setStage2Papers(papersResult.value.papers || []);
+      } else {
+        setStage2Papers([]);
+        console.warn('Stage 3 history: failed to load Stage 2 paper metadata', papersResult.reason);
+      }
     } catch (err) {
       setError(`Error loading library: ${err.message}`);
       console.error('Failed to load final answer library:', err);
@@ -89,7 +119,7 @@ function FinalAnswerLibrary() {
       return;
     }
 
-    const blob = new Blob([expandedContent.content], { type: 'text/plain' });
+    const blob = new Blob([prependDisclaimer(expandedContent.content, 'paper')], { type: 'text/plain' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');
     a.href = url;
@@ -110,7 +140,7 @@ function FinalAnswerLibrary() {
       
       if (data.success && data.content) {
         const filename = sanitizeFilename(`Final_Answer_${answer.title}`);
-        downloadRawText(data.content, filename, null);
+        downloadRawText(data.content, filename, null, 'paper');
       } else {
         alert('Failed to load content for download');
       }
@@ -157,6 +187,7 @@ function FinalAnswerLibrary() {
           console.error('PDF generation failed:', error);
           alert(`PDF generation failed: ${error.message}`);
         },
+        'paper',
       );
     } catch (error) {
       setDownloadingPDF(null);
@@ -188,30 +219,47 @@ function FinalAnswerLibrary() {
     }
   };
 
-  // Filter final answers
-  const filteredAnswers = finalAnswers.filter(answer => {
-    // Format filter
-    if (filterFormat !== 'all' && answer.format !== filterFormat) {
-      return false;
-    }
+  const runGroups = useMemo(() => (
+    buildResearchRunGroups({
+      sessionsResponse,
+      stage2Papers,
+      stage3Answers: finalAnswers,
+    })
+  ), [sessionsResponse, stage2Papers, finalAnswers]);
 
-    // Search filter
-    if (searchTerm) {
-      const searchLower = searchTerm.toLowerCase();
-      const matchesTitle = answer.title.toLowerCase().includes(searchLower);
-      const matchesPrompt = answer.user_prompt.toLowerCase().includes(searchLower);
-      return matchesTitle || matchesPrompt;
-    }
+  const visibleRunGroups = useMemo(() => {
+    const searchLower = searchTerm.trim().toLowerCase();
 
-    return true;
-  });
+    const matchesAnswer = (answer) => {
+      if (filterFormat !== 'all' && answer.format !== filterFormat) {
+        return false;
+      }
+
+      if (!searchLower) {
+        return true;
+      }
+
+      return (
+        answer.title?.toLowerCase().includes(searchLower) ||
+        answer.user_prompt?.toLowerCase().includes(searchLower) ||
+        answer.session_id?.toLowerCase().includes(searchLower)
+      );
+    };
+
+    return runGroups
+      .map((runGroup) => ({
+        ...runGroup,
+        visibleStage3Answers: runGroup.stage3Answers.filter(matchesAnswer),
+      }))
+      .filter((runGroup) => runGroup.visibleStage3Answers.length > 0);
+  }, [runGroups, filterFormat, searchTerm]);
 
   if (loading) {
     return (
       <div className="final-answer-library">
         <div className="library-header">
-          <h2>Final Answer Library</h2>
-          <p>Loading your completed research volumes...</p>
+          <h2>Stage 3 Final Answers History</h2>
+          <p>Loading completed Stage 3 final answers...</p>
         </div>
         <div className="loading-spinner">⟳ Loading...</div>
       </div>
@@ -222,7 +270,7 @@ function FinalAnswerLibrary() {
     return (
       <div className="final-answer-library">
         <div className="library-header">
-          <h2>Final Answer Library</h2>
+          <h2>Stage 3 Final Answers History</h2>
         </div>
         <div className="error-message">
           <span>⚠</span>
@@ -239,17 +287,19 @@ function FinalAnswerLibrary() {
     <div className="final-answer-library">
       {/* Header */}
       <div className="library-header">
-        <h2>📚 Final Answer Library</h2>
-        <p>If you have enabled Tier 3 experimental final answer generation, any completed answers will appear here. Browse all completed research volumes and papers from your autonomous research sessions.</p>
+        <h2>📚 Stage 3 Final Answers History</h2>
+        <p>If you have enabled Tier 3 experimental final answer generation, completed Stage 3 answers will appear here. Browse all completed research volumes and short-form answers from your autonomous research sessions.</p>
         <div className="library-stats">
           <span className="stat-badge">
             {finalAnswers.length} {finalAnswers.length === 1 ? 'Answer' : 'Answers'}
           </span>
           <span className="stat-badge">
-            {finalAnswers.filter(a => a.format === 'long_form').length} Volumes
+            {runGroups.filter((runGroup) => runGroup.stage3AnswerCount > 0).length} Research Runs
           </span>
           <span className="stat-badge">
-            {finalAnswers.filter(a => a.format === 'short_form').length} Papers
+            {runGroups
+              .filter((runGroup) => runGroup.stage3AnswerCount > 0)
+              .reduce((total, runGroup) => total + runGroup.stage2PaperCount, 0)} Matching Stage 2 Papers
           </span>
         </div>
       </div>
@@ -287,10 +337,10 @@ function FinalAnswerLibrary() {
       </div>
 
       {/* List */}
-      {filteredAnswers.length === 0 ? (
-        <div className="empty-state">
+      {visibleRunGroups.length === 0 ? (
+        <div className="fal-empty-state">
           <span className="empty-icon">📭</span>
-          <h3>No final answers found</h3>
+          <h3>No Stage 3 final answers found</h3>
           <p>
             {searchTerm || filterFormat !== 'all'
               ? 'Try adjusting your search or filters'
@@ -298,140 +348,180 @@ function FinalAnswerLibrary() {
           </p>
         </div>
       ) : (
-        <div className="answer-list">
-          {filteredAnswers.map(answer => (
-            <div
-              key={answer.answer_id}
-              className={`answer-card ${expandedId === answer.answer_id ? 'expanded' : ''}`}
-            >
-              {/* Header */}
-              <div className="answer-header" onClick={() => loadFullContent(answer.answer_id)}>
-                <div className="answer-title-row">
-                  <h3 className="answer-title">
-                    {answer.format === 'long_form' ? '▭' : '⊟'} {answer.title}
-                  </h3>
-                  <button className="expand-button">
-                    {expandedId === answer.answer_id ? '▼' : '▶'}
-                  </button>
-                </div>
-                
-                <div className="answer-metadata">
-                  <span className="format-badge">
-                    {answer.format === 'long_form' ? 'Volume' : 'Paper'}
-                  </span>
-                  <span
-                    className="certainty-badge"
-                    style={{ backgroundColor: getCertaintyBadgeColor(answer.certainty_level) }}
-                  >
-                    {formatCertaintyLevel(answer.certainty_level)}
-                  </span>
-                  <span className="word-count">{answer.word_count.toLocaleString()} words</span>
-                  {answer.format === 'long_form' && (
-                    <span className="chapter-count">{answer.chapter_count} chapters</span>
+        <div className="run-history-groups">
+          {visibleRunGroups.map((runGroup) => (
+            <section key={runGroup.sessionId} className="run-history-group">
+              <div className="run-history-group-header">
+                <div className="run-history-group-heading">
+                  <h3 className="run-history-group-title">{runGroup.userPrompt}</h3>
+                  <p className="run-history-group-subtitle">
+                    Research Run: {runGroup.displaySessionId}
+                  </p>
+                  {runGroup.createdAt && (
+                    <p className="run-history-group-subtitle">
+                      Started: {formatDate(runGroup.createdAt)}
+                    </p>
                   )}
                 </div>
-
-                <div className="answer-prompt">
-                  <strong>Research Question:</strong> {answer.user_prompt}
-                </div>
-
-                <div className="answer-footer-info">
-                  <span className="completion-date">
-                    Completed: {formatDate(answer.completion_date)}
+                <div className="run-history-group-badges">
+                  {runGroup.isCurrent && (
+                    <span className="run-history-group-badge run-history-group-badge--current">
+                      Current Run
+                    </span>
+                  )}
+                  <span className="run-history-group-badge">
+                    Stage 2 Papers: {runGroup.stage2PaperCount}
                   </span>
-                  <span className="session-id">
-                    Session: {answer.session_id === 'legacy' ? 'Legacy' : answer.session_id}
+                  <span className="run-history-group-badge run-history-group-badge--linked">
+                    Stage 3 Answers: {runGroup.stage3AnswerCount}
                   </span>
-                </div>
-                
-                {/* Quick Download Buttons (no expand needed) */}
-                <div className="quick-download-buttons" onClick={(e) => e.stopPropagation()}>
-                  <button
-                    className="quick-download-raw"
-                    onClick={(e) => downloadAnswerRaw(e, answer)}
-                    title="Download raw text immediately"
-                  >
-                    📄 Download Raw
-                  </button>
-                  <button
-                    className="quick-download-pdf"
-                    onClick={(e) => downloadAnswerPDF(e, answer)}
-                    disabled={downloadingPDF === answer.answer_id}
-                    title="Generate and download PDF"
-                  >
-                    {downloadingPDF === answer.answer_id ? '⏳ Preparing PDF...' : '📑 Download PDF'}
-                  </button>
+                  {runGroup.brainstormCount !== null && runGroup.brainstormCount !== undefined && (
+                    <span className="run-history-group-badge">
+                      Brainstorms: {runGroup.brainstormCount}
+                    </span>
+                  )}
                 </div>
               </div>
 
-              {/* Expanded Content */}
-              {expandedId === answer.answer_id && expandedContent && (
-                <div className="answer-content">
-                  <div className="content-actions">
-                    <button onClick={() => downloadAnswer(answer)} className="download-button">
-                      💾 Download
-                    </button>
-                    <button
-                      className="critique-button"
-                      onClick={() => {
-                        setSelectedAnswerForCritique(answer);
-                        setCritiqueModalOpen(true);
-                      }}
-                      style={{
-                        background: 'linear-gradient(135deg, #9b59b6 0%, #8e44ad 100%)',
-                        border: 'none',
-                        color: '#fff',
-                        padding: '0.5rem 1rem',
-                        borderRadius: '4px',
-                        cursor: 'pointer',
-                        fontWeight: '500',
-                        fontSize: '0.85rem'
-                      }}
-                      title="Ask validator to critique this final answer"
+              <div className="run-history-group-body">
+                <div className="answer-list">
+                  {runGroup.visibleStage3Answers.map(answer => (
+                    <div
+                      key={answer.answer_id}
+                      className={`answer-card ${expandedId === answer.answer_id ? 'expanded' : ''}`}
                     >
-                      ⭐ Ask Validator to Critique
-                    </button>
-                    {/* View toggle for LaTeX rendering */}
-                    <div className="view-toggle">
-                      <button
-                        className={`btn ${showLatex ? '' : 'btn-secondary'}`}
-                        onClick={() => setShowLatex(true)}
-                      >
-                        Rendered View
-                      </button>
-                      <button
-                        className={`btn ${!showLatex ? '' : 'btn-secondary'}`}
-                        onClick={() => setShowLatex(false)}
-                      >
-                        Raw Text
-                      </button>
+                      {/* Header */}
+                      <div className="answer-header" onClick={() => loadFullContent(answer.answer_id)}>
+                        <div className="answer-title-row">
+                          <h3 className="answer-title">
+                            {answer.format === 'long_form' ? '▭' : '⊟'} {answer.title}
+                          </h3>
+                          <button className="expand-button">
+                            {expandedId === answer.answer_id ? '▼' : '▶'}
+                          </button>
+                        </div>
+                        
+                        <div className="answer-metadata">
+                          <span className="format-badge">
+                            {answer.format === 'long_form' ? 'Volume' : 'Paper'}
+                          </span>
+                          <span
+                            className="certainty-badge"
+                            style={{ backgroundColor: getCertaintyBadgeColor(answer.certainty_level) }}
+                          >
+                            {formatCertaintyLevel(answer.certainty_level)}
+                          </span>
+                          <span className="word-count">{answer.word_count.toLocaleString()} words</span>
+                          {answer.format === 'long_form' && (
+                            <span className="chapter-count">{answer.chapter_count} chapters</span>
+                          )}
+                        </div>
+
+                        <div className="answer-prompt">
+                          <strong>Research Question:</strong> {answer.user_prompt}
+                        </div>
+
+                        <div className="answer-footer-info">
+                          <span className="completion-date">
+                            Completed: {formatDate(answer.completion_date)}
+                          </span>
+                          <span className="session-id">
+                            Session: {answer.session_id === 'legacy' ? 'Legacy' : answer.session_id}
+                          </span>
+                        </div>
+                        
+                        {/* Quick Download Buttons (no expand needed) */}
+                        <div className="quick-download-buttons" onClick={(e) => e.stopPropagation()}>
+                          <button
+                            className="quick-download-raw"
+                            onClick={(e) => downloadAnswerRaw(e, answer)}
+                            title="Download raw text immediately"
+                          >
+                            📄 Download Raw
+                          </button>
+                          <button
+                            className="quick-download-pdf"
+                            onClick={(e) => downloadAnswerPDF(e, answer)}
+                            disabled={downloadingPDF === answer.answer_id}
+                            title="Generate and download PDF"
+                          >
+                            {downloadingPDF === answer.answer_id ? '⏳ Preparing PDF...' : '📑 Download PDF'}
+                          </button>
+                        </div>
+                      </div>
+
+                      {/* Expanded Content */}
+                      {expandedId === answer.answer_id && expandedContent && (
+                        <div className="answer-content">
+                          <div className="content-actions">
+                            <button onClick={() => downloadAnswer(answer)} className="download-button">
+                              💾 Download
+                            </button>
+                            <button
+                              className="critique-button"
+                              onClick={() => {
+                                setSelectedAnswerForCritique(answer);
+                                setCritiqueModalOpen(true);
+                              }}
+                              style={{
+                                background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
+                                border: 'none',
+                                color: '#0b2e0b',
+                                padding: '0.5rem 1rem',
+                                borderRadius: '4px',
+                                cursor: 'pointer',
+                                fontWeight: '500',
+                                fontSize: '0.85rem'
+                              }}
+                              title="Ask validator to critique this final answer"
+                            >
+                              ⭐ Ask Validator to Critique
+                            </button>
+                            {/* View toggle for LaTeX rendering */}
+                            <div className="view-toggle">
+                              <button
+                                className={`btn ${showLatex ? '' : 'btn-secondary'}`}
+                                onClick={() => setShowLatex(true)}
+                              >
+                                Rendered View
+                              </button>
+                              <button
+                                className={`btn ${!showLatex ? '' : 'btn-secondary'}`}
+                                onClick={() => setShowLatex(false)}
+                              >
+                                Raw Text
+                              </button>
+                            </div>
+                          </div>
+
+                          {/* Chapter list (for volumes) */}
+                          {answer.format === 'long_form' && expandedContent.chapters && (
+                            <div className="chapter-list">
+                              <h4>Chapters:</h4>
+                              <ol>
+                                {expandedContent.chapters.map(ch => (
+                                  <li key={ch.order}>
+                                    <strong>{ch.title}</strong>
+                                    <span className="chapter-type">
+                                      [{ch.chapter_type.replace(/_/g, ' ')}]
+                                    </span>
+                                  </li>
+                                ))}
+                              </ol>
+                            </div>
+                          )}
+
+                          {/* Full content */}
+                          <div className="full-content">
+                            <LatexRenderer content={prependDisclaimer(expandedContent.content, 'paper')} showLatex={showLatex} />
+                          </div>
+                        </div>
+                      )}
                     </div>
-                  </div>
-
-                  {/* Chapter list (for volumes) */}
-                  {answer.format === 'long_form' && expandedContent.chapters && (
-                    <div className="chapter-list">
-                      <h4>Chapters:</h4>
-                      <ol>
-                        {expandedContent.chapters.map(ch => (
-                          <li key={ch.order}>
-                            <strong>{ch.title}</strong>
-                            <span className="chapter-type">
-                              [{ch.chapter_type.replace(/_/g, ' ')}]
-                            </span>
-                          </li>
-                        ))}
-                      </ol>
-                    </div>
-                  )}
-
-                  {/* Full content */}
-                  <div className="full-content">
-                    <LatexRenderer content={expandedContent.content} showLatex={showLatex} />
-                  </div>
+                  ))}
                 </div>
-              )}
-            </div>
+              </div>
+            </section>
           ))}
         </div>
       )}
diff --git a/frontend/src/components/autonomous/LivePaperProgress.jsx b/frontend/src/components/autonomous/LivePaperProgress.jsx
index 23ca5c8..23681d8 100644
--- a/frontend/src/components/autonomous/LivePaperProgress.jsx
+++ b/frontend/src/components/autonomous/LivePaperProgress.jsx
@@ -5,6 +5,7 @@ import React, { useState, useEffect, useRef, useCallback } from 'react';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
 
 const LivePaperProgress = ({ api, isCompiling }) => {
   const [paperData, setPaperData] = useState(null);
@@ -60,7 +61,7 @@ const LivePaperProgress = ({ api, isCompiling }) => {
   const handleDownloadRaw = () => {
     if (!paperData?.content) return;
     const filename = sanitizeFilename(paperData.title || paperData.paper_id || 'paper');
-    downloadRawText(paperData.content, filename, paperData.outline);
+    downloadRawText(paperData.content, filename, paperData.outline, 'paper');
   };
 
   const handleDownloadPdf = async () => {
@@ -86,6 +87,7 @@ const LivePaperProgress = ({ api, isCompiling }) => {
         console.error('PDF download failed:', error);
         alert('PDF generation failed: ' + error.message);
       },
+      'paper',
     );
   };
 
@@ -179,8 +181,8 @@ const LivePaperProgress = ({ api, isCompiling }) => {
                 <LatexRenderer 
                   content={
                     paperData.outline
-                      ? `${paperData.outline}\n\n${'='.repeat(80)}\n\n${paperData.content}`
-                      : paperData.content
+                      ? `${paperData.outline}\n\n${'='.repeat(80)}\n\n${prependDisclaimer(paperData.content, 'paper')}`
+                      : prependDisclaimer(paperData.content, 'paper')
                   }
                   className="live-paper-latex-renderer"
                   defaultRaw={true}
diff --git a/frontend/src/components/autonomous/LiveTier3Progress.jsx b/frontend/src/components/autonomous/LiveTier3Progress.jsx
index b1763fd..4627349 100644
--- a/frontend/src/components/autonomous/LiveTier3Progress.jsx
+++ b/frontend/src/components/autonomous/LiveTier3Progress.jsx
@@ -11,6 +11,7 @@ import React, { useState, useEffect, useRef, useCallback } from 'react';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
 
 const LiveTier3Progress = ({ api, status }) => {
   const [paperData, setPaperData] = useState(null);
@@ -103,7 +104,7 @@ const LiveTier3Progress = ({ api, status }) => {
   const handleDownloadRaw = () => {
     if (!paperData?.content) return;
     const filename = sanitizeFilename(paperData.title || 'tier3_final_answer');
-    downloadRawText(paperData.content, filename, paperData.outline);
+    downloadRawText(paperData.content, filename, paperData.outline, 'paper');
   };
 
   const handleDownloadPdf = async () => {
@@ -129,6 +130,7 @@ const LiveTier3Progress = ({ api, status }) => {
         console.error('PDF download failed:', error);
         alert('PDF generation failed: ' + error.message);
       },
+      'paper',
     );
   };
 
@@ -190,7 +192,7 @@ const LiveTier3Progress = ({ api, status }) => {
       'format_selecting': { label: 'Selecting Format', color: 'blue' },
       'organizing_volume': { label: 'Organizing Volume', color: 'purple' },
       'writing': { label: 'Writing', color: 'green' },
-      'complete': { label: 'Complete', color: 'gold' }
+      'complete': { label: 'Complete', color: 'green' }
     };
     
     const info = statusMap[tierStatus] || { label: tierStatus || 'Unknown', color: 'gray' };
@@ -327,8 +329,8 @@ const LiveTier3Progress = ({ api, status }) => {
                 <LatexRenderer 
                   content={
                     paperData.outline
-                      ? `${paperData.outline}\n\n${'='.repeat(80)}\n\n${paperData.content}`
-                      : paperData.content
+                      ? `${paperData.outline}\n\n${'='.repeat(80)}\n\n${prependDisclaimer(paperData.content, 'paper')}`
+                      : prependDisclaimer(paperData.content, 'paper')
                   }
                   className="live-tier3-latex-renderer"
                   defaultRaw={true}
@@ -353,7 +355,7 @@ const LiveTier3Progress = ({ api, status }) => {
       <style>{`
         .live-tier3-progress {
           background: linear-gradient(135deg, #1a1a2e 0%, #16213e 100%);
-          border: 1px solid #ffd700;
+          border: 1px solid #1eff1c;
           border-radius: 8px;
           margin: 1rem 0;
           overflow: hidden;
@@ -364,14 +366,14 @@ const LiveTier3Progress = ({ api, status }) => {
           justify-content: space-between;
           align-items: center;
           padding: 0.75rem 1rem;
-          background: linear-gradient(90deg, rgba(255, 215, 0, 0.15) 0%, rgba(255, 215, 0, 0.05) 100%);
+          background: linear-gradient(90deg, rgba(30, 255, 28, 0.15) 0%, rgba(30, 255, 28, 0.05) 100%);
           cursor: pointer;
-          border-bottom: 1px solid rgba(255, 215, 0, 0.3);
+          border-bottom: 1px solid rgba(30, 255, 28, 0.3);
         }
 
         .live-tier3-header h3 {
           margin: 0;
-          color: #ffd700;
+          color: #1eff1c;
           font-size: 1rem;
           display: flex;
           align-items: center;
@@ -402,7 +404,7 @@ const LiveTier3Progress = ({ api, status }) => {
         .tier3-status-blue { background: #1e40af; color: #93c5fd; }
         .tier3-status-purple { background: #6b21a8; color: #d8b4fe; }
         .tier3-status-green { background: #166534; color: #86efac; }
-        .tier3-status-gold { background: #854d0e; color: #fcd34d; }
+        .tier3-status-gold { background: #0f5a10; color: #7dff6f; }
 
         .tier3-format-badge {
           padding: 0.25rem 0.5rem;
@@ -419,7 +421,7 @@ const LiveTier3Progress = ({ api, status }) => {
 
         .tier3-chapter-list {
           padding: 0.75rem 1rem;
-          border-bottom: 1px solid rgba(255, 215, 0, 0.2);
+          border-bottom: 1px solid rgba(30, 255, 28, 0.2);
           background: rgba(0, 0, 0, 0.2);
         }
 
@@ -447,8 +449,8 @@ const LiveTier3Progress = ({ api, status }) => {
         }
 
         .chapter-item.chapter-active {
-          background: rgba(255, 215, 0, 0.2);
-          border: 1px solid rgba(255, 215, 0, 0.4);
+          background: rgba(30, 255, 28, 0.2);
+          border: 1px solid rgba(30, 255, 28, 0.4);
         }
 
         .chapter-item.chapter-complete {
@@ -464,7 +466,7 @@ const LiveTier3Progress = ({ api, status }) => {
           background: rgba(255, 255, 255, 0.1);
           border-radius: 50%;
           font-weight: 600;
-          color: #ffd700;
+          color: #1eff1c;
         }
 
         .chapter-type {
@@ -488,12 +490,12 @@ const LiveTier3Progress = ({ api, status }) => {
         }
 
         .chapter-status-complete { color: #86efac; }
-        .chapter-status-writing { color: #fcd34d; ${getBannerShimmerEnabled() ? 'animation: pulse 1s infinite;' : ''} }
+        .chapter-status-writing { color: #7dff6f; ${getBannerShimmerEnabled() ? 'animation: pulse 1s infinite;' : ''} }
         .chapter-status-pending { color: #6b7280; }
 
         .tier3-current-writing {
           padding: 0.5rem 1rem;
-          background: rgba(255, 215, 0, 0.1);
+          background: rgba(30, 255, 28, 0.1);
           display: flex;
           align-items: center;
           gap: 0.5rem;
@@ -501,7 +503,7 @@ const LiveTier3Progress = ({ api, status }) => {
         }
 
         .writing-indicator {
-          color: #fcd34d;
+          color: #7dff6f;
           ${getBannerShimmerEnabled() ? 'animation: pulse 1.5s infinite;' : ''}
         }
 
@@ -557,14 +559,14 @@ const LiveTier3Progress = ({ api, status }) => {
         }
 
         .btn-download-pdf {
-          background: #ffd700;
+          background: #1eff1c;
           border: none;
           color: #1a1a2e;
           font-weight: 600;
         }
 
         .btn-download-pdf:hover:not(:disabled) {
-          background: #ffed4e;
+          background: #7dff6f;
         }
 
         .btn-download-raw:disabled, .btn-download-pdf:disabled {
@@ -580,9 +582,9 @@ const LiveTier3Progress = ({ api, status }) => {
 
         .paper-section h4 {
           margin: 0 0 1rem 0;
-          color: #ffd700;
+          color: #1eff1c;
           font-size: 0.9rem;
-          border-bottom: 1px solid rgba(255, 215, 0, 0.2);
+          border-bottom: 1px solid rgba(30, 255, 28, 0.2);
           padding-bottom: 0.5rem;
         }
 
diff --git a/frontend/src/components/autonomous/PaperLibrary.jsx b/frontend/src/components/autonomous/PaperLibrary.jsx
index d1efcbf..16b1c02 100644
--- a/frontend/src/components/autonomous/PaperLibrary.jsx
+++ b/frontend/src/components/autonomous/PaperLibrary.jsx
@@ -156,7 +156,7 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
         <div className="paper-library-pruned-counter">
           Pruned Papers: {archivedCount}
         </div>
-        <div className="empty-state">
+        <div className="auto-empty-state">
           No papers completed yet. Autonomous research will generate papers from brainstorm databases.
         </div>
       </div>
@@ -269,9 +269,9 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
                     onClick={(e) => handleOpenCritique(e, paper)}
                     title="Ask validator to critique this paper"
                     style={{
-                      background: 'linear-gradient(135deg, #9b59b6 0%, #8e44ad 100%)',
+                      background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
                       border: 'none',
-                      color: '#fff',
+                      color: '#0b2e0b',
                       padding: '0.35rem 0.7rem',
                       borderRadius: '4px',
                       cursor: 'pointer',
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.css b/frontend/src/components/autonomous/Stage2PaperHistory.css
new file mode 100644
index 0000000..a740f36
--- /dev/null
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.css
@@ -0,0 +1,51 @@
+.stage2-paper-history .paper-grid {
+  margin-top: 0.5rem;
+}
+
+.stage2-paper-history .run-history-group .paper-grid {
+  margin-top: 0;
+}
+
+.stage2-history-card-identifiers {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  flex-wrap: wrap;
+}
+
+.stage2-history-session-badge {
+  display: inline-flex;
+  align-items: center;
+  padding: 0.18rem 0.5rem;
+  border-radius: 999px;
+  background: rgba(30, 255, 28, 0.12);
+  border: 1px solid rgba(30, 255, 28, 0.2);
+  color: #9eff9e;
+  font-size: 0.7rem;
+  max-width: 220px;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.stage2-history-critique-badge {
+  display: inline-block;
+  margin-left: 8px;
+  padding: 2px 8px;
+  border-radius: 4px;
+  font-size: 0.75rem;
+  font-weight: 600;
+  color: #fff;
+  vertical-align: middle;
+}
+
+.stage2-history-prompt {
+  margin-top: 0.75rem;
+  color: #ccc;
+  font-size: 0.85rem;
+  line-height: 1.45;
+}
+
+.stage2-history-prompt strong {
+  color: #1eff1c;
+}
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.jsx b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
new file mode 100644
index 0000000..bb02d89
--- /dev/null
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
@@ -0,0 +1,534 @@
+import React, { useEffect, useMemo, useState } from 'react';
+import LatexRenderer from '../LatexRenderer';
+import PaperCritiqueModal from '../PaperCritiqueModal';
+import { autonomousAPI } from '../../services/api';
+import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
+import { buildResearchRunGroups } from '../../utils/researchRunHistory';
+import './FinalAnswerLibrary.css';
+import './AutonomousResearch.css';
+import './Stage2PaperHistory.css';
+
+function getCritiqueColor(rating) {
+  if (rating >= 8) return '#10b981';
+  if (rating >= 6.25) return '#3b82f6';
+  if (rating >= 4) return '#eab308';
+  if (rating >= 2) return '#f97316';
+  return '#ef4444';
+}
+
+function formatDate(dateStr) {
+  if (!dateStr) return 'N/A';
+  return new Date(dateStr).toLocaleString();
+}
+
+function truncateAbstract(abstract, maxLength = 220) {
+  if (!abstract || abstract.length <= maxLength) return abstract;
+  return `${abstract.substring(0, maxLength)}...`;
+}
+
+export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
+  const [papers, setPapers] = useState([]);
+  const [finalAnswers, setFinalAnswers] = useState([]);
+  const [sessionsResponse, setSessionsResponse] = useState(null);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState(null);
+  const [expandedId, setExpandedId] = useState(null);
+  const [expandedContent, setExpandedContent] = useState(null);
+  const [loadingContentId, setLoadingContentId] = useState(null);
+  const [searchTerm, setSearchTerm] = useState('');
+  const [deleteConfirmId, setDeleteConfirmId] = useState(null);
+  const [deletingId, setDeletingId] = useState(null);
+  const [generatingPdfId, setGeneratingPdfId] = useState(null);
+  const [critiqueModalOpen, setCritiqueModalOpen] = useState(false);
+  const [critiquePaper, setCritiquePaper] = useState(null);
+
+  useEffect(() => {
+    loadPaperHistory();
+  }, []);
+
+  const loadPaperHistory = async () => {
+    try {
+      setLoading(true);
+      setError(null);
+
+      const [papersResult, sessionsResult, finalAnswersResult] = await Promise.allSettled([
+        autonomousAPI.getPaperHistory(),
+        autonomousAPI.getSessions(),
+        fetch('/api/auto-research/final-answer-library').then(async (response) => {
+          if (!response.ok) {
+            throw new Error('Failed to load Stage 3 final answer history');
+          }
+          return response.json();
+        }),
+      ]);
+
+      if (papersResult.status !== 'fulfilled') {
+        throw papersResult.reason;
+      }
+
+      setPapers(papersResult.value.papers || []);
+
+      if (sessionsResult.status === 'fulfilled') {
+        setSessionsResponse(sessionsResult.value);
+      } else {
+        setSessionsResponse(null);
+        console.warn('Stage 2 history: failed to load sessions metadata', sessionsResult.reason);
+      }
+
+      if (finalAnswersResult.status === 'fulfilled' && finalAnswersResult.value.success) {
+        setFinalAnswers(finalAnswersResult.value.final_answers || []);
+      } else {
+        setFinalAnswers([]);
+        if (finalAnswersResult.status === 'rejected') {
+          console.warn('Stage 2 history: failed to load Stage 3 final answer metadata', finalAnswersResult.reason);
+        }
+      }
+    } catch (err) {
+      setError(`Error loading Stage 2 history: ${err.message}`);
+      console.error('Failed to load Stage 2 paper history:', err);
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  const runGroups = useMemo(() => (
+    buildResearchRunGroups({
+      sessionsResponse,
+      stage2Papers: papers,
+      stage3Answers: finalAnswers,
+    })
+  ), [sessionsResponse, papers, finalAnswers]);
+
+  const visibleRunGroups = useMemo(() => {
+    const searchLower = searchTerm.trim().toLowerCase();
+    const matchesPaper = (paper) => {
+      const sources = (paper.source_brainstorm_ids || []).join(' ').toLowerCase();
+      return (
+        paper.title?.toLowerCase().includes(searchLower) ||
+        paper.abstract?.toLowerCase().includes(searchLower) ||
+        paper.user_prompt?.toLowerCase().includes(searchLower) ||
+        paper.paper_id?.toLowerCase().includes(searchLower) ||
+        paper.session_id?.toLowerCase().includes(searchLower) ||
+        sources.includes(searchLower)
+      );
+    };
+
+    return runGroups
+      .map((runGroup) => ({
+        ...runGroup,
+        visibleStage2Papers: searchLower
+          ? runGroup.stage2Papers.filter(matchesPaper)
+          : runGroup.stage2Papers,
+      }))
+      .filter((runGroup) => runGroup.visibleStage2Papers.length > 0);
+  }, [runGroups, searchTerm]);
+
+  const handleCardClick = async (paper) => {
+    if (expandedId === paper.history_id) {
+      setExpandedId(null);
+      setExpandedContent(null);
+      setLoadingContentId(null);
+      return;
+    }
+
+    setExpandedId(paper.history_id);
+    setExpandedContent(null);
+    setLoadingContentId(paper.history_id);
+
+    try {
+      const data = await autonomousAPI.getHistoryPaper(paper.session_id, paper.paper_id);
+      setExpandedContent(data);
+    } catch (err) {
+      console.error('Failed to load history paper content:', err);
+      setExpandedContent({
+        history_id: paper.history_id,
+        content: 'Failed to load content',
+        outline: '',
+        title: paper.title,
+      });
+    } finally {
+      setLoadingContentId(null);
+    }
+  };
+
+  const handleDownloadRaw = (e, paper) => {
+    e.stopPropagation();
+
+    if (expandedId !== paper.history_id || !expandedContent) {
+      alert('Please expand the paper first.');
+      return;
+    }
+
+    const filename = sanitizeFilename(`${paper.session_id}_${paper.paper_id}_${paper.title}`);
+    downloadRawText(
+      expandedContent.content || '',
+      filename,
+      expandedContent.outline || ''
+    );
+  };
+
+  const handleDownloadPDF = async (e, paper) => {
+    e.stopPropagation();
+
+    if (expandedId !== paper.history_id || !expandedContent) {
+      alert('Please expand the paper first.');
+      return;
+    }
+
+    const filename = sanitizeFilename(`${paper.session_id}_${paper.paper_id}_${paper.title}`);
+    const metadata = {
+      title: expandedContent.title || paper.title,
+      wordCount: paper.word_count,
+      date: paper.created_at ? new Date(paper.created_at).toLocaleDateString() : new Date().toLocaleDateString(),
+      models: paper.model_usage ? Object.keys(paper.model_usage).join(', ') : null,
+    };
+
+    await downloadPDFViaBackend(
+      expandedContent.content || '',
+      metadata,
+      filename,
+      expandedContent.outline || null,
+      () => setGeneratingPdfId(paper.history_id),
+      () => setGeneratingPdfId(null),
+      (downloadError) => {
+        setGeneratingPdfId(null);
+        console.error('PDF generation error:', downloadError);
+        alert(`PDF generation failed: ${downloadError.message}`);
+      },
+    );
+  };
+
+  const handleOpenCritique = (e, paper) => {
+    e.stopPropagation();
+    setCritiquePaper(paper);
+    setCritiqueModalOpen(true);
+  };
+
+  const handleDeleteClick = (e, paper) => {
+    e.stopPropagation();
+    setDeleteConfirmId(paper.history_id);
+  };
+
+  const handleDeleteCancel = (e) => {
+    e.stopPropagation();
+    setDeleteConfirmId(null);
+  };
+
+  const handleDeleteConfirm = async (paper) => {
+    setDeletingId(paper.history_id);
+    try {
+      await autonomousAPI.deleteHistoryPaper(paper.session_id, paper.paper_id);
+      if (expandedId === paper.history_id) {
+        setExpandedId(null);
+        setExpandedContent(null);
+      }
+      if (critiquePaper?.history_id === paper.history_id) {
+        setCritiqueModalOpen(false);
+        setCritiquePaper(null);
+      }
+      setDeleteConfirmId(null);
+      await loadPaperHistory();
+      if (onCurrentSessionDataChanged) {
+        await onCurrentSessionDataChanged();
+      }
+    } catch (err) {
+      console.error('Failed to delete history paper:', err);
+      alert(`Failed to delete paper: ${err.message}`);
+    } finally {
+      setDeletingId(null);
+    }
+  };
+
+  if (loading) {
+    return (
+      <div className="final-answer-library stage2-paper-history">
+        <div className="library-header">
+          <h2>Stage 2 Final Answer History</h2>
+          <p>Loading completed Stage 2 papers from all sessions...</p>
+        </div>
+        <div className="loading-spinner">⟳ Loading...</div>
+      </div>
+    );
+  }
+
+  if (error) {
+    return (
+      <div className="final-answer-library stage2-paper-history">
+        <div className="library-header">
+          <h2>Stage 2 Final Answer History</h2>
+        </div>
+        <div className="error-message">
+          <span>⚠</span>
+          <p>{error}</p>
+          <button onClick={loadPaperHistory} className="retry-button">
+            Retry
+          </button>
+        </div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="final-answer-library stage2-paper-history">
+      <div className="library-header">
+        <h2>Stage 2 Final Answer History</h2>
+        <p>Browse completed Stage 2 papers from all autonomous research sessions. This history excludes pruned and archived papers.</p>
+        <div className="library-stats">
+          <span className="stat-badge">
+            {papers.length} {papers.length === 1 ? 'Paper' : 'Papers'}
+          </span>
+          <span className="stat-badge">
+            {runGroups.length} {runGroups.length === 1 ? 'Research Run' : 'Research Runs'}
+          </span>
+          <span className="stat-badge">
+            {runGroups.filter((runGroup) => runGroup.hasStage3Answer).length} Runs With Stage 3 Answer
+          </span>
+        </div>
+      </div>
+
+      <div className="library-controls">
+        <input
+          type="text"
+          placeholder="Search by title, prompt, session, paper ID, or source brainstorm..."
+          value={searchTerm}
+          onChange={(e) => setSearchTerm(e.target.value)}
+          className="search-input"
+        />
+      </div>
+
+      {visibleRunGroups.length === 0 ? (
+        <div className="fal-empty-state">
+          <span className="empty-icon">📭</span>
+          <h3>No Stage 2 history papers found</h3>
+          <p>
+            {searchTerm
+              ? 'Try adjusting your search.'
+              : 'Completed non-archived Stage 2 papers will appear here.'}
+          </p>
+        </div>
+      ) : (
+        <div className="run-history-groups">
+          {visibleRunGroups.map((runGroup) => (
+            <section key={runGroup.sessionId} className="run-history-group">
+              <div className="run-history-group-header">
+                <div className="run-history-group-heading">
+                  <h3 className="run-history-group-title">{runGroup.userPrompt}</h3>
+                  <p className="run-history-group-subtitle">
+                    Research Run: {runGroup.displaySessionId}
+                  </p>
+                  {runGroup.createdAt && (
+                    <p className="run-history-group-subtitle">
+                      Started: {formatDate(runGroup.createdAt)}
+                    </p>
+                  )}
+                </div>
+                <div className="run-history-group-badges">
+                  {runGroup.isCurrent && (
+                    <span className="run-history-group-badge run-history-group-badge--current">
+                      Current Run
+                    </span>
+                  )}
+                  <span className="run-history-group-badge">
+                    Stage 2 Papers: {runGroup.stage2PaperCount}
+                  </span>
+                  <span
+                    className={`run-history-group-badge ${runGroup.hasStage3Answer ? 'run-history-group-badge--linked' : ''}`}
+                  >
+                    {runGroup.hasStage3Answer ? 'Stage 3 Final Answer Available' : 'No Stage 3 Final Answer Yet'}
+                  </span>
+                  {runGroup.brainstormCount !== null && runGroup.brainstormCount !== undefined && (
+                    <span className="run-history-group-badge">
+                      Brainstorms: {runGroup.brainstormCount}
+                    </span>
+                  )}
+                </div>
+              </div>
+
+              <div className="run-history-group-body">
+                <div className="paper-grid">
+                  {runGroup.visibleStage2Papers.map((paper) => (
+                    <div
+                      key={paper.history_id}
+                      className={`paper-card stage2-history-card ${expandedId === paper.history_id ? 'expanded' : ''}`}
+                      onClick={() => handleCardClick(paper)}
+                    >
+                      <div className="paper-card-header">
+                        <div className="stage2-history-card-identifiers">
+                          <span className="paper-card-id">{paper.paper_id}</span>
+                          <span className="stage2-history-session-badge">
+                            {paper.session_id === 'legacy' ? 'Legacy' : paper.session_id}
+                          </span>
+                        </div>
+                        <span className="paper-word-count">{paper.word_count?.toLocaleString()} words</span>
+                      </div>
+
+                      <div className="paper-card-title">
+                        {paper.title}
+                        {paper.critique_avg !== null && paper.critique_avg !== undefined && (
+                          <span
+                            className="stage2-history-critique-badge"
+                            style={{ backgroundColor: getCritiqueColor(paper.critique_avg) }}
+                            title={`Critique rating: ${paper.critique_avg}/10`}
+                          >
+                            ⭐ {paper.critique_avg}
+                          </span>
+                        )}
+                      </div>
+
+                      <div className="paper-card-abstract">
+                        {truncateAbstract(paper.abstract)}
+                      </div>
+
+                      <div className="stage2-history-prompt">
+                        <strong>Research Question:</strong> {paper.user_prompt}
+                      </div>
+
+                      <div className="paper-card-meta">
+                        <span>Source: {paper.source_brainstorm_ids?.join(', ') || 'N/A'}</span>
+                        <span>{formatDate(paper.created_at)}</span>
+                      </div>
+
+                      {paper.referenced_papers?.length > 0 && (
+                        <div className="paper-references">
+                          References: {paper.referenced_papers.join(', ')}
+                        </div>
+                      )}
+
+                      {expandedId === paper.history_id && (
+                        <>
+                          <div className="paper-actions">
+                            <button
+                              className="btn-download"
+                              onClick={(e) => handleDownloadPDF(e, paper)}
+                              disabled={generatingPdfId === paper.history_id || !expandedContent}
+                              title="Download as PDF"
+                            >
+                              {generatingPdfId === paper.history_id ? 'Preparing PDF...' : 'Download PDF'}
+                            </button>
+
+                            <button
+                              className="btn-download"
+                              onClick={(e) => handleDownloadRaw(e, paper)}
+                              disabled={!expandedContent}
+                              title="Download as raw text"
+                            >
+                              Download Raw
+                            </button>
+
+                            <button
+                              className="btn-critique"
+                              onClick={(e) => handleOpenCritique(e, paper)}
+                              title="Ask validator to critique this paper"
+                              style={{
+                                background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
+                                border: 'none',
+                                color: '#0b2e0b',
+                                padding: '0.35rem 0.7rem',
+                                borderRadius: '4px',
+                                cursor: 'pointer',
+                                fontWeight: '500',
+                                fontSize: '0.75rem',
+                              }}
+                            >
+                              ⭐ Critique
+                            </button>
+
+                            {deleteConfirmId === paper.history_id ? (
+                              <div className="delete-confirm-inline" onClick={(e) => e.stopPropagation()}>
+                                <span>Delete this paper?</span>
+                                <button
+                                  className="btn-delete-confirm"
+                                  onClick={() => handleDeleteConfirm(paper)}
+                                  disabled={deletingId === paper.history_id}
+                                >
+                                  {deletingId === paper.history_id ? 'Deleting...' : 'Yes'}
+                                </button>
+                                <button
+                                  className="btn-delete-cancel"
+                                  onClick={handleDeleteCancel}
+                                  disabled={deletingId === paper.history_id}
+                                >
+                                  Cancel
+                                </button>
+                              </div>
+                            ) : (
+                              <button
+                                className="btn-delete-paper"
+                                onClick={(e) => handleDeleteClick(e, paper)}
+                                title="Delete this paper"
+                              >
+                                Delete
+                              </button>
+                            )}
+                          </div>
+
+                          <div className="paper-full-content">
+                            {loadingContentId === paper.history_id ? (
+                              <div className="loading">Loading content...</div>
+                            ) : expandedContent && expandedContent.history_id === paper.history_id ? (
+                              <div className="paper-section">
+                                <h4>Paper Content</h4>
+                                <LatexRenderer
+                                  content={
+                                    expandedContent.outline
+                                      ? `${expandedContent.outline}\n\n${'='.repeat(80)}\n\n${expandedContent.content || 'No content available'}`
+                                      : expandedContent.content || 'No content available'
+                                  }
+                                  className="paper-content-renderer"
+                                  showToggle={true}
+                                  defaultRaw={false}
+                                />
+                              </div>
+                            ) : (
+                              <div className="loading">Loading content...</div>
+                            )}
+                          </div>
+                        </>
+                      )}
+                    </div>
+                  ))}
+                </div>
+              </div>
+            </section>
+          ))}
+        </div>
+      )}
+
+      <div className="library-footer">
+        <button onClick={loadPaperHistory} className="refresh-button">
+          Refresh History
+        </button>
+      </div>
+
+      <PaperCritiqueModal
+        isOpen={critiqueModalOpen}
+        onClose={() => {
+          setCritiqueModalOpen(false);
+          setCritiquePaper(null);
+        }}
+        paperType="autonomous_paper"
+        paperId={critiquePaper?.paper_id}
+        paperTitle={critiquePaper?.title}
+        onGenerateCritique={async (customPrompt, validatorConfig) => {
+          const result = await autonomousAPI.generateHistoryPaperCritique(
+            critiquePaper?.session_id,
+            critiquePaper?.paper_id,
+            customPrompt,
+            validatorConfig
+          );
+          await loadPaperHistory();
+          if (onCurrentSessionDataChanged) {
+            await onCurrentSessionDataChanged();
+          }
+          return result;
+        }}
+        onGetCritiques={() =>
+          autonomousAPI.getHistoryPaperCritiques(
+            critiquePaper?.session_id,
+            critiquePaper?.paper_id
+          )
+        }
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/components/autonomous/index.js b/frontend/src/components/autonomous/index.js
index 8a0a31e..ff55385 100644
--- a/frontend/src/components/autonomous/index.js
+++ b/frontend/src/components/autonomous/index.js
@@ -4,6 +4,7 @@
 export { default as AutonomousResearchInterface } from './AutonomousResearchInterface';
 export { default as BrainstormList } from './BrainstormList';
 export { default as PaperLibrary } from './PaperLibrary';
+export { default as Stage2PaperHistory } from './Stage2PaperHistory';
 export { default as AutonomousResearchSettings } from './AutonomousResearchSettings';
 export { default as AutonomousResearchLogs } from './AutonomousResearchLogs';
 export { default as FinalAnswerView } from './FinalAnswerView';
diff --git a/frontend/src/components/compiler/CompilerInterface.jsx b/frontend/src/components/compiler/CompilerInterface.jsx
index b532c88..604921f 100644
--- a/frontend/src/components/compiler/CompilerInterface.jsx
+++ b/frontend/src/components/compiler/CompilerInterface.jsx
@@ -3,7 +3,7 @@ import { compilerAPI } from '../../services/api';
 import { websocket } from '../../services/websocket';
 import TextFileUploader from '../TextFileUploader';
 
-function CompilerInterface({ activeTab }) {
+function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
   const [compilerPrompt, setCompilerPrompt] = useState('');
   const [status, setStatus] = useState({ is_running: false });
   const [isStarting, setIsStarting] = useState(false);
@@ -119,6 +119,15 @@ function CompilerInterface({ activeTab }) {
   };
 
   const handleStart = async () => {
+    if (anyWorkflowRunning && !status.is_running) {
+      setError({
+        error: 'workflow_conflict',
+        reason: 'Another workflow is already running. Stop it before starting the Compiler.',
+        suggestion: 'Only one workflow mode may be active at a time.'
+      });
+      return;
+    }
+
     if (!compilerPrompt.trim()) {
       alert('Please enter a compiler-directing prompt');
       return;
@@ -174,6 +183,12 @@ function CompilerInterface({ activeTab }) {
       // Handle structured error response
       if (err.details && typeof err.details === 'object') {
         setError(err.details);
+      } else if (typeof err.details === 'string' && err.details.trim()) {
+        setError({
+          error: 'workflow_conflict',
+          reason: err.details,
+          suggestion: 'Stop the active workflow and try again.'
+        });
       } else {
         setError({
           error: 'unknown',
@@ -239,7 +254,7 @@ function CompilerInterface({ activeTab }) {
       {status.is_running && (
         <div className="critique-phase-banner" style={{
           backgroundColor: critiquePhaseActive ? '#2a2a2a' : '#1a1a1a',
-          border: critiquePhaseActive ? '2px solid #ffd700' : '2px solid #666',
+          border: critiquePhaseActive ? '2px solid #1eff1c' : '2px solid #666',
           borderRadius: '8px',
           padding: '1rem',
           marginTop: '1rem',
@@ -251,7 +266,7 @@ function CompilerInterface({ activeTab }) {
             {critiquePhaseActive ? '◎' : '▬'}
           </span>
           <div style={{ flex: 1 }}>
-            <strong style={{ color: critiquePhaseActive ? '#ffd700' : '#ccc', fontSize: '1.1rem' }}>
+            <strong style={{ color: critiquePhaseActive ? '#1eff1c' : '#ccc', fontSize: '1.1rem' }}>
               {critiquePhaseActive ? `Critique Phase (Version ${paperVersion})` : 'Paper Writing in Progress'}
             </strong>
             {critiquePhaseActive ? (
@@ -260,7 +275,7 @@ function CompilerInterface({ activeTab }) {
                   {critiqueAcceptances} / 10 critiques accepted
                 </p>
                 <p style={{ margin: '0.25rem 0 0 0', fontSize: '0.85rem', color: '#888' }}>
-                  Collecting peer review feedback on body section...
+                  Collecting peer review feedback on the body section...
                 </p>
               </>
             ) : (
@@ -340,7 +355,7 @@ function CompilerInterface({ activeTab }) {
           <button 
             onClick={handleStart} 
             className="btn btn-primary"
-            disabled={isStarting}
+            disabled={isStarting || (anyWorkflowRunning && !status.is_running)}
           >
             {isStarting ? 'Starting...' : 'Start Compiler'}
           </button>
diff --git a/frontend/src/components/compiler/CompilerLogs.jsx b/frontend/src/components/compiler/CompilerLogs.jsx
index f61c3c1..ca7bb79 100644
--- a/frontend/src/components/compiler/CompilerLogs.jsx
+++ b/frontend/src/components/compiler/CompilerLogs.jsx
@@ -8,7 +8,7 @@ function CompilerLogs() {
     rigor: { acceptances: 0, rejections: 0, declines: 0, acceptance_rate: 0 },
     outline: { acceptances: 0, rejections: 0, declines: 0 },
     review: { acceptances: 0, rejections: 0, declines: 0 },
-    miniscule_edit_count: 0,
+    minuscule_edit_count: 0,
     paper_word_count: 0,
     total_submissions: 0
   });
@@ -381,16 +381,16 @@ function CompilerLogs() {
       {/* Recovery Alert */}
       {recoveryStatus && recoveryStatus.in_recovery && (
         <div style={{ 
-          backgroundColor: '#fff3cd', 
-          border: '2px solid #ffc107',
+          backgroundColor: 'rgba(30, 255, 28, 0.1)', 
+          border: '2px solid #1eff1c',
           borderRadius: '8px',
           padding: '1rem',
           margin: '1rem 0'
         }}>
-          <h2 style={{ color: '#856404', margin: '0 0 0.5rem 0' }}>
+          <h2 style={{ color: '#1eff1c', margin: '0 0 0.5rem 0' }}>
             Model Recovery in Progress
           </h2>
-          <div style={{ color: '#856404' }}>
+          <div style={{ color: '#c6ffc5' }}>
             <div><strong>Model:</strong> {recoveryStatus.recovering_model}</div>
             <div><strong>Stage:</strong> {recoveryStatus.recovery_stage}</div>
             <div style={{ marginTop: '0.5rem', fontSize: '0.9rem' }}>
@@ -410,8 +410,8 @@ function CompilerLogs() {
         <>
           <div className="current-mode">
             <h3>Current Mode: <span className="mode-highlight">{status.current_mode}</span></h3>
-            {error && <span className="status-badge status-error">Error</span>}
-            {warning && !error && <span className="status-badge status-warning">Stalled</span>}
+            {error && <span className="compiler-status-badge status-error">Error</span>}
+            {warning && !error && <span className="compiler-status-badge status-warning">Stalled</span>}
           </div>
 
           <div className="metrics-grid">
@@ -448,8 +448,8 @@ function CompilerLogs() {
             </div>
 
             <div className="metric-card">
-              <h3>Miniscule Edits</h3>
-              <div className="metric-value">{metrics.miniscule_edit_count}</div>
+              <h3>Minuscule Edits</h3>
+              <div className="metric-value">{metrics.minuscule_edit_count}</div>
               <div className="metric-label">Convergence indicator</div>
             </div>
 
@@ -461,11 +461,11 @@ function CompilerLogs() {
 
             {/* Critique Phase Stats - Show when in critique mode or has activity */}
             {(status.current_mode === 'critique' || critiqueStats.total > 0) && (
-              <div className="metric-card" style={{ borderColor: '#ffc107', borderWidth: '2px' }}>
+              <div className="metric-card" style={{ borderColor: '#1eff1c', borderWidth: '2px' }}>
                 <h3>Critique Phase (v{critiqueStats.version})</h3>
                 <div className="metric-value">{critiqueStats.accepted} / {critiqueStats.rejected} / {critiqueStats.total}</div>
                 <div className="metric-label">Accept / Reject / Total Attempts</div>
-                <div className="metric-rate" style={{ color: '#ffc107' }}>Target: 5 attempts</div>
+                <div className="metric-rate" style={{ color: '#1eff1c' }}>Target: 5 attempts</div>
               </div>
             )}
           </div>
@@ -501,9 +501,9 @@ function CompilerLogs() {
             <h4>Convergence Indicators</h4>
             <p>The paper is approaching completion when:</p>
             <ul>
-              <li>Construction <strong>declines</strong> increase (guide already covers all topics)</li>
+              <li>Construction <strong>declines</strong> increase (paper already covers all topics)</li>
               <li>Construction rejection rate increases (no more novel content to add)</li>
-              <li>Miniscule edit count increases (only tiny improvements found)</li>
+              <li>Minuscule edit count increases (only tiny improvements found)</li>
               <li>Review <strong>declines</strong> increase (paper is already clean)</li>
               <li>Rigor <strong>declines</strong> increase (rigor already adequate)</li>
             </ul>
diff --git a/frontend/src/components/compiler/CompilerSettings.jsx b/frontend/src/components/compiler/CompilerSettings.jsx
index ed1d860..fb7f411 100644
--- a/frontend/src/components/compiler/CompilerSettings.jsx
+++ b/frontend/src/components/compiler/CompilerSettings.jsx
@@ -1,5 +1,6 @@
 import React, { useState, useEffect } from 'react';
-import { openRouterAPI, api, aggregatorAPI } from '../../services/api';
+import { openRouterAPI, api, aggregatorAPI, compilerAPI } from '../../services/api';
+import '../settings-common.css';
 
 const SETTINGS_KEY = 'compiler_settings';
 
@@ -118,7 +119,6 @@ function CompilerSettings() {
           if (settings.critiqueSubmitterMaxOutput) setCritiqueSubmitterMaxOutput(settings.critiqueSubmitterMaxOutput);
           // Wolfram Alpha
           if (settings.wolframEnabled !== undefined) setWolframEnabled(settings.wolframEnabled);
-          // wolframApiKey not loaded from localStorage (sensitive data - must re-enter per session)
           // Free-only toggle
           if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
           if (settings.freeModelLooping !== undefined) setFreeModelLooping(settings.freeModelLooping);
@@ -129,19 +129,24 @@ function CompilerSettings() {
         }
       }
       
-      // Load Wolfram Alpha status from backend
-      const loadWolframStatus = async () => {
-        try {
-          const response = await api.getWolframStatus();
-          if (response.enabled) {
-            setWolframEnabled(true);
+      // Restore Wolfram Alpha key from localStorage
+      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
+      if (storedWolframKey) {
+        setWolframApiKey(storedWolframKey);
+        setWolframEnabled(true);
+      } else {
+        const loadWolframStatus = async () => {
+          try {
+            const response = await api.getWolframStatus();
+            if (response.enabled) {
+              setWolframEnabled(true);
+            }
+          } catch (err) {
+            console.error('Failed to load Wolfram Alpha status:', err);
           }
-        } catch (err) {
-          console.error('Failed to load Wolfram Alpha status:', err);
-        }
-      };
-      
-      loadWolframStatus();
+        };
+        loadWolframStatus();
+      }
       
       setIsLoaded(true);
       setLoadingModels(false);
@@ -238,7 +243,6 @@ function CompilerSettings() {
     // Fetch default prompt from backend
     const fetchDefaultPrompt = async () => {
       try {
-        const { compilerAPI } = await import('../../services/api');
         const response = await compilerAPI.getDefaultCritiquePrompt();
         if (response.data?.prompt) {
           setDefaultCritiquePrompt(response.data.prompt);
@@ -312,8 +316,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       
       if (response.success) {
         setWolframTestResult(`✓ Success! Result: ${response.result}`);
-        // Save the key to backend
         await api.setWolframApiKey(wolframApiKey);
+        localStorage.setItem('wolfram_alpha_api_key', wolframApiKey);
         setWolframEnabled(true);
       } else {
         setWolframTestResult('✗ Failed: ' + response.message);
@@ -329,6 +333,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const handleClearWolframKey = async () => {
     try {
       await api.clearWolframApiKey();
+      localStorage.removeItem('wolfram_alpha_api_key');
       setWolframApiKey('');
       setWolframEnabled(false);
       setWolframTestResult('Key cleared');
@@ -392,26 +397,20 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     const providers = model && provider === 'openrouter' ? (modelProviders[model] || []) : [];
 
     return (
-      <div style={{
-        marginBottom: '2rem',
-        padding: '1.5rem',
-        background: provider === 'openrouter' ? '#1a1a2e' : '#1a1a24',
-        border: `2px solid ${provider === 'openrouter' ? '#6c5ce7' : borderColor}`,
-        borderRadius: '8px'
-      }}>
-        <h3 style={{ 
-          margin: '0 0 0.5rem 0', 
-          color: provider === 'openrouter' ? '#a29bfe' : borderColor 
-        }}>
+      <div
+        className={`role-config-card role-config-card--highlight${provider === 'openrouter' ? ' role-config-card--openrouter' : ''}`}
+        style={{ borderColor: provider === 'openrouter' ? undefined : borderColor, padding: '1.5rem' }}
+      >
+        <h3 style={{ margin: '0 0 0.5rem 0', color: provider === 'openrouter' ? '#a29bfe' : borderColor }}>
           {title}
-          {provider === 'openrouter' && <span style={{ fontWeight: 'normal', marginLeft: '0.5rem' }}>[OpenRouter]</span>}
+          {provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
         </h3>
-        <small style={{ color: '#888', display: 'block', marginBottom: '1rem' }}>{description}</small>
+        <small className="role-description">{description}</small>
 
         {/* Provider Toggle */}
         <div className="form-group">
           <label>Provider</label>
-          <div style={{ display: 'flex', gap: '0.5rem' }}>
+          <div className="provider-toggle-group">
             <button
               type="button"
               onClick={() => {
@@ -420,15 +419,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 setOpenrouterProv(null);
                 setFallback(null);
               }}
-              style={{
-                flex: 1,
-                padding: '0.5rem',
-                backgroundColor: provider === 'lm_studio' ? '#4CAF50' : '#333',
-                border: 'none',
-                borderRadius: '4px',
-                color: '#fff',
-                cursor: 'pointer'
-              }}
+              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
             >
               LM Studio
             </button>
@@ -443,15 +434,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 }
               }}
               disabled={!hasOpenRouterKey}
-              style={{
-                flex: 1,
-                padding: '0.5rem',
-                backgroundColor: provider === 'openrouter' ? '#6c5ce7' : '#333',
-                border: 'none',
-                borderRadius: '4px',
-                color: hasOpenRouterKey ? '#fff' : '#666',
-                cursor: hasOpenRouterKey ? 'pointer' : 'not-allowed'
-              }}
+              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
               title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
             >
               OpenRouter
@@ -508,7 +491,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         {/* LM Studio Fallback (if OpenRouter) */}
         {provider === 'openrouter' && (
           <div className="form-group">
-            <label style={{ color: '#888' }}>LM Studio Fallback (optional)</label>
+            <label className="label--muted">LM Studio Fallback (optional)</label>
             <select
               value={fallback || ''}
               onChange={(e) => setFallback(e.target.value || null)}
@@ -522,8 +505,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           </div>
         )}
 
-        <div style={{ display: 'grid', gridTemplateColumns: '1fr 1fr', gap: '1rem' }}>
-          <div className="form-group" style={{ margin: 0 }}>
+        <div className="config-grid config-grid--2col">
+          <div className="form-group form-group--compact">
             <label>Context Window (tokens)</label>
             <input
               type="number"
@@ -538,7 +521,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             />
           </div>
 
-          <div className="form-group" style={{ margin: 0 }}>
+          <div className="form-group form-group--compact">
             <label>Max Output Tokens</label>
             <input
               type="number"
@@ -566,28 +549,22 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       <h2>Compiler Settings</h2>
 
       {saveStatus && (
-        <div className="save-status" style={{ color: '#4CAF50', marginBottom: '1rem' }}>
+        <div className="save-message" style={{ marginBottom: '1rem' }}>
           {saveStatus}
         </div>
       )}
 
       {/* OpenRouter Status Banner */}
       {!hasOpenRouterKey && (
-        <div style={{
-          backgroundColor: 'rgba(108, 92, 231, 0.1)',
-          border: '1px solid #6c5ce7',
-          borderRadius: '8px',
-          padding: '1rem',
-          marginBottom: '1.5rem'
-        }}>
-          <p style={{ color: '#a29bfe', margin: 0 }}>
+        <div className="openrouter-banner">
+          <p className="openrouter-banner__text">
             <strong>💡 OpenRouter Available:</strong> Set your OpenRouter API key in the header to enable cloud model selection for any role.
           </p>
         </div>
       )}
 
       <div className="settings-section">
-        <h3 style={{ borderBottom: '1px solid #333', paddingBottom: '0.5rem' }}>Model Configuration</h3>
+        <h3 className="section-heading--bordered">Model Configuration</h3>
         
         <RoleConfig
           title="Validator"
@@ -615,8 +592,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
         <RoleConfig
           title="High-Parameter Model"
-          description="Rigor enhancement mode: adds citations, strengthens methodology, clarifies assumptions."
-          borderColor="#f1c40f"
+          description="Rigor enhancement mode: adds citations, strengthens methodology, and clarifies assumptions."
+          borderColor="#1eff1c"
           provider={highParamProvider} setProvider={setHighParamProvider}
           model={highParamModel} setModel={setHighParamModel}
           openrouterProv={highParamOpenrouterProvider} setOpenrouterProv={setHighParamOpenrouterProvider}
@@ -639,17 +616,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       </div>
 
       {/* Model Refresh Controls */}
-      <div style={{ marginBottom: '2rem', padding: '1rem', background: '#1a1a24', borderRadius: '8px' }}>
+      <div className="settings-panel settings-panel--blue">
         <h3 style={{ marginBottom: '1rem' }}>Model Management</h3>
-        <div style={{ display: 'flex', alignItems: 'center', gap: '1rem', flexWrap: 'wrap' }}>
+        <div className="model-refresh-controls">
           <button 
             onClick={handleUseAggregatorModels}
-            className="secondary"
-            style={{
-              backgroundColor: '#2196F3',
-              border: 'none',
-              color: '#fff'
-            }}
+            className="secondary btn-primary-blue"
           >
             Use Aggregator Models
           </button>
@@ -667,17 +639,16 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary">
                 Refresh OpenRouter Models
               </button>
-              <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
+              <label className="settings-checkbox-label">
                 <input
                   type="checkbox"
                   checked={freeOnly}
                   onChange={(e) => setFreeOnly(e.target.checked)}
-                  style={{ marginRight: '0.5rem' }}
                 />
                 Show only free models
               </label>
-              <div style={{ display: 'flex', flexDirection: 'column', gap: '0.4rem', marginTop: '0.5rem' }}>
-                <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
+              <div className="checkbox-group-col">
+                <label className="settings-checkbox-label">
                   <input
                     type="checkbox"
                     checked={freeModelLooping}
@@ -685,15 +656,14 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                       setFreeModelLooping(e.target.checked);
                       openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
                     }}
-                    style={{ marginRight: '0.5rem' }}
                   />
                   Enable Free Model Looping
                   <span
                     title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
-                    style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
+                    className="help-hint"
                   >(?)</span>
                 </label>
-                <label style={{ display: 'inline-flex', alignItems: 'center', fontSize: '0.9rem' }}>
+                <label className="settings-checkbox-label">
                   <input
                     type="checkbox"
                     checked={freeModelAutoSelector}
@@ -701,19 +671,18 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                       setFreeModelAutoSelector(e.target.checked);
                       openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
                     }}
-                    style={{ marginRight: '0.5rem' }}
                   />
                   Use OpenRouter Free Models Auto-Selector as Backup
                   <span
                     title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
-                    style={{ marginLeft: '0.4rem', cursor: 'help', color: '#888', fontSize: '0.85rem' }}
+                    className="help-hint"
                   >(?)</span>
                 </label>
               </div>
             </>
           )}
         </div>
-        <small style={{ color: '#888', display: 'block', marginTop: '0.75rem' }}>
+        <small className="hint-text" style={{ marginTop: '0.75rem' }}>
           "Use Aggregator Models" copies your aggregator's model selection to all compiler roles.
         </small>
       </div>
@@ -721,32 +690,29 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       {/* Wolfram Alpha Integration */}
       <div className="settings-section">
         <h3>Wolfram Alpha Integration (Optional)</h3>
-        <small style={{ color: '#888', display: 'block', marginBottom: '1rem' }}>
+        <small className="hint-text" style={{ marginBottom: '1rem' }}>
           Enable Wolfram Alpha API for computational verification in rigor mode. 
           Get your API key from <a href="https://products.wolframalpha.com/api" target="_blank" rel="noopener noreferrer">developer.wolframalpha.com</a>
         </small>
         
-        <label style={{ display: 'flex', alignItems: 'center', marginBottom: '1rem' }}>
+        <label className="settings-checkbox-label" style={{ marginBottom: '1rem' }}>
           <input
             type="checkbox"
             checked={wolframEnabled}
             onChange={async (e) => {
               const checked = e.target.checked;
               if (!checked) {
-                // Unchecking - clear key from backend
                 await handleClearWolframKey();
               } else {
-                // Checking - just show UI (key will be saved on Test Connection)
                 setWolframEnabled(true);
               }
             }}
-            style={{ marginRight: '0.75rem' }}
           />
-          <span style={{ fontWeight: '500' }}>Enable Wolfram Alpha Verification in Rigor Mode</span>
+          <span className="label-medium">Enable Wolfram Alpha Verification in Rigor Mode</span>
         </label>
         
         {wolframEnabled && (
-          <div style={{ marginLeft: '1.75rem' }}>
+          <div className="indented-section">
             <div className="form-group">
               <label>Wolfram Alpha API Key:</label>
               <input
@@ -754,28 +720,17 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 value={wolframApiKey}
                 onChange={(e) => setWolframApiKey(e.target.value)}
                 placeholder="Enter your Wolfram Alpha App ID"
-                style={{
-                  padding: '0.5rem',
-                  backgroundColor: '#2a2a2a',
-                  border: '1px solid #444',
-                  borderRadius: '4px',
-                  color: '#fff',
-                  width: '100%',
-                  marginBottom: '0.5rem'
-                }}
+                className="input-dark"
+                style={{ marginBottom: '0.5rem' }}
               />
             </div>
             
-            <div style={{ display: 'flex', gap: '0.5rem', marginTop: '0.75rem' }}>
+            <div className="provider-toggle-group" style={{ marginTop: '0.75rem' }}>
               <button 
                 onClick={handleTestWolframConnection}
                 disabled={testingWolfram}
+                className="btn-success-sm"
                 style={{
-                  padding: '0.5rem 1rem',
-                  backgroundColor: '#4CAF50',
-                  border: 'none',
-                  borderRadius: '4px',
-                  color: '#fff',
                   cursor: testingWolfram ? 'wait' : 'pointer',
                   opacity: testingWolfram ? 0.6 : 1
                 }}
@@ -785,33 +740,19 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               
               <button 
                 onClick={handleClearWolframKey}
-                style={{
-                  padding: '0.5rem 1rem',
-                  backgroundColor: 'transparent',
-                  border: '1px solid #666',
-                  borderRadius: '4px',
-                  color: '#888',
-                  cursor: 'pointer'
-                }}
+                className="btn-ghost"
               >
                 Clear Key
               </button>
             </div>
             
             {wolframTestResult && (
-              <div style={{ 
-                marginTop: '0.75rem', 
-                padding: '0.5rem', 
-                borderRadius: '4px',
-                backgroundColor: wolframTestResult.includes('✓') ? '#1a3a1a' : '#3a1a1a',
-                color: wolframTestResult.includes('✓') ? '#4CAF50' : '#ff6b6b',
-                fontSize: '0.85rem'
-              }}>
+              <div className={`test-result-banner ${wolframTestResult.includes('✓') ? 'test-result-banner--success' : 'test-result-banner--error'}`}>
                 {wolframTestResult}
               </div>
             )}
             
-            <small style={{ color: '#888', display: 'block', marginTop: '1rem' }}>
+            <small className="hint-text" style={{ marginTop: '1rem' }}>
               In rigor mode, the AI can request Wolfram Alpha verification of mathematical claims. 
               This enables computational checking of theorems, solving equations, and verifying properties.
             </small>
@@ -836,41 +777,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       </div>
 
       {/* Validator Critique Prompt Editor */}
-      <div style={{ marginBottom: '2rem', padding: '1rem', background: '#1a1a24', borderRadius: '8px' }}>
+      <div className="settings-panel settings-panel--blue">
         <div 
           onClick={() => setCritiquePromptExpanded(!critiquePromptExpanded)}
-          style={{
-            display: 'flex',
-            alignItems: 'center',
-            justifyContent: 'space-between',
-            cursor: 'pointer',
-            padding: '0.5rem 0'
-          }}
+          className="collapsible-trigger"
+          style={{ padding: '0.5rem 0', background: 'transparent', border: 'none' }}
         >
           <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
             <span style={{ fontSize: '1.1rem' }}>📝</span>
             <h3 style={{ margin: 0 }}>Edit Validator Critique Prompt</h3>
             {isUsingCustomCritiquePrompt && (
-              <span style={{
-                backgroundColor: '#9b59b6',
-                color: '#fff',
-                padding: '2px 8px',
-                borderRadius: '12px',
-                fontSize: '0.7rem',
-                fontWeight: 'bold'
-              }}>CUSTOM</span>
+              <span className="tag-badge tag-badge--purple">CUSTOM</span>
             )}
           </div>
-          <span style={{ 
-            transform: critiquePromptExpanded ? 'rotate(180deg)' : 'rotate(0deg)',
-            transition: 'transform 0.2s',
-            fontSize: '1.2rem'
-          }}>▼</span>
+          <span className={`collapse-chevron${critiquePromptExpanded ? ' collapse-chevron--open' : ''}`}>▼</span>
         </div>
 
         {critiquePromptExpanded && (
           <div style={{ marginTop: '1rem' }}>
-            <p style={{ color: '#888', fontSize: '0.85rem', marginBottom: '1rem' }}>
+            <p className="text-muted-sm">
               Customize the prompt sent to your validator when requesting a paper critique. 
               The JSON output schema is automatically appended and cannot be modified.
             </p>
@@ -878,59 +803,26 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             <textarea
               value={customCritiquePrompt}
               onChange={(e) => setCustomCritiquePrompt(e.target.value)}
-              style={{
-                width: '100%',
-                minHeight: '200px',
-                padding: '0.75rem',
-                backgroundColor: '#2a2a2a',
-                border: '1px solid #444',
-                borderRadius: '4px',
-                color: '#fff',
-                fontFamily: 'monospace',
-                fontSize: '0.85rem',
-                resize: 'vertical',
-                lineHeight: '1.5'
-              }}
+              className="textarea-dark-mono"
               placeholder="Enter your custom critique prompt..."
             />
 
-            <div style={{ 
-              display: 'flex', 
-              justifyContent: 'space-between', 
-              alignItems: 'center',
-              marginTop: '1rem' 
-            }}>
+            <div className="actions-row">
               <button
                 onClick={handleRestoreCritiquePrompt}
-                style={{
-                  padding: '0.5rem 1rem',
-                  backgroundColor: 'transparent',
-                  border: '1px solid #666',
-                  borderRadius: '4px',
-                  color: '#888',
-                  cursor: 'pointer',
-                  fontSize: '0.85rem'
-                }}
+                className="btn-ghost"
+                style={{ fontSize: '0.85rem' }}
               >
                 Restore to Default
               </button>
 
               <div style={{ display: 'flex', alignItems: 'center', gap: '0.75rem' }}>
                 {critiquePromptSaved && (
-                  <span style={{ color: '#4CAF50', fontSize: '0.85rem' }}>✓ Saved!</span>
+                  <span className="status-success-text">✓ Saved!</span>
                 )}
                 <button
                   onClick={handleSaveCritiquePrompt}
-                  style={{
-                    padding: '0.5rem 1.5rem',
-                    backgroundColor: '#9b59b6',
-                    border: 'none',
-                    borderRadius: '4px',
-                    color: '#fff',
-                    cursor: 'pointer',
-                    fontWeight: '500',
-                    fontSize: '0.85rem'
-                  }}
+                  className="btn-accent-purple"
                 >
                   Save Prompt
                 </button>
@@ -941,9 +833,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       </div>
 
       {/* Configuration Summary */}
-      <div style={{ marginTop: '2rem', padding: '1rem', background: '#1a1a1a', borderRadius: '6px' }}>
+      <div className="settings-panel" style={{ marginTop: '2rem' }}>
         <h3>Current Configuration Summary</h3>
-        <pre style={{ color: '#4CAF50', fontSize: '0.85rem', overflow: 'auto' }}>
+        <pre className="config-summary-pre">
           {JSON.stringify({
             validator: {
               provider: validatorProvider,
diff --git a/frontend/src/components/compiler/LivePaper.jsx b/frontend/src/components/compiler/LivePaper.jsx
index 95da3e5..b3c4c8a 100644
--- a/frontend/src/components/compiler/LivePaper.jsx
+++ b/frontend/src/components/compiler/LivePaper.jsx
@@ -3,7 +3,9 @@ import { compilerAPI } from '../../services/api';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
+import { prependDisclaimer } from '../../utils/disclaimerHelper';
 import PaperCritiqueModal from '../PaperCritiqueModal';
+import '../settings-common.css';
 
 function LivePaper() {
   const [paper, setPaper] = useState('');
@@ -189,6 +191,7 @@ function LivePaper() {
         console.error('PDF generation error:', error);
         alert('PDF generation failed: ' + error.message);
       },
+      'paper',
     );
   };
 
@@ -199,7 +202,7 @@ function LivePaper() {
     }
     
     const filename = sanitizeFilename('compiler_paper');
-    downloadRawText(paper, filename, outline);
+    downloadRawText(paper, filename, outline, 'paper');
   };
 
   return (
@@ -280,9 +283,9 @@ function LivePaper() {
             disabled={!paper}
             title="Ask validator to critique this paper"
             style={{
-              background: 'linear-gradient(135deg, #9b59b6 0%, #8e44ad 100%)',
+              background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
               border: 'none',
-              color: '#fff',
+              color: '#0b2e0b',
               padding: '0.5rem 1rem',
               borderRadius: '4px',
               cursor: 'pointer',
@@ -298,7 +301,7 @@ function LivePaper() {
       <div className="paper-container" ref={paperContainerRef}>
         {paper ? (
           <LatexRenderer 
-            content={paper}
+            content={prependDisclaimer(paper, 'paper')}
             className="paper-content-renderer"
             defaultRaw={!showLatex}
             showToggle={true}
@@ -330,9 +333,9 @@ function LivePaper() {
       {previousVersions.length > 0 && (
         <div className="previous-versions-section">
           <button 
-            className="btn btn-secondary"
+            className="btn btn-secondary mt-1"
             onClick={() => setShowVersions(!showVersions)}
-            style={{ marginTop: '1rem', marginBottom: '0.5rem' }}
+            style={{ marginBottom: '0.5rem' }}
           >
             📜 Previous Versions ({previousVersions.length})
           </button>
@@ -347,7 +350,7 @@ function LivePaper() {
                   marginBottom: '1rem',
                   backgroundColor: '#2a2a2a'
                 }}>
-                  <h3 style={{ color: '#ffd700', marginBottom: '0.5rem' }}>
+                  <h3 style={{ color: '#1eff1c', marginBottom: '0.5rem' }}>
                     Version {v.version}: {v.title}
                   </h3>
                   
diff --git a/frontend/src/components/critique-modal.css b/frontend/src/components/critique-modal.css
new file mode 100644
index 0000000..3c6a656
--- /dev/null
+++ b/frontend/src/components/critique-modal.css
@@ -0,0 +1,496 @@
+/* ============================================
+   PaperCritiqueModal — Extracted from inline styles
+   ============================================ */
+
+/* Overlay */
+.critique-modal-overlay {
+  position: fixed;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+  background: rgba(0, 0, 0, 0.65);
+  backdrop-filter: blur(4px);
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  z-index: 999999;
+  padding: 20px;
+}
+
+/* Panel */
+.critique-modal-panel {
+  background: var(--surface-2, #1a1a2e);
+  border-radius: var(--radius-lg, 14px);
+  width: 100%;
+  max-width: 1200px;
+  height: 85vh;
+  display: flex;
+  flex-direction: column;
+  box-shadow: 0 24px 48px rgba(0, 0, 0, 0.5), 0 0 0 1px rgba(30, 255, 28, 0.25);
+  border: 1px solid rgba(30, 255, 28, 0.35);
+  overflow: hidden;
+}
+
+/* Header */
+.critique-modal-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 12px 16px;
+  border-bottom: 1px solid var(--border-subtle, rgba(75, 85, 99, 0.5));
+  background: rgba(30, 255, 28, 0.08);
+}
+
+.critique-header-left {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+}
+
+.critique-header-icon {
+  padding: 6px;
+  background: rgba(30, 255, 28, 0.15);
+  border-radius: var(--radius-sm, 6px);
+}
+
+.critique-modal-title {
+  font-size: 14px;
+  font-weight: 600;
+  color: var(--text-primary, #f3f4f6);
+  margin: 0;
+}
+
+.critique-modal-subtitle {
+  font-size: 11px;
+  color: var(--text-secondary, #9ca3af);
+  margin: 0;
+  max-width: 300px;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.critique-close-btn {
+  color: var(--text-secondary, #9ca3af);
+  padding: 6px;
+  background: transparent;
+  border: none;
+  border-radius: var(--radius-sm, 6px);
+  cursor: pointer;
+  transition: all 0.2s;
+}
+
+.critique-close-btn:hover {
+  background: rgba(255, 255, 255, 0.06);
+  color: var(--text-primary, #f3f4f6);
+}
+
+/* Body */
+.critique-modal-body {
+  flex: 1;
+  overflow-y: auto;
+  padding: 16px;
+  min-height: 500px;
+}
+
+/* Loading */
+.critique-loading-wrapper {
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  height: 150px;
+}
+
+.critique-loading-inner {
+  text-align: center;
+}
+
+.critique-spinner {
+  width: 28px;
+  height: 28px;
+  border: 2px solid #1eff1c;
+  border-top-color: transparent;
+  border-radius: 50%;
+  margin: 0 auto 10px;
+  animation: critique-spin 1s linear infinite;
+}
+
+.critique-spinner--sm {
+  width: 12px;
+  height: 12px;
+  border: 2px solid white;
+  border-top-color: transparent;
+  border-radius: 50%;
+  animation: critique-spin 1s linear infinite;
+}
+
+@keyframes critique-spin {
+  to { transform: rotate(360deg); }
+}
+
+.critique-loading-text {
+  color: var(--text-secondary, #9ca3af);
+  font-size: 13px;
+}
+
+/* Error */
+.critique-error-box {
+  background: rgba(127, 29, 29, 0.15);
+  border: 1px solid rgba(239, 68, 68, 0.3);
+  border-radius: var(--radius-md, 10px);
+  padding: 12px;
+}
+
+.critique-error-row {
+  display: flex;
+  align-items: flex-start;
+  gap: 10px;
+}
+
+.critique-error-title {
+  color: #f87171;
+  font-weight: 500;
+  margin-bottom: 4px;
+  font-size: 13px;
+}
+
+.critique-error-message {
+  font-size: 12px;
+  color: rgba(252, 165, 165, 0.8);
+}
+
+/* Content layout */
+.critique-content-layout {
+  display: flex;
+  flex-direction: column;
+  gap: 12px;
+  height: 100%;
+}
+
+/* Identity card */
+.critique-identity-card {
+  background: linear-gradient(to right, rgba(20, 83, 45, 0.2), rgba(30, 58, 138, 0.2));
+  border-radius: var(--radius-md, 10px);
+  padding: 10px 12px;
+  border: 1px solid rgba(30, 255, 28, 0.15);
+}
+
+.critique-identity-row {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+}
+
+.critique-identity-label {
+  font-size: 10px;
+  color: var(--text-secondary, #9ca3af);
+  text-transform: uppercase;
+  letter-spacing: 0.05em;
+  margin-bottom: 2px;
+}
+
+.critique-model-name {
+  font-size: 14px;
+  font-weight: 600;
+  color: var(--text-primary, #f3f4f6);
+}
+
+.critique-host-provider {
+  font-size: 11px;
+  color: #6ee7b7;
+}
+
+.critique-date-area {
+  text-align: right;
+}
+
+.critique-date-row {
+  display: flex;
+  align-items: center;
+  gap: 4px;
+  color: var(--text-secondary, #9ca3af);
+  font-size: 11px;
+}
+
+/* Ratings grid */
+.critique-ratings-grid {
+  display: grid;
+  grid-template-columns: repeat(3, 1fr);
+  gap: 8px;
+}
+
+/* Full critique section */
+.critique-full-box {
+  background: rgba(31, 41, 55, 0.4);
+  border-radius: var(--radius-md, 10px);
+  padding: 10px 12px;
+  flex: 1;
+  display: flex;
+  flex-direction: column;
+  min-height: 200px;
+}
+
+.critique-section-label {
+  font-size: 11px;
+  font-weight: 500;
+  color: var(--text-secondary, #d1d5db);
+  margin-bottom: 8px;
+}
+
+.critique-full-text {
+  color: var(--text-secondary, #d1d5db);
+  line-height: 1.5;
+  white-space: pre-wrap;
+  font-size: 12px;
+  flex: 1;
+  overflow-y: auto;
+}
+
+/* History accordion */
+.critique-history-container {
+  border: 1px solid var(--border-subtle, rgba(75, 85, 99, 0.5));
+  border-radius: var(--radius-md, 10px);
+  overflow: hidden;
+}
+
+.critique-history-toggle {
+  width: 100%;
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 8px 12px;
+  background: rgba(31, 41, 55, 0.25);
+  border: none;
+  cursor: pointer;
+  transition: background-color 0.2s;
+}
+
+.critique-history-toggle:hover {
+  background: rgba(31, 41, 55, 0.4);
+}
+
+.critique-history-label {
+  font-size: 12px;
+  font-weight: 500;
+  color: var(--text-secondary, #d1d5db);
+}
+
+.critique-history-chevron {
+  transition: transform 0.2s;
+}
+
+.critique-history-chevron--open {
+  transform: rotate(180deg);
+}
+
+.critique-history-list {
+  border-top: 1px solid var(--border-subtle, rgba(75, 85, 99, 0.5));
+  max-height: 120px;
+  overflow-y: auto;
+}
+
+.critique-history-item {
+  width: 100%;
+  text-align: left;
+  padding: 8px 12px;
+  background: transparent;
+  border: none;
+  cursor: pointer;
+  transition: background-color 0.2s;
+  border-bottom: 1px solid rgba(75, 85, 99, 0.3);
+}
+
+.critique-history-item:last-child {
+  border-bottom: none;
+}
+
+.critique-history-item:hover {
+  background: rgba(31, 41, 55, 0.3);
+}
+
+.critique-history-item--selected {
+  background: rgba(30, 255, 28, 0.08);
+}
+
+.critique-history-item-row {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+}
+
+.critique-history-model {
+  font-size: 11px;
+  color: var(--text-secondary, #d1d5db);
+}
+
+.critique-history-date {
+  font-size: 10px;
+  color: var(--text-muted, #6b7280);
+}
+
+.critique-history-ratings {
+  display: flex;
+  gap: 8px;
+  margin-top: 2px;
+  font-size: 10px;
+}
+
+/* Empty state */
+.critique-empty-state {
+  display: flex;
+  flex-direction: column;
+  align-items: center;
+  justify-content: center;
+  height: 150px;
+  text-align: center;
+}
+
+.critique-empty-icon {
+  padding: 12px;
+  background: rgba(31, 41, 55, 0.4);
+  border-radius: 50%;
+  margin-bottom: 12px;
+}
+
+.critique-empty-title {
+  font-size: 14px;
+  font-weight: 500;
+  color: var(--text-secondary, #d1d5db);
+  margin-bottom: 6px;
+}
+
+.critique-empty-desc {
+  font-size: 11px;
+  color: var(--text-muted, #6b7280);
+  max-width: 280px;
+}
+
+/* Footer */
+.critique-modal-footer {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 10px 16px;
+  border-top: 1px solid var(--border-subtle, rgba(75, 85, 99, 0.5));
+  background: rgba(31, 41, 55, 0.25);
+}
+
+.critique-footer-note {
+  font-size: 10px;
+  color: var(--text-muted, #6b7280);
+}
+
+.critique-footer-actions {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+}
+
+.critique-btn-secondary {
+  padding: 6px 12px;
+  font-size: 12px;
+  color: var(--text-secondary, #d1d5db);
+  background: transparent;
+  border: none;
+  cursor: pointer;
+  border-radius: var(--radius-sm, 6px);
+  transition: all 0.2s;
+}
+
+.critique-btn-secondary:hover {
+  background: rgba(255, 255, 255, 0.06);
+}
+
+.critique-btn-primary {
+  display: flex;
+  align-items: center;
+  gap: 6px;
+  padding: 6px 12px;
+  background: #1eff1c;
+  color: #0b2e0b;
+  border: none;
+  border-radius: var(--radius-sm, 6px);
+  font-size: 12px;
+  font-weight: 500;
+  cursor: pointer;
+  transition: background-color 0.2s;
+}
+
+.critique-btn-primary:hover:not(:disabled) {
+  background: #0fcc0d;
+}
+
+.critique-btn-primary:disabled {
+  background: #0d9e0b;
+  cursor: not-allowed;
+  opacity: 0.7;
+}
+
+/* Compact rating card */
+.critique-compact-card {
+  background: rgba(31, 41, 55, 0.4);
+  border-radius: var(--radius-md, 10px);
+  padding: 8px 10px;
+}
+
+.critique-compact-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  margin-bottom: 4px;
+}
+
+.critique-compact-label {
+  font-size: 10px;
+  font-weight: 500;
+  color: var(--text-secondary, #d1d5db);
+}
+
+.critique-compact-value {
+  font-size: 14px;
+  font-weight: 700;
+}
+
+.critique-compact-track {
+  height: 4px;
+  background: rgba(55, 65, 81, 1);
+  border-radius: 9999px;
+  overflow: hidden;
+}
+
+.critique-compact-fill {
+  height: 100%;
+  border-radius: 9999px;
+  transition: width 0.5s;
+}
+
+.critique-compact-feedback {
+  font-size: 11px;
+  color: var(--text-secondary, #9ca3af);
+  line-height: 1.5;
+  max-height: 250px;
+  overflow-y: auto;
+}
+
+/* Rating color classes (text) */
+.critique-color--emerald { color: #34d399; }
+.critique-color--blue    { color: #60a5fa; }
+.critique-color--yellow  { color: #facc15; }
+.critique-color--orange  { color: #fb923c; }
+.critique-color--red     { color: #f87171; }
+
+/* Rating color classes (bar fill) */
+.critique-bg--emerald { background-color: #10b981; }
+.critique-bg--blue    { background-color: #3b82f6; }
+.critique-bg--yellow  { background-color: #eab308; }
+.critique-bg--orange  { background-color: #f97316; }
+.critique-bg--red     { background-color: #ef4444; }
+
+/* Icon sizing utilities */
+.critique-icon--sm     { width: 12px; height: 12px; }
+.critique-icon--lg     { width: 32px; height: 32px; }
+.critique-icon--green { color: #1eff1c; }
+.critique-icon--red    { color: #f87171; }
+.critique-icon--muted  { color: var(--text-muted, #6b7280); }
+.critique-icon--close  { width: 16px; height: 16px; }
diff --git a/frontend/src/components/settings-common.css b/frontend/src/components/settings-common.css
new file mode 100644
index 0000000..df7573a
--- /dev/null
+++ b/frontend/src/components/settings-common.css
@@ -0,0 +1,827 @@
+/* ============================================
+   Settings Common — Shared across
+   AggregatorSettings, CompilerSettings,
+   AutonomousResearchSettings
+   ============================================ */
+
+/* Settings wrapper containers */
+.compiler-settings,
+.privacy-warning-modal {
+  display: flex;
+  flex-direction: column;
+  gap: 1.5rem;
+  width: 100%;
+}
+
+/* Provider toggle button group */
+.provider-toggle-group {
+  display: flex;
+  gap: 0.5rem;
+}
+
+.provider-toggle-btn {
+  flex: 1;
+  padding: 0.5rem;
+  border: none;
+  border-radius: var(--radius-sm);
+  color: #fff;
+  cursor: pointer;
+  font-size: 0.8rem;
+  font-weight: 500;
+  transition: all var(--transition-fast);
+  background: var(--surface-4);
+}
+
+.provider-toggle-btn:hover {
+  filter: brightness(1.15);
+}
+
+.provider-toggle-btn.active-lm {
+  background: var(--accent-green);
+}
+
+.provider-toggle-btn.active-or {
+  background: #6c5ce7;
+}
+
+.provider-toggle-btn.active-or-orange {
+  background: #FF6700;
+}
+
+.provider-toggle-btn:disabled {
+  color: var(--text-muted);
+  cursor: not-allowed;
+  opacity: 0.5;
+}
+
+/* Compact form group (margin: 0 override) */
+.form-group--compact {
+  margin: 0;
+}
+
+/* Small labels and inputs */
+.label--sm {
+  font-size: 0.85rem;
+}
+
+.label--muted {
+  color: var(--text-secondary);
+}
+
+.label--lg {
+  font-size: 1.1rem;
+  font-weight: 600;
+}
+
+.select--sm,
+.input--sm {
+  font-size: 0.85rem;
+}
+
+/* Config grid layouts */
+.config-grid {
+  display: grid;
+  gap: 1rem;
+}
+
+.config-grid--2col {
+  grid-template-columns: 1fr 1fr;
+}
+
+.config-grid--3col {
+  grid-template-columns: 1fr 1fr 1fr;
+}
+
+.config-grid--1col {
+  grid-template-columns: 1fr;
+}
+
+/* Hint / help text */
+.hint-text {
+  color: var(--text-secondary);
+  display: block;
+  font-size: 0.85rem;
+  margin-top: 0.5rem;
+  line-height: 1.4;
+}
+
+.hint-text--dim {
+  color: var(--text-muted);
+}
+
+/* Settings section with background */
+.settings-panel {
+  margin-bottom: 2rem;
+  padding: 1rem;
+  background: var(--surface-2);
+  border-radius: var(--radius-md);
+}
+
+.settings-panel--blue {
+  background: rgba(26, 35, 50, 0.8);
+}
+
+.settings-panel--validator {
+  border: 1px solid var(--border-default);
+}
+
+/* Section heading with border */
+.section-heading--bordered {
+  margin-bottom: 1rem;
+  border-bottom: 1px solid var(--border-subtle);
+  padding-bottom: 0.5rem;
+}
+
+/* Settings header row */
+.settings-header-row {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+}
+
+/* Save status message */
+.save-message {
+  color: var(--accent-green);
+  font-size: 0.9rem;
+  font-weight: 500;
+}
+
+/* OpenRouter status banner */
+.openrouter-banner {
+  background: rgba(108, 92, 231, 0.08);
+  border: 1px solid rgba(108, 92, 231, 0.35);
+  border-radius: var(--radius-md);
+  padding: 1rem;
+  margin-bottom: 1.5rem;
+}
+
+.openrouter-banner--orange {
+  background: rgba(255, 103, 0, 0.08);
+  border-color: rgba(255, 103, 0, 0.35);
+}
+
+.openrouter-banner__text {
+  color: #a29bfe;
+  margin: 0;
+}
+
+.openrouter-banner--orange .openrouter-banner__text {
+  color: #FF6700;
+}
+
+/* Submitter / role card */
+.role-config-card {
+  background: var(--surface-2);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-md);
+  padding: 1rem;
+  margin-bottom: 1rem;
+  transition: border-color var(--transition-fast);
+}
+
+.role-config-card--main {
+  border-color: rgba(76, 175, 80, 0.35);
+  background: rgba(26, 36, 40, 0.8);
+}
+
+.role-config-card--openrouter {
+  border-color: rgba(108, 92, 231, 0.35);
+  background: rgba(26, 26, 56, 0.8);
+}
+
+.role-config-card--openrouter-orange {
+  border-color: rgba(255, 103, 0, 0.35);
+  background: rgba(26, 26, 46, 0.8);
+}
+
+.role-config-card--highlight {
+  border-width: 2px;
+}
+
+/* Card header */
+.card-header-row {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-bottom: 1rem;
+}
+
+/* Card title colours */
+.card-title--green { color: var(--accent-green); }
+.card-title--purple { color: #a29bfe; }
+.card-title--orange { color: #FF6700; }
+
+/* Inline provider badge */
+.provider-badge-inline {
+  font-weight: normal;
+  margin-left: 0.5rem;
+}
+
+/* Apply-to-all button */
+.btn-apply-all {
+  font-size: 0.8rem;
+  padding: 0.3rem 0.6rem;
+  background: var(--accent-green);
+  border: none;
+  border-radius: var(--radius-sm);
+  cursor: pointer;
+  color: #fff;
+  transition: all var(--transition-fast);
+}
+
+.btn-apply-all:hover {
+  filter: brightness(1.15);
+}
+
+/* Checkbox label for settings */
+.settings-checkbox-label {
+  display: inline-flex;
+  align-items: center;
+  font-size: 0.9rem;
+  cursor: pointer;
+}
+
+.settings-checkbox-label input[type="checkbox"] {
+  margin-right: 0.5rem;
+  cursor: pointer;
+}
+
+.settings-checkbox-label--stacked {
+  display: grid;
+  grid-template-columns: auto minmax(0, 1fr);
+  width: 100%;
+  align-items: flex-start;
+  gap: 0.75rem;
+}
+
+.settings-checkbox-label--stacked input[type="checkbox"] {
+  margin-right: 0;
+  margin-top: 0.2rem;
+  flex-shrink: 0;
+}
+
+.settings-option-copy {
+  display: block;
+  min-width: 0;
+}
+
+.settings-option-title {
+  display: block;
+  color: var(--text-primary);
+  font-weight: 500;
+  line-height: 1.35;
+}
+
+.settings-option-description {
+  display: block;
+  margin-top: 0.25rem;
+  color: var(--text-secondary);
+  font-size: 0.85rem;
+  line-height: 1.45;
+}
+
+/* Inline info/help icon */
+.help-hint {
+  margin-left: 0.4rem;
+  cursor: help;
+  color: var(--text-secondary);
+  font-size: 0.85rem;
+}
+
+/* Button spacing utility */
+.mr-05 { margin-right: 0.5rem; }
+.ml-05 { margin-left: 0.5rem; }
+.mt-1 { margin-top: 1rem; }
+.mb-2 { margin-bottom: 2rem; }
+
+/* Range slider */
+.range-slider {
+  width: 100%;
+  margin-top: 0.5rem;
+}
+
+.range-labels {
+  display: flex;
+  justify-content: space-between;
+  font-size: 0.8rem;
+  color: var(--text-secondary);
+}
+
+/* Config summary pre */
+.config-summary-pre {
+  color: var(--accent-green);
+  font-size: 0.85rem;
+  overflow: auto;
+}
+
+/* Error text */
+.error-text {
+  color: var(--accent-red);
+}
+
+/* Success text inline */
+.status-success-text {
+  color: var(--accent-green);
+  font-size: 0.85rem;
+}
+
+/* Dark text input */
+.input-dark {
+  padding: 0.5rem;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
+  color: var(--text-primary);
+  width: 100%;
+}
+
+.input-dark:focus {
+  outline: none;
+  border-color: var(--gold-dim);
+  box-shadow: 0 0 0 3px var(--gold-glow);
+}
+
+/* Dark textarea (monospace) */
+.textarea-dark-mono {
+  width: 100%;
+  min-height: 200px;
+  padding: 0.75rem;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
+  color: var(--text-primary);
+  font-family: monospace;
+  font-size: 0.85rem;
+  resize: vertical;
+  line-height: 1.5;
+}
+
+.textarea-dark-mono:focus {
+  outline: none;
+  border-color: var(--gold-dim);
+  box-shadow: 0 0 0 3px var(--gold-glow);
+}
+
+/* Ghost / outline button */
+.btn-ghost {
+  padding: 0.5rem 1rem;
+  background: transparent;
+  border: 1px solid var(--border-strong);
+  border-radius: var(--radius-sm);
+  color: var(--text-secondary);
+  cursor: pointer;
+  transition: all var(--transition-fast);
+}
+
+.btn-ghost:hover {
+  background: var(--surface-3);
+  color: var(--text-primary);
+}
+
+/* Green primary button (smaller) */
+.btn-success-sm {
+  padding: 0.5rem 1rem;
+  background: var(--accent-green);
+  border: none;
+  border-radius: var(--radius-sm);
+  color: #fff;
+  cursor: pointer;
+  font-weight: 500;
+  transition: all var(--transition-fast);
+}
+
+.btn-success-sm:hover:not(:disabled) {
+  filter: brightness(1.15);
+}
+
+.btn-success-sm:disabled {
+  opacity: 0.5;
+  cursor: not-allowed;
+}
+
+/* Blue primary button */
+.btn-primary-blue {
+  background: var(--accent-blue);
+  border: none;
+  color: #fff;
+  border-radius: var(--radius-sm);
+  cursor: pointer;
+  transition: all var(--transition-fast);
+}
+
+.btn-primary-blue:hover {
+  filter: brightness(1.15);
+}
+
+/* Purple accent button */
+.btn-accent-purple {
+  padding: 0.5rem 1.5rem;
+  background: #9b59b6;
+  border: none;
+  border-radius: var(--radius-sm);
+  color: #fff;
+  cursor: pointer;
+  font-weight: 500;
+  font-size: 0.85rem;
+  transition: all var(--transition-fast);
+}
+
+.btn-accent-purple:hover {
+  filter: brightness(1.15);
+}
+
+/* Test result banner */
+.test-result-banner {
+  margin-top: 0.75rem;
+  padding: 0.5rem 0.75rem;
+  border-radius: var(--radius-sm);
+  font-size: 0.85rem;
+}
+
+.test-result-banner--success {
+  background: rgba(76, 175, 80, 0.1);
+  color: var(--accent-green);
+}
+
+.test-result-banner--error {
+  background: rgba(244, 67, 54, 0.1);
+  color: #ff6b6b;
+}
+
+/* Collapsible / Accordion */
+.collapsible-trigger {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 0.75rem;
+  cursor: pointer;
+  padding: 0.75rem;
+  background: var(--surface-2);
+  border-radius: var(--radius-sm);
+  border: 1px solid var(--border-subtle);
+  width: 100%;
+  max-width: 100%;
+  box-sizing: border-box;
+  transition: background var(--transition-fast);
+}
+
+.collapsible-trigger:hover {
+  background: var(--surface-3);
+}
+
+.collapsible-trigger:focus-visible {
+  outline: 2px solid var(--accent-blue);
+  outline-offset: 2px;
+}
+
+.collapsible-body {
+  padding: 1rem;
+  background: var(--surface-2);
+  border-radius: var(--radius-sm);
+  border: 1px solid var(--border-subtle);
+}
+
+.settings-heading-stack {
+  display: flex;
+  flex: 1;
+  flex-direction: column;
+  gap: 0.3rem;
+  min-width: 0;
+}
+
+.settings-trigger--multiline {
+  align-items: flex-start;
+}
+
+.settings-trigger-copy {
+  display: flex;
+  flex: 1;
+  flex-direction: column;
+  gap: 0.35rem;
+  min-width: 0;
+}
+
+.settings-trigger-title-row {
+  display: flex;
+  align-items: center;
+  flex-wrap: wrap;
+  gap: 0.5rem;
+  min-width: 0;
+}
+
+.settings-trigger-title {
+  margin: 0;
+  line-height: 1.35;
+}
+
+.settings-advanced-content {
+  display: flex;
+  flex-direction: column;
+  gap: 1rem;
+}
+
+.settings-subsection {
+  display: flex;
+  flex-direction: column;
+  gap: 0.85rem;
+  padding: 1rem;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
+}
+
+.settings-subsection--accent-danger {
+  border-left: 4px solid #ff6b6b;
+}
+
+.settings-subsection-header {
+  display: flex;
+  flex-direction: column;
+  gap: 0.35rem;
+}
+
+.settings-subsection-title {
+  margin: 0;
+  color: var(--text-primary);
+  font-size: 1rem;
+}
+
+.settings-subsection-description {
+  margin: 0;
+  color: var(--text-secondary);
+  font-size: 0.85rem;
+  line-height: 1.45;
+}
+
+.collapse-chevron {
+  transition: transform 0.2s;
+  font-size: 1.2rem;
+  flex-shrink: 0;
+  margin-top: 0.1rem;
+}
+
+.collapse-chevron--open {
+  transform: rotate(180deg);
+}
+
+/* Custom tag badge */
+.tag-badge {
+  padding: 2px 8px;
+  border-radius: var(--radius-pill);
+  font-size: 0.7rem;
+  font-weight: bold;
+}
+
+.tag-badge--purple {
+  background: #9b59b6;
+  color: #fff;
+}
+
+/* Actions row (space-between) */
+.actions-row {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  margin-top: 1rem;
+}
+
+/* Description text below role title */
+.role-description {
+  color: var(--text-secondary);
+  display: block;
+  margin-bottom: 1rem;
+  font-size: 0.85rem;
+}
+
+/* Muted paragraph */
+.text-muted-sm {
+  color: var(--text-secondary);
+  font-size: 0.85rem;
+  margin-bottom: 1rem;
+}
+
+/* Indented sub-section (Wolfram, etc.) */
+.indented-section {
+  margin-left: 1.75rem;
+  margin-top: 1rem;
+}
+
+/* Settings group accent border */
+.settings-group--accent-danger {
+  border-left: 4px solid #ff6b6b;
+  padding-left: 12px;
+}
+
+/* Ranking badges (sidebar medals) */
+.ranking-badge {
+  padding: 2px 8px;
+  border-radius: var(--radius-pill);
+  font-size: 0.7rem;
+  font-weight: bold;
+  color: #000;
+  letter-spacing: 0.03em;
+}
+
+.ranking-badge--gold {
+  background:
+    linear-gradient(120deg, rgba(255, 255, 255, 0.72) 0%, rgba(255, 255, 255, 0.22) 18%, rgba(255, 255, 255, 0.02) 34%),
+    linear-gradient(135deg, #fff7bf 0%, #ffe27a 18%, #ffc93b 46%, #d58d00 100%);
+  color: #2c1700;
+  box-shadow:
+    0 0 0 1px rgba(255, 219, 96, 0.78),
+    0 0 14px rgba(255, 200, 40, 0.38),
+    inset 0 1px 0 rgba(255, 255, 255, 0.55),
+    inset 0 -1px 0 rgba(120, 70, 0, 0.2);
+  text-shadow: 0 1px 0 rgba(255, 255, 255, 0.35);
+}
+
+.ranking-badge--silver {
+  background: linear-gradient(135deg, #c0c0c0, #e0e0e0);
+  box-shadow: 0 0 6px rgba(192, 192, 192, 0.4);
+}
+
+.ranking-badge--bronze {
+  background: linear-gradient(135deg, #cd7f32, #e8a860);
+  color: #120900;
+  box-shadow: 0 0 6px rgba(205, 127, 50, 0.4);
+}
+
+/* Model item ranked card (sidebar) */
+.models-podium {
+  background: linear-gradient(180deg, rgba(255, 215, 96, 0.09) 0%, rgba(201, 133, 0, 0.04) 100%);
+  border: 1px solid rgba(255, 215, 96, 0.18);
+}
+
+.models-podium-label {
+  color: rgba(255, 220, 120, 0.72);
+  text-shadow: 0 0 10px rgba(255, 204, 51, 0.18);
+}
+
+.model-item--ranked {
+  border-radius: var(--radius-sm);
+  box-shadow: var(--shadow-sm);
+  padding-left: 12px;
+}
+
+.model-item--gold {
+  border-left: 5px solid #f4c430;
+  background: linear-gradient(180deg, rgba(255, 214, 92, 0.08) 0%, rgba(255, 194, 57, 0.03) 100%);
+  box-shadow:
+    0 0 0 1px rgba(255, 208, 90, 0.16),
+    var(--shadow-sm);
+}
+
+.model-item--gold:hover {
+  background: linear-gradient(180deg, rgba(255, 220, 110, 0.14) 0%, rgba(255, 194, 57, 0.06) 100%);
+  border-color: rgba(255, 211, 95, 0.45);
+}
+
+.model-item--silver { border-left: 5px solid #c0c0c0; }
+.model-item--bronze { border-left: 5px solid #cd7f32; }
+
+/* Info tooltip button (? circle) */
+.info-tooltip-btn {
+  background: transparent;
+  padding: 0;
+  border-radius: var(--radius-sm);
+  cursor: pointer;
+  font-weight: bold;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: all var(--transition-fast);
+}
+
+.info-tooltip-btn--orange {
+  border: 2px solid #FF6700;
+  color: #FF6700;
+  font-size: 0.7rem;
+  width: 16px;
+  height: 16px;
+}
+
+.info-tooltip-btn--gold {
+  border: 2px solid #f4c430;
+  color: #ffd54a;
+  box-shadow: 0 0 8px rgba(255, 204, 51, 0.22);
+  font-size: 0.8rem;
+  width: 20px;
+  height: 20px;
+}
+
+.info-tooltip-btn:hover {
+  filter: brightness(1.3);
+}
+
+/* Tooltip popup */
+.tooltip-popup {
+  background: var(--surface-2);
+  border: 2px solid #FF6700;
+  border-radius: var(--radius-sm);
+  padding: 12px 16px;
+  font-size: 0.85rem;
+  color: #FF6700;
+  font-weight: 500;
+  box-shadow: var(--shadow-lg);
+  pointer-events: none;
+  z-index: 1000;
+}
+
+.tooltip-popup--absolute {
+  position: absolute;
+  top: calc(100% + 8px);
+  left: 50%;
+  transform: translateX(-50%);
+}
+
+.tooltip-popup--fixed {
+  position: fixed;
+}
+
+/*
+ * sidebar-escape tooltip: uses position:fixed instead of absolute so it can
+ * break out of the narrow 322px left sidebar without being clipped or squished.
+ * left: 326px sits flush against the sidebar's right edge (322px wide + 4px gap).
+ * top: 62px aligns it with roughly where the "?" button sits in the sidebar header.
+ * Adjust top if the header height ever changes.
+ */
+.tooltip-popup--sidebar-escape {
+  position: fixed;
+  left: 276px;
+  top: 112px;
+  width: 340px;
+  z-index: 9999;
+}
+
+/* Tooltip anchor wrapper */
+.tooltip-anchor {
+  position: relative;
+  display: inline-block;
+}
+
+/* Modal overlay and content (shared by inline modals) */
+.inline-modal-overlay {
+  position: fixed;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+  background: rgba(0, 0, 0, 0.65);
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  z-index: 9999;
+  backdrop-filter: blur(4px);
+}
+
+.inline-modal-content {
+  background: var(--surface-2);
+  padding: 2rem;
+  border-radius: var(--radius-md);
+  border: 1px solid var(--border-default);
+  min-width: 400px;
+  box-shadow: var(--shadow-lg);
+}
+
+.inline-modal-content h3 {
+  margin-top: 0;
+}
+
+/* Model refresh controls row */
+.model-refresh-controls {
+  display: flex;
+  flex-wrap: wrap;
+  align-items: center;
+  gap: 0.5rem;
+  margin-bottom: 1rem;
+}
+
+.model-refresh-controls__toggle {
+  white-space: nowrap;
+  font-size: 0.85rem;
+  gap: 0.35rem;
+}
+
+.model-refresh-controls__toggle input[type="checkbox"] {
+  margin-right: 0.35rem !important;
+}
+
+/* Flex column for checkbox groups */
+.checkbox-group-col {
+  display: flex;
+  flex-direction: column;
+  gap: 0.4rem;
+  margin-top: 0.5rem;
+}
+
+/* Flex row utility (generic) */
+.flex-row-center {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+}
+
+/* Bold label text */
+.label-medium {
+  font-weight: 500;
+}
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 890c716..1df006f 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -1,3 +1,60 @@
+/* ============================================
+   Design Tokens
+   ============================================ */
+:root {
+  /* Surface hierarchy (darkest → lightest) */
+  --surface-0: #0b0b0f;
+  --surface-1: #131318;
+  --surface-2: #1a1a22;
+  --surface-3: #22222c;
+  --surface-4: #2a2a36;
+
+  /* Brand highlight palette (legacy variable names kept for compatibility) */
+  --gold: #1eff1c;
+  --gold-dim: #18cc17;
+  --gold-glow: rgba(30, 255, 28, 0.12);
+
+  /* Semantic accent colours (unchanged hues, new aliases) */
+  --accent-green: #4CAF50;
+  --accent-blue: #2196F3;
+  --accent-purple: #9C27B0;
+  --accent-red: #f44336;
+  --accent-orange: #ff9800;
+
+  /* Text */
+  --text-primary: #e4e4ec;
+  --text-secondary: #9d9db0;
+  --text-muted: #666680;
+
+  /* Borders & dividers */
+  --border-subtle: rgba(255, 255, 255, 0.07);
+  --border-default: rgba(255, 255, 255, 0.10);
+  --border-strong: rgba(255, 255, 255, 0.16);
+
+  /* Radii */
+  --radius-sm: 6px;
+  --radius-md: 10px;
+  --radius-lg: 14px;
+  --radius-pill: 100px;
+
+  /* Shadows (layered for depth) */
+  --shadow-sm: 0 1px 3px rgba(0,0,0,0.4), 0 1px 2px rgba(0,0,0,0.3);
+  --shadow-md: 0 4px 12px rgba(0,0,0,0.45), 0 2px 4px rgba(0,0,0,0.3);
+  --shadow-lg: 0 8px 28px rgba(0,0,0,0.5), 0 4px 8px rgba(0,0,0,0.3);
+  --shadow-gold: 0 4px 16px rgba(30, 255, 28, 0.18);
+
+  /* Transitions */
+  --ease-out: cubic-bezier(0.22, 1, 0.36, 1);
+  --transition-fast: 0.15s var(--ease-out);
+  --transition-normal: 0.25s var(--ease-out);
+
+  /* Legacy compatibility aliases used by AutonomousResearch.css */
+  --bg-primary: var(--surface-2);
+  --bg-secondary: var(--surface-2);
+  --bg-tertiary: var(--surface-3);
+  --border-color: var(--border-default);
+}
+
 * {
   margin: 0;
   padding: 0;
@@ -5,13 +62,14 @@
 }
 
 body {
-  font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', 'Roboto', 'Oxygen',
+  font-family: 'Inter', -apple-system, BlinkMacSystemFont, 'Segoe UI', 'Roboto', 'Oxygen',
     'Ubuntu', 'Cantarell', 'Fira Sans', 'Droid Sans', 'Helvetica Neue',
     sans-serif;
   -webkit-font-smoothing: antialiased;
   -moz-osx-font-smoothing: grayscale;
-  background: #0f0f0f;
-  color: #e0e0e0;
+  background: var(--surface-0);
+  color: var(--text-primary);
+  line-height: 1.5;
 }
 
 code {
@@ -34,12 +92,14 @@ code {
    Banner & Logo Section
    ============================================ */
 .app-banner {
-  background: linear-gradient(135deg, #1a1a1a 0%, #2a2a2a 50%, #1a1a1a 100%);
-  border-bottom: 2px solid #ffd700;
-  padding: 1.25rem 2rem;
+  background: linear-gradient(160deg, var(--surface-1) 0%, var(--surface-3) 50%, var(--surface-1) 100%);
+  border-bottom: 1px solid var(--gold-dim);
+  box-shadow: 0 2px 20px rgba(30, 255, 28, 0.08);
+  padding: 1.5rem 2rem;
   text-align: center;
   position: relative;
   overflow: hidden;
+  isolation: isolate;
 }
 
 /* Subtle animated gradient shimmer effect */
@@ -53,9 +113,9 @@ code {
   background: linear-gradient(
     90deg,
     transparent 0%,
-    rgba(255, 215, 0, 0.03) 25%,
-    rgba(255, 215, 0, 0.06) 50%,
-    rgba(255, 215, 0, 0.03) 75%,
+    rgba(30, 255, 28, 0.03) 25%,
+    rgba(30, 255, 28, 0.06) 50%,
+    rgba(30, 255, 28, 0.03) 75%,
     transparent 100%
   );
   animation: banner-shimmer 8s ease-in-out infinite;
@@ -80,6 +140,8 @@ code {
 .banner-content {
   position: relative;
   z-index: 1;
+  transform: translateZ(0);
+  backface-visibility: hidden;
 }
 
 .banner-title {
@@ -95,32 +157,37 @@ code {
 }
 
 .banner-moto {
-  color: #ffd700;
+  color: #1eff1c;
   text-shadow: 
-    0 0 10px rgba(255, 215, 0, 0.4),
-    0 0 20px rgba(255, 215, 0, 0.2);
+    0 0 10px rgba(30, 255, 28, 0.4),
+    0 0 20px rgba(30, 255, 28, 0.2);
   letter-spacing: 3px;
   font-weight: 800;
 }
 
 .banner-subtitle {
-  color: #e0e0e0;
+  color: #1eff1c;
+  text-shadow:
+    0 0 10px rgba(30, 255, 28, 0.4),
+    0 0 20px rgba(30, 255, 28, 0.2);
   font-weight: 500;
 }
 
 .banner-variant {
   color: #ffa726;
   font-size: 0.95rem;
-  margin: 0.25rem 0 0.5rem 0;
+  margin: 0.85rem 0 0 0;
   font-weight: 500;
   letter-spacing: 0.5px;
   font-style: italic;
+  transform: translateZ(0);
+  backface-visibility: hidden;
 }
 
 .banner-company {
-  color: #888;
+  color: #ffffff;
   font-size: 0.85rem;
-  margin: 0;
+  margin: 0.1rem 0 0;
   letter-spacing: 1px;
   font-weight: 400;
 }
@@ -142,6 +209,7 @@ code {
   
   .banner-variant {
     font-size: 0.85rem;
+    margin-top: 0.65rem;
   }
   
   .banner-company {
@@ -159,6 +227,7 @@ code {
   gap: 6px;
   align-items: flex-end;
   transition: right 0.15s ease; /* Fast slide animation - matches panel speed */
+  transform: translateZ(0);
 }
 
 /* When workflow panel is collapsed, slide buttons to the right edge */
@@ -166,69 +235,116 @@ code {
   right: 60px; /* Positioned next to collapsed panel (50px + 10px margin) */
 }
 
+.mode-switch-control {
+  min-width: 250px;
+  padding: 0.7rem 0.8rem 0.8rem;
+  background: rgba(11, 11, 15, 0.92);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-md);
+  box-shadow: var(--shadow-md);
+  backdrop-filter: blur(8px);
+}
+
+.mode-switch-label {
+  display: block;
+  margin-bottom: 0.45rem;
+  color: var(--text-secondary);
+  font-size: 0.72rem;
+  font-weight: 700;
+  letter-spacing: 0.08em;
+  text-transform: uppercase;
+}
+
+.mode-switch-select {
+  min-width: 0;
+  padding: 0.6rem 0.8rem;
+  background: linear-gradient(180deg, var(--surface-2), var(--surface-1));
+  border: 1px solid var(--border-strong);
+  color: var(--text-primary);
+  font-size: 0.9rem;
+  font-weight: 600;
+  cursor: pointer;
+  box-shadow: inset 0 1px 0 rgba(255, 255, 255, 0.04);
+}
+
+.mode-switch-select:hover {
+  border-color: rgba(30, 255, 28, 0.28);
+}
+
+.mode-switch-select option {
+  color: #000;
+  background: #fff;
+}
+
 .boost-btn {
-  background: linear-gradient(135deg, #ffd700 0%, #ffed4e 100%);
+  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
   color: #000;
   border: none;
   padding: 0.5rem 1rem;
-  border-radius: 6px;
+  border-radius: var(--radius-sm);
   font-size: 0.9rem;
   font-weight: 700;
   cursor: pointer;
-  box-shadow: 0 4px 12px rgba(255, 215, 0, 0.3);
-  transition: all 0.2s ease;
+  box-shadow: var(--shadow-gold);
+  transition: all var(--transition-fast);
   white-space: nowrap;
 }
 
 .boost-btn:hover {
   transform: translateY(-2px);
-  box-shadow: 0 6px 16px rgba(255, 215, 0, 0.4);
+  box-shadow: 0 6px 20px rgba(30, 255, 28, 0.35);
 }
 
 .boost-logs-btn {
-  background: linear-gradient(135deg, #ff9800 0%, #ffb74d 100%);
+  background: linear-gradient(135deg, var(--accent-orange) 0%, #ffb74d 100%);
   color: #000;
   border: none;
   padding: 0.4rem 0.8rem;
-  border-radius: 6px;
+  border-radius: var(--radius-sm);
   font-size: 0.85rem;
   font-weight: 600;
   cursor: pointer;
-  box-shadow: 0 3px 10px rgba(255, 152, 0, 0.3);
-  transition: all 0.2s ease;
+  box-shadow: 0 3px 10px rgba(255, 152, 0, 0.25);
+  transition: all var(--transition-fast);
   white-space: nowrap;
   width: fit-content;
 }
 
 .boost-logs-btn:hover {
   transform: translateY(-2px);
-  box-shadow: 0 5px 14px rgba(255, 152, 0, 0.4);
+  box-shadow: 0 5px 14px rgba(255, 152, 0, 0.35);
 }
 
 .tabs {
   display: flex;
-  gap: 1px;
-  background: #1a1a1a;
-  padding: 1rem;
-  padding-right: 150px; /* Leave room for API Boost button */
-  border-bottom: 2px solid #333;
-  flex-wrap: nowrap; /* Changed from wrap to nowrap */
+  gap: 4px;
+  background: var(--surface-1);
+  padding: 0.75rem 1rem;
+  padding-right: 150px;
+  border-bottom: 1px solid var(--border-subtle);
+  flex-wrap: nowrap;
+}
+
+.tabs.tabs-manual {
+  flex-wrap: wrap;
+  row-gap: 0.5rem;
 }
 
 .tab {
-  padding: 0.75rem 1.5rem;
-  background: #2a2a2a;
-  border: none;
-  color: #999;
+  padding: 0.65rem 1.25rem;
+  background: var(--surface-3);
+  border: 1px solid transparent;
+  color: var(--text-secondary);
   cursor: pointer;
-  font-size: 0.95rem;
-  transition: all 0.2s;
+  font-size: 0.9rem;
+  border-radius: var(--radius-sm);
+  transition: all var(--transition-fast);
 }
 
 /* Tab with subtext - increase height to accommodate two lines */
 .tab-with-subtext {
-  padding: 0.5rem 1.5rem;
-  min-height: 60px;
+  padding: 0.45rem 1.25rem;
+  min-height: 56px;
   display: flex;
   align-items: center;
 }
@@ -241,31 +357,33 @@ code {
 }
 
 .tab-main-label {
-  font-size: 0.95rem;
+  font-size: 0.9rem;
   line-height: 1.2;
 }
 
 .tab-subtext {
   font-size: 0.65rem;
-  color: #ff4444;
+  color: var(--accent-red);
   font-weight: 500;
   line-height: 1;
   white-space: nowrap;
 }
 
 .tab-subtext.green {
-  color: #44bb44;
+  color: var(--accent-green);
 }
 
 .tab:hover {
-  background: #333;
-  color: #fff;
+  background: var(--surface-4);
+  color: var(--text-primary);
+  border-color: var(--border-subtle);
 }
 
 .tab.active {
-  background: #0f0f0f;
-  color: #4CAF50;
-  border-bottom: 2px solid #4CAF50;
+  background: var(--surface-0);
+  color: var(--accent-green);
+  border-color: var(--accent-green);
+  box-shadow: inset 0 -2px 0 var(--accent-green);
 }
 
 .tab-content {
@@ -300,18 +418,26 @@ h2 {
 label {
   display: block;
   margin-bottom: 0.5rem;
-  color: #ccc;
+  color: var(--text-secondary);
   font-weight: 500;
+  font-size: 0.9rem;
 }
 
 input, textarea, select {
   width: 100%;
-  padding: 0.75rem;
-  background: #1a1a1a;
-  border: 1px solid #333;
-  color: #e0e0e0;
-  border-radius: 4px;
+  padding: 0.7rem 0.85rem;
+  background: var(--surface-1);
+  border: 1px solid var(--border-default);
+  color: var(--text-primary);
+  border-radius: var(--radius-sm);
   font-size: 0.95rem;
+  transition: border-color var(--transition-fast), box-shadow var(--transition-fast);
+}
+
+input:focus, textarea:focus, select:focus {
+  outline: none;
+  border-color: var(--gold-dim);
+  box-shadow: 0 0 0 3px var(--gold-glow);
 }
 
 textarea {
@@ -321,84 +447,102 @@ textarea {
 }
 
 button {
-  padding: 0.75rem 1.5rem;
-  background: #4CAF50;
+  padding: 0.65rem 1.35rem;
+  background: var(--accent-green);
   color: white;
   border: none;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   cursor: pointer;
   font-size: 0.95rem;
   font-weight: 600;
-  transition: background 0.2s;
+  transition: all var(--transition-fast);
 }
 
 button:hover {
-  background: #45a049;
+  filter: brightness(1.1);
+  transform: translateY(-1px);
+}
+
+button:active {
+  transform: translateY(0);
 }
 
 button:disabled {
-  background: #555;
+  background: var(--surface-4);
   cursor: not-allowed;
+  transform: none;
+  filter: none;
+  opacity: 0.6;
 }
 
 button.secondary {
-  background: #666;
+  background: var(--surface-4);
 }
 
 button.secondary:hover {
-  background: #777;
+  background: var(--surface-3);
+  filter: brightness(1.2);
 }
 
 button.danger {
-  background: #f44336;
+  background: var(--accent-red);
 }
 
 button.danger:hover {
-  background: #da190b;
+  filter: brightness(1.15);
 }
 
 .status-badge {
   display: inline-block;
   padding: 0.25rem 0.75rem;
-  border-radius: 12px;
+  border-radius: var(--radius-pill);
   font-size: 0.85rem;
   font-weight: 600;
 }
 
 .status-running {
-  background: #4CAF50;
-  color: white;
+  background: rgba(76, 175, 80, 0.15);
+  color: var(--accent-green);
+  box-shadow: 0 0 8px rgba(76, 175, 80, 0.2);
 }
 
 .status-stopped {
-  background: #666;
-  color: white;
+  background: var(--surface-4);
+  color: var(--text-secondary);
 }
 
 .metric-card {
-  background: #1a1a1a;
+  background: var(--surface-2);
   padding: 1.25rem;
-  border-radius: 6px;
-  border: 1px solid #333;
+  border-radius: var(--radius-md);
+  border: 1px solid var(--border-subtle);
   margin-bottom: 1rem;
+  box-shadow: var(--shadow-sm);
+  transition: border-color var(--transition-fast), box-shadow var(--transition-fast);
+}
+
+.metric-card:hover {
+  border-color: var(--border-default);
 }
 
 .metric-label {
-  color: #999;
-  font-size: 0.85rem;
-  margin-bottom: 0.25rem;
+  color: var(--text-muted);
+  font-size: 0.8rem;
+  margin-bottom: 0.35rem;
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
 }
 
 .metric-value {
-  color: #fff;
+  color: var(--text-primary);
   font-size: 1.5rem;
   font-weight: 700;
 }
 
 .event-log {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1rem;
   max-height: 400px;
   overflow-y: auto;
@@ -407,9 +551,10 @@ button.danger:hover {
 }
 
 .event-item {
-  padding: 0.5rem;
-  border-bottom: 1px solid #222;
-  margin-bottom: 0.5rem;
+  padding: 0.5rem 0.65rem;
+  border-bottom: 1px solid var(--border-subtle);
+  margin-bottom: 0.25rem;
+  border-radius: var(--radius-sm);
 }
 
 .event-item:last-child {
@@ -417,59 +562,63 @@ button.danger:hover {
 }
 
 .event-time {
-  color: #666;
+  color: var(--text-muted);
   font-size: 0.75rem;
 }
 
 .event-accept {
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .event-reject {
-  color: #f44336;
+  color: var(--accent-red);
 }
 
 /* Event styling classes for compiler logs */
 .event-success {
-  background: rgba(76, 175, 80, 0.1);
-  border-left: 3px solid #4CAF50;
+  background: rgba(76, 175, 80, 0.08);
+  border-left: 3px solid var(--accent-green);
+  border-radius: var(--radius-sm);
 }
 
 .event-success .event-type {
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .event-error {
-  background: rgba(244, 67, 54, 0.1);
-  border-left: 3px solid #f44336;
+  background: rgba(244, 67, 54, 0.08);
+  border-left: 3px solid var(--accent-red);
+  border-radius: var(--radius-sm);
 }
 
 .event-error .event-type {
-  color: #f44336;
+  color: var(--accent-red);
 }
 
 .event-info {
-  background: rgba(33, 150, 243, 0.1);
-  border-left: 3px solid #2196F3;
+  background: rgba(33, 150, 243, 0.08);
+  border-left: 3px solid var(--accent-blue);
+  border-radius: var(--radius-sm);
 }
 
 .event-info .event-type {
-  color: #2196F3;
+  color: var(--accent-blue);
 }
 
 .event-warning {
-  background: rgba(255, 152, 0, 0.1);
-  border-left: 3px solid #ff9800;
+  background: rgba(255, 152, 0, 0.08);
+  border-left: 3px solid var(--accent-orange);
+  border-radius: var(--radius-sm);
 }
 
 .event-warning .event-type {
-  color: #ff9800;
+  color: var(--accent-orange);
 }
 
 .results-container {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   min-height: 500px;
   max-height: 700px;
@@ -478,6 +627,7 @@ button.danger:hover {
   font-size: 0.9rem;
   white-space: pre-wrap;
   line-height: 1.6;
+  box-shadow: var(--shadow-sm);
 }
 
 .button-group {
@@ -511,10 +661,9 @@ button.danger:hover {
     font-size: 0.85rem;
     padding: 0.5rem 1rem;
   }
-  
-  .expandable-content {
-    flex-direction: column;
-    gap: 1rem;
+
+  .mode-switch-control {
+    min-width: 220px;
   }
   
   .app-header {
@@ -535,15 +684,15 @@ button.danger:hover {
 }
 
 .current-mode {
-  background: #1a1a1a;
+  background: var(--surface-2);
   padding: 1rem;
-  border-radius: 6px;
-  border: 1px solid #333;
+  border-radius: var(--radius-md);
+  border: 1px solid var(--border-subtle);
   margin-bottom: 1.5rem;
 }
 
 .mode-highlight {
-  color: #4CAF50;
+  color: var(--accent-green);
   font-weight: 700;
   text-transform: uppercase;
 }
@@ -556,7 +705,7 @@ button.danger:hover {
 }
 
 .metric-rate {
-  color: #4CAF50;
+  color: var(--accent-green);
   font-size: 1rem;
   font-weight: 600;
   margin-top: 0.5rem;
@@ -567,23 +716,23 @@ button.danger:hover {
 }
 
 .events-list {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1rem;
   max-height: 500px;
   overflow-y: auto;
 }
 
 .no-events {
-  color: #666;
+  color: var(--text-muted);
   text-align: center;
   padding: 2rem;
   font-style: italic;
 }
 
 .event-data {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 0.85rem;
   margin-left: 1rem;
   white-space: pre-wrap;
@@ -591,33 +740,33 @@ button.danger:hover {
 }
 
 .event-type {
-  color: #4CAF50;
+  color: var(--accent-green);
   font-weight: 600;
   margin-left: 0.5rem;
 }
 
 .info-section {
-  background: #1a1a1a;
+  background: var(--surface-2);
   padding: 1.5rem;
-  border-radius: 6px;
-  border: 1px solid #333;
+  border-radius: var(--radius-md);
+  border: 1px solid var(--border-subtle);
   margin-top: 2rem;
 }
 
 .info-section h4 {
-  color: #fff;
+  color: var(--text-primary);
   margin-bottom: 0.75rem;
   font-size: 1.1rem;
 }
 
 .info-section p {
-  color: #ccc;
+  color: var(--text-secondary);
   margin-bottom: 0.5rem;
   line-height: 1.6;
 }
 
 .info-section ul {
-  color: #ccc;
+  color: var(--text-secondary);
   margin-left: 1.5rem;
   line-height: 1.8;
 }
@@ -627,7 +776,7 @@ button.danger:hover {
 }
 
 .info-text {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 0.9rem;
   line-height: 1.6;
 }
@@ -639,7 +788,7 @@ button.danger:hover {
   align-items: center;
   margin-bottom: 1rem;
   padding-bottom: 1rem;
-  border-bottom: 2px solid #333;
+  border-bottom: 1px solid var(--border-default);
 }
 
 .paper-meta {
@@ -649,18 +798,18 @@ button.danger:hover {
 }
 
 .word-count {
-  color: #4CAF50;
+  color: var(--accent-green);
   font-weight: 700;
   font-size: 1.1rem;
 }
 
 .version {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 0.9rem;
-  background: #1a1a1a;
+  background: var(--surface-2);
   padding: 0.25rem 0.75rem;
-  border-radius: 4px;
-  border: 1px solid #333;
+  border-radius: var(--radius-sm);
+  border: 1px solid var(--border-subtle);
 }
 
 .paper-controls {
@@ -668,17 +817,17 @@ button.danger:hover {
   justify-content: space-between;
   align-items: center;
   margin-bottom: 1rem;
-  padding: 1rem;
-  background: #1a1a1a;
-  border-radius: 6px;
-  border: 1px solid #333;
+  padding: 0.85rem 1rem;
+  background: var(--surface-2);
+  border-radius: var(--radius-md);
+  border: 1px solid var(--border-subtle);
 }
 
 .checkbox-label {
   display: flex;
   align-items: center;
   gap: 0.5rem;
-  color: #ccc;
+  color: var(--text-secondary);
   cursor: pointer;
   user-select: none;
 }
@@ -689,52 +838,57 @@ button.danger:hover {
 }
 
 .btn {
-  padding: 0.75rem 1.5rem;
+  padding: 0.65rem 1.35rem;
   border: none;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   cursor: pointer;
   font-size: 0.95rem;
   font-weight: 600;
-  transition: background 0.2s;
+  transition: all var(--transition-fast);
 }
 
 .btn-primary {
-  background: #4CAF50;
+  background: var(--accent-green);
   color: white;
 }
 
 .btn-primary:hover {
-  background: #45a049;
+  filter: brightness(1.1);
+  transform: translateY(-1px);
 }
 
 .btn-secondary {
-  background: #666;
+  background: var(--surface-4);
   color: white;
 }
 
 .btn-secondary:hover {
-  background: #777;
+  background: var(--surface-3);
+  filter: brightness(1.2);
 }
 
 .btn:disabled {
-  background: #444;
+  background: var(--surface-3);
   cursor: not-allowed;
   opacity: 0.5;
+  transform: none;
+  filter: none;
 }
 
 .paper-container {
   flex: 1;
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 2rem;
   overflow-y: auto;
   min-height: 400px;
   max-height: calc(100vh - 400px);
+  box-shadow: var(--shadow-sm);
 }
 
 .paper-content {
-  color: #e0e0e0;
+  color: var(--text-primary);
   line-height: 1.8;
 }
 
@@ -751,7 +905,7 @@ button.danger:hover {
   align-items: center;
   justify-content: center;
   min-height: 300px;
-  color: #666;
+  color: var(--text-muted);
   text-align: center;
 }
 
@@ -764,16 +918,17 @@ button.danger:hover {
 .paper-footer {
   margin-top: 1rem;
   padding-top: 1rem;
-  border-top: 1px solid #333;
+  border-top: 1px solid var(--border-subtle);
 }
 
 /* Error Display Styles */
 .error-box {
-  background: #2a1515;
-  border: 2px solid #ff4444;
-  border-radius: 6px;
+  background: rgba(244, 67, 54, 0.06);
+  border: 1px solid rgba(244, 67, 54, 0.35);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   margin: 1.5rem 0;
+  box-shadow: 0 4px 16px rgba(244, 67, 54, 0.1);
 }
 
 .error-header {
@@ -820,9 +975,9 @@ button.danger:hover {
 }
 
 .error-suggestion {
-  background: #1a2a1a;
-  border: 1px solid #4CAF50;
-  border-radius: 4px;
+  background: rgba(76, 175, 80, 0.06);
+  border: 1px solid rgba(76, 175, 80, 0.25);
+  border-radius: var(--radius-sm);
   padding: 1rem;
   margin-top: 1rem;
 }
@@ -835,26 +990,26 @@ button.danger:hover {
 
 /* Model Test Results Styles */
 .model-test-results {
-  background: #1a1a1a;
-  border: 2px solid #666;
-  border-radius: 6px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   margin: 1.5rem 0;
 }
 
 .model-test-results.all-passed {
-  border-color: #4CAF50;
-  background: #1a2a1a;
+  border-color: rgba(76, 175, 80, 0.4);
+  background: rgba(76, 175, 80, 0.05);
 }
 
 .model-test-results.some-failed {
-  border-color: #ff9800;
-  background: #2a2015;
+  border-color: rgba(255, 152, 0, 0.4);
+  background: rgba(255, 152, 0, 0.05);
 }
 
 .model-test-results h3 {
   margin: 0 0 1rem 0;
-  color: #fff;
+  color: var(--text-primary);
 }
 
 .test-results-grid {
@@ -865,19 +1020,19 @@ button.danger:hover {
 }
 
 .test-result-item {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 4px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
   padding: 1rem;
 }
 
 .test-result-item.passed {
-  border-color: #4CAF50;
+  border-color: rgba(76, 175, 80, 0.4);
 }
 
 .test-result-item.failed {
-  border-color: #ff4444;
-  background: #1a0a0a;
+  border-color: rgba(244, 67, 54, 0.4);
+  background: rgba(244, 67, 54, 0.04);
 }
 
 .test-result-header {
@@ -907,17 +1062,17 @@ button.danger:hover {
 .test-result-error {
   color: #ff8888;
   font-size: 0.85rem;
-  background: #1a0a0a;
+  background: rgba(244, 67, 54, 0.06);
   padding: 0.5rem;
-  border-radius: 3px;
+  border-radius: var(--radius-sm);
   margin-top: 0.5rem;
   line-height: 1.4;
 }
 
 .test-suggestion {
-  background: #2a2015;
-  border: 1px solid #ff9800;
-  border-radius: 4px;
+  background: rgba(255, 152, 0, 0.06);
+  border: 1px solid rgba(255, 152, 0, 0.25);
+  border-radius: var(--radius-sm);
   padding: 0.75rem;
   color: #ffcc80;
   font-size: 0.9rem;
@@ -940,27 +1095,27 @@ button.danger:hover {
 }
 
 .status-badge.running {
-  background: #4CAF50;
-  color: white;
+  background: rgba(76, 175, 80, 0.15);
+  color: var(--accent-green);
   padding: 0.5rem 1rem;
-  border-radius: 4px;
+  border-radius: var(--radius-pill);
   font-weight: 600;
 }
 
 .status-badge.stopped {
-  background: #666;
-  color: white;
+  background: var(--surface-4);
+  color: var(--text-secondary);
   padding: 0.5rem 1rem;
-  border-radius: 4px;
+  border-radius: var(--radius-pill);
   font-weight: 600;
 }
 
 .mode-badge {
-  background: #1a1a1a;
-  border: 1px solid #4CAF50;
-  color: #4CAF50;
+  background: var(--surface-2);
+  border: 1px solid rgba(76, 175, 80, 0.3);
+  color: var(--accent-green);
   padding: 0.5rem 1rem;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   font-size: 0.9rem;
 }
 
@@ -983,16 +1138,16 @@ button.danger:hover {
 }
 
 .btn-danger {
-  background: #f44336;
+  background: var(--accent-red);
   color: white;
 }
 
 .btn-danger:hover {
-  background: #da190b;
+  filter: brightness(1.15);
 }
 
 .btn-danger:disabled {
-  background: #555;
+  background: var(--surface-4);
   cursor: not-allowed;
   opacity: 0.5;
 }
@@ -1001,20 +1156,20 @@ button.danger:hover {
 .empty-state {
   text-align: center;
   padding: 4rem 2rem;
-  background: #1a1a1a;
-  border-radius: 6px;
-  border: 1px solid #333;
+  background: var(--surface-2);
+  border-radius: var(--radius-lg);
+  border: 1px solid var(--border-subtle);
   margin: 2rem 0;
 }
 
 .empty-state h3 {
-  color: #fff;
+  color: var(--text-primary);
   font-size: 1.5rem;
   margin-bottom: 1rem;
 }
 
 .empty-state p {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 1rem;
   line-height: 1.6;
   max-width: 600px;
@@ -1022,25 +1177,25 @@ button.danger:hover {
 }
 
 .empty-state strong {
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 /* Compiler Alerts */
 .alert {
   margin: 1rem 0;
   padding: 1.5rem;
-  border-radius: 8px;
+  border-radius: var(--radius-md);
   border-left: 4px solid;
 }
 
 .alert-error {
-  background: rgba(244, 67, 54, 0.1);
-  border-left-color: #f44336;
+  background: rgba(244, 67, 54, 0.06);
+  border-left-color: var(--accent-red);
 }
 
 .alert-warning {
-  background: rgba(255, 152, 0, 0.1);
-  border-left-color: #ff9800;
+  background: rgba(255, 152, 0, 0.06);
+  border-left-color: var(--accent-orange);
 }
 
 .alert h3 {
@@ -1072,64 +1227,64 @@ button.danger:hover {
 }
 
 .traceback {
-  background: #1a1a1a;
+  background: var(--surface-2);
   padding: 1rem;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   overflow-x: auto;
   font-size: 0.85rem;
   margin-top: 0.5rem;
-  border: 1px solid #333;
+  border: 1px solid var(--border-subtle);
 }
 
 .dismiss-btn {
   margin-top: 1rem;
   padding: 0.5rem 1rem;
-  background: #333;
-  border: 1px solid #555;
-  color: #e0e0e0;
+  background: var(--surface-3);
+  border: 1px solid var(--border-default);
+  color: var(--text-primary);
   cursor: pointer;
-  border-radius: 4px;
-  transition: all 0.2s;
+  border-radius: var(--radius-sm);
+  transition: all var(--transition-fast);
 }
 
 .dismiss-btn:hover {
-  background: #444;
-  border-color: #666;
+  background: var(--surface-4);
+  border-color: var(--border-strong);
 }
 
-.status-badge {
+.compiler-status-badge {
   display: inline-block;
   padding: 0.25rem 0.75rem;
-  border-radius: 12px;
+  border-radius: var(--radius-pill);
   font-size: 0.75rem;
   font-weight: 600;
   margin-left: 1rem;
 }
 
 .status-error {
-  background: rgba(244, 67, 54, 0.2);
-  color: #f44336;
-  border: 1px solid #f44336;
+  background: rgba(244, 67, 54, 0.12);
+  color: var(--accent-red);
+  border: 1px solid rgba(244, 67, 54, 0.3);
 }
 
 .status-warning {
-  background: rgba(255, 152, 0, 0.2);
-  color: #ff9800;
-  border: 1px solid #ff9800;
+  background: rgba(255, 152, 0, 0.12);
+  color: var(--accent-orange);
+  border: 1px solid rgba(255, 152, 0, 0.3);
 }
 
 /* Tab Group Separator */
 .tab-separator {
-  width: 2px;
-  height: 30px;
-  background: #444;
+  width: 1px;
+  height: 28px;
+  background: var(--border-default);
   margin: 0 0.5rem;
   align-self: center;
 }
 
 /* Large Tab Group Spacer - ~3/4 inch separation for isolated groups */
 .tab-group-spacer-large {
-  width: 84px; /* ~3/4 inch at 72dpi */
+  width: 84px;
   height: 100%;
 }
 
@@ -1150,8 +1305,8 @@ button.danger:hover {
 }
 
 .tab-boost.active {
-  color: #ffd700;
-  border-bottom-color: #ffd700;
+  color: #1eff1c;
+  border-bottom-color: #1eff1c;
 }
 
 /* Tier 3 Final Answer Tab Special Styling */
@@ -1173,111 +1328,6 @@ button.danger:hover {
   50% { opacity: 0.7; }
 }
 
-/* Expandable Section Styles */
-.expandable-section {
-  background: #1a1a1a;
-  border-bottom: 2px solid #333;
-}
-
-.expandable-trigger {
-  width: 100%;
-  background: #2a2a2a;
-  border: none;
-  border-top: 1px solid #333;
-  padding: 0.75rem 2rem;
-  display: flex;
-  align-items: center;
-  gap: 0.75rem;
-  cursor: pointer;
-  transition: all 0.2s ease;
-  color: #999;
-  font-size: 0.95rem;
-}
-
-.expandable-trigger:hover {
-  background: #333;
-  color: #fff;
-}
-
-.expandable-trigger.expanded {
-  background: #1a1a1a;
-  border-bottom: 1px solid #444;
-}
-
-.expand-icon {
-  font-size: 0.8rem;
-  transition: transform 0.2s ease;
-  color: #4CAF50;
-}
-
-.section-title {
-  font-weight: 700;
-  text-transform: uppercase;
-  letter-spacing: 0.5px;
-  color: #2196F3;
-}
-
-.section-subtitle {
-  font-size: 0.85rem;
-  color: #666;
-  font-style: italic;
-}
-
-.expandable-content {
-  background: #0f0f0f;
-  padding: 1rem 2rem;
-  display: flex;
-  gap: 2rem;
-  border-bottom: 1px solid #333;
-}
-
-.subsection {
-  flex: 1;
-}
-
-.subsection-header {
-  color: #999;
-  font-size: 0.8rem;
-  font-weight: 600;
-  text-transform: uppercase;
-  letter-spacing: 1px;
-  margin-bottom: 0.75rem;
-  padding-bottom: 0.5rem;
-  border-bottom: 1px solid #333;
-}
-
-.subsection-tabs {
-  display: flex;
-  flex-direction: column;
-  gap: 0.5rem;
-}
-
-.subtab {
-  padding: 0.5rem 1rem;
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-left: 3px solid transparent;
-  color: #999;
-  cursor: pointer;
-  font-size: 0.9rem;
-  text-align: left;
-  transition: all 0.2s;
-  border-radius: 4px;
-}
-
-.subtab:hover {
-  background: #2a2a2a;
-  color: #fff;
-  border-left-color: #666;
-}
-
-.subtab.active {
-  background: #2a2a2a;
-  color: #2196F3;
-  border-left-color: #2196F3;
-  font-weight: 600;
-}
-
 /* Autonomous Research Styles */
 .autonomous-research {
   padding: 1rem;
@@ -1289,15 +1339,16 @@ button.danger:hover {
   align-items: center;
   margin-bottom: 2rem;
   padding-bottom: 1rem;
-  border-bottom: 2px solid #333;
+  border-bottom: 1px solid var(--border-default);
 }
 
 .autonomous-status-panel {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   margin-bottom: 1.5rem;
+  box-shadow: var(--shadow-sm);
 }
 
 .autonomous-tier-indicator {
@@ -1305,28 +1356,28 @@ button.danger:hover {
   align-items: center;
   gap: 1rem;
   padding: 0.75rem 1.25rem;
-  background: #0a0a0a;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border-radius: var(--radius-sm);
   margin-bottom: 1rem;
 }
 
 .tier-label {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 0.9rem;
 }
 
 .tier-value {
-  color: #9C27B0;
+  color: var(--accent-purple);
   font-weight: 700;
   font-size: 1.1rem;
 }
 
 .tier-1-active {
-  color: #FF9800;
+  color: var(--accent-orange);
 }
 
 .tier-2-active {
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .autonomous-progress {
@@ -1337,28 +1388,31 @@ button.danger:hover {
 }
 
 .progress-card {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1rem;
+  box-shadow: var(--shadow-sm);
 }
 
 .progress-card-label {
-  color: #999;
-  font-size: 0.85rem;
-  margin-bottom: 0.25rem;
+  color: var(--text-muted);
+  font-size: 0.8rem;
+  margin-bottom: 0.35rem;
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
 }
 
 .progress-card-value {
-  color: #fff;
+  color: var(--text-primary);
   font-size: 1.4rem;
   font-weight: 700;
 }
 
 .autonomous-activity {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1rem;
   max-height: 400px;
   overflow-y: auto;
@@ -1367,8 +1421,9 @@ button.danger:hover {
 .activity-item {
   display: flex;
   gap: 0.75rem;
-  padding: 0.75rem;
-  border-bottom: 1px solid #1a1a1a;
+  padding: 0.6rem 0.5rem;
+  border-bottom: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
 }
 
 .activity-item:last-child {
@@ -1382,28 +1437,28 @@ button.danger:hover {
   display: flex;
   align-items: center;
   justify-content: center;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   font-size: 0.85rem;
 }
 
 .activity-icon.accept {
-  background: rgba(76, 175, 80, 0.2);
-  color: #4CAF50;
+  background: rgba(76, 175, 80, 0.12);
+  color: var(--accent-green);
 }
 
 .activity-icon.reject {
-  background: rgba(244, 67, 54, 0.2);
-  color: #f44336;
+  background: rgba(244, 67, 54, 0.12);
+  color: var(--accent-red);
 }
 
 .activity-icon.topic {
-  background: rgba(156, 39, 176, 0.2);
-  color: #9C27B0;
+  background: rgba(156, 39, 176, 0.12);
+  color: var(--accent-purple);
 }
 
 .activity-icon.paper {
-  background: rgba(33, 150, 243, 0.2);
-  color: #2196F3;
+  background: rgba(33, 150, 243, 0.12);
+  color: var(--accent-blue);
 }
 
 .activity-content {
@@ -1411,13 +1466,13 @@ button.danger:hover {
 }
 
 .activity-title {
-  color: #e0e0e0;
+  color: var(--text-primary);
   font-size: 0.9rem;
   margin-bottom: 0.25rem;
 }
 
 .activity-time {
-  color: #666;
+  color: var(--text-muted);
   font-size: 0.75rem;
 }
 
@@ -1427,16 +1482,18 @@ button.danger:hover {
 }
 
 .brainstorm-card {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.25rem;
   margin-bottom: 1rem;
-  transition: border-color 0.2s;
+  transition: border-color var(--transition-fast), box-shadow var(--transition-fast);
+  box-shadow: var(--shadow-sm);
 }
 
 .brainstorm-card:hover {
-  border-color: #444;
+  border-color: var(--border-strong);
+  box-shadow: var(--shadow-md);
 }
 
 .brainstorm-card-header {
@@ -1455,21 +1512,21 @@ button.danger:hover {
 .brainstorm-status {
   display: inline-block;
   padding: 0.25rem 0.75rem;
-  border-radius: 12px;
+  border-radius: var(--radius-pill);
   font-size: 0.75rem;
   font-weight: 600;
 }
 
 .brainstorm-status.in-progress {
-  background: rgba(255, 152, 0, 0.2);
-  color: #FF9800;
-  border: 1px solid #FF9800;
+  background: rgba(255, 152, 0, 0.12);
+  color: var(--accent-orange);
+  border: 1px solid rgba(255, 152, 0, 0.3);
 }
 
 .brainstorm-status.complete {
-  background: rgba(76, 175, 80, 0.2);
-  color: #4CAF50;
-  border: 1px solid #4CAF50;
+  background: rgba(76, 175, 80, 0.12);
+  color: var(--accent-green);
+  border: 1px solid rgba(76, 175, 80, 0.3);
 }
 
 .brainstorm-prompt {
@@ -1521,20 +1578,22 @@ button.danger:hover {
 }
 
 .paper-card {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
-  transition: border-color 0.2s, transform 0.2s;
+  transition: border-color var(--transition-fast), transform var(--transition-fast), box-shadow var(--transition-fast);
+  box-shadow: var(--shadow-sm);
 }
 
 .paper-card:hover {
-  border-color: #2196F3;
-  transform: translateY(-2px);
+  border-color: rgba(33, 150, 243, 0.35);
+  transform: translateY(-3px);
+  box-shadow: var(--shadow-md);
 }
 
 .paper-card-title {
-  color: #fff;
+  color: var(--text-primary);
   font-size: 1.1rem;
   font-weight: 600;
   margin-bottom: 0.75rem;
@@ -1542,7 +1601,7 @@ button.danger:hover {
 }
 
 .paper-card-abstract {
-  color: #ccc;
+  color: var(--text-secondary);
   font-size: 0.9rem;
   line-height: 1.5;
   margin-bottom: 1rem;
@@ -1557,17 +1616,17 @@ button.danger:hover {
   justify-content: space-between;
   align-items: center;
   padding-top: 0.75rem;
-  border-top: 1px solid #333;
+  border-top: 1px solid var(--border-subtle);
 }
 
 .paper-word-count {
-  color: #4CAF50;
+  color: var(--accent-green);
   font-size: 0.85rem;
   font-weight: 600;
 }
 
 .paper-source {
-  color: #999;
+  color: var(--text-muted);
   font-size: 0.8rem;
 }
 
@@ -1580,29 +1639,29 @@ button.danger:hover {
 .paper-btn {
   padding: 0.5rem 1rem;
   font-size: 0.85rem;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   border: none;
   cursor: pointer;
-  transition: background 0.2s;
+  transition: all var(--transition-fast);
 }
 
 .paper-btn-view {
-  background: #2196F3;
+  background: var(--accent-blue);
   color: white;
 }
 
 .paper-btn-view:hover {
-  background: #1976D2;
+  filter: brightness(1.15);
 }
 
 .paper-btn-download {
-  background: #333;
-  color: #e0e0e0;
-  border: 1px solid #444;
+  background: var(--surface-3);
+  color: var(--text-primary);
+  border: 1px solid var(--border-default);
 }
 
 .paper-btn-download:hover {
-  background: #444;
+  background: var(--surface-4);
 }
 
 /* Tier 3 Reset Button */
@@ -1634,20 +1693,21 @@ button.danger:hover {
 }
 
 .settings-section {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   margin-bottom: 1.5rem;
+  box-shadow: var(--shadow-sm);
 }
 
 .settings-section-title {
-  color: #fff;
+  color: var(--text-primary);
   font-size: 1.1rem;
   font-weight: 600;
   margin-bottom: 1rem;
   padding-bottom: 0.5rem;
-  border-bottom: 1px solid #333;
+  border-bottom: 1px solid var(--border-subtle);
 }
 
 .model-config-grid {
@@ -1657,14 +1717,14 @@ button.danger:hover {
 }
 
 .model-config-card {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
   padding: 1rem;
 }
 
 .model-config-label {
-  color: #9C27B0;
+  color: var(--accent-purple);
   font-size: 0.85rem;
   font-weight: 600;
   margin-bottom: 0.75rem;
@@ -1683,18 +1743,18 @@ button.danger:hover {
 }
 
 .log-chart-container {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1.5rem;
   margin-bottom: 1.5rem;
   min-height: 300px;
 }
 
 .event-log-container {
-  background: #0a0a0a;
-  border: 1px solid #333;
-  border-radius: 8px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-md);
   padding: 1rem;
   max-height: 600px;
   overflow-y: auto;
@@ -1704,7 +1764,7 @@ button.danger:hover {
   display: flex;
   gap: 1rem;
   padding: 0.75rem;
-  border-bottom: 1px solid #1a1a1a;
+  border-bottom: 1px solid var(--border-subtle);
   font-family: 'Courier New', monospace;
   font-size: 0.85rem;
 }
@@ -1714,7 +1774,7 @@ button.danger:hover {
 }
 
 .log-timestamp {
-  color: #666;
+  color: var(--text-muted);
   flex-shrink: 0;
 }
 
@@ -1725,31 +1785,31 @@ button.danger:hover {
 }
 
 .log-level.info {
-  color: #2196F3;
+  color: var(--accent-blue);
 }
 
 .log-level.success {
-  color: #4CAF50;
+  color: var(--accent-green);
 }
 
 .log-level.warning {
-  color: #FF9800;
+  color: var(--accent-orange);
 }
 
 .log-level.error {
-  color: #f44336;
+  color: var(--accent-red);
 }
 
 .log-message {
-  color: #e0e0e0;
+  color: var(--text-primary);
   flex: 1;
 }
 
 /* Per-submitter config styles (used in aggregator settings) */
 .submitter-config-section {
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 6px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-sm);
   padding: 1rem;
   margin-bottom: 1rem;
 }
@@ -1760,43 +1820,43 @@ button.danger:hover {
 
 .submitter-config-section h5 {
   margin: 0 0 0.75rem 0;
-  color: #fff;
+  color: var(--text-primary);
   font-size: 0.95rem;
   font-weight: 600;
 }
 
 .settings-info {
-  color: #999;
+  color: var(--text-secondary);
   font-size: 0.85rem;
   margin-bottom: 1rem;
   line-height: 1.4;
 }
 
 .settings-notice {
-  background: rgba(255, 152, 0, 0.1);
-  border: 1px solid rgba(255, 152, 0, 0.3);
-  border-radius: 6px;
+  background: rgba(255, 152, 0, 0.08);
+  border: 1px solid rgba(255, 152, 0, 0.25);
+  border-radius: var(--radius-sm);
   padding: 0.75rem 1rem;
-  color: #ff9800;
+  color: var(--accent-orange);
   font-size: 0.9rem;
   text-align: center;
   margin-top: 1rem;
 }
 
 .copy-btn {
-  background: #1a1a1a;
-  color: #4CAF50;
-  border: 1px solid #4CAF50;
+  background: var(--surface-2);
+  color: var(--accent-green);
+  border: 1px solid rgba(76, 175, 80, 0.3);
   padding: 0.35rem 0.75rem;
-  border-radius: 4px;
+  border-radius: var(--radius-sm);
   cursor: pointer;
   font-size: 0.8rem;
-  transition: all 0.2s ease;
+  transition: all var(--transition-fast);
   margin-left: auto;
 }
 
 .copy-btn:hover:not(:disabled) {
-  background: rgba(76, 175, 80, 0.2);
+  background: rgba(76, 175, 80, 0.12);
 }
 
 .copy-btn:disabled {
@@ -1888,14 +1948,14 @@ button.danger:hover {
   top: 50%;
   left: 50%;
   transform: translate(-50%, -50%);
-  background: #1a1a1a;
-  border: 2px solid #f1c40f;
-  border-radius: 12px;
-  padding: 2rem;
-  max-width: 600px;
+  background: var(--surface-2);
+  border: 1px solid var(--gold-dim);
+  border-radius: var(--radius-lg);
+  padding: 2.5rem;
+  max-width: 620px;
   width: 90%;
   z-index: 9999;
-  box-shadow: 0 8px 32px rgba(241, 196, 15, 0.3);
+  box-shadow: 0 16px 48px rgba(0, 0, 0, 0.6), 0 0 40px var(--gold-glow);
 }
 
 .disclaimer-content {
@@ -1905,34 +1965,33 @@ button.danger:hover {
 .disclaimer-content h2 {
   margin-top: 0;
   margin-bottom: 1.5rem;
-  color: #f1c40f;
+  color: var(--gold);
   font-size: 1.5rem;
 }
 
 .disclaimer-content p {
-  font-size: 1.1rem;
+  font-size: 1.05rem;
   line-height: 1.6;
   margin-bottom: 1.5rem;
-  color: #e0e0e0;
+  color: var(--text-primary);
 }
 
 .disclaimer-acknowledge-btn {
-  background: #f1c40f;
+  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
   color: #000;
   border: none;
   padding: 0.75rem 2rem;
-  border-radius: 6px;
+  border-radius: var(--radius-sm);
   font-size: 1rem;
   font-weight: 700;
   cursor: pointer;
-  transition: all 0.2s ease;
-  box-shadow: 0 4px 12px rgba(241, 196, 15, 0.3);
+  transition: all var(--transition-fast);
+  box-shadow: var(--shadow-gold);
 }
 
 .disclaimer-acknowledge-btn:hover {
-  background: #f39c12;
   transform: translateY(-2px);
-  box-shadow: 0 6px 16px rgba(241, 196, 15, 0.4);
+  box-shadow: 0 6px 20px rgba(30, 255, 28, 0.35);
 }
 
 .disclaimer-acknowledge-btn:active {
@@ -1943,8 +2002,8 @@ button.danger:hover {
    Footer Section
    ============================================ */
 .app-footer {
-  background: linear-gradient(135deg, #1a1a1a 0%, #0f0f0f 100%);
-  border-top: 1px solid #333;
+  background: linear-gradient(160deg, var(--surface-1) 0%, var(--surface-0) 100%);
+  border-top: 1px solid var(--border-subtle);
   padding: 1rem 2rem;
   margin-top: auto;
   position: relative;
@@ -1960,9 +2019,9 @@ button.danger:hover {
   background: linear-gradient(
     90deg,
     transparent 0%,
-    rgba(255, 215, 0, 0.3) 20%,
-    rgba(255, 215, 0, 0.5) 50%,
-    rgba(255, 215, 0, 0.3) 80%,
+    rgba(30, 255, 28, 0.25) 20%,
+    rgba(30, 255, 28, 0.4) 50%,
+    rgba(30, 255, 28, 0.25) 80%,
     transparent 100%
   );
 }
@@ -1989,17 +2048,17 @@ button.danger:hover {
 }
 
 .footer-license {
-  color: #888;
+  color: var(--text-muted);
   font-size: 0.85rem;
 }
 
 .footer-divider {
-  color: #444;
+  color: var(--border-strong);
   margin: 0 0.25rem;
 }
 
 .footer-copyright {
-  color: #666;
+  color: var(--text-muted);
 }
 
 .footer-links {
@@ -2008,34 +2067,59 @@ button.danger:hover {
 }
 
 .footer-link {
-  color: #aaa;
+  color: var(--text-secondary);
   text-decoration: none;
   font-size: 0.9rem;
   display: flex;
   align-items: center;
   gap: 0.4rem;
   padding: 0.4rem 0.75rem;
-  border-radius: 4px;
-  transition: all 0.2s ease;
+  border-radius: var(--radius-sm);
+  transition: all var(--transition-fast);
   border: 1px solid transparent;
 }
 
 .footer-link:hover {
-  color: #fff;
-  background: rgba(255, 255, 255, 0.05);
-  border-color: #444;
+  color: var(--text-primary);
+  background: rgba(255, 255, 255, 0.04);
+  border-color: var(--border-subtle);
 }
 
 .footer-link-news {
-  color: #ccc;
-  border: 1px solid #444;
+  color: var(--text-secondary);
+  border: 1px solid var(--border-subtle);
   background: rgba(255, 255, 255, 0.02);
 }
 
 .footer-link-news:hover {
-  color: #ffd700;
-  border-color: rgba(255, 215, 0, 0.4);
-  background: rgba(255, 215, 0, 0.08);
+  color: var(--gold);
+  border-color: rgba(30, 255, 28, 0.3);
+  background: rgba(30, 255, 28, 0.06);
+}
+
+.footer-link-github {
+  color: var(--text-secondary);
+  border: 1px solid var(--border-subtle);
+  background: rgba(255, 255, 255, 0.02);
+}
+
+.footer-link-github:hover {
+  color: #7dff6f;
+  border-color: rgba(30, 255, 28, 0.4);
+  background: rgba(30, 255, 28, 0.06);
+}
+
+.footer-link-purchase {
+  color: #7dff6f;
+  font-weight: 700;
+  border: 1px solid rgba(30, 255, 28, 0.45);
+  background: rgba(30, 255, 28, 0.03);
+}
+
+.footer-link-purchase:hover {
+  color: #a8ff9a;
+  background: rgba(30, 255, 28, 0.06);
+  border-color: rgba(30, 255, 28, 0.72);
 }
 
 
@@ -2063,3 +2147,38 @@ button.danger:hover {
     justify-content: center;
   }
 }
+
+/* ============================================
+   Global Scrollbar Styling
+   ============================================ */
+::-webkit-scrollbar {
+  width: 8px;
+  height: 8px;
+}
+
+::-webkit-scrollbar-track {
+  background: var(--surface-0);
+}
+
+::-webkit-scrollbar-thumb {
+  background: var(--surface-4);
+  border-radius: 4px;
+}
+
+::-webkit-scrollbar-thumb:hover {
+  background: var(--border-strong);
+}
+
+/* Firefox scrollbar */
+* {
+  scrollbar-width: thin;
+  scrollbar-color: var(--surface-4) var(--surface-0);
+}
+
+/* ============================================
+   Global Selection Styling
+   ============================================ */
+::selection {
+  background: rgba(30, 255, 28, 0.2);
+  color: var(--text-primary);
+}
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index 80f2f95..ce8573d 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -20,7 +20,12 @@ export const api = {
       headers: { 'Content-Type': 'application/json' },
       body: JSON.stringify(config),
     });
-    if (!response.ok) throw new Error('Failed to start aggregator');
+    if (!response.ok) {
+      const errorData = await response.json();
+      const error = new Error('Failed to start aggregator');
+      error.details = errorData.detail;
+      throw error;
+    }
     return response.json();
   },
 
@@ -363,6 +368,22 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  // Get all Stage 2 history papers across legacy + sessions
+  async getPaperHistory() {
+    const response = await fetch(`${API_BASE}/auto-research/paper-history`);
+    if (!response.ok) throw new Error('Failed to get Stage 2 paper history');
+    return response.json();
+  },
+
+  // Get one Stage 2 history paper by session-aware identifier
+  async getHistoryPaper(sessionId, paperId) {
+    const response = await fetch(
+      `${API_BASE}/auto-research/paper-history/${encodeURIComponent(sessionId)}/${encodeURIComponent(paperId)}`
+    );
+    if (!response.ok) throw new Error(`Failed to get history paper ${sessionId}/${paperId}`);
+    return response.json();
+  },
+
   // Get statistics
   async getStats() {
     const response = await fetch(`${API_BASE}/auto-research/stats`);
@@ -467,6 +488,21 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  // Delete Stage 2 history paper by session-aware identifier
+  async deleteHistoryPaper(sessionId, paperId) {
+    const response = await fetch(
+      `${API_BASE}/auto-research/paper-history/${encodeURIComponent(sessionId)}/${encodeURIComponent(paperId)}?confirm=true`,
+      {
+        method: 'DELETE',
+      }
+    );
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.detail || `Failed to delete history paper ${sessionId}/${paperId}`);
+    }
+    return response.json();
+  },
+
   // ============================================================
   // Tier 3 - Final Answer API
   // ============================================================
@@ -526,8 +562,10 @@ export const autonomousAPI = {
   // ============================================================
 
   // Get API logs
-  async getApiLogs(limit = 100) {
-    const response = await fetch(`${API_BASE}/auto-research/api-logs?limit=${limit}`);
+  async getApiLogs(limit = 100, options = {}) {
+    const response = await fetch(`${API_BASE}/auto-research/api-logs?limit=${limit}`, {
+      signal: options.signal,
+    });
     if (!response.ok) throw new Error('Failed to get API logs');
     return response.json();
   },
@@ -598,6 +636,45 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  // Generate a critique for a Stage 2 history paper
+  async generateHistoryPaperCritique(sessionId, paperId, customPrompt = null, validatorConfig = null) {
+    const body = {};
+    if (customPrompt) body.custom_prompt = customPrompt;
+
+    if (validatorConfig && validatorConfig.validator_model) {
+      body.validator_model = validatorConfig.validator_model;
+      body.validator_context_window = validatorConfig.validator_context_window;
+      body.validator_max_tokens = validatorConfig.validator_max_tokens;
+      body.validator_provider = validatorConfig.validator_provider;
+      body.validator_openrouter_provider = validatorConfig.validator_openrouter_provider;
+    }
+
+    const response = await fetch(
+      `${API_BASE}/auto-research/paper-history/${encodeURIComponent(sessionId)}/${encodeURIComponent(paperId)}/critique`,
+      {
+        method: 'POST',
+        headers: {
+          'Content-Type': 'application/json',
+        },
+        body: JSON.stringify(body),
+      }
+    );
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.detail || 'Failed to generate history paper critique');
+    }
+    return response.json();
+  },
+
+  // Get all critiques for a Stage 2 history paper
+  async getHistoryPaperCritiques(sessionId, paperId) {
+    const response = await fetch(
+      `${API_BASE}/auto-research/paper-history/${encodeURIComponent(sessionId)}/${encodeURIComponent(paperId)}/critiques`
+    );
+    if (!response.ok) throw new Error('Failed to get history paper critiques');
+    return response.json();
+  },
+
   // Generate a critique for a final answer
   // validatorConfig is optional - if not provided, will try to use coordinator's stored config
   async generateFinalAnswerCritique(answerId, customPrompt = null, validatorConfig = null) {
@@ -816,6 +893,13 @@ export const workflowAPI = {
     if (!response.ok) throw new Error('Failed to get workflow history');
     return response.json();
   },
+
+  // Get cumulative token usage stats and elapsed time
+  async getTokenStats() {
+    const response = await fetch(`${API_BASE}/token-stats`);
+    if (!response.ok) throw new Error('Failed to get token stats');
+    return response.json();
+  },
 };
 
 // OpenRouter API (for per-role model selection)
@@ -923,6 +1007,17 @@ export const openRouterAPI = {
     }
     return response.json();
   },
+
+  async resetCreditExhaustion() {
+    const response = await fetch(`${API_BASE}/openrouter/reset-exhaustion`, {
+      method: 'POST',
+    });
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.detail || 'Failed to reset credit exhaustion');
+    }
+    return response.json();
+  },
 };
 
 // Add helper methods to main api object
diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
new file mode 100644
index 0000000..d626853
--- /dev/null
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -0,0 +1,424 @@
+import { loadModelCache, getModelApiId } from './modelCache';
+
+export const AUTONOMOUS_SETTINGS_STORAGE_KEY = 'autonomous_research_settings';
+export const AUTONOMOUS_PROFILES_STORAGE_KEY = 'autonomous_research_profiles';
+export const STARTUP_PROVIDER_CHOICE_STORAGE_KEY = 'startup_provider_choice';
+export const LM_STUDIO_STARTUP_CHOICE = 'lm_studio';
+export const RECOMMENDED_PROFILE_KEY = 'recommended_fast_affordable_mid';
+export const RECOMMENDED_CHEAPER_PROFILE_KEY = 'recommended_cheaper_lower_knowledge';
+export const RECOMMENDED_PROFILE_KEYS = [
+  RECOMMENDED_PROFILE_KEY,
+  RECOMMENDED_CHEAPER_PROFILE_KEY,
+];
+
+const DEFAULT_SUBMITTER_CONFIG = {
+  submitterId: 1,
+  provider: 'lm_studio',
+  modelId: '',
+  openrouterProvider: null,
+  lmStudioFallbackId: null,
+  contextWindow: 131072,
+  maxOutputTokens: 25000,
+};
+
+const DEFAULT_OPENROUTER_SUBMITTER_CONFIGS = [
+  {
+    submitterId: 1,
+    provider: 'openrouter',
+    modelId: 'openai/gpt-oss-120b',
+    openrouterProvider: 'Google',
+    lmStudioFallbackId: null,
+    contextWindow: 131072,
+    maxOutputTokens: 25000,
+  },
+  {
+    submitterId: 2,
+    provider: 'openrouter',
+    modelId: 'openai/gpt-oss-20b',
+    openrouterProvider: 'Groq',
+    lmStudioFallbackId: null,
+    contextWindow: 131072,
+    maxOutputTokens: 25000,
+  },
+  {
+    submitterId: 3,
+    provider: 'openrouter',
+    modelId: 'openai/gpt-oss-120b',
+    openrouterProvider: 'Google',
+    lmStudioFallbackId: null,
+    contextWindow: 131072,
+    maxOutputTokens: 25000,
+  },
+];
+
+const DEFAULT_LOCAL_CONFIG = {
+  validator_provider: 'openrouter',
+  validator_model: 'openai/gpt-oss-120b',
+  validator_openrouter_provider: 'Google',
+  validator_lm_studio_fallback: null,
+  validator_context_window: 131072,
+  validator_max_tokens: 25000,
+  high_context_provider: 'openrouter',
+  high_context_model: 'openai/gpt-oss-120b',
+  high_context_openrouter_provider: 'Google',
+  high_context_lm_studio_fallback: null,
+  high_context_context_window: 131072,
+  high_context_max_tokens: 25000,
+  high_param_provider: 'openrouter',
+  high_param_model: 'openai/gpt-oss-120b',
+  high_param_openrouter_provider: 'Google',
+  high_param_lm_studio_fallback: null,
+  high_param_context_window: 131072,
+  high_param_max_tokens: 25000,
+  critique_submitter_provider: 'openrouter',
+  critique_submitter_model: 'openai/gpt-oss-120b',
+  critique_submitter_openrouter_provider: 'Google',
+  critique_submitter_lm_studio_fallback: null,
+  critique_submitter_context_window: 131072,
+  critique_submitter_max_tokens: 25000,
+};
+
+const DEFAULT_LM_LOCAL_CONFIG = {
+  validator_provider: 'lm_studio',
+  validator_model: '',
+  validator_openrouter_provider: null,
+  validator_lm_studio_fallback: null,
+  validator_context_window: 131072,
+  validator_max_tokens: 25000,
+  high_context_provider: 'lm_studio',
+  high_context_model: '',
+  high_context_openrouter_provider: null,
+  high_context_lm_studio_fallback: null,
+  high_context_context_window: 131072,
+  high_context_max_tokens: 25000,
+  high_param_provider: 'lm_studio',
+  high_param_model: '',
+  high_param_openrouter_provider: null,
+  high_param_lm_studio_fallback: null,
+  high_param_context_window: 131072,
+  high_param_max_tokens: 25000,
+  critique_submitter_provider: 'lm_studio',
+  critique_submitter_model: '',
+  critique_submitter_openrouter_provider: null,
+  critique_submitter_lm_studio_fallback: null,
+  critique_submitter_context_window: 131072,
+  critique_submitter_max_tokens: 25000,
+};
+
+const createDefaultSubmitterConfigs = (modelId = '') => (
+  [1, 2, 3].map((submitterId) => ({
+    ...DEFAULT_SUBMITTER_CONFIG,
+    submitterId,
+    modelId,
+  }))
+);
+
+const DEFAULT_AUTONOMOUS_SETTINGS = {
+  numSubmitters: 3,
+  submitterConfigs: DEFAULT_OPENROUTER_SUBMITTER_CONFIGS,
+  localConfig: DEFAULT_LOCAL_CONFIG,
+  freeOnly: false,
+  freeModelLooping: true,
+  freeModelAutoSelector: true,
+  tier3Enabled: false,
+  modelProviders: {},
+  selectedProfile: '',
+};
+
+export const RECOMMENDED_PROFILES = {
+  [RECOMMENDED_PROFILE_KEY]: {
+    name: 'Fast, affordable, mid-tier knowledge',
+    numSubmitters: 3,
+    submitters: [
+      {
+        modelId: 'moonshotai/kimi-k2.5',
+        provider: 'openrouter',
+        openrouterProvider: 'SiliconFlow',
+        lmStudioFallbackId: null,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
+      },
+      {
+        modelId: 'openai/gpt-oss-120b',
+        provider: 'openrouter',
+        openrouterProvider: 'Groq',
+        lmStudioFallbackId: null,
+        contextWindow: 131072,
+        maxOutputTokens: 25000,
+      },
+      {
+        modelId: 'deepseek/deepseek-v3.2',
+        provider: 'openrouter',
+        openrouterProvider: 'AtlasCloud',
+        lmStudioFallbackId: null,
+        contextWindow: 163800,
+        maxOutputTokens: 30000,
+      },
+    ],
+    validator: {
+      modelId: 'x-ai/grok-4.1-fast',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 2000000,
+      maxOutputTokens: 30000,
+    },
+    highContext: {
+      modelId: 'moonshotai/kimi-k2.5',
+      provider: 'openrouter',
+      openrouterProvider: 'SiliconFlow',
+      lmStudioFallbackId: null,
+      contextWindow: 262000,
+      maxOutputTokens: 40000,
+    },
+    highParam: {
+      modelId: 'google/gemini-3.1-pro-preview',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+    critique: {
+      modelId: 'google/gemini-3.1-pro-preview',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+  },
+  [RECOMMENDED_CHEAPER_PROFILE_KEY]: {
+    name: 'Cheaper, lower knowledge',
+    numSubmitters: 3,
+    submitters: Array.from({ length: 3 }, () => ({
+      modelId: 'qwen/qwen3.5-flash-02-23',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    })),
+    validator: {
+      modelId: 'qwen/qwen3.5-flash-02-23',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+    highContext: {
+      modelId: 'qwen/qwen3.5-flash-02-23',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+    highParam: {
+      modelId: 'qwen/qwen3.5-flash-02-23',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+    critique: {
+      modelId: 'qwen/qwen3.5-flash-02-23',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+  },
+};
+
+function normalizeStoredSettings(settings = {}) {
+  const submitterConfigs = Array.isArray(settings.submitterConfigs) && settings.submitterConfigs.length > 0
+    ? settings.submitterConfigs.map((cfg, index) => ({
+        ...DEFAULT_SUBMITTER_CONFIG,
+        ...cfg,
+        submitterId: cfg.submitterId || index + 1,
+      }))
+    : DEFAULT_AUTONOMOUS_SETTINGS.submitterConfigs;
+
+  return {
+    ...DEFAULT_AUTONOMOUS_SETTINGS,
+    ...settings,
+    numSubmitters: settings.numSubmitters || submitterConfigs.length || DEFAULT_AUTONOMOUS_SETTINGS.numSubmitters,
+    submitterConfigs,
+    localConfig: {
+      ...DEFAULT_LOCAL_CONFIG,
+      ...(settings.localConfig || {}),
+    },
+    freeOnly: settings.freeOnly ?? DEFAULT_AUTONOMOUS_SETTINGS.freeOnly,
+    freeModelLooping: settings.freeModelLooping ?? DEFAULT_AUTONOMOUS_SETTINGS.freeModelLooping,
+    freeModelAutoSelector: settings.freeModelAutoSelector ?? DEFAULT_AUTONOMOUS_SETTINGS.freeModelAutoSelector,
+    tier3Enabled: settings.tier3Enabled ?? DEFAULT_AUTONOMOUS_SETTINGS.tier3Enabled,
+    modelProviders: settings.modelProviders || DEFAULT_AUTONOMOUS_SETTINGS.modelProviders,
+    selectedProfile: settings.selectedProfile || '',
+  };
+}
+
+export function getStoredAutonomousSettings() {
+  try {
+    const raw = localStorage.getItem(AUTONOMOUS_SETTINGS_STORAGE_KEY);
+    if (!raw) {
+      return normalizeStoredSettings();
+    }
+
+    return normalizeStoredSettings(JSON.parse(raw));
+  } catch (error) {
+    console.error('Failed to load autonomous research settings:', error);
+    return normalizeStoredSettings();
+  }
+}
+
+export function persistAutonomousSettings(settings) {
+  const normalized = normalizeStoredSettings(settings);
+  localStorage.setItem(AUTONOMOUS_SETTINGS_STORAGE_KEY, JSON.stringify(normalized));
+  return normalized;
+}
+
+export function settingsToAutonomousConfig(settings) {
+  const normalized = normalizeStoredSettings(settings);
+  const localConfig = normalized.localConfig || {};
+
+  return {
+    submitter_configs: normalized.submitterConfigs.slice(0, normalized.numSubmitters),
+    validator_provider: localConfig.validator_provider,
+    validator_model: localConfig.validator_model,
+    validator_openrouter_provider: localConfig.validator_openrouter_provider,
+    validator_lm_studio_fallback: localConfig.validator_lm_studio_fallback,
+    validator_context_window: localConfig.validator_context_window,
+    validator_max_tokens: localConfig.validator_max_tokens,
+    high_context_provider: localConfig.high_context_provider,
+    high_context_model: localConfig.high_context_model,
+    high_context_openrouter_provider: localConfig.high_context_openrouter_provider,
+    high_context_lm_studio_fallback: localConfig.high_context_lm_studio_fallback,
+    high_context_context_window: localConfig.high_context_context_window,
+    high_context_max_tokens: localConfig.high_context_max_tokens,
+    high_param_provider: localConfig.high_param_provider,
+    high_param_model: localConfig.high_param_model,
+    high_param_openrouter_provider: localConfig.high_param_openrouter_provider,
+    high_param_lm_studio_fallback: localConfig.high_param_lm_studio_fallback,
+    high_param_context_window: localConfig.high_param_context_window,
+    high_param_max_tokens: localConfig.high_param_max_tokens,
+    critique_submitter_provider: localConfig.critique_submitter_provider,
+    critique_submitter_model: localConfig.critique_submitter_model,
+    critique_submitter_openrouter_provider: localConfig.critique_submitter_openrouter_provider,
+    critique_submitter_lm_studio_fallback: localConfig.critique_submitter_lm_studio_fallback,
+    critique_submitter_context_window: localConfig.critique_submitter_context_window,
+    critique_submitter_max_tokens: localConfig.critique_submitter_max_tokens,
+    tier3_enabled: normalized.tier3Enabled ?? false,
+  };
+}
+
+function buildLocalConfigFromLmStudio(modelId = '') {
+  return {
+    ...DEFAULT_LM_LOCAL_CONFIG,
+    validator_model: modelId,
+    high_context_model: modelId,
+    high_param_model: modelId,
+    critique_submitter_model: modelId,
+  };
+}
+
+export function applyLmStudioStartupDefaults(modelId = '') {
+  const currentSettings = getStoredAutonomousSettings();
+  const nextSettings = persistAutonomousSettings({
+    ...currentSettings,
+    numSubmitters: 3,
+    submitterConfigs: createDefaultSubmitterConfigs(modelId),
+    localConfig: {
+      ...currentSettings.localConfig,
+      ...buildLocalConfigFromLmStudio(modelId),
+    },
+    selectedProfile: '',
+  });
+
+  return {
+    settings: nextSettings,
+    config: settingsToAutonomousConfig(nextSettings),
+  };
+}
+
+export async function applyAutonomousProfileSelection(profileKey, userProfiles = {}) {
+  const isRecommended = profileKey.startsWith('recommended_');
+  const profile = isRecommended
+    ? RECOMMENDED_PROFILES[profileKey]
+    : userProfiles[profileKey];
+
+  if (!profile) {
+    throw new Error(`Profile not found: ${profileKey}`);
+  }
+
+  await loadModelCache();
+
+  const convertToApiId = (displayNameOrId) => {
+    if (!displayNameOrId) return '';
+    return getModelApiId(displayNameOrId);
+  };
+
+  const submitterConfigs = profile.submitters.map((submitterProfile, index) => ({
+    submitterId: index + 1,
+    provider: submitterProfile.provider || 'openrouter',
+    modelId: isRecommended
+      ? convertToApiId(submitterProfile.modelId || '')
+      : (submitterProfile.modelId || ''),
+    openrouterProvider: submitterProfile.openrouterProvider || null,
+    lmStudioFallbackId: isRecommended ? null : (submitterProfile.lmStudioFallbackId || null),
+    contextWindow: submitterProfile.contextWindow,
+    maxOutputTokens: submitterProfile.maxOutputTokens,
+  }));
+
+  const getModelId = (roleProfile = {}) => (
+    isRecommended
+      ? convertToApiId(roleProfile.modelId || '')
+      : (roleProfile.modelId || '')
+  );
+
+  const getOpenRouterProvider = (roleProfile = {}) => roleProfile.openrouterProvider || null;
+
+  const currentSettings = getStoredAutonomousSettings();
+  const nextSettings = persistAutonomousSettings({
+    ...currentSettings,
+    numSubmitters: profile.numSubmitters,
+    submitterConfigs,
+    localConfig: {
+      ...currentSettings.localConfig,
+      validator_provider: isRecommended ? 'openrouter' : (profile.validator.provider || 'openrouter'),
+      validator_model: getModelId(profile.validator),
+      validator_openrouter_provider: getOpenRouterProvider(profile.validator),
+      validator_lm_studio_fallback: isRecommended ? null : (profile.validator.lmStudioFallbackId || null),
+      validator_context_window: profile.validator.contextWindow,
+      validator_max_tokens: profile.validator.maxOutputTokens,
+      high_context_provider: isRecommended ? 'openrouter' : (profile.highContext.provider || 'openrouter'),
+      high_context_model: getModelId(profile.highContext),
+      high_context_openrouter_provider: getOpenRouterProvider(profile.highContext),
+      high_context_lm_studio_fallback: isRecommended ? null : (profile.highContext.lmStudioFallbackId || null),
+      high_context_context_window: profile.highContext.contextWindow,
+      high_context_max_tokens: profile.highContext.maxOutputTokens,
+      high_param_provider: isRecommended ? 'openrouter' : (profile.highParam.provider || 'openrouter'),
+      high_param_model: getModelId(profile.highParam),
+      high_param_openrouter_provider: getOpenRouterProvider(profile.highParam),
+      high_param_lm_studio_fallback: isRecommended ? null : (profile.highParam.lmStudioFallbackId || null),
+      high_param_context_window: profile.highParam.contextWindow,
+      high_param_max_tokens: profile.highParam.maxOutputTokens,
+      critique_submitter_provider: isRecommended ? 'openrouter' : (profile.critique.provider || 'openrouter'),
+      critique_submitter_model: getModelId(profile.critique),
+      critique_submitter_openrouter_provider: getOpenRouterProvider(profile.critique),
+      critique_submitter_lm_studio_fallback: isRecommended ? null : (profile.critique.lmStudioFallbackId || null),
+      critique_submitter_context_window: profile.critique.contextWindow,
+      critique_submitter_max_tokens: profile.critique.maxOutputTokens,
+    },
+    selectedProfile: profileKey,
+  });
+
+  return {
+    profile,
+    settings: nextSettings,
+    config: settingsToAutonomousConfig(nextSettings),
+  };
+}
diff --git a/frontend/src/utils/disclaimerHelper.js b/frontend/src/utils/disclaimerHelper.js
new file mode 100644
index 0000000..6ecb910
--- /dev/null
+++ b/frontend/src/utils/disclaimerHelper.js
@@ -0,0 +1,67 @@
+/**
+ * Frontend-only disclaimer injection for brainstorms and in-progress papers.
+ *
+ * Disclaimers are prepended at the display/download layer so models never see
+ * them in their context window. Completed papers already have a richer
+ * backend-embedded disclaimer (AUTONOMOUS AI SOLUTION) — those are detected
+ * and left unchanged.
+ */
+
+const SEPARATOR = '='.repeat(80);
+
+export const PAPER_DISCLAIMER =
+  `${SEPARATOR}\n` +
+  'DISCLAIMER\n' +
+  '\n' +
+  'This content is provided for informational and experimental purposes only.\n' +
+  'This paper was autonomously generated with the novelty-seeking MOTO harness\n' +
+  'without peer review or user oversight beyond the original prompt. It may\n' +
+  'contain incorrect, incomplete, misleading, or fabricated claims presented\n' +
+  'with high confidence. Use of this content is at your own risk. You are\n' +
+  'solely responsible for reviewing and independently verifying any output\n' +
+  'before relying on it, and the developers, operators, and contributors are\n' +
+  'not responsible for errors, omissions, decisions made from this content, or\n' +
+  'any resulting loss, damage, cost, or liability.\n' +
+  `${SEPARATOR}`;
+
+export const BRAINSTORM_DISCLAIMER =
+  `${SEPARATOR}\n` +
+  'DISCLAIMER\n' +
+  '\n' +
+  'This content is provided for informational and experimental purposes only.\n' +
+  'This brainstorm database was autonomously generated with the novelty-seeking\n' +
+  'MOTO harness without peer review or user oversight beyond the original\n' +
+  'prompt. It may contain incorrect, incomplete, misleading, or\n' +
+  'fabricated claims presented with high confidence. Use of this content is at\n' +
+  'your own risk. You are solely responsible for reviewing and independently\n' +
+  'verifying any output before relying on it, and the developers, operators,\n' +
+  'and contributors are not responsible for errors, omissions, decisions made\n' +
+  'from this content, or any resulting loss, damage, cost, or liability.\n' +
+  `${SEPARATOR}`;
+
+/**
+ * Returns true when the content already carries a disclaimer header
+ * (either the backend-embedded AUTONOMOUS AI SOLUTION or the frontend
+ * DISCLAIMER block).
+ */
+export function hasDisclaimer(content) {
+  if (!content) return false;
+  const head = content.slice(0, 200);
+  return (
+    head.includes('AUTONOMOUS AI SOLUTION') ||
+    head.includes('DISCLAIMER')
+  );
+}
+
+/**
+ * Prepend the appropriate disclaimer to content unless one is already present.
+ *
+ * @param {string} content  Raw content string
+ * @param {'paper'|'brainstorm'} type  Which disclaimer variant to use
+ * @returns {string} Content with disclaimer prepended (or unchanged)
+ */
+export function prependDisclaimer(content, type) {
+  if (!content || hasDisclaimer(content)) return content;
+  const disclaimer = type === 'brainstorm' ? BRAINSTORM_DISCLAIMER : PAPER_DISCLAIMER;
+  return `${disclaimer}\n\n${content}`;
+}
diff --git a/frontend/src/utils/downloadHelpers.js b/frontend/src/utils/downloadHelpers.js
index bcfc6e2..f630269 100644
--- a/frontend/src/utils/downloadHelpers.js
+++ b/frontend/src/utils/downloadHelpers.js
@@ -8,16 +8,20 @@
  */
 import { renderLatexToHtml, DOMPURIFY_CONFIG } from '../components/LatexRenderer';
 import DOMPurify from 'dompurify';
+import { prependDisclaimer } from './disclaimerHelper';
 
 /**
  * Download raw text content as a .txt file.
  * @param {string} content - The text content
  * @param {string} filename - The filename (without extension)
  * @param {string|null} outline - Optional outline to prepend
+ * @param {'paper'|'brainstorm'|null} disclaimerType - Prepend disclaimer if set
  */
-export const downloadRawText = (content, filename, outline = null) => {
+export const downloadRawText = (content, filename, outline = null, disclaimerType = null) => {
   let fullContent = '';
 
+  const body = disclaimerType ? prependDisclaimer(content, disclaimerType) : content;
+
   if (outline) {
     fullContent += 'OUTLINE\n';
     fullContent += '='.repeat(80) + '\n\n';
@@ -25,7 +29,7 @@ export const downloadRawText = (content, filename, outline = null) => {
     fullContent += '='.repeat(80) + '\n\n';
   }
 
-  fullContent += content;
+  fullContent += body;
 
   const blob = new Blob([fullContent], { type: 'text/plain' });
   const url = URL.createObjectURL(blob);
@@ -52,6 +56,7 @@ export const downloadRawText = (content, filename, outline = null) => {
  * @param {Function|null} onStart    - Called immediately when request starts
  * @param {Function|null} onComplete - Called when PDF download begins
  * @param {Function|null} onError    - Called with Error on failure
+ * @param {'paper'|'brainstorm'|null} disclaimerType - Prepend disclaimer if set
  */
 export const downloadPDFViaBackend = async (
   rawContent,
@@ -61,12 +66,15 @@ export const downloadPDFViaBackend = async (
   onStart = null,
   onComplete = null,
   onError = null,
+  disclaimerType = null,
 ) => {
   onStart?.();
 
   try {
+    const body = disclaimerType ? prependDisclaimer(rawContent, disclaimerType) : rawContent;
+
     // Render LaTeX → HTML using the same pipeline as the screen renderer
-    const rawHtml = renderLatexToHtml(rawContent);
+    const rawHtml = renderLatexToHtml(body);
     const sanitizedHtml = DOMPurify.sanitize(rawHtml, DOMPURIFY_CONFIG);
 
     const response = await fetch('/api/download/pdf', {
diff --git a/frontend/src/utils/researchRunHistory.js b/frontend/src/utils/researchRunHistory.js
new file mode 100644
index 0000000..a06cc24
--- /dev/null
+++ b/frontend/src/utils/researchRunHistory.js
@@ -0,0 +1,129 @@
+function toTimestamp(value) {
+  if (!value) return 0;
+  const timestamp = new Date(value).getTime();
+  return Number.isFinite(timestamp) ? timestamp : 0;
+}
+
+function parsePaperSequence(paperId = '') {
+  const match = String(paperId).match(/(\d+)(?!.*\d)/);
+  return match ? Number(match[1]) : null;
+}
+
+function compareStage2Papers(a, b) {
+  const aSequence = parsePaperSequence(a.paper_id);
+  const bSequence = parsePaperSequence(b.paper_id);
+
+  if (aSequence !== null && bSequence !== null && aSequence !== bSequence) {
+    return aSequence - bSequence;
+  }
+
+  return toTimestamp(a.created_at) - toTimestamp(b.created_at);
+}
+
+function compareStage3Answers(a, b) {
+  return toTimestamp(b.completion_date) - toTimestamp(a.completion_date);
+}
+
+function buildFallbackRun(sessionId, seedItem = null) {
+  return {
+    sessionId,
+    displaySessionId: sessionId === 'legacy' ? 'Legacy' : sessionId,
+    userPrompt: seedItem?.user_prompt || (sessionId === 'legacy' ? 'Legacy research session' : 'Unknown research question'),
+    createdAt: seedItem?.created_at || seedItem?.completion_date || null,
+    brainstormCount: null,
+    sessionPaperCount: null,
+    isLegacy: sessionId === 'legacy',
+    isCurrent: false,
+    stage2Papers: [],
+    stage3Answers: [],
+  };
+}
+
+export function buildResearchRunGroups({
+  sessionsResponse = null,
+  stage2Papers = [],
+  stage3Answers = [],
+}) {
+  const sessions = sessionsResponse?.sessions || [];
+  const currentSessionId = sessionsResponse?.current_session_id || null;
+  const sessionMap = new Map();
+
+  for (const session of sessions) {
+    sessionMap.set(session.session_id, session);
+  }
+
+  const groups = new Map();
+
+  const ensureGroup = (sessionId, seedItem = null) => {
+    if (groups.has(sessionId)) {
+      return groups.get(sessionId);
+    }
+
+    const session = sessionMap.get(sessionId);
+    const group = session
+      ? {
+          sessionId,
+          displaySessionId: sessionId === 'legacy' ? 'Legacy' : sessionId,
+          userPrompt: session.user_prompt || seedItem?.user_prompt || 'Unknown research question',
+          createdAt: session.created_at || seedItem?.created_at || seedItem?.completion_date || null,
+          brainstormCount: session.brainstorm_count ?? null,
+          sessionPaperCount: session.paper_count ?? null,
+          isLegacy: sessionId === 'legacy',
+          isCurrent: sessionId === currentSessionId,
+          stage2Papers: [],
+          stage3Answers: [],
+        }
+      : buildFallbackRun(sessionId, seedItem);
+
+    groups.set(sessionId, group);
+    return group;
+  };
+
+  for (const paper of stage2Papers) {
+    const group = ensureGroup(paper.session_id, paper);
+    group.stage2Papers.push(paper);
+    if (!group.userPrompt && paper.user_prompt) {
+      group.userPrompt = paper.user_prompt;
+    }
+    if (!group.createdAt) {
+      group.createdAt = paper.created_at || null;
+    }
+  }
+
+  for (const answer of stage3Answers) {
+    const group = ensureGroup(answer.session_id, answer);
+    group.stage3Answers.push(answer);
+    if (!group.userPrompt && answer.user_prompt) {
+      group.userPrompt = answer.user_prompt;
+    }
+    if (!group.createdAt) {
+      group.createdAt = answer.completion_date || null;
+    }
+  }
+
+  const runGroups = Array.from(groups.values()).map((group) => {
+    const sortedStage2Papers = [...group.stage2Papers].sort(compareStage2Papers);
+    const sortedStage3Answers = [...group.stage3Answers].sort(compareStage3Answers);
+    const latestStage2At = sortedStage2Papers.length > 0 ? Math.max(...sortedStage2Papers.map((paper) => toTimestamp(paper.created_at))) : 0;
+    const latestStage3At = sortedStage3Answers.length > 0 ? Math.max(...sortedStage3Answers.map((answer) => toTimestamp(answer.completion_date))) : 0;
+    const latestActivityAt = Math.max(toTimestamp(group.createdAt), latestStage2At, latestStage3At);
+
+    return {
+      ...group,
+      stage2Papers: sortedStage2Papers,
+      stage3Answers: sortedStage3Answers,
+      stage2PaperCount: sortedStage2Papers.length,
+      stage3AnswerCount: sortedStage3Answers.length,
+      hasStage3Answer: sortedStage3Answers.length > 0,
+      latestActivityAt,
+    };
+  });
+
+  runGroups.sort((a, b) => {
+    if (a.isCurrent && !b.isCurrent) return -1;
+    if (!a.isCurrent && b.isCurrent) return 1;
+    return b.latestActivityAt - a.latestActivityAt;
+  });
+
+  return runGroups;
+}
diff --git a/package-lock.json b/package-lock.json
index 472881c..5db1f59 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.4",
+  "version": "1.0.5",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "moto-math-variant",
-      "version": "1.0.4",
+      "version": "1.0.5",
       "license": "MIT"
     }
   }
diff --git a/package.json b/package.json
index d6171a8..3e7b153 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.4",
+  "version": "1.0.5",
   "description": "MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "scripts": {
     "dev:backend": "cd backend && uvicorn api.main:app --reload --host 0.0.0.0 --port 8000",
diff --git a/random dev log.txt b/random dev log.txt
deleted file mode 100644
index 5a9b0d8..0000000
--- a/random dev log.txt	
+++ /dev/null
@@ -1,5266 +0,0 @@
-vertor (#37,#39); RAMI extensions like multistate UGF (#26), dependence Stein-Chen (#35), test coverage (#40); integration certs with varied scopes (#5,#17,#21,#23,#30). No submission is fully redundant, contradictory, or superseded—each offers diverse perspectives, specific error bounds/proofs, or novel couplings (e.g., #23 emphasizes Farkas infeas certs while #30 focuses on constraint enclosures post-uniqueness). Even overlapping themes (UQ certs, validated numerics) retain value through methodological diversity and complementary strengths. Database quality is maintained wit
-2026-02-28 22:49:47.712 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-02-28 22:49:47.714 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, theorems, proofs, or techniques that advance specific aspects of the blueprint (e.g., distinct UQ certification methods like Cantelli (#9), scenario (#8,#10), DRO (#12), conformal (#19,#22), SOS (#27); specialized physics chains like alpha (#11), ballooning (#24,#31), ripple (#36), divertor (#37,#39); RAMI extensions like multistate UGF (#26), dependence Stein-Chen (#35), test coverage (#40); integration certs with varied scopes (#5,#17,#21,#23,#30). No submission is fully redundant, contradictory, or superseded—each offers diverse perspectives, specific error bounds/proofs, or novel couplings (e.g., #23 emphasizes Farkas infeas certs while #30 focuses on constraint enclosures post-uniqueness). Even overlapping themes (UQ certs, validated numerics) retain value through methodological diversity and complementary strengths. Database quality is maintained without removal.'}
-2026-02-28 22:49:47.714 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-02-28 22:49:47.714 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, theorems, proofs, or techniques that advance specific aspects of the blueprint (e.g., distinct UQ certification methods like Cantelli (#9), scenario (#8,#10), DRO (#12), conformal (#19,#22), SOS (#27); specialized physics chains like alpha (
-2026-02-28 22:49:47.714 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-02-28 22:49:47.714 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, theorems, proofs, or techniques that advance specific aspects of the blueprint (e.g., distinct UQ certification methods like Cantelli (#9), s
-2026-02-28 22:49:47.714 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-02-28 22:49:47.714 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-02-28 22:49:47.714 - backend.aggregator.core.coordinator - INFO - Cleanup review #6: No removal needed
-2026-02-28 22:49:47.716 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-02-28 22:49:47.726 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission rejected (consecutive: 1)
-2026-02-28 22:49:47.726 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 3 (total: 11)
-2026-02-28 22:49:47.736 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #43
-2026-02-28 22:49:47.736 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:49:47.736 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 18)
-2026-02-28 22:49:47.738 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 43)
-2026-02-28 22:49:47.738 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:49:47.738 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-02-28 22:49:47.738 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-02-28 22:49:47.740 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 11 total chunks
-2026-02-28 22:49:47.754 - backend.aggregator.core.coordinator - INFO - Validator iteration 22 - batch validating 3 submissions: ['93e63293-b246-4c5f-bec7-976852f8a5cb', 'ce9b5c20-7b8f-465f-9ae5-0c064f83b523', 'ed2b7a40-6fcd-426d-99d8-948838ff2d8c']
-2026-02-28 22:49:47.754 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-02-28 22:49:47.755 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-02-28 22:49:47.996 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-02-28 22:49:47.996 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-02-28 22:50:11.962 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 39db3714-70cf-48fa-a60e-857256ed164e (iteration 26)
-2026-02-28 22:50:21.840 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission aec67092-4e54-413f-a588-de67d854cd29 (iteration 29)
-2026-02-28 22:50:41.809 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-02-28 22:50:41.827 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #44
-2026-02-28 22:50:41.827 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:50:41.827 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 20)
-2026-02-28 22:50:41.827 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 44)
-2026-02-28 22:50:41.827 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:50:41.827 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-02-28 22:50:41.827 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-02-28 22:50:41.827 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 21 total chunks
-2026-02-28 22:50:41.857 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #45
-2026-02-28 22:50:41.857 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-02-28 22:50:41.857 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:50:41.857 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 19)
-2026-02-28 22:50:41.858 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 45)
-2026-02-28 22:50:41.862 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-02-28 22:50:41.863 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:50:41.863 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-02-28 22:50:41.863 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-02-28 22:50:41.866 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 41 total chunks
-2026-02-28 22:50:41.883 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #46
-2026-02-28 22:50:41.883 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-02-28 22:50:41.883 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:50:41.883 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 21)
-2026-02-28 22:50:41.884 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 46)
-2026-02-28 22:50:41.886 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-02-28 22:50:41.886 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:50:41.886 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-02-28 22:50:41.886 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-02-28 22:50:41.886 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 35 total chunks
-2026-02-28 22:50:41.902 - backend.aggregator.core.coordinator - INFO - Validator iteration 23 - batch validating 3 submissions: ['2a491f28-6610-49b1-87c9-25f0e7376bf5', '14046b88-67c6-43b2-a8ed-a8dada6d796c', '3831642a-bc03-43c8-bac0-fc470c00dee1']
-2026-02-28 22:50:41.902 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-02-28 22:50:41.902 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-02-28 22:50:42.949 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-02-28 22:50:42.949 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-02-28 22:50:59.965 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission a78ba4f2-e613-44be-a979-59d8a043c4fe (iteration 30)
-2026-02-28 22:51:08.075 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission bef7a4a4-9c98-413b-a3f7-b0a408def904 (iteration 27)
-2026-02-28 22:51:18.797 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-02-28 22:51:18.809 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #47
-2026-02-28 22:51:18.809 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:51:18.809 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 20)
-2026-02-28 22:51:18.809 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 47)
-2026-02-28 22:51:18.809 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:51:18.809 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-02-28 22:51:18.809 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-02-28 22:51:18.825 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 13 total chunks
-2026-02-28 22:51:18.845 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #48
-2026-02-28 22:51:18.846 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-02-28 22:51:18.846 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:51:18.846 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 22)
-2026-02-28 22:51:18.847 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 48)
-2026-02-28 22:51:18.851 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-02-28 22:51:18.852 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:51:18.852 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-02-28 22:51:18.852 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-02-28 22:51:18.856 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 64 total chunks
-2026-02-28 22:51:18.871 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #49
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-02-28 22:51:18.871 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 21)
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 49)
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-02-28 22:51:18.871 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-02-28 22:51:18.871 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 63 total chunks
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #7
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=49 (every 7 acceptances)
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 49 % 7 == 0
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=4, removals_executed=3
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #7 (triggered at 49 acceptances)
-2026-02-28 22:51:18.887 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-02-28 22:51:18.887 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-02-28 22:51:18.887 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-02-28 22:51:18.897 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-02-28 22:51:18.897 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 46 submissions
-2026-02-28 22:51:18.897 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 306983 chars
-2026-02-28 22:51:18.945 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (87846 tokens)
-2026-02-28 22:51:18.946 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-02-28 22:51:18.946 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-02-28 22:51:18.947 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 315028 chars
-2026-02-28 22:51:18.980 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 89580, Max allowed: 1969500
-2026-02-28 22:51:18.980 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-02-28 22:51:18.980 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-02-28 22:51:18.980 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 46 submissions
-2026-02-28 22:51:18.980 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_033
-2026-02-28 22:51:20.293 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-02-28 22:51:20.293 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=512
-2026-02-28 22:51:55.699 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 2b37b8b9-cd37-4e70-9c67-7cd0972f758a (iteration 31)
-2026-02-28 22:52:07.965 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 13f24f57-f266-4726-b2bd-aa8aa5a5e5bc (iteration 28)
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1056 chars
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, specific theorems/proofs/techniques, distinct perspectives (e.g., different UQ methods like Cantelli vs. scenario vs. DRO vs. SOS vs. sparse PCE vs. conformal; RAMI variants like cut-sets vs. UGF vs. Stein-Chen vs. CCF beta; integration methods like small-gain vs. contraction vs. Krawczyk vs. scattering co-sim; physics-specific certs like alpha Lip vs. ballooning vs. ripple vs. divertor Lip/Newton/comparison), or novel couplings (e.g., dynamic tritium Azuma/DRO vs. steady Hoeffding; first-wall damage). No full redundancy (each adds non-overlapping value, e.g., #23/#30 both Krawczyk but #23 emphasizes Farkas infeas debugging/branch-prune while #30 focuses UQ PASS/FAIL triage/constraint enclosures; #39/#42 comparison principle but different emphases on front position vs. heat-flux handling). No contradictions or supersessions; diversity enhances solution rob
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, specific theorems/proofs/techniques, distinct perspectives (e.g., different UQ methods like Cantelli vs. scenario vs. DRO vs. SOS vs. sparse PCE vs. conformal; RAMI variants like cut-sets vs. UGF vs. Stein-Chen vs. CCF beta; integration methods like small-gain vs. contraction vs. Krawczyk vs. scattering co-sim; physics-specific certs like alpha Lip vs. ballooning vs. ripple vs. divertor Lip/Newton/comparison), or novel couplings (e.g., dynamic tritium Azuma/DRO vs. steady Hoeffding; first-wall damage). No full redundancy (each adds non-overlapping value, e.g., #23/#30 both Krawczyk but #23 emphasizes Farkas infeas debugging/branch-prune while #30 focuses UQ PASS/FAIL triage/constraint enclosures; #39/#42 comparison principle but different emphases on front position vs. heat-flux handling). No contradictions or supersessions; diversity enhances solution robustness. Database quality maintained without removal.'}
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, specific theorems/proofs/techniques, distinct perspectives (e.g., different UQ methods like Cantelli vs. scenario vs. DRO vs. SOS vs. sparse PCE vs. conformal; RAMI variants like cut-sets vs. UGF vs. Stein-Chen vs. CCF beta; integration meth
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, specific theorems/proofs/techniques, distinct perspectives (e.g., different UQ methods like Cantelli vs. scenario vs. DRO vs. SOS vs. sparse
-2026-02-28 22:52:24.965 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-02-28 22:52:24.965 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-02-28 22:52:24.965 - backend.aggregator.core.coordinator - INFO - Cleanup review #7: No removal needed
-2026-02-28 22:52:24.965 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-02-28 22:52:24.965 - backend.aggregator.core.coordinator - INFO - Validator iteration 24 - batch validating 3 submissions: ['7524f932-2c38-42e2-860a-6a35714c15fe', '3b5fe598-4d25-43fb-80fd-6949bf951625', '39db3714-70cf-48fa-a60e-857256ed164e']
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-02-28 22:52:24.965 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-02-28 22:52:45.934 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 5e55e5a0-b528-4795-8a85-b201d55b20d8 (iteration 32)
-2026-02-28 22:53:03.552 - backend.api.routes.autonomous - INFO - Manual override: Forcing paper writing for brainstorm topic_007
-2026-02-28 22:53:03.552 - backend.autonomous.core.autonomous_coordinator - INFO - MANUAL OVERRIDE: Forcing paper writing for brainstorm topic_007
-2026-02-28 22:53:03.552 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-02-28 22:53:03.552 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-02-28 22:53:03.569 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-02-28 22:53:03.569 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-02-28 22:53:03.569 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 24
-2026-02-28 22:53:03.569 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 24 iterations - is_running=False
-2026-02-28 22:53:03.569 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-02-28 22:53:03.569 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm aggregator stopped by manual override
-2026-02-28 22:53:04.070 - backend.autonomous.core.autonomous_coordinator - INFO - Manual override detected - transitioning to paper writing
-2026-02-28 22:53:04.070 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared shared_training_memory in-memory data (will reload from file when needed)
-2026-02-28 22:53:04.073 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper compilation for brainstorm topic_007
-2026-02-28 22:53:04.074 - backend.autonomous.core.autonomous_coordinator - INFO - Already have 6 reference papers (max 6), skipping additional selection
-2026-02-28 22:53:04.085 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 1
-2026-02-28 22:53:04.085 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model openai/gpt-5.2 (task_id=auto_pt_006)
-2026-02-28 22:53:08.543 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=auto_pt_007)
-2026-02-28 22:53:12.419 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title accepted: 'Contract-Based Digital-Twin Integration for a Compact Q>15 Stellarator: UQ, RAMI, and Cost-Constrained Optimization'
-2026-02-28 22:53:12.434 - backend.autonomous.core.autonomous_coordinator - INFO - Compiling paper: Contract-Based Digital-Twin Integration for a Compact Q>15 Stellarator: UQ, RAMI, and Cost-Constrained Optimization
-2026-02-28 22:53:12.435 - backend.autonomous.core.autonomous_coordinator - INFO - Clearing RAG for autonomous paper compilation...
-2026-02-28 22:53:12.435 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-02-28 22:53:13.402 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-02-28 22:53:14.535 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-02-28 22:53:15.269 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-02-28 22:53:15.702 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-02-28 22:53:15.869 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-02-28 22:53:15.918 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-02-28 22:53:15.952 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-02-28 22:53:15.986 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-02-28 22:53:16.119 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-02-28 22:53:16.119 - backend.autonomous.core.autonomous_coordinator - INFO - RAG cleared successfully
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Initializing compiler coordinator...
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Resetting compiler RAG manager state...
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager state reset
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Initializing compiler RAG manager...
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Updating compiler context window from 131072 to 131072
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager initialized
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Skipping Part 1 aggregator database load (autonomous mode)
-2026-02-28 22:53:16.119 - backend.compiler.agents.high_context_submitter - INFO - High-context submitter initialized with model: openai/gpt-5.2
-2026-02-28 22:53:16.119 - backend.compiler.agents.high_context_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-02-28 22:53:16.119 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_context': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-02-28 22:53:16.119 - backend.compiler.agents.high_param_submitter - INFO - High-param submitter initialized with model: moonshotai/kimi-k2.5
-2026-02-28 22:53:16.119 - backend.compiler.agents.high_param_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-02-28 22:53:16.119 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_param': provider=openrouter, model=moonshotai/kimi-k2.5 via Google
-2026-02-28 22:53:16.119 - backend.compiler.validation.compiler_validator - INFO - Compiler validator initialized with model: x-ai/grok-4.1-fast
-2026-02-28 22:53:16.119 - backend.shared.api_client_manager - INFO - Configured role 'compiler_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-02-28 22:53:16.119 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Per-paper model tracking enabled for manual compiler mode
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Compiler coordinator initialized successfully
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Autonomous mode enabled - section order: Body → Conclusion → Intro → Abstract
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Clearing paper and outline...
-2026-02-28 22:53:16.119 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 65, 0 words)
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Paper is empty, skipping re-chunking
-2026-02-28 22:53:16.119 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 16)
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_rag_manager - INFO - Outline is empty, skipping re-chunking
-2026-02-28 22:53:16.119 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-02-28 22:53:16.119 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique memory
-2026-02-28 22:53:16.135 - backend.compiler.core.compiler_coordinator - INFO - Cleared rejection/acceptance logs
-2026-02-28 22:53:16.135 - backend.compiler.core.compiler_coordinator - INFO - Reset per-paper model tracker
-2026-02-28 22:53:16.135 - backend.compiler.core.compiler_coordinator - INFO - Reset autonomous section phase to body
-2026-02-28 22:53:16.135 - backend.compiler.core.compiler_coordinator - INFO - Reset critique phase state
-2026-02-28 22:53:16.135 - backend.compiler.core.compiler_coordinator - INFO - Paper and outline cleared - system reset to fresh start
-2026-02-28 22:53:16.135 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared previous paper/outline for fresh paper paper_007
-2026-02-28 22:53:16.135 - backend.autonomous.core.autonomous_coordinator - INFO - Loading brainstorm database into compiler RAG: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_007.txt
-2026-02-28 22:53:16.202 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_007.txt: 878 total chunks
-2026-02-28 22:53:28.582 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_007.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm database loaded into compiler RAG
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - INFO - Loading 6 reference papers into compiler RAG
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_001.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_002.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_003.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_004.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_005.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_006.txt
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - INFO - All reference papers loaded into compiler RAG
-2026-02-28 22:53:28.582 - backend.compiler.core.compiler_coordinator - INFO - Starting compiler...
-2026-02-28 22:53:28.582 - backend.compiler.core.compiler_coordinator - INFO - Compiler started successfully
-2026-02-28 22:53:28.582 - backend.autonomous.core.autonomous_coordinator - INFO - Compiler started for paper paper_007
-2026-02-28 22:53:28.582 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow started
-2026-02-28 22:53:28.582 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring started - will check for new acceptances every 30 seconds
-2026-02-28 22:53:28.598 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: None → body
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_coordinator - INFO - Starting fresh - no existing paper or outline found
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_coordinator - INFO - PHASE 1: ITERATIVE OUTLINE CREATION
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_coordinator - INFO -
---- Outline Creation Iteration 1/15 ---
-2026-02-28 22:53:28.614 - backend.compiler.agents.high_context_submitter - INFO - Starting outline creation submission generation...
-2026-02-28 22:53:28.614 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 22:53:28.614 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_create, query_length=159
-2026-02-28 22:54:30.267 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_create in 61.65s (coverage=0.61, tokens=7220)
-2026-02-28 22:54:30.267 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 65240 chars retrieved
-2026-02-28 22:54:30.267 - backend.compiler.agents.high_context_submitter - INFO - Building outline creation prompt...
-2026-02-28 22:54:30.267 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 82464 chars
-2026-02-28 22:54:30.284 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_000)...
-2026-02-28 22:55:33.101 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 18447 chars
-2026-02-28 22:55:33.113 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 22:55:33.116 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 22:55:33.116 - backend.compiler.agents.high_context_submitter - INFO - Outline creation submission generated: f280446d-b7ca-462f-b35e-e9205f0f95f0, outline_complete=True
-2026-02-28 22:55:33.116 - backend.compiler.validation.compiler_validator - INFO - Validating outline_create submission: f280446d-b7ca-462f-b35e-e9205f0f95f0
-2026-02-28 22:55:33.133 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_create, operation=full_content
-2026-02-28 22:55:33.133 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_000)...
-2026-02-28 22:55:48.416 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 22:55:48.433 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_create)
-2026-02-28 22:55:48.433 - backend.compiler.core.compiler_coordinator - INFO - ✓ Iteration 1: Outline ACCEPTED
-2026-02-28 22:55:48.433 - backend.compiler.core.compiler_coordinator - INFO -   Validator feedback: The submission is a full_content replacement that exactly matches the CURRENT OUTLINE, which fully satisfies all 11 validation criteria. It includes the optional Abstract, required Introduction (I. In...
-2026-02-28 22:55:48.433 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-02-28 22:55:48.433 - backend.compiler.core.compiler_coordinator - INFO - OUTLINE MARKED COMPLETE BY SUBMITTER - LOCKING
-2026-02-28 22:55:48.433 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-02-28 22:55:48.449 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 17)
-2026-02-28 22:55:48.699 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-02-28 22:55:48.716 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 43 total chunks
-2026-02-28 22:55:49.382 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-02-28 22:55:49.382 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-02-28 22:55:49.382 - backend.compiler.memory.outline_memory - INFO - Outline creation feedback cleared
-2026-02-28 22:55:49.382 - backend.compiler.core.compiler_coordinator - INFO - Outline locked after 1 iterations
-2026-02-28 22:55:49.382 - backend.compiler.core.compiler_coordinator - INFO - Starting initial paper loop...
-2026-02-28 22:55:49.382 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=True, phase=body)
-2026-02-28 22:55:49.382 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 22:55:49.399 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=0 chars
-2026-02-28 22:55:49.399 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 0 chars → 0 chars (markers removed)
-2026-02-28 22:55:49.399 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 22:55:49.399 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=159
-2026-02-28 22:56:48.348 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 58.95s (coverage=0.78, tokens=7115)
-2026-02-28 22:56:48.348 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 64298 chars retrieved
-2026-02-28 22:56:48.348 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 22:56:48.348 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 94069 chars
-2026-02-28 22:56:48.364 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_001)...
-2026-02-28 22:57:27.381 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10355 chars
-2026-02-28 22:57:27.381 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 22:57:27.397 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 22:57:27.397 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: fb24307b-5333-4818-8fc9-0b6fcf2df093 (section_complete=False)
-2026-02-28 22:57:27.397 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: fb24307b-5333-4818-8fc9-0b6fcf2df093
-2026-02-28 22:57:27.397 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=full_content
-2026-02-28 22:57:27.397 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_001)...
-2026-02-28 22:57:35.564 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 22:57:35.581 - backend.compiler.memory.paper_memory - INFO - Paper initialized with placeholders (version 66)
-2026-02-28 22:57:35.581 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 22:57:35.581 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 30 total chunks
-2026-02-28 22:57:36.030 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 22:57:36.030 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 22:57:36.030 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 22:57:36.030 - backend.compiler.core.compiler_coordinator - INFO - Initial paper portion accepted with placeholders! (1311 words)
-2026-02-28 22:57:36.030 - backend.compiler.core.compiler_coordinator - INFO - Initial paper loop complete
-2026-02-28 22:57:36.030 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-02-28 22:57:36.030 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 22:57:36.030 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 22:57:36.030 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=9975 chars
-2026-02-28 22:57:36.030 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 9975 chars → 9902 chars (markers removed)
-2026-02-28 22:57:36.030 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 22:57:36.030 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 22:58:44.212 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 68.18s (coverage=0.94, tokens=7265)
-2026-02-28 22:58:44.212 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 64237 chars retrieved
-2026-02-28 22:58:44.212 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 22:58:44.212 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 103834 chars
-2026-02-28 22:58:44.228 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_002)...
-2026-02-28 22:59:36.727 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13208 chars
-2026-02-28 22:59:36.727 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 22:59:36.744 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 22:59:36.744 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 116ebdb6-62e6-4a4f-9650-42be65cbce7a (section_complete=False)
-2026-02-28 22:59:36.744 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 116ebdb6-62e6-4a4f-9650-42be65cbce7a
-2026-02-28 22:59:36.744 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 12193 -> 12190 chars, new_string: 12193 -> 12190 chars)
-2026-02-28 22:59:36.760 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 22:59:36.760 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This completes the formal problem setup used by the contract-based integration, stability analysis, '...
-2026-02-28 22:59:36.760 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 9619
-2026-02-28 22:59:36.761 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_002)...
-2026-02-28 22:59:52.961 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 22:59:52.976 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=179, new_string_len=12190
-2026-02-28 22:59:52.976 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 12190 chars (conclusion boundary preserved)
-2026-02-28 22:59:52.985 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 67, 2963 words)
-2026-02-28 22:59:53.194 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 22:59:53.194 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 66 total chunks
-2026-02-28 22:59:54.027 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 22:59:54.027 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 22:59:54.027 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 22:59:54.027 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2963 words)
-2026-02-28 22:59:54.027 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 22:59:54.027 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 22:59:54.027 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=22167 chars
-2026-02-28 22:59:54.027 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 22167 chars → 22094 chars (markers removed)
-2026-02-28 22:59:54.027 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 22:59:54.027 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:01:01.325 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 67.30s (coverage=0.92, tokens=7195)
-2026-02-28 23:01:01.325 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 62911 chars retrieved
-2026-02-28 23:01:01.325 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:01:01.325 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 114700 chars
-2026-02-28 23:01:01.342 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_003)...
-2026-02-28 23:02:21.906 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 17909 chars
-2026-02-28 23:02:21.907 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:02:21.923 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:02:21.923 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 0d98df8b-6b1a-4a4b-803f-e513f04f8564 (section_complete=False)
-2026-02-28 23:02:21.924 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 0d98df8b-6b1a-4a4b-803f-e513f04f8564
-2026-02-28 23:02:21.924 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 16428 -> 16425 chars, new_string: 16428 -> 16425 chars)
-2026-02-28 23:02:21.924 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:02:21.924 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The remaining sections build on this spine: stability/well-posedness conditions (Section IV) and ver'...
-2026-02-28 23:02:21.924 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 21609
-2026-02-28 23:02:21.940 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_003)...
-2026-02-28 23:02:32.457 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:02:32.457 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=381, new_string_len=16425
-2026-02-28 23:02:32.457 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 16425 chars (conclusion boundary preserved)
-2026-02-28 23:02:32.473 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 68, 5172 words)
-2026-02-28 23:02:32.695 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:02:32.706 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 115 total chunks
-2026-02-28 23:02:34.124 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:02:34.124 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:02:34.124 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:02:34.140 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (5172 words)
-2026-02-28 23:02:34.140 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:02:34.140 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:02:34.140 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=38594 chars
-2026-02-28 23:02:34.140 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 38594 chars → 38521 chars (markers removed)
-2026-02-28 23:02:34.140 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:02:34.140 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:03:39.988 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 65.85s (coverage=0.92, tokens=7269)
-2026-02-28 23:03:39.988 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 62983 chars retrieved
-2026-02-28 23:03:39.988 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:03:39.988 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 131199 chars
-2026-02-28 23:03:40.005 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_004)...
-2026-02-28 23:04:37.954 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13001 chars
-2026-02-28 23:04:37.954 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:04:37.971 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:04:37.971 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: f95ad310-164b-40af-b2cb-0b69853f35ef (section_complete=False)
-2026-02-28 23:04:37.987 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: f95ad310-164b-40af-b2cb-0b69853f35ef
-2026-02-28 23:04:37.987 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11745 -> 11743 chars, new_string: 11745 -> 11743 chars)
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'With these caveats, Section IV provides a contract-compatible systems-theory layer: it ties together'...
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=368 | first20='With these caveats, ' | last20='zation (Section X).\n'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=38594 | double_spaces=51 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'With these caveats, Section IV provides a contract-compatible systems-theory layer: it ties together physically meaningful interface constraints (Section III) with execution-level stability checks and'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'ution-level stability checks and explicit error-amplification bounds that are later consumed by verified numerics (Section V), UQ/certification layers (Sections VI–VII), and optimization (Section X).\n'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'timization (Section X).\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 38045
-2026-02-28 23:04:38.004 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'With these caveats, Section IV provides a contract-compatible systems-theory layer: it ties together'
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - WARNING - CONSECUTIVE_MATCH_FALLBACK: Exact match failed but found unique consecutive match (consecutive=88.6%) at position 38050
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - WARNING -   Model provided: 'With these caveats, Section IV provides a contract-compatible systems-theory layer: it ties together'...
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: 'these caveats, Section IV provides a contract-compatible systems-theory layer: it ties together phys'...
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - WARNING -   Using consecutive match to proceed. This indicates a model escaping quirk.
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - INFO - Consecutive fuzzy match correction applied - updating old_string to actual document text
-2026-02-28 23:04:38.021 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 38050
-2026-02-28 23:04:38.037 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_004)...
-2026-02-28 23:04:46.487 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:04:46.487 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=367, new_string_len=11743
-2026-02-28 23:04:46.487 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11743 chars (conclusion boundary preserved)
-2026-02-28 23:04:46.507 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 69, 6776 words)
-2026-02-28 23:04:46.737 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:04:46.754 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 153 total chunks
-2026-02-28 23:04:48.654 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:04:48.654 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:04:48.654 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:04:48.671 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (6776 words)
-2026-02-28 23:04:48.671 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:04:48.671 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:04:48.674 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=50339 chars
-2026-02-28 23:04:48.674 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 50339 chars → 50266 chars (markers removed)
-2026-02-28 23:04:48.675 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:04:48.675 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:05:59.402 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 70.73s (coverage=0.94, tokens=7290)
-2026-02-28 23:05:59.402 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 63951 chars retrieved
-2026-02-28 23:05:59.402 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:05:59.402 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 143912 chars
-2026-02-28 23:05:59.419 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_005)...
-2026-02-28 23:07:19.250 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 17403 chars
-2026-02-28 23:07:19.250 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:07:19.267 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:07:19.267 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 1f408fe0-354a-4db7-bfa3-d13d4dc47f0f (section_complete=False)
-2026-02-28 23:07:19.283 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 1f408fe0-354a-4db7-bfa3-d13d4dc47f0f
-2026-02-28 23:07:19.283 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 15741 -> 15739 chars, new_string: 15741 -> 15739 chars)
-2026-02-28 23:07:19.284 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:07:19.284 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This verified-numerics layer is intentionally orthogonal to any particular physics module: it only r'...
-2026-02-28 23:07:19.284 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 49794
-2026-02-28 23:07:19.300 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_005)...
-2026-02-28 23:07:35.433 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:07:35.449 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=368, new_string_len=15739
-2026-02-28 23:07:35.449 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 15739 chars (conclusion boundary preserved)
-2026-02-28 23:07:35.466 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 70, 8739 words)
-2026-02-28 23:07:35.717 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:07:35.733 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 201 total chunks
-2026-02-28 23:07:38.283 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:07:38.283 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:07:38.283 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:07:38.283 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (8739 words)
-2026-02-28 23:07:38.283 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-02-28 23:07:38.283 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:07:38.283 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16539 chars, paper=66080 chars
-2026-02-28 23:07:38.283 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 66080 chars → 66007 chars (markers removed)
-2026-02-28 23:07:38.283 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:07:38.283 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=159
-2026-02-28 23:08:36.249 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 57.97s (coverage=0.72, tokens=6882)
-2026-02-28 23:08:36.249 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 61333 chars retrieved
-2026-02-28 23:08:36.249 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-02-28 23:08:36.249 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 156488 chars
-2026-02-28 23:08:36.265 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_006)...
-2026-02-28 23:09:05.182 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 3453 chars
-2026-02-28 23:09:05.182 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:09:05.182 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:09:05.182 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: 3336064f-222e-42ce-87dd-8ebc8fdcaa8a
-2026-02-28 23:09:05.198 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: 3336064f-222e-42ce-87dd-8ebc8fdcaa8a
-2026-02-28 23:09:05.198 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 1571 -> 1569 chars)
-2026-02-28 23:09:05.215 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-02-28 23:09:05.215 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'XII. Implementation Workflow and Auditability Requirements\n   A. Data/metadata requirements for cont'...
-2026-02-28 23:09:05.215 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 15025
-2026-02-28 23:09:05.215 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_006)...
-2026-02-28 23:09:18.364 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:09:18.364 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-02-28 23:09:18.364 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 1569 chars
-2026-02-28 23:09:18.364 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 18)
-2026-02-28 23:09:18.613 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-02-28 23:09:18.614 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 47 total chunks
-2026-02-28 23:09:19.314 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-02-28 23:09:19.314 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-02-28 23:09:19.314 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-02-28 23:09:19.314 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=66080 chars
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 66080 chars → 66007 chars (markers removed)
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-02-28 23:09:19.314 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 92765 chars
-2026-02-28 23:09:19.331 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_007)...
-2026-02-28 23:10:21.863 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10819 chars
-2026-02-28 23:10:21.863 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:10:21.863 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:10:21.863 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: df319e73-2060-449d-89c6-54530c7f6b2d (miniscule=False)
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: df319e73-2060-449d-89c6-54530c7f6b2d
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 4896 -> 4895 chars, new_string: 4896 -> 4895 chars)
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\['...
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=4899 | double_spaces=8 | first20='V.B.1. Interval vect' | last20='aints at (d,y,\\xi).\n'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=66080 | double_spaces=84 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{R}^n : \\\\\\underline x_i \\le x_i \\le \\overline x'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'herwise, constraint status is UNKNOWN; one may refine X or tighten the constraint evaluation.\n\nThis produces a solver-independent feasibility statement for the coupled plant constraints at (d,y,\\xi).\n'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'nd safety certificates.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 40733
-2026-02-28 23:10:21.880 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'V.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\['
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - WARNING - CONSECUTIVE_MATCH_FALLBACK: Exact match failed but found unique consecutive match (consecutive=87.7%) at position 40724
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - WARNING -   Model provided: 'V.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\['...
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: 'ibility\n\nV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is w'...
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - WARNING -   Using consecutive match to proceed. This indicates a model escaping quirk.
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - INFO - Consecutive fuzzy match correction applied - updating old_string to actual document text
-2026-02-28 23:10:27.296 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 40724
-2026-02-28 23:10:27.313 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_007)...
-2026-02-28 23:10:35.529 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:10:35.529 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=4898, new_string_len=4895
-2026-02-28 23:10:35.529 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 4898 chars with 4895 chars
-2026-02-28 23:10:35.545 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 71, 8740 words)
-2026-02-28 23:10:35.746 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:10:35.763 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 201 total chunks
-2026-02-28 23:10:38.229 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:10:38.229 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:10:38.229 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-02-28 23:10:38.229 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (8740 words)
-2026-02-28 23:10:38.229 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-02-28 23:10:38.229 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:10:38.242 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=66077 chars
-2026-02-28 23:10:38.242 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 66077 chars → 66004 chars (markers removed)
-2026-02-28 23:10:38.242 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-02-28 23:10:38.242 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 92762 chars
-2026-02-28 23:10:38.246 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_008)...
-2026-02-28 23:11:00.712 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1791 chars
-2026-02-28 23:11:00.712 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:11:00.712 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:11:00.712 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 7cfc8e2c-3b39-4f64-b602-8f0f5befb504 (miniscule=False)
-2026-02-28 23:11:00.712 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 7cfc8e2c-3b39-4f64-b602-8f0f5befb504
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'...
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=66077 | double_spaces=84 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'nd safety certificates.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 40677
-2026-02-28 23:11:00.729 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=18108 | double_spaces=427 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. Motivation: compact Q>15 stellarator digital twin as a system-of-systems under cost (<$5B) and schedule (<=2030) constraints\n   B. Integration problem statement: coupli'
-2026-02-28 23:11:00.798 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'ms can be treated as engineering evidence\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:11:00.811 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-02-28 23:11:00.811 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-02-28 23:11:00.811 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-02-28 23:11:00.811 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-02-28 23:11:00.811 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-02-28 23:11:00.812 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-02-28 23:11:00.812 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-02-28 23:11:00.812 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-02-28 23:11:00.812 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-02-28 23:11:00.812 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-02-28 23:11:00.812 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-02-28 23:11:00.812 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=18108 chars, paper=66077 chars
-2026-02-28 23:11:00.812 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-02-28 23:11:00.812 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:12:15.844 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 75.03s (coverage=0.97, tokens=7417)
-2026-02-28 23:12:15.844 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 65196 chars
-2026-02-28 23:12:15.844 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-02-28 23:12:15.844 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_000)...
-2026-02-28 23:15:26.772 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1018 chars
-2026-02-28 23:15:26.773 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-02-28 23:15:26.773 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=287
-2026-02-28 23:15:26.773 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-02-28 23:15:26.773 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-02-28 23:15:26.788 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:16:41.771 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 74.98s (coverage=0.97, tokens=7417)
-2026-02-28 23:16:41.787 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-02-28 23:16:41.787 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_001)...
-2026-02-28 23:19:19.584 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 2453 chars
-2026-02-28 23:19:19.584 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Rigor enhancement submission generated - 71caedd5-22d1-4ff4-9ca0-9d1b99991a6f
-2026-02-28 23:19:19.601 - backend.compiler.validation.compiler_validator - INFO - Validating rigor submission: 71caedd5-22d1-4ff4-9ca0-9d1b99991a6f
-2026-02-28 23:19:19.601 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 692 -> 690 chars, new_string: 692 -> 690 chars)
-2026-02-28 23:19:19.601 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=rigor, operation=insert_after
-2026-02-28 23:19:19.601 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Let \\(g_j(\\xi)\\) denote the true (expensive) constraint function evaluation produced by the coupled '...
-2026-02-28 23:19:19.601 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 52596
-2026-02-28 23:19:19.618 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_008)...
-2026-02-28 23:19:25.917 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:19:25.917 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=220, new_string_len=690
-2026-02-28 23:19:25.917 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 690 chars (conclusion boundary preserved)
-2026-02-28 23:19:25.934 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 72, 8836 words)
-2026-02-28 23:19:26.218 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:19:26.234 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 204 total chunks
-2026-02-28 23:19:28.651 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:19:28.651 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:19:28.667 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: rigor)
-2026-02-28 23:19:28.667 - backend.compiler.core.compiler_coordinator - INFO - Rigor enhancement accepted (8836 words)
-2026-02-28 23:19:28.671 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-02-28 23:19:28.671 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-02-28 23:19:28.671 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=18108 chars, paper=66770 chars
-2026-02-28 23:19:28.671 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-02-28 23:19:28.671 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:20:43.549 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 74.88s (coverage=0.97, tokens=7332)
-2026-02-28 23:20:43.549 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 64566 chars
-2026-02-28 23:20:43.549 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-02-28 23:20:43.566 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_002)...
-2026-02-28 23:24:44.977 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1214 chars
-2026-02-28 23:24:44.977 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-02-28 23:24:44.977 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=368
-2026-02-28 23:24:44.977 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-02-28 23:24:44.994 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-02-28 23:24:44.994 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:25:59.936 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 74.94s (coverage=0.97, tokens=7332)
-2026-02-28 23:25:59.937 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-02-28 23:25:59.949 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_003)...
-2026-02-28 23:27:31.123 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 925 chars
-2026-02-28 23:27:31.123 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM refused (Step 1 made mistake)
-2026-02-28 23:27:31.123 - backend.compiler.core.compiler_coordinator - INFO - No rigor enhancement needed
-2026-02-28 23:27:31.123 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
-2026-02-28 23:27:31.123 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-02-28 23:27:31.123 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-02-28 23:27:31.123 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-02-28 23:27:31.123 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:27:31.123 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:27:31.140 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=66770 chars
-2026-02-28 23:27:31.140 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 66770 chars → 66697 chars (markers removed)
-2026-02-28 23:27:31.140 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:27:31.140 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:28:43.388 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 72.25s (coverage=0.94, tokens=7199)
-2026-02-28 23:28:43.388 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 63918 chars retrieved
-2026-02-28 23:28:43.388 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:28:43.388 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 163766 chars
-2026-02-28 23:28:43.422 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_009)...
-2026-02-28 23:30:20.608 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 18109 chars
-2026-02-28 23:30:20.609 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:30:20.620 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:30:20.620 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: bbce9c0b-530e-4293-b2ad-80ed64285256 (section_complete=False)
-2026-02-28 23:30:20.636 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: bbce9c0b-530e-4293-b2ad-80ed64285256
-2026-02-28 23:30:20.636 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 16432 -> 16430 chars, new_string: 16432 -> 16430 chars)
-2026-02-28 23:30:20.654 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:30:20.654 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'With these interfaces, Section VI supplies the computational machinery used later in Section VII (pr'...
-2026-02-28 23:30:20.654 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 66265
-2026-02-28 23:30:20.670 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_009)...
-2026-02-28 23:30:28.904 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:30:28.904 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=328, new_string_len=16430
-2026-02-28 23:30:28.905 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 16430 chars (conclusion boundary preserved)
-2026-02-28 23:30:28.922 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 73, 10895 words)
-2026-02-28 23:30:29.303 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:30:29.320 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 257 total chunks
-2026-02-28 23:30:32.421 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:30:32.421 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:30:32.421 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:30:32.435 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (10895 words)
-2026-02-28 23:30:32.435 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:30:32.436 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:30:32.436 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=83202 chars
-2026-02-28 23:30:32.436 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 83202 chars → 83129 chars (markers removed)
-2026-02-28 23:30:32.436 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:30:32.436 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:31:43.250 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 70.81s (coverage=0.87, tokens=6955)
-2026-02-28 23:31:43.250 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 62121 chars retrieved
-2026-02-28 23:31:43.250 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:31:43.266 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 178401 chars
-2026-02-28 23:31:43.284 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_010)...
-2026-02-28 23:33:21.880 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 19385 chars
-2026-02-28 23:33:21.880 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:33:21.897 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:33:21.898 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 3e01629e-ca55-432b-b446-38237b7dccf0 (section_complete=False)
-2026-02-28 23:33:21.902 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 3e01629e-ca55-432b-b446-38237b7dccf0
-2026-02-28 23:33:21.902 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 17557 -> 17555 chars, new_string: 17557 -> 17555 chars)
-2026-02-28 23:33:21.907 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:33:21.907 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These rules ensure that probability lower bounds remain conservative at the expense of potentially l'...
-2026-02-28 23:33:21.907 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 82507
-2026-02-28 23:33:21.926 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_010)...
-2026-02-28 23:33:42.831 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:33:42.831 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=518, new_string_len=17555
-2026-02-28 23:33:42.831 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 17555 chars (conclusion boundary preserved)
-2026-02-28 23:33:42.848 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 74, 13144 words)
-2026-02-28 23:33:43.164 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:33:43.181 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 310 total chunks
-2026-02-28 23:33:46.969 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:33:46.969 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:33:46.981 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:33:46.981 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (13144 words)
-2026-02-28 23:33:46.981 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:33:46.981 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:33:47.006 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=100759 chars
-2026-02-28 23:33:47.006 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 100759 chars → 100686 chars (markers removed)
-2026-02-28 23:33:47.006 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:33:47.006 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:34:52.399 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 65.39s (coverage=0.92, tokens=6868)
-2026-02-28 23:34:52.399 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 60900 chars retrieved
-2026-02-28 23:34:52.399 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:34:52.399 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 194737 chars
-2026-02-28 23:34:52.429 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_011)...
-2026-02-28 23:36:03.113 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 15901 chars
-2026-02-28 23:36:03.113 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:36:03.129 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:36:03.129 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6e1e7f93-83fd-44f8-90f6-ee90ac06bcd9 (section_complete=False)
-2026-02-28 23:36:03.146 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6e1e7f93-83fd-44f8-90f6-ee90ac06bcd9
-2026-02-28 23:36:03.146 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 14439 -> 14437 chars, new_string: 14439 -> 14437 chars)
-2026-02-28 23:36:03.146 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:36:03.146 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The next sections build on this RAMI layer: Section IX discusses component-level physics and risk mo'...
-2026-02-28 23:36:03.146 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 100300
-2026-02-28 23:36:03.179 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_011)...
-2026-02-28 23:36:14.981 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:36:14.981 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=282, new_string_len=14437
-2026-02-28 23:36:14.981 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 14437 chars (conclusion boundary preserved)
-2026-02-28 23:36:14.998 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 75, 14923 words)
-2026-02-28 23:36:15.448 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:36:15.481 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 354 total chunks
-2026-02-28 23:36:19.698 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:36:19.698 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:36:19.698 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:36:19.698 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (14923 words)
-2026-02-28 23:36:19.698 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:36:19.698 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:36:19.698 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=115198 chars
-2026-02-28 23:36:19.698 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 115198 chars → 115125 chars (markers removed)
-2026-02-28 23:36:19.698 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:36:19.698 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:37:29.894 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 70.20s (coverage=0.82, tokens=6846)
-2026-02-28 23:37:29.895 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 61028 chars retrieved
-2026-02-28 23:37:29.895 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:37:29.895 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 209304 chars
-2026-02-28 23:37:29.924 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_012)...
-2026-02-28 23:38:37.016 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 16236 chars
-2026-02-28 23:38:37.016 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:38:37.016 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:38:37.031 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 99d4b6d5-8de4-4a2a-816f-6d118908bb56 (section_complete=False)
-2026-02-28 23:38:37.033 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 99d4b6d5-8de4-4a2a-816f-6d118908bb56
-2026-02-28 23:38:37.033 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 14931 -> 14929 chars, new_string: 14931 -> 14929 chars)
-2026-02-28 23:38:37.033 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:38:37.033 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The next section (Section X) shows how these contract-consumable outputs are assembled into a unifie'...
-2026-02-28 23:38:37.033 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 114696
-2026-02-28 23:38:37.066 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_012)...
-2026-02-28 23:38:46.662 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:38:46.662 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=325, new_string_len=14929
-2026-02-28 23:38:46.662 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 14929 chars (conclusion boundary preserved)
-2026-02-28 23:38:46.667 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 76, 16836 words)
-2026-02-28 23:38:46.934 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:38:46.967 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 402 total chunks
-2026-02-28 23:38:51.985 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:38:51.985 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:38:52.001 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:38:52.001 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (16836 words)
-2026-02-28 23:38:52.001 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-02-28 23:38:52.001 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:38:52.001 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18108 chars, paper=130129 chars
-2026-02-28 23:38:52.001 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 130129 chars → 130056 chars (markers removed)
-2026-02-28 23:38:52.001 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:38:52.001 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=159
-2026-02-28 23:39:58.526 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 66.53s (coverage=0.78, tokens=6663)
-2026-02-28 23:39:58.526 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 59722 chars retrieved
-2026-02-28 23:39:58.526 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-02-28 23:39:58.526 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 222358 chars
-2026-02-28 23:39:58.560 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_013)...
-2026-02-28 23:40:37.548 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 2201 chars
-2026-02-28 23:40:37.548 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:40:37.548 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:40:37.548 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: b32e10ee-2094-49cf-b2d4-7510658362b1
-2026-02-28 23:40:37.548 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: b32e10ee-2094-49cf-b2d4-7510658362b1
-2026-02-28 23:40:37.548 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 1032 -> 1028 chars)
-2026-02-28 23:40:37.565 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-02-28 23:40:37.565 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '   E. Database test artifacts to include (as outline placeholders, not yet validated)\n      1. Multi'...
-2026-02-28 23:40:37.566 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 6035
-2026-02-28 23:40:37.582 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_013)...
-2026-02-28 23:40:51.283 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:40:51.283 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-02-28 23:40:51.283 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 1028 chars
-2026-02-28 23:40:51.300 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 19)
-2026-02-28 23:40:51.517 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-02-28 23:40:51.517 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 50 total chunks
-2026-02-28 23:40:52.130 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-02-28 23:40:52.130 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-02-28 23:40:52.133 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-02-28 23:40:52.133 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=130129 chars
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 130129 chars → 130056 chars (markers removed)
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-02-28 23:40:52.133 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 159705 chars
-2026-02-28 23:40:52.151 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_014)...
-2026-02-28 23:41:22.571 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 2137 chars
-2026-02-28 23:41:22.571 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:41:22.571 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:41:22.571 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 8da8a02a-0a20-41b4-b37a-078ea58a316c (miniscule=False)
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 8da8a02a-0a20-41b4-b37a-078ea58a316c
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'...
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=130129 | double_spaces=175 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:41:22.587 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'e feasibility and cost.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:41:22.604 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 40677
-2026-02-28 23:41:22.604 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=19136 | double_spaces=446 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. Motivation: compact Q>15 stellarator digital twin as a system-of-systems under cost (<$5B) and schedule (<=2030) constraints\n   B. Integration problem statement: coupli'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'ms can be treated as engineering evidence\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-02-28 23:41:22.671 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-02-28 23:41:22.671 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-02-28 23:41:22.671 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=130129 chars
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 130129 chars → 130056 chars (markers removed)
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-02-28 23:41:22.671 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 161484 chars
-2026-02-28 23:41:22.704 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_015)...
-2026-02-28 23:41:48.707 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 2398 chars
-2026-02-28 23:41:48.707 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:41:48.724 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:41:48.724 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: df4b749a-5164-4736-9fdd-258d50c29fd1 (miniscule=False)
-2026-02-28 23:41:48.724 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: df4b749a-5164-4736-9fdd-258d50c29fd1
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'...
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=130129 | double_spaces=175 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'e feasibility and cost.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 40677
-2026-02-28 23:41:48.741 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=604 | double_spaces=2 | first20='V.B. Interval prelim' | last20='aranteed enclosures.'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=19136 | double_spaces=446 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\\\underline x,\\overline x] := \\{x\\in\\mathbb{'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'uch that\n\\[\n  \\varphi(X) := \\{\\varphi(x): x\\in X\\} \\subseteq [\\varphi](X).\n\\]\nIn practice, \\([\\varphi](X)\\) is computed by interval arithmetic (with outward rounding) and yields guaranteed enclosures.'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. Motivation: compact Q>15 stellarator digital twin as a system-of-systems under cost (<$5B) and schedule (<=2030) constraints\n   B. Integration problem statement: coupli'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'ms can be treated as engineering evidence\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-02-28 23:41:48.824 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-02-28 23:41:48.824 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-02-28 23:41:48.824 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-02-28 23:41:48.824 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-02-28 23:41:48.824 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-02-28 23:41:48.824 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-02-28 23:41:48.824 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-02-28 23:41:48.841 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=19136 chars, paper=130129 chars
-2026-02-28 23:41:48.841 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-02-28 23:41:48.841 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:43:00.333 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 71.49s (coverage=0.96, tokens=7051)
-2026-02-28 23:43:00.333 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 62516 chars
-2026-02-28 23:43:00.333 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-02-28 23:43:00.350 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_004)...
-2026-02-28 23:45:20.985 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1471 chars
-2026-02-28 23:45:21.001 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-02-28 23:45:21.001 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=rewrite_focus, target_section_len=483
-2026-02-28 23:45:21.001 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: rewrite_focus execution...
-2026-02-28 23:45:21.001 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-02-28 23:45:21.001 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1160
-2026-02-28 23:46:32.577 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 71.58s (coverage=0.96, tokens=7051)
-2026-02-28 23:46:32.577 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-02-28 23:46:32.594 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_005)...
-2026-02-28 23:50:36.925 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 4388 chars
-2026-02-28 23:50:36.942 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Rigor enhancement submission generated - 335e328c-fc31-420f-bcf9-4257ac019ec4
-2026-02-28 23:50:36.949 - backend.compiler.validation.compiler_validator - INFO - Validating rigor submission: 335e328c-fc31-420f-bcf9-4257ac019ec4
-2026-02-28 23:50:36.959 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=rigor, operation=replace
-2026-02-28 23:50:36.959 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'...
-2026-02-28 23:50:36.959 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:50:36.959 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=481 | double_spaces=1 | first20='V.B. Interval prelim' | last20='for all \\(x \\in X\\).'
-2026-02-28 23:50:36.960 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=130129 | double_spaces=175 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:50:36.962 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:50:36.963 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\underline x,\\overline x] := \\{x\\in\\mathbb{R'
-2026-02-28 23:50:36.963 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'xtension of a function \\(f: \\mathbb{R}^n \\to \\mathbb{R}^m\\) is an interval-valued function \\([f]: \\mathbb{I}\\mathbb{R}^n \\to \\mathbb{I}\\mathbb{R}^m\\) such that \\(f(x) \\in [f](X)\\) for all \\(x \\in X\\).'
-2026-02-28 23:50:36.963 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-02-28 23:50:36.963 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'e feasibility and cost.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:50:36.965 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 40677
-2026-02-28 23:50:36.965 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn i'
-2026-02-28 23:50:36.966 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-02-28 23:50:36.966 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=481 | double_spaces=1 | first20='V.B. Interval prelim' | last20='for all \\(x \\in X\\).'
-2026-02-28 23:50:36.966 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=19136 | double_spaces=446 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-02-28 23:50:36.966 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'V.B. Interval preliminaries and contract compatV.B.1. Interval vectors and interval extensions\n\nAn interval (box) in \\(\\mathbb{R}^n\\) is written\n\\[\n  X = [\\\\underline x,\\overline x] := \\{x\\in\\mathbb{R'
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'xtension of a function \\(f: \\mathbb{R}^n \\to \\mathbb{R}^m\\) is an interval-valued function \\([f]: \\mathbb{I}\\mathbb{R}^n \\to \\mathbb{I}\\mathbb{R}^m\\) such that \\(f(x) \\in [f](X)\\) for all \\(x \\in X\\).'
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. Motivation: compact Q>15 stellarator digital twin as a system-of-systems under cost (<$5B) and schedule (<=2030) constraints\n   B. Integration problem statement: coupli'
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'ms can be treated as engineering evidence\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-02-28 23:50:36.967 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-02-28 23:50:36.968 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-02-28 23:50:36.968 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-02-28 23:50:36.968 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-02-28 23:50:36.974 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: rigor)
-2026-02-28 23:50:36.975 - backend.compiler.core.compiler_coordinator - INFO - Rigor enhancement rejected
-2026-02-28 23:50:36.975 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-02-28 23:50:36.975 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-02-28 23:50:36.976 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-02-28 23:50:36.976 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-02-28 23:50:36.976 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-02-28 23:50:36.981 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=130129 chars
-2026-02-28 23:50:36.982 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 130129 chars → 130056 chars (markers removed)
-2026-02-28 23:50:36.982 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-02-28 23:50:36.982 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-02-28 23:51:47.951 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 70.97s (coverage=0.93, tokens=6889)
-2026-02-28 23:51:47.951 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 61017 chars retrieved
-2026-02-28 23:51:47.951 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-02-28 23:51:47.951 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 230588 chars
-2026-02-28 23:51:47.968 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_016)...
-2026-02-28 23:53:16.812 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 23428 chars
-2026-02-28 23:53:16.812 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-02-28 23:53:16.840 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-02-28 23:53:16.840 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 71275059-3af1-4ab3-bc75-8b4952fba0f9 (section_complete=True)
-2026-02-28 23:53:16.845 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 71275059-3af1-4ab3-bc75-8b4952fba0f9
-2026-02-28 23:53:16.845 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 21939 -> 21937 chars, new_string: 21939 -> 21937 chars)
-2026-02-28 23:53:16.845 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-02-28 23:53:16.845 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The next section (Section XI) uses these artifacts to plan 12–18 month V\\&V programs: selecting fals'...
-2026-02-28 23:53:16.845 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 129700
-2026-02-28 23:53:16.879 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_014)...
-2026-02-28 23:53:30.614 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-02-28 23:53:30.614 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=252, new_string_len=21937
-2026-02-28 23:53:30.614 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 21937 chars (conclusion boundary preserved)
-2026-02-28 23:53:30.643 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 77, 19599 words)
-2026-02-28 23:53:31.015 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-02-28 23:53:31.064 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 471 total chunks
-2026-02-28 23:53:36.750 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-02-28 23:53:36.750 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-02-28 23:53:36.750 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-02-28 23:53:36.750 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=body, paper_words=19599
-2026-02-28 23:53:36.750 - backend.compiler.core.compiler_coordinator - INFO - Body section complete - transitioning to CRITIQUE PHASE
-2026-02-28 23:53:36.750 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-02-28 23:53:36.762 - backend.compiler.core.compiler_coordinator - INFO - STARTING CRITIQUE PHASE
-2026-02-28 23:53:36.762 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Snapshot pre-critique paper: 152068 chars
-2026-02-28 23:53:36.763 - backend.compiler.memory.critique_memory - INFO - Initialized critique memory for paper_v1 at backend\data\critique_feedback_paper_v1.txt
-2026-02-28 23:53:36.763 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-02-28 23:53:36.763 - backend.compiler.memory.critique_memory - INFO - Critique file is empty
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Critique memory initialized for paper_v1
-2026-02-28 23:53:36.763 - backend.compiler.agents.critique_submitter - INFO - Critique submitter initialized with model google/gemini-3.1-pro-preview
-2026-02-28 23:53:36.763 - backend.compiler.memory.critique_rejection_memory - INFO - Loaded 0 critique rejections
-2026-02-28 23:53:36.763 - backend.compiler.agents.critique_submitter - INFO - Critique submitter rejection memory initialized
-2026-02-28 23:53:36.763 - backend.compiler.memory.critique_rejection_memory - INFO - Reset critique rejection log
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique rejection feedback for fresh start
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter created with model: google/gemini-3.1-pro-preview
-2026-02-28 23:53:36.763 - backend.shared.api_client_manager - INFO - Configured role 'compiler_critique_submitter': provider=openrouter, model=google/gemini-3.1-pro-preview via Google
-2026-02-28 23:53:36.763 - backend.shared.api_client_manager - INFO - Configured role 'critique_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-02-28 23:53:36.763 - backend.shared.api_client_manager - INFO - Configured role 'critique_cleanup': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Starting critique aggregation loop (target: 5 total attempts, accepted OR rejected)
-2026-02-28 23:53:36.763 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 0/5, accepted: 0, rejected: 0)
-2026-02-28 23:53:57.432 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #1
-2026-02-28 23:53:57.432 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 0b3199f4-aca7-4a98-884f-a429ba5eefd4
-2026-02-28 23:54:10.033 - backend.compiler.memory.critique_memory - INFO - Added critique #1 to critique memory
-2026-02-28 23:54:10.033 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (1/5): 0b3199f4-aca7-4a98-884f-a429ba5eefd4
-2026-02-28 23:54:13.029 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 1/5, accepted: 1, rejected: 0)
-2026-02-28 23:55:42.591 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #2
-2026-02-28 23:55:42.591 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: b2bf6b38-e571-4ab4-bb29-2e7205c3c966
-2026-02-28 23:55:55.576 - backend.compiler.memory.critique_memory - INFO - Added critique #2 to critique memory
-2026-02-28 23:55:55.576 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (2/5): b2bf6b38-e571-4ab4-bb29-2e7205c3c966
-2026-02-28 23:55:58.576 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 2/5, accepted: 2, rejected: 0)
-2026-02-28 23:57:28.383 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #3
-2026-02-28 23:57:28.383 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: e412836f-d72b-4e7a-8807-aeab039ff4df
-2026-02-28 23:57:49.836 - backend.compiler.memory.critique_memory - INFO - Added critique #3 to critique memory
-2026-02-28 23:57:49.836 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (3/5): e412836f-d72b-4e7a-8807-aeab039ff4df
-2026-02-28 23:57:52.836 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 3/5, accepted: 3, rejected: 0)
-2026-02-28 23:59:35.768 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #4
-2026-02-28 23:59:35.768 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 9fd82e24-edf2-4e61-b198-6f5d196d46dd
-2026-02-28 23:59:44.580 - backend.compiler.memory.critique_memory - INFO - Added critique #4 to critique memory
-2026-02-28 23:59:44.580 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (4/5): 9fd82e24-edf2-4e61-b198-6f5d196d46dd
-2026-02-28 23:59:47.581 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 4/5, accepted: 4, rejected: 0)
-2026-03-01 00:02:11.960 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #5
-2026-03-01 00:02:11.960 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: c552d9e2-3c19-4028-96a0-7965377da5b7
-2026-03-01 00:02:24.643 - backend.compiler.memory.critique_memory - INFO - Added critique #5 to critique memory
-2026-03-01 00:02:24.643 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (5/5): c552d9e2-3c19-4028-96a0-7965377da5b7
-2026-03-01 00:02:27.644 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete: 5 total attempts (5 accepted, 0 rejected)
-2026-03-01 00:02:27.644 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:02:27.644 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete (5 total attempts) - triggering rewrite decision (attempt 1)
-2026-03-01 00:02:27.644 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:02:27.644 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter generating rewrite decision...
-2026-03-01 00:02:40.479 - backend.compiler.agents.critique_submitter - INFO - Rewrite decision generated: partial_revision
-2026-03-01 00:02:40.479 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision: partial_revision
-2026-03-01 00:02:40.479 - backend.compiler.core.compiler_coordinator - INFO - Validator reviewing rewrite decision...
-2026-03-01 00:02:40.479 - backend.compiler.validation.compiler_validator - INFO - Validating rewrite decision...
-2026-03-01 00:02:48.030 - backend.compiler.validation.compiler_validator - INFO - Rewrite decision VALIDATED: The decision to use PARTIAL_REVISION is justified. All five accepted critiques identify specific, localized issues: (1) missing subsections V.F/V.G, textual duplication in VI.A.3, and a heading format...
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision validated - executing
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - Decision: PARTIAL REVISION (iterative targeted edits)
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - EXECUTING PARTIAL REVISION (ITERATIVE EDITS)
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - Partial revision initiated (pending successful completion, max: 1)
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - Paper title unchanged
-2026-03-01 00:02:48.030 - backend.compiler.core.compiler_coordinator - INFO - Starting iterative edit loop...
-2026-03-01 00:02:48.046 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 00:02:56.847 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 00:02:56.847 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a malformed heading in Section V.B due to a merging error. Splitting it into ...
-2026-03-01 00:02:56.847 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 00:03:02.343 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses the formatting error in Section V.B identified in Critique #1, where the heading is malformed as 'V.B. Interval preliminar...
-2026-03-01 00:03:02.343 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 00:03:02.348 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 00:03:09.763 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 00:03:09.764 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a malformed heading in Section V.B due to a merging error. Splitting it into ...
-2026-03-01 00:03:09.764 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 00:03:14.715 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses the formatting error in Section V.B identified in Critique #1, where the heading is malformed as 'V.B. Interval preliminar...
-2026-03-01 00:03:14.715 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 00:03:14.732 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 00:03:22.799 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 00:03:22.799 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a malformed heading in Section V.B due to a merging error. Splitting it into ...
-2026-03-01 00:03:22.799 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 00:03:27.377 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses the formatting error in Section V.B identified in Critique #1, where the heading is malformed as 'V.B. Interval preliminar...
-2026-03-01 00:03:27.377 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 00:03:27.377 - backend.compiler.core.compiler_coordinator - ERROR - Max consecutive failures (3) reached - stopping iterative loop
-2026-03-01 00:03:27.377 - backend.compiler.core.compiler_coordinator - INFO - Iterative edit loop complete: 0 successful, 3 failed
-2026-03-01 00:03:27.377 - backend.compiler.core.compiler_coordinator - INFO - Ending critique phase (rewrite=False)
-2026-03-01 00:03:27.377 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete - transitioning to CONCLUSION phase
-2026-03-01 00:03:27.384 - backend.compiler.core.compiler_coordinator - INFO - Title unchanged - continuing to conclusion
-2026-03-01 00:03:27.384 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:03:27.384 - backend.compiler.core.compiler_coordinator - INFO - PARTIAL REVISION COMPLETE - Continuing to CONCLUSION
-2026-03-01 00:03:27.384 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 00:03:27.384 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (19599 words)
-2026-03-01 00:03:27.384 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: body → conclusion
-2026-03-01 00:03:27.399 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 00:03:27.399 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=conclusion)
-2026-03-01 00:03:27.399 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:03:27.400 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=152068 chars
-2026-03-01 00:03:27.400 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 152068 chars → 151995 chars (markers removed)
-2026-03-01 00:03:27.400 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:03:27.400 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-03-01 00:04:36.739 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 69.34s (coverage=0.92, tokens=6847)
-2026-03-01 00:04:36.740 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 61458 chars retrieved
-2026-03-01 00:04:36.740 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: conclusion...
-2026-03-01 00:04:36.741 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 252729 chars
-2026-03-01 00:04:36.773 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_017)...
-2026-03-01 00:05:05.642 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 8820 chars
-2026-03-01 00:05:05.642 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:05:05.657 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:05:05.657 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: b6420faa-6daa-4f93-af47-1121bdd8f125 (section_complete=True)
-2026-03-01 00:05:05.675 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: b6420faa-6daa-4f93-af47-1121bdd8f125
-2026-03-01 00:05:05.675 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 00:05:05.690 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLET'...
-2026-03-01 00:05:05.690 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 151893
-2026-03-01 00:05:05.708 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_019)...
-2026-03-01 00:05:18.042 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:05:18.059 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 78)
-2026-03-01 00:05:18.629 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:05:18.660 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 498 total chunks
-2026-03-01 00:05:24.528 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:05:24.528 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:05:24.528 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:05:24.543 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=conclusion, paper_words=20564
-2026-03-01 00:05:24.543 - backend.compiler.core.compiler_coordinator - INFO - Phase transition: conclusion → introduction (explicit section_complete)
-2026-03-01 00:05:24.543 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (20564 words)
-2026-03-01 00:05:24.560 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 00:05:24.560 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=introduction)
-2026-03-01 00:05:24.560 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:05:24.560 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=160095 chars
-2026-03-01 00:05:24.560 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 160095 chars → 160022 chars (markers removed)
-2026-03-01 00:05:24.560 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:05:24.560 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-03-01 00:06:32.474 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 67.91s (coverage=0.92, tokens=6610)
-2026-03-01 00:06:32.476 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 58806 chars retrieved
-2026-03-01 00:06:32.476 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: introduction...
-2026-03-01 00:06:32.476 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 258607 chars
-2026-03-01 00:06:32.499 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_018)...
-2026-03-01 00:06:32.521 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: conclusion → introduction
-2026-03-01 00:06:57.385 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 8280 chars
-2026-03-01 00:06:57.385 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:06:57.385 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:06:57.385 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6f35b7a1-5173-4973-a389-97ae2b7ba195 (section_complete=True)
-2026-03-01 00:06:57.402 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6f35b7a1-5173-4973-a389-97ae2b7ba195
-2026-03-01 00:06:57.403 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 00:06:57.403 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS COM'...
-2026-03-01 00:06:57.403 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 102
-2026-03-01 00:06:57.435 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_020)...
-2026-03-01 00:07:04.385 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:07:04.401 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 79)
-2026-03-01 00:07:04.834 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:07:04.878 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 523 total chunks
-2026-03-01 00:07:11.336 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:07:11.336 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:07:11.353 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:07:11.370 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=introduction, paper_words=21464
-2026-03-01 00:07:11.386 - backend.compiler.core.compiler_coordinator - INFO - Phase transition: introduction → abstract (explicit section_complete)
-2026-03-01 00:07:11.386 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (21464 words)
-2026-03-01 00:07:11.386 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 00:07:11.386 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=abstract)
-2026-03-01 00:07:11.386 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:07:11.403 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=19136 chars, paper=167596 chars
-2026-03-01 00:07:11.403 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 167596 chars → 167523 chars (markers removed)
-2026-03-01 00:07:11.403 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:07:11.403 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=660
-2026-03-01 00:08:17.275 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 65.87s (coverage=0.92, tokens=6652)
-2026-03-01 00:08:17.275 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 59202 chars retrieved
-2026-03-01 00:08:17.275 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: abstract...
-2026-03-01 00:08:17.275 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 266147 chars
-2026-03-01 00:08:17.308 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_019)...
-2026-03-01 00:08:17.325 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: introduction → abstract
-2026-03-01 00:08:28.910 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 2633 chars
-2026-03-01 00:08:28.910 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:08:28.910 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:08:28.910 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 9de51ee9-1af5-4b48-9c9b-f1902a94d1c2 (section_complete=True)
-2026-03-01 00:08:28.925 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 9de51ee9-1af5-4b48-9c9b-f1902a94d1c2
-2026-03-01 00:08:28.926 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 00:08:28.926 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]'
-2026-03-01 00:08:28.926 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 0
-2026-03-01 00:08:28.962 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_021)...
-2026-03-01 00:08:36.744 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:08:36.761 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 80)
-2026-03-01 00:08:37.160 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:08:37.211 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 529 total chunks
-2026-03-01 00:08:38.347 - backend.autonomous.core.autonomous_coordinator - INFO - Abstract detected - paper compilation complete
-2026-03-01 00:08:38.347 - backend.compiler.core.compiler_coordinator - INFO - Stopping compiler...
-2026-03-01 00:08:38.351 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow cancelled
-2026-03-01 00:08:38.353 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring stopped
-2026-03-01 00:08:38.353 - backend.compiler.core.compiler_coordinator - INFO - Compiler stopped
-2026-03-01 00:08:38.363 - backend.autonomous.core.autonomous_coordinator - INFO - Paper paper_007: tracked 3 models, 105 API calls, 0 Wolfram calls
-2026-03-01 00:08:38.364 - backend.autonomous.core.autonomous_coordinator - INFO - Added author attribution and model credits to paper
-2026-03-01 00:08:38.370 - backend.autonomous.memory.paper_library - INFO - Paper saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_007.txt
-2026-03-01 00:08:38.373 - backend.autonomous.memory.paper_library - INFO - Outline saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_007_outline.txt
-2026-03-01 00:08:38.376 - backend.autonomous.memory.paper_library - INFO - Abstract saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_007_abstract.txt
-2026-03-01 00:08:38.380 - backend.autonomous.memory.paper_library - INFO - Saved paper paper_007: 'Contract-Based Digital-Twin Integration for a Compact Q>15 Stellarator: UQ, RAMI, and Cost-Constrained Optimization' (21873 words, 3 models tracked)
-2026-03-01 00:08:38.399 - backend.autonomous.core.autonomous_coordinator - INFO - Auto-generating critique for paper paper_007: Contract-Based Digital-Twin Integration for a Compact Q>15 Stellarator: UQ, RAMI, and Cost-Constrained Optimization
-2026-03-01 00:08:38.403 - backend.autonomous.core.autonomous_coordinator - INFO - Paper completed: paper_007 (21873 words)
-2026-03-01 00:08:38.403 - backend.autonomous.core.autonomous_coordinator - INFO - Running paper redundancy check
-2026-03-01 00:08:38.432 - backend.shared.api_client_manager - INFO - Configured role 'paper_critic': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 00:08:38.545 - backend.autonomous.validation.paper_redundancy_checker - INFO - PaperRedundancyChecker: Checking redundancy with model x-ai/grok-4.1-fast (task_id=auto_prc_001)
-2026-03-01 00:08:58.028 - backend.shared.critique_memory - INFO - Saved critique 3c5703e8-4bad-48ba-9541-4aa59d6b50d0 for autonomous_paper paper_id=paper_007 at backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_007_critiques.json
-2026-03-01 00:08:58.028 - backend.autonomous.core.autonomous_coordinator - INFO - Auto-critique saved for paper paper_007: avg=8.0 (N=7, C=9, I=8)
-2026-03-01 00:08:58.028 - backend.autonomous.core.autonomous_coordinator - INFO - High-score critique notification sent for paper paper_007 (avg=8.0)
-2026-03-01 00:09:12.763 - backend.autonomous.validation.paper_redundancy_checker - INFO - PaperRedundancyChecker: Recommending removal of paper_003
-2026-03-01 00:09:12.788 - backend.autonomous.memory.paper_library - INFO - Paper paper_003 archived successfully
-2026-03-01 00:09:12.795 - backend.autonomous.validation.paper_redundancy_checker - INFO - PaperRedundancyChecker: Successfully archived paper paper_003
-2026-03-01 00:09:12.797 - backend.autonomous.core.autonomous_coordinator - INFO - Paper complete, returning to topic selection
-2026-03-01 00:09:12.797 - backend.autonomous.core.autonomous_coordinator - INFO - Topic selection attempt 1/3
-2026-03-01 00:09:12.864 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generating topic selection with model openai/gpt-5.2 (prompt=4388t, task_id=auto_ts_121)
-2026-03-01 00:09:21.514 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generated submission - action=continue_existing
-2026-03-01 00:09:21.514 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Validating topic selection with model x-ai/grok-4.1-fast (prompt=4290t, task_id=auto_tv_004)
-2026-03-01 00:09:28.982 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Decision=accept
-2026-03-01 00:09:28.982 - backend.autonomous.core.autonomous_coordinator - INFO - Continuing brainstorm: topic_003
-2026-03-01 00:09:29.081 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Starting selection (max 6 papers, 6 available, 0 already selected)
-2026-03-01 00:09:29.098 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector: Requesting expansion with model openai/gpt-5.2 (prompt=22973t, task_id=auto_rs_012)
-2026-03-01 00:09:46.250 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Papers (232415 tokens) exceed budget (128000). Using RAG for relevant sections.
-2026-03-01 00:09:46.383 - backend.autonomous.core.autonomous_rag_manager - INFO - Reference papers: Using RAG (232415 tokens > 128000 max)
-2026-03-01 00:09:46.510 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_007: 2024 total chunks
-2026-03-01 00:10:13.458 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_007
-2026-03-01 00:10:13.568 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_006: 1717 total chunks
-2026-03-01 00:10:35.358 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_006
-2026-03-01 00:10:35.434 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_004: 1267 total chunks
-2026-03-01 00:10:51.824 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_004
-2026-03-01 00:10:51.937 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_001: 1824 total chunks
-2026-03-01 00:11:23.322 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_001
-2026-03-01 00:11:23.424 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_005: 1313 total chunks
-2026-03-01 00:11:41.128 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_005
-2026-03-01 00:11:41.259 - backend.aggregator.ingestion.pipeline - INFO - Ingested reference_paper_paper_002: 2053 total chunks
-2026-03-01 00:12:09.692 - backend.aggregator.core.rag_manager - INFO - Added text: reference_paper_paper_002
-2026-03-01 00:13:08.579 - backend.autonomous.core.autonomous_rag_manager - INFO - Reference papers RAG: Retrieved 105 evidence chunks
-2026-03-01 00:13:08.589 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Making final selection with model openai/gpt-5.2 (prompt=15574t, max=6 papers, task_id=auto_rs_013)
-2026-03-01 00:13:24.412 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Selected 6 reference papers
-2026-03-01 00:13:24.427 - backend.autonomous.core.autonomous_coordinator - INFO - Pre-brainstorm reference selection: selected 6 papers
-2026-03-01 00:13:24.427 - backend.autonomous.core.autonomous_coordinator - INFO - Selected 6 reference papers for brainstorm
-2026-03-01 00:13:24.429 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 00:13:24.429 - backend.autonomous.core.autonomous_coordinator - INFO - Per-paper model tracking enabled for brainstorm topic_003
-2026-03-01 00:13:24.446 - backend.aggregator.memory.shared_training - INFO - Reloaded 39 insights from backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_003.txt (submission count: 39)
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - INFO - Reloaded 39 existing submissions from brainstorm database
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_007.txt
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_001.txt
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_004.txt
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_006.txt
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_005.txt
-2026-03-01 00:13:24.446 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_002.txt
-2026-03-01 00:13:24.446 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-03-01 00:13:24.446 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 400000, Validator: 2000000
-2026-03-01 00:13:24.446 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['openai/gpt-5.2', 'moonshotai/kimi-k2.5', 'x-ai/grok-4.1-fast'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-03-01 00:13:25.110 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
-2026-03-01 00:13:25.111 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 400000 tokens (model: openai/gpt-5.2)
-  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.5)
-  - Submitter 3: 2000000 tokens (model: x-ai/grok-4.1-fast)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-03-01 00:13:25.124 - backend.aggregator.memory.shared_training - INFO - Loaded 39 existing insights from shared training (submission count: 39)
-2026-03-01 00:13:25.124 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-03-01 00:13:25.139 - backend.aggregator.memory.event_log - INFO - Loaded 1740 events from event log
-2026-03-01 00:13:25.140 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 1
-2026-03-01 00:13:25.140 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model openai/gpt-5.2
-2026-03-01 00:13:25.140 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 00:13:25.140 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=openai/gpt-5.2, provider=openrouter, context=400000
-2026-03-01 00:13:25.140 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 2
-2026-03-01 00:13:25.145 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.5
-2026-03-01 00:13:25.145 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.5 via Groq
-2026-03-01 00:13:25.145 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.5, provider=openrouter, context=262000
-2026-03-01 00:13:25.146 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 3
-2026-03-01 00:13:25.146 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.1-fast
-2026-03-01 00:13:25.146 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.1-fast via Google
-2026-03-01 00:13:25.146 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.1-fast, provider=openrouter, context=2000000
-2026-03-01 00:13:25.146 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-03-01 00:13:25.146 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 00:13:25.146 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-03-01 00:13:25.146 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
-2026-03-01 00:13:25.146 - backend.autonomous.core.autonomous_coordinator - INFO - Re-ingesting 39 existing submissions into RAG...
-2026-03-01 00:13:25.513 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_003.tmp: 2806 total chunks
-2026-03-01 00:14:05.065 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_003.tmp
-2026-03-01 00:14:05.065 - backend.autonomous.core.autonomous_coordinator - INFO - Successfully re-ingested 39 submissions into RAG
-2026-03-01 00:14:05.065 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-03-01 00:14:05.065 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-03-01 00:14:05.065 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-03-01 00:14:05.065 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-03-01 00:14:05.065 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-03-01 00:14:05.065 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-03-01 00:14:05.065 - backend.autonomous.core.autonomous_coordinator - INFO - Aggregator started for brainstorm topic_003
-2026-03-01 00:14:05.065 - backend.autonomous.core.autonomous_coordinator - INFO - Resuming brainstorm with 39 acceptances, 24 rejections from workflow state
-2026-03-01 00:14:05.065 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-03-01 00:14:05.165 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-03-01 00:14:05.252 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-03-01 00:14:05.353 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-03-01 00:14:05.353 - backend.aggregator.core.coordinator - INFO - Validator iteration 1 - batch validating 3 submissions: ['aec67092-4e54-413f-a588-de67d854cd29', 'a78ba4f2-e613-44be-a979-59d8a043c4fe', 'bef7a4a4-9c98-413b-a3f7-b0a408def904']
-2026-03-01 00:14:05.354 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 00:14:05.355 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 00:14:18.717 - backend.api.routes.autonomous - INFO - Manual override: Forcing paper writing for brainstorm topic_003
-2026-03-01 00:14:18.717 - backend.autonomous.core.autonomous_coordinator - INFO - MANUAL OVERRIDE: Forcing paper writing for brainstorm topic_003
-2026-03-01 00:14:18.717 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-03-01 00:14:18.717 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-03-01 00:14:18.733 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-03-01 00:14:18.733 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-03-01 00:14:18.733 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 1
-2026-03-01 00:14:18.733 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 1 iterations - is_running=False
-2026-03-01 00:14:18.733 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-03-01 00:14:18.733 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm aggregator stopped by manual override
-2026-03-01 00:14:19.057 - backend.autonomous.core.autonomous_coordinator - INFO - Manual override detected - transitioning to paper writing
-2026-03-01 00:14:19.058 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared shared_training_memory in-memory data (will reload from file when needed)
-2026-03-01 00:14:19.061 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper compilation for brainstorm topic_003
-2026-03-01 00:14:19.061 - backend.autonomous.core.autonomous_coordinator - INFO - Already have 6 reference papers (max 6), skipping additional selection
-2026-03-01 00:14:19.072 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 1
-2026-03-01 00:14:19.073 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model openai/gpt-5.2 (task_id=auto_pt_008)
-2026-03-01 00:14:24.255 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=auto_pt_009)
-2026-03-01 00:14:29.239 - backend.shared.json_parser - ERROR - parse_json: Expecting property name enclosed in double quotes: line 2 column 3 (char 4)
-2026-03-01 00:14:29.239 - backend.autonomous.agents.paper_title_selector - ERROR - PaperTitleSelector: Error validating title: Expecting property name enclosed in double quotes: line 2 column 3 (char 4)
-2026-03-01 00:14:29.239 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title rejected (attempt 1): Validation error: Expecting property name enclosed in double quotes: line 2 column 3 (char 4)
-2026-03-01 00:14:31.249 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 2
-2026-03-01 00:14:31.251 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model openai/gpt-5.2 (task_id=auto_pt_010)
-2026-03-01 00:14:36.295 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=auto_pt_011)
-2026-03-01 00:14:41.191 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title accepted: 'Certified 3D Neutron Transport for Stellarator Blankets: Adjoint Sensitivity and Multilevel Uncertainty Quantification'
-2026-03-01 00:14:41.211 - backend.autonomous.core.autonomous_coordinator - INFO - Compiling paper: Certified 3D Neutron Transport for Stellarator Blankets: Adjoint Sensitivity and Multilevel Uncertainty Quantification
-2026-03-01 00:14:41.211 - backend.autonomous.core.autonomous_coordinator - INFO - Clearing RAG for autonomous paper compilation...
-2026-03-01 00:14:41.211 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-03-01 00:14:42.442 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-03-01 00:14:43.923 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-03-01 00:14:44.569 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-03-01 00:14:45.101 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-03-01 00:14:45.264 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-03-01 00:14:45.323 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-03-01 00:14:45.361 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-03-01 00:14:45.404 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-03-01 00:14:45.537 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-03-01 00:14:45.537 - backend.autonomous.core.autonomous_coordinator - INFO - RAG cleared successfully
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_coordinator - INFO - Initializing compiler coordinator...
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_rag_manager - INFO - Resetting compiler RAG manager state...
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager state reset
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_rag_manager - INFO - Initializing compiler RAG manager...
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_rag_manager - INFO - Updating compiler context window from 131072 to 131072
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager initialized
-2026-03-01 00:14:45.537 - backend.compiler.core.compiler_coordinator - INFO - Skipping Part 1 aggregator database load (autonomous mode)
-2026-03-01 00:14:45.553 - backend.compiler.agents.high_context_submitter - INFO - High-context submitter initialized with model: openai/gpt-5.2
-2026-03-01 00:14:45.553 - backend.compiler.agents.high_context_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-03-01 00:14:45.553 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_context': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 00:14:45.553 - backend.compiler.agents.high_param_submitter - INFO - High-param submitter initialized with model: moonshotai/kimi-k2.5
-2026-03-01 00:14:45.553 - backend.compiler.agents.high_param_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-03-01 00:14:45.553 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_param': provider=openrouter, model=moonshotai/kimi-k2.5 via Google
-2026-03-01 00:14:45.553 - backend.compiler.validation.compiler_validator - INFO - Compiler validator initialized with model: x-ai/grok-4.1-fast
-2026-03-01 00:14:45.553 - backend.shared.api_client_manager - INFO - Configured role 'compiler_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 00:14:45.553 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Per-paper model tracking enabled for manual compiler mode
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Compiler coordinator initialized successfully
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Autonomous mode enabled - section order: Body → Conclusion → Intro → Abstract
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Clearing paper and outline...
-2026-03-01 00:14:45.553 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 81, 0 words)
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_rag_manager - INFO - Paper is empty, skipping re-chunking
-2026-03-01 00:14:45.553 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 20)
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_rag_manager - INFO - Outline is empty, skipping re-chunking
-2026-03-01 00:14:45.553 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique memory
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Cleared rejection/acceptance logs
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Reset per-paper model tracker
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Reset autonomous section phase to body
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Reset critique phase state
-2026-03-01 00:14:45.553 - backend.compiler.core.compiler_coordinator - INFO - Paper and outline cleared - system reset to fresh start
-2026-03-01 00:14:45.553 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared previous paper/outline for fresh paper paper_008
-2026-03-01 00:14:45.553 - backend.autonomous.core.autonomous_coordinator - INFO - Loading brainstorm database into compiler RAG: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_003.txt
-2026-03-01 00:14:45.638 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_003.txt: 783 total chunks
-2026-03-01 00:14:56.688 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_003.txt
-2026-03-01 00:14:56.688 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm database loaded into compiler RAG
-2026-03-01 00:14:56.688 - backend.autonomous.core.autonomous_coordinator - INFO - Loading 6 reference papers into compiler RAG
-2026-03-01 00:14:56.688 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_007.txt
-2026-03-01 00:14:56.688 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_001.txt
-2026-03-01 00:14:56.689 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_004.txt
-2026-03-01 00:14:56.689 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_006.txt
-2026-03-01 00:14:56.689 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_005.txt
-2026-03-01 00:14:56.689 - backend.autonomous.core.autonomous_coordinator - WARNING - Reference paper not found: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_reference_paper_paper_002.txt
-2026-03-01 00:14:56.689 - backend.autonomous.core.autonomous_coordinator - INFO - All reference papers loaded into compiler RAG
-2026-03-01 00:14:56.690 - backend.compiler.core.compiler_coordinator - INFO - Starting compiler...
-2026-03-01 00:14:56.690 - backend.compiler.core.compiler_coordinator - INFO - Compiler started successfully
-2026-03-01 00:14:56.691 - backend.autonomous.core.autonomous_coordinator - INFO - Compiler started for paper paper_008
-2026-03-01 00:14:56.691 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow started
-2026-03-01 00:14:56.691 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring started - will check for new acceptances every 30 seconds
-2026-03-01 00:14:56.694 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: None → body
-2026-03-01 00:14:56.697 - backend.compiler.core.compiler_coordinator - INFO - Starting fresh - no existing paper or outline found
-2026-03-01 00:14:56.698 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 00:14:56.698 - backend.compiler.core.compiler_coordinator - INFO - PHASE 1: ITERATIVE OUTLINE CREATION
-2026-03-01 00:14:56.698 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 00:14:56.698 - backend.compiler.core.compiler_coordinator - INFO -
---- Outline Creation Iteration 1/15 ---
-2026-03-01 00:14:56.698 - backend.compiler.agents.high_context_submitter - INFO - Starting outline creation submission generation...
-2026-03-01 00:14:56.698 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:14:56.698 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_create, query_length=162
-2026-03-01 00:15:50.488 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_create in 53.79s (coverage=0.84, tokens=6724)
-2026-03-01 00:15:50.488 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 58988 chars retrieved
-2026-03-01 00:15:50.488 - backend.compiler.agents.high_context_submitter - INFO - Building outline creation prompt...
-2026-03-01 00:15:50.488 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 76215 chars
-2026-03-01 00:15:50.504 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_000)...
-2026-03-01 00:16:49.656 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 16964 chars
-2026-03-01 00:16:49.656 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:16:49.658 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:16:49.658 - backend.compiler.agents.high_context_submitter - INFO - Outline creation submission generated: 127edc0f-a2a3-46f5-b4a1-dcae3744b856, outline_complete=True
-2026-03-01 00:16:49.658 - backend.compiler.validation.compiler_validator - INFO - Validating outline_create submission: 127edc0f-a2a3-46f5-b4a1-dcae3744b856
-2026-03-01 00:16:49.674 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_create, operation=full_content
-2026-03-01 00:16:49.674 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_000)...
-2026-03-01 00:17:03.042 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:17:03.074 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_create)
-2026-03-01 00:17:03.075 - backend.compiler.core.compiler_coordinator - INFO - ✓ Iteration 1: Outline ACCEPTED
-2026-03-01 00:17:03.075 - backend.compiler.core.compiler_coordinator - INFO -   Validator feedback: The submission is a complete outline that fully meets all validation criteria. It includes the optional Abstract, required Introduction (I. Introduction), multiple body sections (II through XVI), and ...
-2026-03-01 00:17:03.075 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 00:17:03.075 - backend.compiler.core.compiler_coordinator - INFO - OUTLINE MARKED COMPLETE BY SUBMITTER - LOCKING
-2026-03-01 00:17:03.075 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 00:17:03.080 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 21)
-2026-03-01 00:17:03.325 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 00:17:03.342 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 40 total chunks
-2026-03-01 00:17:03.992 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 00:17:03.992 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 00:17:03.992 - backend.compiler.memory.outline_memory - INFO - Outline creation feedback cleared
-2026-03-01 00:17:03.992 - backend.compiler.core.compiler_coordinator - INFO - Outline locked after 1 iterations
-2026-03-01 00:17:03.992 - backend.compiler.core.compiler_coordinator - INFO - Starting initial paper loop...
-2026-03-01 00:17:03.992 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=True, phase=body)
-2026-03-01 00:17:03.992 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:17:03.992 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=0 chars
-2026-03-01 00:17:03.992 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 0 chars → 0 chars (markers removed)
-2026-03-01 00:17:03.992 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:17:03.992 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=162
-2026-03-01 00:17:54.845 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 50.85s (coverage=0.84, tokens=6121)
-2026-03-01 00:17:54.845 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 53789 chars retrieved
-2026-03-01 00:17:54.845 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:17:54.845 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 81952 chars
-2026-03-01 00:17:54.862 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_001)...
-2026-03-01 00:18:37.681 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 11673 chars
-2026-03-01 00:18:37.685 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:18:37.685 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:18:37.685 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: cb45e3aa-da99-4d0b-83c2-93e044e0e928 (section_complete=False)
-2026-03-01 00:18:37.697 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: cb45e3aa-da99-4d0b-83c2-93e044e0e928
-2026-03-01 00:18:37.697 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 10627 -> 10626 chars, new_string: 10627 -> 10626 chars)
-2026-03-01 00:18:37.697 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=full_content
-2026-03-01 00:18:37.697 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_001)...
-2026-03-01 00:18:47.582 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:18:47.583 - backend.compiler.memory.paper_memory - INFO - Paper initialized with placeholders (version 82)
-2026-03-01 00:18:47.598 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:18:47.598 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 34 total chunks
-2026-03-01 00:18:48.094 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:18:48.094 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:18:48.097 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:18:48.099 - backend.compiler.core.compiler_coordinator - INFO - Initial paper portion accepted with placeholders! (1367 words)
-2026-03-01 00:18:48.099 - backend.compiler.core.compiler_coordinator - INFO - Initial paper loop complete
-2026-03-01 00:18:48.099 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 00:18:48.100 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:18:48.100 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:18:48.103 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=11013 chars
-2026-03-01 00:18:48.103 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 11013 chars → 10940 chars (markers removed)
-2026-03-01 00:18:48.103 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:18:48.103 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:19:51.869 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 63.77s (coverage=0.96, tokens=6571)
-2026-03-01 00:19:51.869 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 56803 chars retrieved
-2026-03-01 00:19:51.869 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:19:51.869 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 95830 chars
-2026-03-01 00:19:51.885 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_002)...
-2026-03-01 00:20:37.077 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10119 chars
-2026-03-01 00:20:37.077 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:20:37.088 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:20:37.088 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: b9364f33-a2eb-4a57-8a8b-dffae00bfa16 (section_complete=False)
-2026-03-01 00:20:37.088 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: b9364f33-a2eb-4a57-8a8b-dffae00bfa16
-2026-03-01 00:20:37.088 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 8825 -> 8823 chars, new_string: 8825 -> 8823 chars)
-2026-03-01 00:20:37.088 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:20:37.088 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '3. Damage metrics must specify any time normalization (e.g., dpa per FPY) as a deterministic scaling'...
-2026-03-01 00:20:37.088 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 10534
-2026-03-01 00:20:37.110 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_002)...
-2026-03-01 00:20:48.855 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:20:48.855 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=302, new_string_len=8823
-2026-03-01 00:20:48.855 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 8823 chars (conclusion boundary preserved)
-2026-03-01 00:20:48.880 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 83, 2329 words)
-2026-03-01 00:20:49.092 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:20:49.097 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 63 total chunks
-2026-03-01 00:20:49.872 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:20:49.872 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:20:49.872 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:20:49.889 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2329 words)
-2026-03-01 00:20:49.889 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:20:49.889 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:20:49.889 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=19838 chars
-2026-03-01 00:20:49.889 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 19838 chars → 19765 chars (markers removed)
-2026-03-01 00:20:49.889 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:20:49.889 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:21:59.109 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 69.22s (coverage=0.89, tokens=6679)
-2026-03-01 00:21:59.109 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 57532 chars retrieved
-2026-03-01 00:21:59.109 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:21:59.109 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 105384 chars
-2026-03-01 00:21:59.126 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_003)...
-2026-03-01 00:22:54.881 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 15180 chars
-2026-03-01 00:22:54.881 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:22:54.897 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:22:54.897 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 05939ecb-ce8d-4b30-ac82-46a499542381 (section_complete=False)
-2026-03-01 00:22:54.897 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 05939ecb-ce8d-4b30-ac82-46a499542381
-2026-03-01 00:22:54.897 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 13564 -> 13563 chars, new_string: 13564 -> 13563 chars)
-2026-03-01 00:22:54.897 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:22:54.897 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The subsequent sections build adjoint sensitivity formulas, variance-reduction constructions, and mu'...
-2026-03-01 00:22:54.897 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 19385
-2026-03-01 00:22:54.914 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_003)...
-2026-03-01 00:23:05.932 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:23:05.932 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=380, new_string_len=13563
-2026-03-01 00:23:05.932 - backend.compiler.core.compiler_coordinator - WARNING - AUTO-CORRECTING BOUNDARY VIOLATION: insert_after anchor is after CONCLUSION_PLACEHOLDER. Relocating insertion to just before the placeholder. Original anchor position: 19765, Conclusion placeholder position: 19663
-2026-03-01 00:23:05.932 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 13563 chars (conclusion boundary preserved)
-2026-03-01 00:23:05.956 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 84, 3874 words)
-2026-03-01 00:23:06.181 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:23:06.181 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 105 total chunks
-2026-03-01 00:23:07.515 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:23:07.515 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:23:07.515 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:23:07.515 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (3874 words)
-2026-03-01 00:23:07.515 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:23:07.515 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:23:07.515 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=33403 chars
-2026-03-01 00:23:07.515 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 33403 chars → 33330 chars (markers removed)
-2026-03-01 00:23:07.515 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:23:07.515 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:24:22.584 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 75.07s (coverage=0.95, tokens=6825)
-2026-03-01 00:24:22.585 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 58750 chars retrieved
-2026-03-01 00:24:22.585 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:24:22.585 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 120167 chars
-2026-03-01 00:24:22.601 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_004)...
-2026-03-01 00:25:20.223 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 12756 chars
-2026-03-01 00:25:20.223 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:25:20.237 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:25:20.237 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 961e6e4c-356c-4d3c-bdf9-639c6e4e663b (section_complete=False)
-2026-03-01 00:25:20.239 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 961e6e4c-356c-4d3c-bdf9-639c6e4e663b
-2026-03-01 00:25:20.239 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11715 -> 11713 chars, new_string: 11715 -> 11713 chars)
-2026-03-01 00:25:20.264 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:25:20.264 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These checks are “gaps” in the sense that their exact thresholds depend on the concrete solver and g'...
-2026-03-01 00:25:20.264 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 33029
-2026-03-01 00:25:20.272 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_004)...
-2026-03-01 00:25:42.124 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=True, rigor=True, placement=True)
-2026-03-01 00:25:42.124 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: construction)
-2026-03-01 00:25:42.124 - backend.compiler.core.compiler_coordinator - INFO - Construction rejected
-2026-03-01 00:25:42.124 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body, retry with feedback)
-2026-03-01 00:25:42.139 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:25:42.155 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=33403 chars
-2026-03-01 00:25:42.156 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 33403 chars → 33330 chars (markers removed)
-2026-03-01 00:25:42.156 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:25:42.156 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:26:58.195 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 76.04s (coverage=0.95, tokens=6825)
-2026-03-01 00:26:58.195 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 58750 chars retrieved
-2026-03-01 00:26:58.195 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:26:58.195 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 124537 chars
-2026-03-01 00:26:58.212 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_005)...
-2026-03-01 00:28:08.004 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14524 chars
-2026-03-01 00:28:08.004 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:28:08.021 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:28:08.021 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6a2e3571-7ca9-42ff-9ce4-ce3914803def (section_complete=False)
-2026-03-01 00:28:08.030 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6a2e3571-7ca9-42ff-9ce4-ce3914803def
-2026-03-01 00:28:08.031 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 13494 -> 13492 chars, new_string: 13494 -> 13492 chars)
-2026-03-01 00:28:08.036 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:28:08.036 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These checks are “gaps” in the sense that their exact thresholds depend on the concrete solver and g'...
-2026-03-01 00:28:08.036 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 33029
-2026-03-01 00:28:08.052 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_005)...
-2026-03-01 00:28:16.198 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:28:16.198 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=197, new_string_len=13492
-2026-03-01 00:28:16.198 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 13492 chars (conclusion boundary preserved)
-2026-03-01 00:28:16.215 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 85, 5616 words)
-2026-03-01 00:28:16.463 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:28:16.475 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 152 total chunks
-2026-03-01 00:28:18.366 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:28:18.367 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:28:18.369 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:28:18.371 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (5616 words)
-2026-03-01 00:28:18.371 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-03-01 00:28:18.371 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:28:18.371 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14928 chars, paper=46897 chars
-2026-03-01 00:28:18.371 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 46897 chars → 46824 chars (markers removed)
-2026-03-01 00:28:18.371 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:28:18.371 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=162
-2026-03-01 00:29:11.150 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 52.78s (coverage=0.84, tokens=6237)
-2026-03-01 00:29:11.150 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54322 chars retrieved
-2026-03-01 00:29:11.150 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-03-01 00:29:11.150 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 131486 chars
-2026-03-01 00:29:11.168 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_006)...
-2026-03-01 00:29:28.510 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1563 chars
-2026-03-01 00:29:28.511 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:29:28.512 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:29:28.512 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: e51c73a8-247f-4f43-a1ed-a8bc1c3130ab
-2026-03-01 00:29:28.518 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: e51c73a8-247f-4f43-a1ed-a8bc1c3130ab
-2026-03-01 00:29:28.518 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 696 -> 692 chars)
-2026-03-01 00:29:28.518 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-03-01 00:29:28.518 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '      2. Consistency/unit checks for coupled gradients'
-2026-03-01 00:29:28.518 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 10881
-2026-03-01 00:29:28.534 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_006)...
-2026-03-01 00:29:43.602 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:29:43.602 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-03-01 00:29:43.602 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 692 chars
-2026-03-01 00:29:43.618 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 22)
-2026-03-01 00:29:43.752 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 00:29:43.752 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 42 total chunks
-2026-03-01 00:29:44.302 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 00:29:44.302 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 00:29:44.318 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-03-01 00:29:44.319 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-03-01 00:29:44.319 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 00:29:44.319 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:29:44.322 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=46897 chars
-2026-03-01 00:29:44.322 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 46897 chars → 46824 chars (markers removed)
-2026-03-01 00:29:44.322 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 00:29:44.322 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 73897 chars
-2026-03-01 00:29:44.333 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_007)...
-2026-03-01 00:30:31.770 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1889 chars
-2026-03-01 00:30:31.770 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:30:31.770 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:30:31.770 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 1a6ecf7a-8749-4b92-a08e-41e2fda7c792 (miniscule=False)
-2026-03-01 00:30:31.786 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 1a6ecf7a-8749-4b92-a08e-41e2fda7c792
-2026-03-01 00:30:31.786 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 00:30:31.786 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Assumption 3.1 (Forward solve is well-defined). For each admissible \\(\\mathbf{p}\\), there exists a u'...
-2026-03-01 00:30:31.786 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 13921
-2026-03-01 00:30:31.801 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_007)...
-2026-03-01 00:30:40.769 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:30:40.769 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=606, new_string_len=683
-2026-03-01 00:30:40.769 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 606 chars with 683 chars
-2026-03-01 00:30:40.769 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 86, 5626 words)
-2026-03-01 00:30:40.959 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:30:40.959 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 152 total chunks
-2026-03-01 00:30:42.987 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:30:42.987 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:30:42.987 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-03-01 00:30:42.987 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (5626 words)
-2026-03-01 00:30:42.987 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 00:30:42.987 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:30:43.003 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=46974 chars
-2026-03-01 00:30:43.003 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 46974 chars → 46901 chars (markers removed)
-2026-03-01 00:30:43.003 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 00:30:43.003 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 73974 chars
-2026-03-01 00:30:43.003 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_008)...
-2026-03-01 00:31:15.724 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 895 chars
-2026-03-01 00:31:15.724 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:31:15.740 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:31:15.740 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 77fd5799-a1f8-41eb-a26d-cbd79537a714 (miniscule=False)
-2026-03-01 00:31:15.756 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 77fd5799-a1f8-41eb-a26d-cbd79537a714
-2026-03-01 00:31:15.756 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 00:31:15.772 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The subsequent sections will formalize these QoIs as linear functionals in an operator framework sui'...
-2026-03-01 00:31:15.772 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 10637
-2026-03-01 00:31:15.772 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_008)...
-2026-03-01 00:31:24.342 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:31:24.342 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=199, new_string_len=178
-2026-03-01 00:31:24.342 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 199 chars with 178 chars
-2026-03-01 00:31:24.358 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 87, 5624 words)
-2026-03-01 00:31:24.661 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:31:24.677 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 152 total chunks
-2026-03-01 00:31:26.523 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:31:26.523 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:31:26.523 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-03-01 00:31:26.523 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (5624 words)
-2026-03-01 00:31:26.523 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-03-01 00:31:26.523 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-03-01 00:31:26.523 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-03-01 00:31:26.523 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-03-01 00:31:26.538 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=15620 chars, paper=46953 chars
-2026-03-01 00:31:26.538 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-03-01 00:31:26.538 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1163
-2026-03-01 00:32:35.313 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 68.77s (coverage=0.96, tokens=6626)
-2026-03-01 00:32:35.313 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 56365 chars
-2026-03-01 00:32:35.313 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-03-01 00:32:35.321 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_000)...
-2026-03-01 00:34:38.612 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1394 chars
-2026-03-01 00:34:38.612 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-03-01 00:34:38.612 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=355
-2026-03-01 00:34:38.612 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-03-01 00:34:38.645 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-03-01 00:34:38.645 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1163
-2026-03-01 00:35:46.031 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 67.39s (coverage=0.96, tokens=6626)
-2026-03-01 00:35:46.031 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-03-01 00:35:46.047 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_001)...
-2026-03-01 00:37:25.518 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 865 chars
-2026-03-01 00:37:25.518 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM refused (Step 1 made mistake)
-2026-03-01 00:37:25.518 - backend.compiler.core.compiler_coordinator - INFO - No rigor enhancement needed
-2026-03-01 00:37:25.518 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
-2026-03-01 00:37:25.518 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-03-01 00:37:25.518 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-03-01 00:37:25.534 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 00:37:25.534 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:37:25.534 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:37:25.535 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=46953 chars
-2026-03-01 00:37:25.535 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 46953 chars → 46880 chars (markers removed)
-2026-03-01 00:37:25.535 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:37:25.535 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:38:35.190 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 69.65s (coverage=0.91, tokens=6541)
-2026-03-01 00:38:35.191 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 55638 chars retrieved
-2026-03-01 00:38:35.191 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:38:35.191 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 134121 chars
-2026-03-01 00:38:35.210 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_009)...
-2026-03-01 00:39:34.856 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14271 chars
-2026-03-01 00:39:34.856 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:39:34.873 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:39:34.888 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 9c16b1e8-9025-413b-a222-2d6338c4dce6 (section_complete=False)
-2026-03-01 00:39:34.889 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 9c16b1e8-9025-413b-a222-2d6338c4dce6
-2026-03-01 00:39:34.889 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 12959 -> 12957 chars, new_string: 12959 -> 12957 chars)
-2026-03-01 00:39:34.889 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:39:34.889 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'In summary: adjoint-based biasing is mathematically justified by change-of-measure identities and th'...
-2026-03-01 00:39:34.889 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 46465
-2026-03-01 00:39:34.906 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_009)...
-2026-03-01 00:39:47.606 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:39:47.606 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=311, new_string_len=12957
-2026-03-01 00:39:47.606 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 12957 chars (conclusion boundary preserved)
-2026-03-01 00:39:47.638 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 88, 7196 words)
-2026-03-01 00:39:47.940 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:39:47.956 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 192 total chunks
-2026-03-01 00:39:50.591 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:39:50.591 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:39:50.606 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:39:50.606 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (7196 words)
-2026-03-01 00:39:50.606 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:39:50.606 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:39:50.623 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=59912 chars
-2026-03-01 00:39:50.623 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 59912 chars → 59839 chars (markers removed)
-2026-03-01 00:39:50.623 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:39:50.623 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:41:07.084 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 76.46s (coverage=0.93, tokens=6325)
-2026-03-01 00:41:07.084 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54624 chars retrieved
-2026-03-01 00:41:07.084 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:41:07.084 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 146066 chars
-2026-03-01 00:41:07.108 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_010)...
-2026-03-01 00:42:14.145 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 16077 chars
-2026-03-01 00:42:14.145 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:42:14.162 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:42:14.162 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: e997c0ae-7d85-4abf-bc34-1898504097c1 (section_complete=False)
-2026-03-01 00:42:14.178 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: e997c0ae-7d85-4abf-bc34-1898504097c1
-2026-03-01 00:42:14.178 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 14637 -> 14635 chars, new_string: 14637 -> 14635 chars)
-2026-03-01 00:42:14.211 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:42:14.212 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These diagnostics do not guarantee correctness, but they convert the fidelity-hierarchy adequacy que'...
-2026-03-01 00:42:14.212 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 59517
-2026-03-01 00:42:14.212 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_010)...
-2026-03-01 00:42:23.896 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:42:23.896 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=218, new_string_len=14635
-2026-03-01 00:42:23.896 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 14635 chars (conclusion boundary preserved)
-2026-03-01 00:42:23.912 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 89, 9002 words)
-2026-03-01 00:42:24.212 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:42:24.245 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 240 total chunks
-2026-03-01 00:42:27.779 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:42:27.779 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:42:27.783 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:42:27.789 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (9002 words)
-2026-03-01 00:42:27.789 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:42:27.789 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:42:27.790 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=74549 chars
-2026-03-01 00:42:27.790 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 74549 chars → 74476 chars (markers removed)
-2026-03-01 00:42:27.790 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:42:27.790 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:43:44.599 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 76.81s (coverage=0.93, tokens=6474)
-2026-03-01 00:43:44.599 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 55965 chars retrieved
-2026-03-01 00:43:44.599 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:43:44.599 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 162044 chars
-2026-03-01 00:43:44.631 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_011)...
-2026-03-01 00:44:38.684 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13689 chars
-2026-03-01 00:44:38.684 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:44:38.699 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:44:38.699 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6faae179-4175-4791-bfa5-81019671fd89 (section_complete=False)
-2026-03-01 00:44:38.700 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6faae179-4175-4791-bfa5-81019671fd89
-2026-03-01 00:44:38.700 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11964 -> 11963 chars, new_string: 11964 -> 11963 chars)
-2026-03-01 00:44:38.734 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:44:38.734 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'For certification, such updates remain valid only if the module-local certificates are updated along'...
-2026-03-01 00:44:38.734 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 73811
-2026-03-01 00:44:38.750 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_011)...
-2026-03-01 00:44:44.850 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:44:44.850 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=561, new_string_len=11963
-2026-03-01 00:44:44.850 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11963 chars (conclusion boundary preserved)
-2026-03-01 00:44:44.883 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 90, 10616 words)
-2026-03-01 00:44:45.400 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:44:45.434 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 277 total chunks
-2026-03-01 00:44:48.986 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:44:48.986 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:44:49.000 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:44:49.000 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (10616 words)
-2026-03-01 00:44:49.000 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 00:44:49.000 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:44:49.000 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=86514 chars
-2026-03-01 00:44:49.000 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 86514 chars → 86441 chars (markers removed)
-2026-03-01 00:44:49.000 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:44:49.000 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 00:46:02.519 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 73.52s (coverage=0.93, tokens=6574)
-2026-03-01 00:46:02.519 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 55753 chars retrieved
-2026-03-01 00:46:02.519 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 00:46:02.519 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 173797 chars
-2026-03-01 00:46:02.552 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_012)...
-2026-03-01 00:47:20.537 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14051 chars
-2026-03-01 00:47:20.537 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:47:20.554 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:47:20.554 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 1d09d3e0-dd7f-4c48-81b4-3ae6b1349e6e (section_complete=False)
-2026-03-01 00:47:20.570 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 1d09d3e0-dd7f-4c48-81b4-3ae6b1349e6e
-2026-03-01 00:47:20.586 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 12572 -> 12571 chars, new_string: 12572 -> 12571 chars)
-2026-03-01 00:47:20.595 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 00:47:20.595 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These artifacts are sufficient for an independent reviewer to reproduce the bias-bar computation and'...
-2026-03-01 00:47:20.595 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 86170
-2026-03-01 00:47:20.621 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_012)...
-2026-03-01 00:47:32.871 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:47:32.871 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=271, new_string_len=12571
-2026-03-01 00:47:32.871 - backend.compiler.core.compiler_coordinator - WARNING - AUTO-CORRECTING BOUNDARY VIOLATION: insert_after anchor is after CONCLUSION_PLACEHOLDER. Relocating insertion to just before the placeholder. Original anchor position: 86441, Conclusion placeholder position: 86339
-2026-03-01 00:47:32.871 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 12571 chars (conclusion boundary preserved)
-2026-03-01 00:47:32.887 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 91, 12236 words)
-2026-03-01 00:47:33.220 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 00:47:33.237 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 315 total chunks
-2026-03-01 00:47:37.188 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 00:47:37.188 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 00:47:37.188 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 00:47:37.188 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (12236 words)
-2026-03-01 00:47:37.188 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-03-01 00:47:37.188 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:47:37.188 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=15620 chars, paper=99087 chars
-2026-03-01 00:47:37.203 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 99087 chars → 99014 chars (markers removed)
-2026-03-01 00:47:37.204 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 00:47:37.204 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=162
-2026-03-01 00:48:32.705 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 55.50s (coverage=0.84, tokens=6237)
-2026-03-01 00:48:32.705 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54347 chars retrieved
-2026-03-01 00:48:32.705 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-03-01 00:48:32.705 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 184393 chars
-2026-03-01 00:48:32.722 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_013)...
-2026-03-01 00:48:54.973 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1787 chars
-2026-03-01 00:48:54.973 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:48:54.973 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:48:54.973 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: 32f221eb-7e9a-4337-bfa4-f91bf75ac6f1
-2026-03-01 00:48:54.973 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: 32f221eb-7e9a-4337-bfa4-f91bf75ac6f1
-2026-03-01 00:48:54.973 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 798 -> 791 chars)
-2026-03-01 00:48:54.989 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-03-01 00:48:54.989 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '      2. Unit and normalization checks (TBR dimensionless, dpa/FPY scaling applied deterministically'...
-2026-03-01 00:48:54.989 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 7302
-2026-03-01 00:48:55.006 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_013)...
-2026-03-01 00:49:10.890 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 00:49:10.890 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-03-01 00:49:10.890 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 791 chars
-2026-03-01 00:49:10.906 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 23)
-2026-03-01 00:49:11.140 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 00:49:11.156 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 44 total chunks
-2026-03-01 00:49:11.790 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 00:49:11.790 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 00:49:11.790 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-03-01 00:49:11.790 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=99087 chars
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 99087 chars → 99014 chars (markers removed)
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 00:49:11.790 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 126878 chars
-2026-03-01 00:49:11.806 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_014)...
-2026-03-01 00:49:31.874 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 867 chars
-2026-03-01 00:49:31.874 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:49:31.874 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:49:31.874 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 43c07d3a-1a49-46f3-bbd1-6b4bb30db2e2 (miniscule=False)
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 43c07d3a-1a49-46f3-bbd1-6b4bb30db2e2
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\big'...
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=226 | first20='\\mathbb{E}\\bigl[(\\wi' | last20='statistical error}}.'
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=99087 | double_spaces=7 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING - BACKSLASH_NORMALIZED_MATCH: Exact/hyphen/whitespace match failed but found unique backslash-normalized match at pos 51259. This indicates a model over-escaping quirk.
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING -   Model provided (normalized): '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr)'...
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr'...
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - INFO - Unicode hyphen normalization applied - updating old_string to actual document text
-2026-03-01 00:49:31.891 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 51259
-2026-03-01 00:49:31.907 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_014)...
-2026-03-01 00:49:42.644 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=True, rigor=True, placement=True)
-2026-03-01 00:49:42.653 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-03-01 00:49:42.655 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-03-01 00:49:42.655 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 00:49:42.655 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 00:49:42.658 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=99087 chars
-2026-03-01 00:49:42.658 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 99087 chars → 99014 chars (markers removed)
-2026-03-01 00:49:42.658 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 00:49:42.658 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 128663 chars
-2026-03-01 00:49:42.674 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_015)...
-2026-03-01 00:49:57.174 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 911 chars
-2026-03-01 00:49:57.174 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 00:49:57.174 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 00:49:57.174 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: b6449429-6ed5-411d-8c60-fa7c6083f4b6 (miniscule=False)
-2026-03-01 00:49:57.198 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: b6449429-6ed5-411d-8c60-fa7c6083f4b6
-2026-03-01 00:49:57.218 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 00:49:57.218 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\big'...
-2026-03-01 00:49:57.218 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 00:49:57.218 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=226 | first20='\\mathbb{E}\\bigl[(\\wi' | last20='statistical error}}.'
-2026-03-01 00:49:57.218 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=99087 | double_spaces=7 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 00:49:57.224 - backend.compiler.validation.compiler_validator - WARNING - BACKSLASH_NORMALIZED_MATCH: Exact/hyphen/whitespace match failed but found unique backslash-normalized match at pos 51259. This indicates a model over-escaping quirk.
-2026-03-01 00:49:57.224 - backend.compiler.validation.compiler_validator - WARNING -   Model provided (normalized): '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr)'...
-2026-03-01 00:49:57.224 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr'...
-2026-03-01 00:49:57.224 - backend.compiler.validation.compiler_validator - INFO - Unicode hyphen normalization applied - updating old_string to actual document text
-2026-03-01 00:49:57.224 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 51259
-2026-03-01 00:49:57.241 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_015)...
-2026-03-01 00:50:08.774 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=True, rigor=True, placement=False)
-2026-03-01 00:50:08.776 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-03-01 00:50:08.776 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-03-01 00:50:08.776 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-03-01 00:50:08.808 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-03-01 00:50:08.808 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-03-01 00:50:08.808 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-03-01 00:50:08.825 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=16411 chars, paper=99087 chars
-2026-03-01 00:50:08.825 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-03-01 00:50:08.825 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1163
-2026-03-01 00:51:32.593 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 83.77s (coverage=0.97, tokens=6721)
-2026-03-01 00:51:32.593 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 56214 chars
-2026-03-01 00:51:32.593 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-03-01 00:51:32.593 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_002)...
-2026-03-01 00:53:11.099 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1512 chars
-2026-03-01 00:53:11.099 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-03-01 00:53:11.099 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=494
-2026-03-01 00:53:11.099 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-03-01 00:53:11.099 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-03-01 00:53:11.099 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1163
-2026-03-01 00:54:34.581 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 83.48s (coverage=0.97, tokens=6721)
-2026-03-01 00:54:34.581 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-03-01 00:54:34.608 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_003)...
-2026-03-01 01:08:49.891 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 88247 chars
-2026-03-01 01:08:49.891 - backend.shared.json_parser - ERROR - parse_json: Expecting property name enclosed in double quotes: line 1 column 2 (char 1)
-2026-03-01 01:08:49.891 - backend.compiler.agents.high_param_submitter - INFO - Compiler high-param submitter (rigor): Initial JSON parse failed, attempting retry
-2026-03-01 01:15:50.467 - backend.compiler.agents.high_param_submitter - INFO - Compiler high-param submitter (rigor): Retry succeeded!
-2026-03-01 01:15:50.467 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Rigor enhancement submission generated - 10b1d7e1-c1fc-4ff8-a35d-0b9c7c250b62
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - INFO - Validating rigor submission: 10b1d7e1-c1fc-4ff8-a35d-0b9c7c250b62
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=rigor, operation=replace
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This section addresses two related certification obstacles that arise in true-3D shielding and blank'...
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=480 | first20='This section address' | last20='nts and multiplicity'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=99087 | double_spaces=7 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'This section addresses two related certification obstacles that arise in true-3D shielding and blanket design: (i) many constraints depend on maxima (hotspots) of spatial fields rather than on spatial'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'actions), so naive per-tally confidence intervals do not control the probability of a false-feasibility claim across the full tally set.\n\nIX.A. Problem statement: max-type constraints and multiplicity'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'into the error control.\n\n[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 86417
-2026-03-01 01:15:50.483 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'This section addresses two related certification obstacles that arise in true-3D shielding and blank'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=480 | first20='This section address' | last20='nts and multiplicity'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=16411 | double_spaces=341 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars): 'This section addresses two related certification obstacles that arise in true-3D shielding and blanket design: (i) many constraints depend on maxima (hotspots) of spatial fields rather than on spatial'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars): 'actions), so naive per-tally confidence intervals do not control the probability of a false-feasibility claim across the full tally set.\n\nIX.A. Problem statement: max-type constraints and multiplicity'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. Motivation: certified true-3D neutronics for non-axisymmetric stellarator blankets (TBR, coil damage, dose, heating)\n   B. Problem statement: compute responses and grad'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'fication tasks required before deployment\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-03-01 01:15:50.537 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-03-01 01:15:50.546 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: rigor)
-2026-03-01 01:15:50.546 - backend.compiler.core.compiler_coordinator - INFO - Rigor enhancement rejected
-2026-03-01 01:15:50.546 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-03-01 01:15:50.546 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-03-01 01:15:50.546 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 01:15:50.546 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 01:15:50.546 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:15:50.546 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=99087 chars
-2026-03-01 01:15:50.546 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 99087 chars → 99014 chars (markers removed)
-2026-03-01 01:15:50.546 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:15:50.546 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:17:12.501 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 81.95s (coverage=0.96, tokens=6801)
-2026-03-01 01:17:12.501 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 56936 chars retrieved
-2026-03-01 01:17:12.501 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 01:17:12.501 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 194478 chars
-2026-03-01 01:17:12.516 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_016)...
-2026-03-01 01:18:27.373 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13672 chars
-2026-03-01 01:18:27.373 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:18:27.386 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:18:27.386 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 46d4f45c-db41-43d8-abbc-97238a49362d (section_complete=False)
-2026-03-01 01:18:27.402 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 46d4f45c-db41-43d8-abbc-97238a49362d
-2026-03-01 01:18:27.402 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 12095 -> 12093 chars, new_string: 12095 -> 12093 chars)
-2026-03-01 01:18:27.417 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 01:18:27.417 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '4. Many-tally scope. The definition of the tally family \\(\\{1,\\dots,J\\}\\) must be fixed before exami'...
-2026-03-01 01:18:27.417 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 98556
-2026-03-01 01:18:27.433 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_016)...
-2026-03-01 01:18:38.601 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:18:38.601 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=354, new_string_len=12093
-2026-03-01 01:18:38.605 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 12093 chars (conclusion boundary preserved)
-2026-03-01 01:18:38.621 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 92, 13584 words)
-2026-03-01 01:18:39.116 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:18:39.148 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 353 total chunks
-2026-03-01 01:18:43.326 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:18:43.326 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:18:43.336 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:18:43.336 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (13584 words)
-2026-03-01 01:18:43.336 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 01:18:43.336 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:18:43.351 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=111182 chars
-2026-03-01 01:18:43.351 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 111182 chars → 111109 chars (markers removed)
-2026-03-01 01:18:43.351 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:18:43.351 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:20:00.453 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 77.10s (coverage=0.93, tokens=6551)
-2026-03-01 01:20:00.453 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 56314 chars retrieved
-2026-03-01 01:20:00.453 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 01:20:00.453 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 205951 chars
-2026-03-01 01:20:00.485 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_017)...
-2026-03-01 01:20:54.940 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13309 chars
-2026-03-01 01:20:54.940 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:20:54.956 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:20:54.956 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: f62170e6-789d-4bce-99a2-2d0636c975f4 (section_complete=False)
-2026-03-01 01:20:54.956 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: f62170e6-789d-4bce-99a2-2d0636c975f4
-2026-03-01 01:20:54.956 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11951 -> 11949 chars, new_string: 11951 -> 11949 chars)
-2026-03-01 01:20:54.972 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 01:20:54.972 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '3. Moment inputs and inflation. Any covariance inflation (to account for unknown correlations, trunc'...
-2026-03-01 01:20:54.972 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 110745
-2026-03-01 01:20:54.988 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_017)...
-2026-03-01 01:21:01.271 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:21:01.271 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=260, new_string_len=11949
-2026-03-01 01:21:01.271 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11949 chars (conclusion boundary preserved)
-2026-03-01 01:21:01.287 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 93, 15043 words)
-2026-03-01 01:21:01.667 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:21:01.699 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 391 total chunks
-2026-03-01 01:21:06.392 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:21:06.392 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:21:06.392 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:21:06.392 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (15043 words)
-2026-03-01 01:21:06.392 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 01:21:06.392 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:21:06.408 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=123133 chars
-2026-03-01 01:21:06.408 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 123133 chars → 123060 chars (markers removed)
-2026-03-01 01:21:06.408 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:21:06.408 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:22:22.387 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 75.98s (coverage=0.93, tokens=6563)
-2026-03-01 01:22:22.387 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 56181 chars retrieved
-2026-03-01 01:22:22.387 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 01:22:22.387 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 217769 chars
-2026-03-01 01:22:22.421 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_018)...
-2026-03-01 01:23:28.572 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 15210 chars
-2026-03-01 01:23:28.572 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:23:28.588 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:23:28.588 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 4474c0f3-d918-4974-8e03-35bf945fc41c (section_complete=False)
-2026-03-01 01:23:28.588 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 4474c0f3-d918-4974-8e03-35bf945fc41c
-2026-03-01 01:23:28.588 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 13829 -> 13827 chars, new_string: 13829 -> 13827 chars)
-2026-03-01 01:23:28.605 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 01:23:28.605 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'These records are necessary to interpret a tolerance margin as an auditable, falsifiable statement r'...
-2026-03-01 01:23:28.605 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 122809
-2026-03-01 01:23:28.638 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_018)...
-2026-03-01 01:23:38.688 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:23:38.688 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=147, new_string_len=13827
-2026-03-01 01:23:38.688 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 13827 chars (conclusion boundary preserved)
-2026-03-01 01:23:38.704 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 94, 16588 words)
-2026-03-01 01:23:39.071 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:23:39.104 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 432 total chunks
-2026-03-01 01:23:44.161 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:23:44.161 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:23:44.161 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:23:44.161 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (16588 words)
-2026-03-01 01:23:44.161 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 01:23:44.161 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:23:44.177 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=136962 chars
-2026-03-01 01:23:44.177 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 136962 chars → 136889 chars (markers removed)
-2026-03-01 01:23:44.177 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:23:44.177 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:24:58.822 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 74.64s (coverage=0.96, tokens=6705)
-2026-03-01 01:24:58.822 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 57157 chars retrieved
-2026-03-01 01:24:58.822 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 01:24:58.822 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 232574 chars
-2026-03-01 01:24:58.853 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_019)...
-2026-03-01 01:26:55.999 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 23501 chars
-2026-03-01 01:26:55.999 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:26:56.015 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:26:56.031 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: d8cc5ccf-1def-4311-b7d7-61115c08ff34 (section_complete=True)
-2026-03-01 01:26:56.031 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: d8cc5ccf-1def-4311-b7d7-61115c08ff34
-2026-03-01 01:26:56.031 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 21783 -> 21782 chars, new_string: 21783 -> 21782 chars)
-2026-03-01 01:26:56.031 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 01:26:56.031 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '4. Finite-difference spot checks contradict coupled-adjoint derivatives beyond tolerance (Section XI'...
-2026-03-01 01:26:56.031 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 136678
-2026-03-01 01:26:56.067 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_019)...
-2026-03-01 01:27:07.434 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:27:07.434 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=107, new_string_len=21782
-2026-03-01 01:27:07.450 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 21782 chars (conclusion boundary preserved)
-2026-03-01 01:27:07.466 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 95, 19213 words)
-2026-03-01 01:27:08.008 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:27:08.038 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 497 total chunks
-2026-03-01 01:27:13.903 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:27:13.911 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:27:13.911 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=body, paper_words=19213
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - Body section complete - transitioning to CRITIQUE PHASE
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - STARTING CRITIQUE PHASE
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - Snapshot pre-critique paper: 158746 chars
-2026-03-01 01:27:13.927 - backend.compiler.memory.critique_memory - INFO - Initialized critique memory for paper_v1 at backend\data\critique_feedback_paper_v1.txt
-2026-03-01 01:27:13.927 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-03-01 01:27:13.927 - backend.compiler.memory.critique_memory - INFO - Critique file is empty
-2026-03-01 01:27:13.927 - backend.compiler.core.compiler_coordinator - INFO - Critique memory initialized for paper_v1
-2026-03-01 01:27:13.927 - backend.compiler.agents.critique_submitter - INFO - Critique submitter initialized with model google/gemini-3.1-pro-preview
-2026-03-01 01:27:13.943 - backend.compiler.memory.critique_rejection_memory - INFO - Loaded 0 critique rejections
-2026-03-01 01:27:13.943 - backend.compiler.agents.critique_submitter - INFO - Critique submitter rejection memory initialized
-2026-03-01 01:27:13.943 - backend.compiler.memory.critique_rejection_memory - INFO - Reset critique rejection log
-2026-03-01 01:27:13.943 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique rejection feedback for fresh start
-2026-03-01 01:27:13.943 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter created with model: google/gemini-3.1-pro-preview
-2026-03-01 01:27:13.943 - backend.shared.api_client_manager - INFO - Configured role 'compiler_critique_submitter': provider=openrouter, model=google/gemini-3.1-pro-preview via Google
-2026-03-01 01:27:13.943 - backend.shared.api_client_manager - INFO - Configured role 'critique_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 01:27:13.943 - backend.shared.api_client_manager - INFO - Configured role 'critique_cleanup': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 01:27:13.943 - backend.compiler.core.compiler_coordinator - INFO - Starting critique aggregation loop (target: 5 total attempts, accepted OR rejected)
-2026-03-01 01:27:13.943 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 0/5, accepted: 0, rejected: 0)
-2026-03-01 01:27:56.791 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #1
-2026-03-01 01:27:56.791 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: b9757fd1-4095-44bb-a80e-5f6ca39f9649
-2026-03-01 01:28:08.291 - backend.compiler.memory.critique_memory - INFO - Added critique #1 to critique memory
-2026-03-01 01:28:08.294 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (1/5): b9757fd1-4095-44bb-a80e-5f6ca39f9649
-2026-03-01 01:28:11.291 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 1/5, accepted: 1, rejected: 0)
-2026-03-01 01:30:04.587 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #2
-2026-03-01 01:30:04.588 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: e1b5fc14-4971-4136-b39d-1668e783b342
-2026-03-01 01:30:18.406 - backend.compiler.memory.critique_memory - INFO - Added critique #2 to critique memory
-2026-03-01 01:30:18.406 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (2/5): e1b5fc14-4971-4136-b39d-1668e783b342
-2026-03-01 01:30:21.422 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 2/5, accepted: 2, rejected: 0)
-2026-03-01 01:30:57.473 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #3
-2026-03-01 01:30:57.473 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 7490bda1-e4e7-4a12-94a6-68a95f3172ba
-2026-03-01 01:31:13.856 - backend.compiler.memory.critique_memory - INFO - Added critique #3 to critique memory
-2026-03-01 01:31:13.856 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (3/5): 7490bda1-e4e7-4a12-94a6-68a95f3172ba
-2026-03-01 01:31:16.854 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 3/5, accepted: 3, rejected: 0)
-2026-03-01 01:32:21.774 - backend.compiler.agents.critique_submitter - INFO - Critique submitter declined to critique (assessment #4)
-2026-03-01 01:32:21.774 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 544790ca-e1d7-410d-9725-97de41463396
-2026-03-01 01:32:46.506 - backend.compiler.core.compiler_coordinator - INFO - Decline REJECTED - validator found issues: This is a decline assessment (critique_needed=false) claiming the body section is academically acceptable. However, the body contains substantive issues identified in existing accepted critiques, which remain unaddressed: (1) Missing required outline content in VIII.C.3 (covariance pushforward \(\mathbf{C}_R \approx J \mathbf{C}_p J^T\), validity conditions, Cantelli/Chebyshev bounds) and XIII.E gap note on convex relaxations vs. heuristics; these are explicit outline gaps affecting completeness and rigor. (2) Mathematical error in Theorem 10.1 proof (Section X.C): the inequality derivation yields \(\mathbb{E}[L] + \frac{1}{1-\beta} \sqrt{\mathrm{Var}(L)}\) not the claimed tighter \(\mathbb{E}[L] + \sqrt{\frac{\beta}{1-\beta}} \sqrt{\mathrm{Var}(L)}\), invalidating the SOC representability claim without correction. (3) Error in Proposition 14.1 (XIV.E.2): greedy approximation guarantee \((1-1/e)\) misapplied to non-normalized \(\mathcal{U}(S)\) where \(\mathcal{U}(\emptyset) \neq 0\); correct form applies to gain \(\mathcal{U}(S) - \mathcal{U}(\emptyset)\). These are genuine mathematical errors and structural omissions impacting correctness, auditability, and alignment with outline. No evidence these are resolved, so body not acceptable; decline incorrect.
-2026-03-01 01:32:49.507 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 4/5, accepted: 3, rejected: 1)
-2026-03-01 01:34:02.428 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #5
-2026-03-01 01:34:02.428 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 16fe31ec-4281-4cd4-8f65-6d1b91058bf1
-2026-03-01 01:34:13.825 - backend.compiler.memory.critique_memory - INFO - Added critique #4 to critique memory
-2026-03-01 01:34:13.825 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (4/5): 16fe31ec-4281-4cd4-8f65-6d1b91058bf1
-2026-03-01 01:34:16.823 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete: 5 total attempts (4 accepted, 1 rejected)
-2026-03-01 01:34:16.823 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:34:16.823 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete (5 total attempts) - triggering rewrite decision (attempt 1)
-2026-03-01 01:34:16.823 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:34:16.823 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter generating rewrite decision...
-2026-03-01 01:34:26.290 - backend.compiler.agents.critique_submitter - INFO - Rewrite decision generated: partial_revision
-2026-03-01 01:34:26.290 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision: partial_revision
-2026-03-01 01:34:26.290 - backend.compiler.core.compiler_coordinator - INFO - Validator reviewing rewrite decision...
-2026-03-01 01:34:26.290 - backend.compiler.validation.compiler_validator - INFO - Validating rewrite decision...
-2026-03-01 01:34:36.390 - backend.compiler.validation.compiler_validator - INFO - Rewrite decision VALIDATED: The partial_revision decision is justified. All four accepted critiques identify specific, localized issues: (1) missing subsections/content in VIII.C.3 (covariance propagation with GPT Jacobians, Can...
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision validated - executing
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - Decision: PARTIAL REVISION (iterative targeted edits)
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - EXECUTING PARTIAL REVISION (ITERATIVE EDITS)
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - Partial revision initiated (pending successful completion, max: 1)
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - Paper title unchanged
-2026-03-01 01:34:36.390 - backend.compiler.core.compiler_coordinator - INFO - Starting iterative edit loop...
-2026-03-01 01:34:36.407 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 01:34:59.973 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 01:34:59.973 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified that Section VIII.C was missing the required subsection on covariance-based p...
-2026-03-01 01:34:59.989 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 01:35:13.690 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit addresses Critique #1, which identified the omission of the required subsection VIII.C.3 on 'Covariance-based parametric uncertainty propagat...
-2026-03-01 01:35:13.690 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 01:35:13.690 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 01:35:39.124 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 01:35:39.124 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified that Section VIII.C was missing the required subsection on covariance-based p...
-2026-03-01 01:35:39.124 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 01:35:52.390 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit addresses Critique #1, which identified the omission of the required subsection VIII.C.3 on covariance-based parametric uncertainty propagati...
-2026-03-01 01:35:52.390 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 01:35:52.390 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 01:36:14.990 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 01:36:14.990 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified that Section VIII.C was missing the detailed mathematical formulation for cov...
-2026-03-01 01:36:14.990 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 01:36:25.308 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses Critique #1 by expanding Section VIII.C to include the required mathematical formulation for covariance-based parametric u...
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - ERROR - Max consecutive failures (3) reached - stopping iterative loop
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - Iterative edit loop complete: 0 successful, 3 failed
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - Ending critique phase (rewrite=False)
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete - transitioning to CONCLUSION phase
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - Title unchanged - continuing to conclusion
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - PARTIAL REVISION COMPLETE - Continuing to CONCLUSION
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 01:36:25.308 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (19213 words)
-2026-03-01 01:36:25.342 - backend.compiler.core.compiler_coordinator - INFO - Skipping outline update - body construction complete
-2026-03-01 01:36:25.342 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 01:36:25.342 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:36:25.348 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=158746 chars
-2026-03-01 01:36:25.349 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 158746 chars → 158673 chars (markers removed)
-2026-03-01 01:36:25.349 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 01:36:25.350 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 192671 chars
-2026-03-01 01:36:25.376 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_020)...
-2026-03-01 01:36:27.059 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: body → conclusion
-2026-03-01 01:36:47.975 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 931 chars
-2026-03-01 01:36:47.975 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:36:47.975 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:36:47.975 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: c8bdf363-d426-4c81-950c-a385d6e8d8ab (miniscule=False)
-2026-03-01 01:36:47.992 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: c8bdf363-d426-4c81-950c-a385d6e8d8ab
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\big'...
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=226 | first20='\\mathbb{E}\\bigl[(\\wi' | last20='statistical error}}.'
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=158746 | double_spaces=20 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING - BACKSLASH_NORMALIZED_MATCH: Exact/hyphen/whitespace match failed but found unique backslash-normalized match at pos 51259. This indicates a model over-escaping quirk.
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING -   Model provided (normalized): '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr)'...
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr'...
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - INFO - Unicode hyphen normalization applied - updating old_string to actual document text
-2026-03-01 01:36:48.009 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 51259
-2026-03-01 01:36:48.042 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_024)...
-2026-03-01 01:36:55.575 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=True, rigor=True, placement=False)
-2026-03-01 01:36:55.575 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-03-01 01:36:55.575 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-03-01 01:36:55.575 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 01:36:55.575 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:36:55.592 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=158746 chars
-2026-03-01 01:36:55.592 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 158746 chars → 158673 chars (markers removed)
-2026-03-01 01:36:55.592 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 01:36:55.592 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 194996 chars
-2026-03-01 01:36:55.625 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_021)...
-2026-03-01 01:37:14.342 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1037 chars
-2026-03-01 01:37:14.342 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:37:14.356 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:37:14.357 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 99746d50-3623-4e54-8d93-21c45c972b9f (miniscule=False)
-2026-03-01 01:37:14.358 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 99746d50-3623-4e54-8d93-21c45c972b9f
-2026-03-01 01:37:14.375 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 01:37:14.375 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\big'...
-2026-03-01 01:37:14.375 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 01:37:14.375 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=226 | first20='\\mathbb{E}\\bigl[(\\wi' | last20='statistical error}}.'
-2026-03-01 01:37:14.375 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=158746 | double_spaces=20 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 01:37:14.392 - backend.compiler.validation.compiler_validator - WARNING - BACKSLASH_NORMALIZED_MATCH: Exact/hyphen/whitespace match failed but found unique backslash-normalized match at pos 51259. This indicates a model over-escaping quirk.
-2026-03-01 01:37:14.392 - backend.compiler.validation.compiler_validator - WARNING -   Model provided (normalized): '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr)'...
-2026-03-01 01:37:14.392 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: '\\mathbb{E}\\bigl[(\\widehat R_{\\mathrm{ML}}-R_*)^2\\bigr]\n= \\\\underbrace{\\bigl(\\mathbb{E}[Y_L]-R_*\\bigr'...
-2026-03-01 01:37:14.392 - backend.compiler.validation.compiler_validator - INFO - Unicode hyphen normalization applied - updating old_string to actual document text
-2026-03-01 01:37:14.392 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 51259
-2026-03-01 01:37:14.408 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_025)...
-2026-03-01 01:37:22.042 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=True, rigor=True, placement=True)
-2026-03-01 01:37:22.042 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-03-01 01:37:22.042 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-03-01 01:37:22.042 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-03-01 01:37:22.057 - backend.compiler.core.compiler_coordinator - INFO - Skipping rigor loop - body construction complete
-2026-03-01 01:37:22.057 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 01:37:22.058 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 01:37:22.058 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=conclusion)
-2026-03-01 01:37:22.058 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:37:22.058 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=158746 chars
-2026-03-01 01:37:22.058 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 158746 chars → 158673 chars (markers removed)
-2026-03-01 01:37:22.058 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:37:22.058 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:38:39.875 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 77.82s (coverage=0.92, tokens=6663)
-2026-03-01 01:38:39.875 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 56434 chars retrieved
-2026-03-01 01:38:39.875 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: conclusion...
-2026-03-01 01:38:39.875 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 257554 chars
-2026-03-01 01:38:39.909 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_022)...
-2026-03-01 01:39:12.459 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 8833 chars
-2026-03-01 01:39:12.459 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:39:12.474 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:39:12.475 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 8a93fe68-0bb1-4efe-bdb7-c0ab40e0e294 (section_complete=True)
-2026-03-01 01:39:12.490 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 8a93fe68-0bb1-4efe-bdb7-c0ab40e0e294
-2026-03-01 01:39:12.506 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 01:39:12.506 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLET'...
-2026-03-01 01:39:12.507 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 158571
-2026-03-01 01:39:12.525 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_026)...
-2026-03-01 01:39:19.408 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:39:19.425 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 96)
-2026-03-01 01:39:19.794 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:39:19.842 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 525 total chunks
-2026-03-01 01:39:26.255 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:39:26.256 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:39:26.257 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:39:26.273 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=conclusion, paper_words=20226
-2026-03-01 01:39:26.273 - backend.compiler.core.compiler_coordinator - INFO - Phase transition: conclusion → introduction (explicit section_complete)
-2026-03-01 01:39:26.273 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (20226 words)
-2026-03-01 01:39:26.291 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 01:39:26.291 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=introduction)
-2026-03-01 01:39:26.291 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:39:26.297 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=167100 chars
-2026-03-01 01:39:26.297 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 167100 chars → 167027 chars (markers removed)
-2026-03-01 01:39:26.297 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:39:26.297 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:40:28.025 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 61.73s (coverage=0.93, tokens=6346)
-2026-03-01 01:40:28.025 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54901 chars retrieved
-2026-03-01 01:40:28.025 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: introduction...
-2026-03-01 01:40:28.040 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 264878 chars
-2026-03-01 01:40:28.074 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_023)...
-2026-03-01 01:40:28.092 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: conclusion → introduction
-2026-03-01 01:40:55.423 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 8811 chars
-2026-03-01 01:40:55.424 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:40:55.425 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:40:55.425 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: cfe8dc25-4cf7-4880-93af-ced7e9de32fe (section_complete=True)
-2026-03-01 01:40:55.440 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: cfe8dc25-4cf7-4880-93af-ced7e9de32fe
-2026-03-01 01:40:55.457 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 01:40:55.457 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS COM'...
-2026-03-01 01:40:55.458 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 102
-2026-03-01 01:40:55.475 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_027)...
-2026-03-01 01:41:07.675 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:41:07.689 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 97)
-2026-03-01 01:41:08.092 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:41:08.139 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 554 total chunks
-2026-03-01 01:41:15.007 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 01:41:15.007 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 01:41:15.023 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 01:41:15.057 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=introduction, paper_words=21233
-2026-03-01 01:41:15.057 - backend.compiler.core.compiler_coordinator - INFO - Phase transition: introduction → abstract (explicit section_complete)
-2026-03-01 01:41:15.057 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (21233 words)
-2026-03-01 01:41:15.073 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 01:41:15.073 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=abstract)
-2026-03-01 01:41:15.073 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 01:41:15.090 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=16411 chars, paper=175328 chars
-2026-03-01 01:41:15.090 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 175328 chars → 175255 chars (markers removed)
-2026-03-01 01:41:15.090 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 01:41:15.090 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=663
-2026-03-01 01:42:16.140 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 61.05s (coverage=0.93, tokens=6183)
-2026-03-01 01:42:16.140 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 53045 chars retrieved
-2026-03-01 01:42:16.140 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: abstract...
-2026-03-01 01:42:16.140 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 270893 chars
-2026-03-01 01:42:16.173 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_024)...
-2026-03-01 01:42:16.207 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: introduction → abstract
-2026-03-01 01:42:30.373 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 2492 chars
-2026-03-01 01:42:30.373 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 01:42:30.373 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 01:42:30.373 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 09b50546-148b-4c5e-b91c-ca918016dded (section_complete=True)
-2026-03-01 01:42:30.390 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 09b50546-148b-4c5e-b91c-ca918016dded
-2026-03-01 01:42:30.407 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 01:42:30.407 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]'
-2026-03-01 01:42:30.407 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 0
-2026-03-01 01:42:30.440 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_028)...
-2026-03-01 01:42:40.323 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 01:42:40.338 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 98)
-2026-03-01 01:42:40.742 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 01:42:40.773 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 560 total chunks
-2026-03-01 01:42:40.798 - backend.autonomous.core.autonomous_coordinator - INFO - Abstract detected - paper compilation complete
-2026-03-01 01:42:40.798 - backend.compiler.core.compiler_coordinator - INFO - Stopping compiler...
-2026-03-01 01:42:40.798 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow cancelled
-2026-03-01 01:42:40.807 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring stopped
-2026-03-01 01:42:40.807 - backend.compiler.core.compiler_coordinator - INFO - Compiler stopped
-2026-03-01 01:42:40.823 - backend.autonomous.core.autonomous_coordinator - INFO - Paper paper_008: tracked 1 models, 4 API calls, 0 Wolfram calls
-2026-03-01 01:42:40.823 - backend.autonomous.core.autonomous_coordinator - INFO - Added author attribution and model credits to paper
-2026-03-01 01:42:40.842 - backend.autonomous.memory.paper_library - INFO - Paper saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_008.txt
-2026-03-01 01:42:40.842 - backend.autonomous.memory.paper_library - INFO - Outline saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_008_outline.txt
-2026-03-01 01:42:40.842 - backend.autonomous.memory.paper_library - INFO - Abstract saved: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_008_abstract.txt
-2026-03-01 01:42:40.857 - backend.autonomous.memory.paper_library - INFO - Saved paper paper_008: 'Certified 3D Neutron Transport for Stellarator Blankets: Adjoint Sensitivity and Multilevel Uncertainty Quantification' (21625 words, 1 models tracked)
-2026-03-01 01:42:40.857 - backend.autonomous.core.autonomous_coordinator - INFO - Auto-generating critique for paper paper_008: Certified 3D Neutron Transport for Stellarator Blankets: Adjoint Sensitivity and Multilevel Uncertainty Quantification
-2026-03-01 01:42:40.857 - backend.autonomous.core.autonomous_coordinator - INFO - Paper completed: paper_008 (21625 words)
-2026-03-01 01:42:40.890 - backend.shared.api_client_manager - INFO - Configured role 'paper_critic': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 01:42:40.928 - backend.autonomous.core.autonomous_coordinator - INFO - Tier 3 trigger: Attempting final answer generation
-2026-03-01 01:42:40.928 - backend.autonomous.core.autonomous_coordinator - INFO - ============================================================
-2026-03-01 01:42:40.928 - backend.autonomous.core.autonomous_coordinator - INFO - TIER 3: FINAL ANSWER GENERATION STARTED
-2026-03-01 01:42:40.928 - backend.autonomous.core.autonomous_coordinator - INFO - ============================================================
-2026-03-01 01:42:40.957 - backend.autonomous.memory.final_answer_memory - INFO - Tier 3 Final Answer activated
-2026-03-01 01:42:40.957 - backend.autonomous.memory.final_answer_memory - INFO - Tier 3 status: phase1_assessment
-2026-03-01 01:42:40.973 - backend.autonomous.memory.final_answer_memory - INFO - Model usage tracking initialized for Tier 3
-2026-03-01 01:42:40.973 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 01:42:40.973 - backend.autonomous.core.autonomous_coordinator - INFO - Tier 3: Model tracking enabled (global + per-paper)
-2026-03-01 01:42:41.056 - backend.autonomous.core.autonomous_coordinator - INFO - Tier 3 Phase 1: Assessing certainty
-2026-03-01 01:42:41.056 - backend.autonomous.memory.final_answer_memory - INFO - Tier 3 status: phase1_assessment
-2026-03-01 01:42:41.056 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Starting assessment with 7 papers
-2026-03-01 01:42:41.079 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Requesting paper expansion (task_id=auto_ca_000)
-2026-03-01 01:42:52.173 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Requested expansion of 7 papers
-2026-03-01 01:42:52.223 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 1/10
-2026-03-01 01:42:52.356 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_001)
-2026-03-01 01:42:55.273 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 1)
-2026-03-01 01:42:55.273 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 2/10
-2026-03-01 01:42:55.422 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_002)
-2026-03-01 01:42:58.456 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 2)
-2026-03-01 01:42:58.456 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 3/10
-2026-03-01 01:42:58.607 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_003)
-2026-03-01 01:43:01.559 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 3)
-2026-03-01 01:43:01.559 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 4/10
-2026-03-01 01:43:01.690 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_004)
-2026-03-01 01:43:03.240 - backend.shared.critique_memory - INFO - Saved critique 64777fc3-dd27-4f96-847f-2c6bd91299df for autonomous_paper paper_id=paper_008 at backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_008_critiques.json
-2026-03-01 01:43:03.240 - backend.autonomous.core.autonomous_coordinator - INFO - Auto-critique saved for paper paper_008: avg=7.0 (N=6, C=8, I=7)
-2026-03-01 01:43:03.240 - backend.autonomous.core.autonomous_coordinator - INFO - High-score critique notification sent for paper paper_008 (avg=7.0)
-2026-03-01 01:43:04.690 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 4)
-2026-03-01 01:43:04.690 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 5/10
-2026-03-01 01:43:04.823 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_005)
-2026-03-01 01:43:08.057 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 5)
-2026-03-01 01:43:08.057 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 6/10
-2026-03-01 01:43:08.207 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_006)
-2026-03-01 01:43:11.790 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 6)
-2026-03-01 01:43:11.790 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 7/10
-2026-03-01 01:43:11.923 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_007)
-2026-03-01 01:43:14.790 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 7)
-2026-03-01 01:43:14.790 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 8/10
-2026-03-01 01:43:14.923 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_008)
-2026-03-01 01:43:18.057 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 8)
-2026-03-01 01:43:18.057 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 9/10
-2026-03-01 01:43:18.190 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_009)
-2026-03-01 01:43:20.988 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 9)
-2026-03-01 01:43:20.988 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Assessment attempt 10/10
-2026-03-01 01:43:21.123 - backend.autonomous.agents.final_answer.certainty_assessor - INFO - CertaintyAssessor: Generating assessment (prompt=279275t, task_id=auto_ca_010)
-2026-03-01 01:43:24.223 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed to generate assessment (attempt 10)
-2026-03-01 01:43:24.223 - backend.autonomous.agents.final_answer.certainty_assessor - ERROR - CertaintyAssessor: Failed after 10 attempts
-2026-03-01 01:43:24.223 - backend.autonomous.core.autonomous_coordinator - ERROR - Tier 3: Certainty assessment failed
-2026-03-01 01:43:24.223 - backend.autonomous.memory.final_answer_memory - INFO - Tier 3 Final Answer deactivated
-2026-03-01 01:43:24.223 - backend.shared.api_client_manager - INFO - Model tracking callback cleared
-2026-03-01 01:43:24.223 - backend.autonomous.core.autonomous_coordinator - INFO - Tier 3: Model tracking disabled
-2026-03-01 01:43:24.238 - backend.autonomous.core.autonomous_coordinator - INFO - Tier 3: More research needed, returning to topic selection
-2026-03-01 01:43:24.238 - backend.autonomous.core.autonomous_coordinator - INFO - Paper complete, returning to topic selection
-2026-03-01 01:43:24.238 - backend.autonomous.core.autonomous_coordinator - INFO - Topic selection attempt 1/3
-2026-03-01 01:43:24.357 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generating topic selection with model openai/gpt-5.2 (prompt=4447t, task_id=auto_ts_122)
-2026-03-01 01:43:45.656 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generated submission - action=new_topic
-2026-03-01 01:43:45.673 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Validating topic selection with model x-ai/grok-4.1-fast (prompt=4705t, task_id=auto_tv_005)
-2026-03-01 01:43:57.574 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Decision=accept
-2026-03-01 01:43:57.590 - backend.autonomous.memory.brainstorm_memory - INFO - Created new brainstorm: topic_008
-2026-03-01 01:43:57.590 - backend.autonomous.core.autonomous_coordinator - INFO - Created new brainstorm: topic_008
-2026-03-01 01:43:57.656 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Starting selection (max 6 papers, 7 available, 0 already selected)
-2026-03-01 01:43:57.674 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector: Requesting expansion with model openai/gpt-5.2 (prompt=27111t, task_id=auto_rs_014)
-2026-03-01 01:44:08.257 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Direct injection for 3 papers (117284 tokens <= 128000 budget)
-2026-03-01 01:44:08.323 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Making final selection with model openai/gpt-5.2 (prompt=130597t, max=6 papers, task_id=auto_rs_015)
-2026-03-01 01:44:22.072 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [initial]: Selected 3 reference papers
-2026-03-01 01:44:22.072 - backend.autonomous.core.autonomous_coordinator - INFO - Pre-brainstorm reference selection: selected 3 papers
-2026-03-01 01:44:22.073 - backend.autonomous.core.autonomous_coordinator - INFO - Selected 3 reference papers for brainstorm
-2026-03-01 01:44:22.073 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 01:44:22.073 - backend.autonomous.core.autonomous_coordinator - INFO - Per-paper model tracking enabled for brainstorm topic_008
-2026-03-01 01:44:22.073 - backend.aggregator.memory.shared_training - INFO - Reloaded 0 insights from backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\brainstorms\brainstorm_topic_008.txt (submission count: 0)
-2026-03-01 01:44:22.073 - backend.autonomous.core.autonomous_coordinator - INFO - Reloaded 0 existing submissions from brainstorm database
-2026-03-01 01:44:22.073 - backend.autonomous.core.autonomous_coordinator - INFO - Loading 3 reference papers for brainstorm aggregation
-2026-03-01 01:44:22.073 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-03-01 01:44:22.073 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 400000, Validator: 2000000
-2026-03-01 01:44:22.073 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['openai/gpt-5.2', 'moonshotai/kimi-k2.5', 'x-ai/grok-4.1-fast'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-03-01 01:44:22.740 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
-2026-03-01 01:44:22.740 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 400000 tokens (model: openai/gpt-5.2)
-  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.5)
-  - Submitter 3: 2000000 tokens (model: x-ai/grok-4.1-fast)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-03-01 01:44:22.740 - backend.aggregator.memory.shared_training - INFO - Loaded 0 existing insights from shared training (submission count: 0)
-2026-03-01 01:44:22.740 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-03-01 01:44:22.756 - backend.aggregator.memory.event_log - INFO - Loaded 1740 events from event log
-2026-03-01 01:44:22.873 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_007.txt: 2024 total chunks
-2026-03-01 01:44:49.840 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_007.txt
-2026-03-01 01:44:49.840 - backend.aggregator.core.coordinator - INFO - Loaded user file: paper_paper_007.txt
-2026-03-01 01:44:49.973 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_008.txt: 2076 total chunks
-2026-03-01 01:45:17.807 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_008.txt
-2026-03-01 01:45:17.823 - backend.aggregator.core.coordinator - INFO - Loaded user file: paper_paper_008.txt
-2026-03-01 01:45:17.923 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_005.txt: 1313 total chunks
-2026-03-01 01:45:35.273 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21\papers\paper_paper_005.txt
-2026-03-01 01:45:35.273 - backend.aggregator.core.coordinator - INFO - Loaded user file: paper_paper_005.txt
-2026-03-01 01:45:35.273 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 1
-2026-03-01 01:45:35.273 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model openai/gpt-5.2
-2026-03-01 01:45:35.273 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 01:45:35.273 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=openai/gpt-5.2, provider=openrouter, context=400000
-2026-03-01 01:45:35.288 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 2
-2026-03-01 01:45:35.288 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.5
-2026-03-01 01:45:35.288 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.5 via Groq
-2026-03-01 01:45:35.288 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.5, provider=openrouter, context=262000
-2026-03-01 01:45:35.290 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 3
-2026-03-01 01:45:35.290 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.1-fast
-2026-03-01 01:45:35.290 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.1-fast via Google
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.1-fast, provider=openrouter, context=2000000
-2026-03-01 01:45:35.290 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-03-01 01:45:35.290 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-03-01 01:45:35.290 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-03-01 01:45:35.290 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-03-01 01:45:35.290 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-03-01 01:45:35.290 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-03-01 01:45:35.290 - backend.autonomous.core.autonomous_coordinator - INFO - Aggregator started for brainstorm topic_008
-2026-03-01 01:45:35.290 - backend.autonomous.core.autonomous_coordinator - INFO - Resuming brainstorm with 0 acceptances, 24 rejections from workflow state
-2026-03-01 01:45:35.290 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-03-01 01:45:35.423 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-03-01 01:45:35.556 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-03-01 01:45:35.690 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-03-01 01:45:35.690 - backend.aggregator.core.coordinator - INFO - Validator iteration 1 - batch validating 3 submissions: ['2b37b8b9-cd37-4e70-9c67-7cd0972f758a', '13f24f57-f266-4726-b2bd-aa8aa5a5e5bc', '5e55e5a0-b528-4795-8a85-b201d55b20d8']
-2026-03-01 01:45:35.690 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 01:45:35.690 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 01:46:12.123 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 63d3f1e1-5eba-4bc7-b6e5-b3d667f4c9a1 (iteration 1)
-2026-03-01 01:46:25.773 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 01:46:25.790 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
-2026-03-01 01:46:25.790 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:46:25.790 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
-2026-03-01 01:46:25.790 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 1)
-2026-03-01 01:46:25.790 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:46:25.790 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 01:46:25.790 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 01:46:25.790 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 20 total chunks
-2026-03-01 01:46:25.839 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
-2026-03-01 01:46:25.840 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 01:46:25.840 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:46:25.840 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
-2026-03-01 01:46:25.842 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 2)
-2026-03-01 01:46:25.845 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 01:46:25.845 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:46:25.845 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 01:46:25.845 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 01:46:25.845 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 41 total chunks
-2026-03-01 01:46:25.875 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
-2026-03-01 01:46:25.875 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 01:46:25.875 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:46:25.875 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
-2026-03-01 01:46:25.875 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 3)
-2026-03-01 01:46:25.890 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 01:46:25.892 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:46:25.892 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 01:46:25.892 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 01:46:25.892 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 36 total chunks
-2026-03-01 01:46:25.923 - backend.aggregator.core.coordinator - INFO - Validator iteration 2 - batch validating 1 submissions: ['63d3f1e1-5eba-4bc7-b6e5-b3d667f4c9a1']
-2026-03-01 01:46:27.091 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 01:46:27.091 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 01:46:50.140 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 80b79f83-eab3-496c-a5c6-c66f8114e5c2 (iteration 1)
-2026-03-01 01:46:55.756 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 85c68cbd-abc8-4421-b641-2bcf98bb49f9 (iteration 2)
-2026-03-01 01:47:05.529 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
-2026-03-01 01:47:05.529 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:47:05.529 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 3)
-2026-03-01 01:47:05.529 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 4)
-2026-03-01 01:47:05.529 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:47:05.529 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 01:47:05.529 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 01:47:05.529 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 5 total chunks
-2026-03-01 01:47:05.557 - backend.aggregator.core.coordinator - INFO - Validator iteration 3 - batch validating 2 submissions: ['80b79f83-eab3-496c-a5c6-c66f8114e5c2', '85c68cbd-abc8-4421-b641-2bcf98bb49f9']
-2026-03-01 01:47:05.557 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
-2026-03-01 01:47:05.557 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
-2026-03-01 01:47:05.806 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 01:47:05.806 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-03-01 01:47:24.923 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 45efa201-d5f8-4b78-a5f7-c75c03bbe0bd (iteration 3)
-2026-03-01 01:47:39.390 - backend.aggregator.agents.validator - INFO - Batch validation complete: 2/2 accepted
-2026-03-01 01:47:39.406 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
-2026-03-01 01:47:39.406 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:47:39.406 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
-2026-03-01 01:47:39.406 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 5)
-2026-03-01 01:47:39.406 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:47:39.406 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 01:47:39.406 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 01:47:39.406 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 47 total chunks
-2026-03-01 01:47:39.456 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #6
-2026-03-01 01:47:39.456 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 01:47:39.456 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:47:39.456 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 4)
-2026-03-01 01:47:39.459 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 6)
-2026-03-01 01:47:39.461 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 01:47:39.461 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:47:39.461 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 01:47:39.461 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 01:47:39.461 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 40 total chunks
-2026-03-01 01:47:39.490 - backend.aggregator.core.coordinator - INFO - Validator iteration 4 - batch validating 1 submissions: ['45efa201-d5f8-4b78-a5f7-c75c03bbe0bd']
-2026-03-01 01:47:40.459 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 01:47:40.459 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=512
-2026-03-01 01:47:43.755 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 9a5c6904-4da3-46bd-8d7f-a0479bd0f6f9 (iteration 1)
-2026-03-01 01:47:57.856 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 290b0bd7-6503-4bdf-b945-e2476df0933c (iteration 4)
-2026-03-01 01:48:05.072 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 2e1abde5-e890-4e7b-9f0d-3ad03d225b97 (iteration 2)
-2026-03-01 01:48:07.173 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #7
-2026-03-01 01:48:07.173 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 01:48:07.179 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 5)
-2026-03-01 01:48:07.179 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 7)
-2026-03-01 01:48:07.179 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 01:48:07.323 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 01:48:07.323 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 01:48:07.323 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 8 total chunks
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #1
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=7 (every 7 acceptances)
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 7 % 7 == 0
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=0, removals_executed=0
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #1 (triggered at 7 acceptances)
-2026-03-01 01:48:07.340 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 01:48:07.340 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 01:48:07.340 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 01:48:07.340 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 01:48:07.348 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 7 submissions
-2026-03-01 01:48:07.348 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 41554 chars
-2026-03-01 01:48:07.357 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (12135 tokens)
-2026-03-01 01:48:07.407 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 01:48:07.407 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 01:48:07.407 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: User files context length: 463501 chars
-2026-03-01 01:48:07.407 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 512898 chars
-2026-03-01 01:48:07.480 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 131109, Max allowed: 1969500
-2026-03-01 01:48:07.480 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 01:48:07.480 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 01:48:07.480 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 7 submissions
-2026-03-01 01:48:07.480 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_004
-2026-03-01 01:48:07.573 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 01:48:07.573 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-03-01 01:48:23.390 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 94913303-c721-4e90-8f23-a22d8f4f4409 (iteration 5)
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1057 chars
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions contribute unique value to the stellarator safety blueprint. #1 provides schedule-reliability composition with tail bounds and test allocation, non-redundant with PRA. #2 offers hybrid supermartingale safety certificates for transients, distinct from PRA. #3 delivers certified multi-fidelity MLMC UQ speedup. #4 introduces Cantelli-Union PRA with martingale source-terms and epistemic bounds. #5 uniquely advances source-term/confinement via positive-system LP certificates. #6 and #7 both use scenario-optimized PRA but #6 emphasizes ET/FT feasibility certificates tied to UGF/RAMI, while #7 focuses on BEPU interval enclosures and Gamma/InvGamma MTTR integration with ranked tests—complementary perspectives on PRA diversity without full redundancy or contradiction. No submission is fully covered/superseded; each adds specific theorems, code hooks, and falsifiable tests aligning with blueprint tasks (ii),
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions contribute unique value to the stellarator safety blueprint. #1 provides schedule-reliability composition with tail bounds and test allocation, non-redundant with PRA. #2 offers hybrid supermartingale safety certificates for transients, distinct from PRA. #3 delivers certified multi-fidelity MLMC UQ speedup. #4 introduces Cantelli-Union PRA with martingale source-terms and epistemic bounds. #5 uniquely advances source-term/confinement via positive-system LP certificates. #6 and #7 both use scenario-optimized PRA but #6 emphasizes ET/FT feasibility certificates tied to UGF/RAMI, while #7 focuses on BEPU interval enclosures and Gamma/InvGamma MTTR integration with ranked tests—complementary perspectives on PRA diversity without full redundancy or contradiction. No submission is fully covered/superseded; each adds specific theorems, code hooks, and falsifiable tests aligning with blueprint tasks (ii),(iii),(v),(vii). Database quality maintained with all.'}
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions contribute unique value to the stellarator safety blueprint. #1 provides schedule-reliability composition with tail bounds and test allocation, non-redundant with PRA. #2 offers hybrid supermartingale safety certificates for transients, distinct from PRA. #3 delivers certified multi-
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions contribute unique value to the stellarator safety blueprint. #1 provides schedule-reliability composition with tail bounds and test allocation, non-redundant with PRA. #2 offers hybrid
-2026-03-01 01:48:41.740 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 01:48:41.740 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 01:48:41.740 - backend.aggregator.core.coordinator - INFO - Cleanup review #1: No removal needed
-2026-03-01 01:48:41.740 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 01:48:41.740 - backend.aggregator.core.coordinator - INFO - Validator iteration 5 - batch validating 3 submissions: ['9a5c6904-4da3-46bd-8d7f-a0479bd0f6f9', '290b0bd7-6503-4bdf-b945-e2476df0933c', '2e1abde5-e890-4e7b-9f0d-3ad03d225b97']
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 01:48:41.740 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 01:48:52.673 - backend.autonomous.core.autonomous_coordinator - INFO - Stopping AutonomousCoordinator...
-2026-03-01 01:48:52.673 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-03-01 01:48:52.673 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-03-01 01:48:52.690 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-03-01 01:48:52.708 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-03-01 01:48:52.728 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 5
-2026-03-01 01:48:52.729 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 5 iterations - is_running=False
-2026-03-01 01:48:52.730 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-03-01 01:48:52.730 - backend.autonomous.core.autonomous_coordinator - INFO - Stopped brainstorm aggregator
-2026-03-01 01:48:52.730 - backend.autonomous.core.autonomous_coordinator - INFO - Stopped paper compiler
-2026-03-01 01:48:52.730 - backend.shared.api_client_manager - INFO - Autonomous API logger callback cleared
-2026-03-01 01:48:52.730 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging disabled
-2026-03-01 01:48:52.733 - backend.autonomous.core.autonomous_coordinator - INFO - Workflow state saved for resume (tier=tier1_aggregation, topic=topic_008)
-2026-03-01 01:48:52.734 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous research stopped - press Start to resume from last state
-2026-03-01 01:48:53.918 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared shared_training_memory in-memory data (will reload from file when needed)
-2026-03-01 01:48:53.919 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator stopped
-2026-03-01 02:30:56.011 - backend.api.routes.websocket - INFO - WebSocket disconnected. Total connections: 0
-INFO:     connection closed
-INFO:     127.0.0.1:54105 - "WebSocket /ws" [accepted]
-2026-03-01 09:10:43.336 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
-INFO:     connection open
-2026-03-01 09:11:23.373 - backend.api.routes.websocket - INFO - WebSocket disconnected. Total connections: 0
-INFO:     connection closed
-INFO:     127.0.0.1:50822 - "WebSocket /ws" [accepted]
-2026-03-01 19:17:38.919 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
-INFO:     connection open
-INFO:     127.0.0.1:51185 - "WebSocket /ws" [accepted]
-2026-03-01 19:17:38.974 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 2
-INFO:     connection open
-2026-03-01 19:17:38.978 - backend.api.routes.websocket - INFO - WebSocket disconnected. Total connections: 1
-INFO:     connection closed
-2026-03-01 19:17:39.756 - backend.shared.lm_studio_client - WARNING - 'lms ps' returned code 0
-2026-03-01 19:17:39.756 - backend.shared.lm_studio_client - INFO - LM Studio availability check: 0 models loaded
-2026-03-01 19:17:40.465 - backend.shared.lm_studio_client - WARNING - 'lms ps' returned code 0
-2026-03-01 19:17:40.466 - backend.shared.lm_studio_client - INFO - LM Studio availability check: 0 models loaded
-2026-03-01 19:17:48.128 - backend.api.routes.autonomous - INFO - Starting autonomous research data clear...
-2026-03-01 19:17:48.439 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared workflow state from session: deliver_a_complete_engineering_ready_blueprint_fo_2026-02-28_02-21
-2026-03-01 19:17:48.439 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared all session workflow states
-2026-03-01 19:17:48.439 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared brainstorms directory: backend\data\auto_brainstorms
-2026-03-01 19:17:48.439 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared papers directory: backend\data\auto_papers
-2026-03-01 19:17:48.455 - backend.autonomous.memory.research_metadata - INFO - Research metadata cleared
-2026-03-01 19:17:48.455 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared research metadata and stats
-2026-03-01 19:17:48.455 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared topic rejections file: backend\data\auto_research_topic_rejections.txt
-2026-03-01 19:17:48.455 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Cleared all autonomous rejection logs
-2026-03-01 19:17:48.455 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared autonomous rejection logs
-2026-03-01 19:17:48.961 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
-2026-03-01 19:17:48.961 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
-2026-03-01 19:17:48.961 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-03-01 19:17:50.626 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-03-01 19:17:51.544 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-03-01 19:17:51.897 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-03-01 19:17:52.216 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-03-01 19:17:52.406 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-03-01 19:17:52.454 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-03-01 19:17:52.501 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-03-01 19:17:52.549 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-03-01 19:17:52.629 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-03-01 19:17:52.645 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared RAG state (ChromaDB collections)
-2026-03-01 19:17:52.645 - backend.autonomous.memory.session_manager - INFO - Session manager cleared
-2026-03-01 19:17:52.645 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared session manager state
-2026-03-01 19:17:52.645 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous research data cleared successfully (7 operations completed, 0 non-critical warnings)
-2026-03-01 19:17:52.645 - backend.api.routes.autonomous - INFO - Autonomous research data clear completed successfully
-2026-03-01 19:20:47.856 - backend.api.routes.autonomous - INFO - Starting autonomous research data clear...
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared all session workflow states
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared brainstorms directory: backend\data\auto_brainstorms
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared papers directory: backend\data\auto_papers
-2026-03-01 19:20:48.168 - backend.autonomous.memory.research_metadata - INFO - Research metadata cleared
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared research metadata and stats
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared topic rejections file: backend\data\auto_research_topic_rejections.txt
-2026-03-01 19:20:48.168 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Cleared all autonomous rejection logs
-2026-03-01 19:20:48.168 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared autonomous rejection logs
-2026-03-01 19:20:48.679 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
-2026-03-01 19:20:48.680 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
-2026-03-01 19:20:48.680 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-03-01 19:20:48.680 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-03-01 19:20:48.704 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-03-01 19:20:48.711 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-03-01 19:20:48.727 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-03-01 19:20:48.882 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-03-01 19:20:48.930 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-03-01 19:20:48.977 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-03-01 19:20:49.018 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-03-01 19:20:49.018 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-03-01 19:20:49.018 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared RAG state (ChromaDB collections)
-2026-03-01 19:20:49.018 - backend.autonomous.memory.session_manager - INFO - Session manager cleared
-2026-03-01 19:20:49.018 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared session manager state
-2026-03-01 19:20:49.018 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous research data cleared successfully (7 operations completed, 0 non-critical warnings)
-2026-03-01 19:20:49.018 - backend.api.routes.autonomous - INFO - Autonomous research data clear completed successfully
-2026-03-01 19:20:53.422 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 1 (Main Submitter): model=openai/gpt-5.2, context=400000, max_tokens=80000
-2026-03-01 19:20:53.422 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 2 : model=moonshotai/kimi-k2.5, context=262000, max_tokens=68000
-2026-03-01 19:20:53.422 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 3 : model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
-2026-03-01 19:20:53.422 - backend.api.routes.autonomous - INFO - Validator: model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
-2026-03-01 19:20:53.422 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous coordinator initializing with 3 submitters
-2026-03-01 19:20:53.422 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 1 (Main Submitter): model=openai/gpt-5.2, context=400000
-2026-03-01 19:20:53.422 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 2 : model=moonshotai/kimi-k2.5, context=262000
-2026-03-01 19:20:53.422 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 3 : model=x-ai/grok-4.1-fast, context=2000000
-2026-03-01 19:20:53.435 - backend.autonomous.memory.session_manager - INFO - Session initialized: solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20
-2026-03-01 19:20:53.435 - backend.autonomous.memory.session_manager - INFO - Session path: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20
-2026-03-01 19:20:53.435 - backend.autonomous.core.autonomous_coordinator - INFO - New session initialized: solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20
-2026-03-01 19:20:53.435 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms
-2026-03-01 19:20:53.435 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\papers
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20
-2026-03-01 19:20:53.435 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\final_answer
-2026-03-01 19:20:53.435 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms
-2026-03-01 19:20:53.435 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\papers
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'user_research_prompt' to research metadata
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'brainstorms' to research metadata
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'papers' to research metadata
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_topic_id' to research metadata
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_paper_id' to research metadata
-2026-03-01 19:20:53.435 - backend.autonomous.memory.research_metadata - INFO - User research prompt updated
-2026-03-01 19:20:53.452 - backend.autonomous.memory.research_metadata - INFO - Research metadata initialized
-2026-03-01 19:20:53.452 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Autonomous rejection logs initialized
-2026-03-01 19:20:53.452 - backend.autonomous.core.autonomous_coordinator - INFO - Resetting RAG state for fresh autonomous research mode...
-2026-03-01 19:20:53.452 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
-2026-03-01 19:20:53.452 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
-2026-03-01 19:20:53.452 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-03-01 19:20:53.469 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-03-01 19:20:53.469 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-03-01 19:20:53.485 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-03-01 19:20:53.502 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-03-01 19:20:53.552 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-03-01 19:20:53.602 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-03-01 19:20:53.635 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-03-01 19:20:53.685 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-03-01 19:20:53.685 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - RAG state reset and cleared for autonomous mode
-2026-03-01 19:20:53.685 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms
-2026-03-01 19:20:53.685 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\papers
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager initialized
-2026-03-01 19:20:53.685 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory initialized at backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\final_answer
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_selector': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_completion_reviewer': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_reference_selector': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_title_selector': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_redundancy_checker': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_certainty_assessor': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_format_selector': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_volume_organizer': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - Configured Tier 3 Final Answer agents with api_client_manager
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - No interrupted workflow found - checking for incomplete papers
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator initialized
-2026-03-01 19:20:53.685 - backend.shared.api_client_manager - INFO - Autonomous API logger callback set
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging enabled
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator started
-2026-03-01 19:20:53.685 - backend.autonomous.core.autonomous_coordinator - INFO - Topic selection attempt 1/3
-2026-03-01 19:20:53.685 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generating topic selection with model openai/gpt-5.2 (prompt=1331t, task_id=auto_ts_000)
-2026-03-01 19:21:01.885 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generated submission - action=new_topic
-2026-03-01 19:21:01.885 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Validating topic selection with model x-ai/grok-4.1-fast (prompt=1287t, task_id=auto_tv_000)
-2026-03-01 19:21:09.185 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Decision=accept
-2026-03-01 19:21:09.202 - backend.autonomous.memory.brainstorm_memory - INFO - Created new brainstorm: topic_001
-2026-03-01 19:21:09.218 - backend.autonomous.core.autonomous_coordinator - INFO - Created new brainstorm: topic_001
-2026-03-01 19:21:09.218 - backend.autonomous.core.autonomous_coordinator - INFO - No papers available for pre-brainstorm reference selection
-2026-03-01 19:21:09.218 - backend.autonomous.core.autonomous_coordinator - INFO - Selected 0 reference papers for brainstorm
-2026-03-01 19:21:09.235 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 19:21:09.235 - backend.autonomous.core.autonomous_coordinator - INFO - Per-paper model tracking enabled for brainstorm topic_001
-2026-03-01 19:21:09.235 - backend.aggregator.memory.shared_training - INFO - Reloaded 0 insights from backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms\brainstorm_topic_001.txt (submission count: 0)
-2026-03-01 19:21:09.235 - backend.autonomous.core.autonomous_coordinator - INFO - Reloaded 0 existing submissions from brainstorm database
-2026-03-01 19:21:09.235 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-03-01 19:21:09.235 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 400000, Validator: 2000000
-2026-03-01 19:21:09.235 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['openai/gpt-5.2', 'moonshotai/kimi-k2.5', 'x-ai/grok-4.1-fast'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-03-01 19:21:09.869 - backend.shared.lm_studio_client - WARNING - 'lms ps' returned code 0
-2026-03-01 19:21:09.869 - backend.aggregator.core.coordinator - INFO - Currently loaded models: []
-2026-03-01 19:21:09.869 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 400000 tokens (model: openai/gpt-5.2)
-  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.5)
-  - Submitter 3: 2000000 tokens (model: x-ai/grok-4.1-fast)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-03-01 19:21:09.869 - backend.aggregator.memory.shared_training - INFO - Loaded 0 existing insights from shared training (submission count: 0)
-2026-03-01 19:21:09.869 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-03-01 19:21:09.885 - backend.aggregator.memory.event_log - INFO - Loaded 1747 events from event log
-2026-03-01 19:21:09.902 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 1
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model openai/gpt-5.2
-2026-03-01 19:21:09.902 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=openai/gpt-5.2, provider=openrouter, context=400000
-2026-03-01 19:21:09.902 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 2
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.5
-2026-03-01 19:21:09.902 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.5 via Groq
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.5, provider=openrouter, context=262000
-2026-03-01 19:21:09.902 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 3
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.1-fast
-2026-03-01 19:21:09.902 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.1-fast via Google
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.1-fast, provider=openrouter, context=2000000
-2026-03-01 19:21:09.902 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-03-01 19:21:09.902 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-03-01 19:21:09.902 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-03-01 19:21:09.902 - backend.autonomous.core.autonomous_coordinator - INFO - Aggregator started for brainstorm topic_001
-2026-03-01 19:21:09.902 - backend.autonomous.core.autonomous_coordinator - INFO - Starting fresh brainstorm with 0 acceptances
-2026-03-01 19:21:09.902 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-03-01 19:21:09.918 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-03-01 19:21:09.918 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-03-01 19:21:09.918 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-03-01 19:21:09.918 - backend.aggregator.core.coordinator - INFO - Validator iteration 1 - batch validating 1 submissions: ['94913303-c721-4e90-8f23-a22d8f4f4409']
-2026-03-01 19:21:52.143 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 53203947-eef6-46d0-bb5e-9c061be2c4ae (iteration 1)
-2026-03-01 19:22:02.116 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission rejected (consecutive: 1)
-2026-03-01 19:22:02.116 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 3 (total: 1)
-2026-03-01 19:22:02.131 - backend.aggregator.core.coordinator - INFO - Validator iteration 2 - batch validating 1 submissions: ['53203947-eef6-46d0-bb5e-9c061be2c4ae']
-2026-03-01 19:22:16.191 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 217f70ff-4096-40fb-b5ce-827529840ebc (iteration 1)
-2026-03-01 19:22:34.897 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 7f69307d-80aa-42e7-bb8d-aa60aaeebf2d (iteration 2)
-2026-03-01 19:22:45.725 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
-2026-03-01 19:22:45.725 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:22:45.725 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
-2026-03-01 19:22:45.725 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 1)
-2026-03-01 19:22:45.725 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:22:45.725 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:22:45.725 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:22:45.725 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 18 total chunks
-2026-03-01 19:22:45.741 - backend.aggregator.core.coordinator - INFO - Validator iteration 3 - batch validating 2 submissions: ['217f70ff-4096-40fb-b5ce-827529840ebc', '7f69307d-80aa-42e7-bb8d-aa60aaeebf2d']
-2026-03-01 19:22:45.741 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
-2026-03-01 19:22:45.741 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
-2026-03-01 19:22:50.615 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:22:50.615 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-03-01 19:23:04.507 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission f105f060-b412-444e-8291-2a70fa8b8526 (iteration 1)
-2026-03-01 19:23:15.621 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission dab53e23-b9ee-4d27-929c-579c6462f063 (iteration 3)
-2026-03-01 19:23:20.710 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission b6425e4d-f1b1-41ed-9a6b-e72c423fa281 (iteration 2)
-2026-03-01 19:23:33.915 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/2 accepted
-2026-03-01 19:23:33.915 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
-2026-03-01 19:23:33.915 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:23:33.915 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
-2026-03-01 19:23:33.915 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 2)
-2026-03-01 19:23:33.915 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:23:33.915 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:23:33.915 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:23:33.915 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 23 total chunks
-2026-03-01 19:23:33.947 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission rejected (consecutive: 1)
-2026-03-01 19:23:33.947 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 3 (total: 2)
-2026-03-01 19:23:33.947 - backend.aggregator.core.coordinator - INFO - Validator iteration 4 - batch validating 3 submissions: ['f105f060-b412-444e-8291-2a70fa8b8526', 'dab53e23-b9ee-4d27-929c-579c6462f063', 'b6425e4d-f1b1-41ed-9a6b-e72c423fa281']
-2026-03-01 19:23:33.947 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:23:33.947 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:23:34.312 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:23:34.312 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-03-01 19:24:17.062 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f2e2d0d8-448e-49cc-9fd1-527b672251d0 (iteration 4)
-2026-03-01 19:24:28.022 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission f4ce2e47-46a6-4279-af97-9be1902bfb4a (iteration 3)
-2026-03-01 19:24:40.566 - backend.aggregator.agents.validator - INFO - Batch validation complete: 2/3 accepted
-2026-03-01 19:24:40.581 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
-2026-03-01 19:24:40.581 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:24:40.581 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 1)
-2026-03-01 19:24:40.581 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 3)
-2026-03-01 19:24:40.581 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:24:40.581 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:24:40.581 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:24:40.581 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 10 total chunks
-2026-03-01 19:24:40.597 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
-2026-03-01 19:24:40.597 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:24:40.597 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:24:40.597 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
-2026-03-01 19:24:40.597 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 4)
-2026-03-01 19:24:40.613 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:24:40.613 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:24:40.613 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:24:40.613 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:24:40.615 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 14 total chunks
-2026-03-01 19:24:40.629 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission rejected (consecutive: 1)
-2026-03-01 19:24:40.629 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 1 (total: 3)
-2026-03-01 19:24:40.629 - backend.aggregator.core.coordinator - INFO - Validator iteration 5 - batch validating 2 submissions: ['f2e2d0d8-448e-49cc-9fd1-527b672251d0', 'f4ce2e47-46a6-4279-af97-9be1902bfb4a']
-2026-03-01 19:24:40.629 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
-2026-03-01 19:24:40.629 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
-2026-03-01 19:24:41.376 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:24:41.376 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=1024
-2026-03-01 19:25:10.157 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission d912c075-1f55-4c9a-8c8b-4fef07969388 (iteration 5)
-2026-03-01 19:25:24.550 - backend.aggregator.agents.validator - INFO - Batch validation complete: 2/2 accepted
-2026-03-01 19:25:24.558 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
-2026-03-01 19:25:24.558 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:25:24.558 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 3)
-2026-03-01 19:25:24.558 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 5)
-2026-03-01 19:25:24.558 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:25:24.558 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:25:24.558 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:25:24.558 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 17 total chunks
-2026-03-01 19:25:24.566 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #6
-2026-03-01 19:25:24.566 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:25:24.566 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:25:24.566 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
-2026-03-01 19:25:24.582 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 6)
-2026-03-01 19:25:24.582 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:25:24.582 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:25:24.582 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:25:24.582 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:25:24.582 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 35 total chunks
-2026-03-01 19:25:24.598 - backend.aggregator.core.coordinator - INFO - Validator iteration 6 - batch validating 1 submissions: ['d912c075-1f55-4c9a-8c8b-4fef07969388']
-2026-03-01 19:25:25.186 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:25:25.186 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=512
-2026-03-01 19:25:33.845 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 3c7d7c3c-a88e-4b67-83d8-a79a8f99a872 (iteration 4)
-2026-03-01 19:25:57.585 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission f42474aa-23fc-4330-b889-d111e04b06d3 (iteration 2)
-2026-03-01 19:26:23.426 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 78b6a576-2196-453c-9514-46c14928b96c (iteration 5)
-2026-03-01 19:26:38.583 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission d9e492ef-f4fe-4b70-83ae-ad9b68b10735 (iteration 6)
-2026-03-01 19:26:45.224 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #7
-2026-03-01 19:26:45.224 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:26:45.224 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 4)
-2026-03-01 19:26:45.224 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 7)
-2026-03-01 19:26:45.224 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:26:45.224 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:26:45.224 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:26:45.224 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 9 total chunks
-2026-03-01 19:26:45.240 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #1
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=7 (every 7 acceptances)
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 7 % 7 == 0
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=0, removals_executed=0
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #1 (triggered at 7 acceptances)
-2026-03-01 19:26:45.244 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:26:45.244 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:26:45.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:26:45.244 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:26:45.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 7 submissions
-2026-03-01 19:26:45.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 37274 chars
-2026-03-01 19:26:45.253 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (11394 tokens)
-2026-03-01 19:26:45.253 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:26:45.253 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:26:45.253 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 43460 chars
-2026-03-01 19:26:45.260 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 12695, Max allowed: 1969500
-2026-03-01 19:26:45.260 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:26:45.260 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:26:45.260 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 7 submissions
-2026-03-01 19:26:45.260 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_006
-2026-03-01 19:26:45.594 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:26:45.594 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-03-01 19:27:18.045 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission b4e23d0d-3d5a-4260-9079-9e53fa55b488 (iteration 7)
-2026-03-01 19:27:28.547 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission b15e7351-1ec7-4373-8068-cfe07bf39d09 (iteration 6)
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1215 chars
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique value and contribute to solution diversity without redundancy, contradictions, or supersession. #1 offers foundational DRO planning for design with out-of-sample guarantees. #2 uniquely introduces robust viability/RCI sets and DRO-CVaR risk for operations. #3 provides detailed aquifer recharge dynamics, physics-based models (e.g., osmotic pressure, head-dependent losses), and storage equivalence not covered elsewhere. #4 delivers a distinct concentration inequality (Hoeffding/Azuma) for certifiable storage sizing under bounded uncertainties, a simpler complementary tool absent in advanced DRO/multistage methods. #5 specializes tube-based MPC with probabilistic ISS. #6 advances multistage time-consistent DRO-OC via DR-SDDP for temporal correlations. #7 introduces conformal prediction for adaptive, distribution-free robust MPC handling nonstationarity. No submission is fully covered by
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique value and contribute to solution diversity without redundancy, contradictions, or supersession. #1 offers foundational DRO planning for design with out-of-sample guarantees. #2 uniquely introduces robust viability/RCI sets and DRO-CVaR risk for operations. #3 provides detailed aquifer recharge dynamics, physics-based models (e.g., osmotic pressure, head-dependent losses), and storage equivalence not covered elsewhere. #4 delivers a distinct concentration inequality (Hoeffding/Azuma) for certifiable storage sizing under bounded uncertainties, a simpler complementary tool absent in advanced DRO/multistage methods. #5 specializes tube-based MPC with probabilistic ISS. #6 advances multistage time-consistent DRO-OC via DR-SDDP for temporal correlations. #7 introduces conformal prediction for adaptive, distribution-free robust MPC handling nonstationarity. No submission is fully covered by others; each offers specific theorems, techniques, or perspectives (e.g., robust vs. DRO vs. conformal), enhancing multi-objective UQ and control diversity. Conservative retention preserves high-quality variety.'}
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique value and contribute to solution diversity without redundancy, contradictions, or supersession. #1 offers foundational DRO planning for design with out-of-sample guarantees. #2 uniquely introduces robust viability/RCI sets and DRO-CVaR risk for operations. #3 provides
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique value and contribute to solution diversity without redundancy, contradictions, or supersession. #1 offers foundational DRO planning for design with out-of-sample guarant
-2026-03-01 19:27:31.213 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:27:31.213 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:27:31.213 - backend.aggregator.core.coordinator - INFO - Cleanup review #1: No removal needed
-2026-03-01 19:27:31.213 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:27:31.213 - backend.aggregator.core.coordinator - INFO - Validator iteration 7 - batch validating 3 submissions: ['3c7d7c3c-a88e-4b67-83d8-a79a8f99a872', 'f42474aa-23fc-4330-b889-d111e04b06d3', '78b6a576-2196-453c-9514-46c14928b96c']
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:27:31.213 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:28:00.562 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 65e814cc-c776-47b9-a4a5-03cffea6136d (iteration 8)
-2026-03-01 19:28:24.146 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:28:24.162 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #8
-2026-03-01 19:28:24.162 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:28:24.162 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 3)
-2026-03-01 19:28:24.162 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 8)
-2026-03-01 19:28:24.162 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:28:24.162 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:28:24.162 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:28:24.162 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 11 total chunks
-2026-03-01 19:28:24.178 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #9
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:28:24.178 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 2)
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 9)
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:28:24.178 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:28:24.194 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 50 total chunks
-2026-03-01 19:28:24.210 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #10
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:28:24.210 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 4)
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 10)
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:28:24.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:28:24.210 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 54 total chunks
-2026-03-01 19:28:24.230 - backend.aggregator.core.coordinator - INFO - Validator iteration 8 - batch validating 3 submissions: ['d9e492ef-f4fe-4b70-83ae-ad9b68b10735', 'b4e23d0d-3d5a-4260-9079-9e53fa55b488', 'b15e7351-1ec7-4373-8068-cfe07bf39d09']
-2026-03-01 19:28:24.230 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:28:24.230 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:28:25.429 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:28:25.429 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=512
-2026-03-01 19:28:26.177 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 10 acceptances
-2026-03-01 19:28:26.193 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (16520 tokens <= 310000 available)
-2026-03-01 19:28:26.209 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=17767t, RAG=False, task_id=auto_cr_000)
-2026-03-01 19:28:47.968 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 5b7f8d7d-9fcb-40f2-92fa-f561c8b6da7f (iteration 3)
-2026-03-01 19:28:49.170 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission d3448dd2-c5ad-426c-b494-5f73b75c8ace (iteration 7)
-2026-03-01 19:28:50.404 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 671e3f38-56e7-4734-9dd2-bb4e6e87c1da (iteration 9)
-2026-03-01 19:29:09.084 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:29:09.100 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #11
-2026-03-01 19:29:09.100 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:29:09.100 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 5)
-2026-03-01 19:29:09.100 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 11)
-2026-03-01 19:29:09.100 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:29:09.100 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:29:09.100 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:29:09.100 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 9 total chunks
-2026-03-01 19:29:09.116 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #12
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:29:09.116 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 6)
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 12)
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:29:09.116 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:29:09.116 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 13 total chunks
-2026-03-01 19:29:09.132 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #13
-2026-03-01 19:29:09.132 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:29:09.132 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:29:09.132 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 5)
-2026-03-01 19:29:09.132 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 13)
-2026-03-01 19:29:09.148 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:29:09.148 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:29:09.148 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:29:09.148 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:29:09.148 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 63 total chunks
-2026-03-01 19:29:09.164 - backend.aggregator.core.coordinator - INFO - Validator iteration 9 - batch validating 3 submissions: ['65e814cc-c776-47b9-a4a5-03cffea6136d', '5b7f8d7d-9fcb-40f2-92fa-f561c8b6da7f', 'd3448dd2-c5ad-426c-b494-5f73b75c8ace']
-2026-03-01 19:29:09.164 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:29:09.164 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:29:10.225 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:29:10.225 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=256
-2026-03-01 19:29:20.243 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=18661t, RAG=False, task_id=auto_cr_001)
-2026-03-01 19:30:08.289 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 8b2180f1-188b-4298-97bc-ea48c27fdb65 (iteration 10)
-2026-03-01 19:30:17.641 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 76a1c832-e4fc-4cbf-8193-2ea08d11a40f (iteration 8)
-2026-03-01 19:30:27.856 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The decision \"continue_brainstorm\" is accurate given the current brainstorm database. The accepted submissions heavily emphasize Wasserstein DRO, robust invariance/robust MPC, multistage time-consistent DRO (DR-SDDP), DRMDP framing, conformal prediction sets, and martingale concentration bounds, which indeed cover a substantial but not end-to-end set of mathematical pillars for the stated goal.\n\nThe identified gaps are concrete and not merely \"more cou
-2026-03-01 19:30:27.856 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:30:27.856 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The decision "continue_brainstorm" is accurate given the current brainstorm database. The accepted submissions heavily emphasize Wasserstein DRO, robust invariance/robust MPC, multistage time-consistent DRO (DR-SDDP), DRMDP framing, conformal prediction sets, and martingale concentration bounds, whi...
-2026-03-01 19:30:29.156 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:30:29.173 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:30:29.173 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #14
-2026-03-01 19:30:29.173 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:30:29.173 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 7)
-2026-03-01 19:30:29.173 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 14)
-2026-03-01 19:30:29.173 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:30:29.173 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:30:29.173 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:30:29.173 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 12 total chunks
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #2
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=14 (every 7 acceptances)
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 14 % 7 == 0
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=0, removals_executed=0
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #2 (triggered at 14 acceptances)
-2026-03-01 19:30:29.205 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:30:29.205 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:30:29.205 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:30:29.205 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:30:29.205 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 14 submissions
-2026-03-01 19:30:29.205 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 75877 chars
-2026-03-01 19:30:29.223 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (22811 tokens)
-2026-03-01 19:30:29.223 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 82063 chars
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 24112, Max allowed: 1969500
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 14 submissions
-2026-03-01 19:30:29.223 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_010
-2026-03-01 19:30:29.417 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:30:29.417 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-03-01 19:31:01.605 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission eedb68ab-b6bd-49ef-a27b-daf05bdebf55 (iteration 11)
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1002 chars
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All 14 submissions contribute unique value to the knowledge base, offering distinct mathematical frameworks, guarantees, and techniques that enhance solution diversity for the water-renewable optimization problem. Examples include: DRO planning (#1), robust viability/RCI MPC (#2), detailed aquifer/thermo dynamics (#3), Hoeffding storage sizing (#4), DR-tube MPC (#5), multistage DR-SDDP (#6), conformal robust MPC (#7), DRMDP feedback (#8), Port-Hamiltonian passivity (#9), variance-adaptive Freedman CC (#10), decentralized DRO-ADMM (#11), conformal DRO-MPC (#12), min-cut reliability (#13), and Lyapunov OCO regret (#14). No submission is fully redundant, contradicted, superseded, or lacking unique info (e.g., #4's simple bounded concentration complements #10's adaptive martingale; DRO variants differ in scope/stage/tubes/decentralization). Conservative retention preserves comprehensive coverage without quality loss."
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': "All 14 submissions contribute unique value to the knowledge base, offering distinct mathematical frameworks, guarantees, and techniques that enhance solution diversity for the water-renewable optimization problem. Examples include: DRO planning (#1), robust viability/RCI MPC (#2), detailed aquifer/thermo dynamics (#3), Hoeffding storage sizing (#4), DR-tube MPC (#5), multistage DR-SDDP (#6), conformal robust MPC (#7), DRMDP feedback (#8), Port-Hamiltonian passivity (#9), variance-adaptive Freedman CC (#10), decentralized DRO-ADMM (#11), conformal DRO-MPC (#12), min-cut reliability (#13), and Lyapunov OCO regret (#14). No submission is fully redundant, contradicted, superseded, or lacking unique info (e.g., #4's simple bounded concentration complements #10's adaptive martingale; DRO variants differ in scope/stage/tubes/decentralization). Conservative retention preserves comprehensive coverage without quality loss."}
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All 14 submissions contribute unique value to the knowledge base, offering distinct mathematical frameworks, guarantees, and techniques that enhance solution diversity for the water-renewable optimization problem. Examples include: DRO planning (#1), robust viability/RCI MPC (#2), detailed aquifer/t
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:31:14.372 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All 14 submissions contribute unique value to the knowledge base, offering distinct mathematical frameworks, guarantees, and techniques that enhance solution diversity for the water-renewable optimiza
-2026-03-01 19:31:14.372 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:31:14.372 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:31:14.372 - backend.aggregator.core.coordinator - INFO - Cleanup review #2: No removal needed
-2026-03-01 19:31:14.372 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:31:14.389 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #15
-2026-03-01 19:31:14.389 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:31:14.389 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 3)
-2026-03-01 19:31:14.389 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 15)
-2026-03-01 19:31:14.389 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:31:14.389 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:31:14.389 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:31:14.389 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 10 total chunks
-2026-03-01 19:31:14.420 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #16
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:31:14.420 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 6)
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 16)
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:31:14.420 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:31:14.420 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 20 total chunks
-2026-03-01 19:31:14.445 - backend.aggregator.core.coordinator - INFO - Validator iteration 10 - batch validating 3 submissions: ['671e3f38-56e7-4734-9dd2-bb4e6e87c1da', '8b2180f1-188b-4298-97bc-ea48c27fdb65', '76a1c832-e4fc-4cbf-8193-2ea08d11a40f']
-2026-03-01 19:31:14.445 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:31:14.445 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:31:14.928 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:31:14.928 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=1024
-2026-03-01 19:31:21.871 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission c11c9678-04f5-4324-9e88-b713d42dffd3 (iteration 9)
-2026-03-01 19:31:44.787 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission b0ecf83c-24e3-44f4-bdc4-5e529742d29c (iteration 4)
-2026-03-01 19:31:52.560 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 4964cb1e-15e5-4f72-8de3-bd3dafa5ddda (iteration 12)
-2026-03-01 19:32:15.236 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:32:15.253 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #17
-2026-03-01 19:32:15.253 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:32:15.253 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 8)
-2026-03-01 19:32:15.253 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 17)
-2026-03-01 19:32:15.253 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:32:15.253 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:32:15.253 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:32:15.253 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 21 total chunks
-2026-03-01 19:32:15.270 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #18
-2026-03-01 19:32:15.270 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:32:15.270 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:32:15.270 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 9)
-2026-03-01 19:32:15.270 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 18)
-2026-03-01 19:32:15.286 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:32:15.286 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:32:15.286 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:32:15.286 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:32:15.286 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 22 total chunks
-2026-03-01 19:32:15.302 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #19
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:32:15.302 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 7)
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 19)
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:32:15.302 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:32:15.302 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 28 total chunks
-2026-03-01 19:32:15.317 - backend.aggregator.core.coordinator - INFO - Validator iteration 11 - batch validating 3 submissions: ['eedb68ab-b6bd-49ef-a27b-daf05bdebf55', 'c11c9678-04f5-4324-9e88-b713d42dffd3', 'b0ecf83c-24e3-44f4-bdc4-5e529742d29c']
-2026-03-01 19:32:15.317 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:32:15.317 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:32:16.336 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:32:16.336 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:32:24.609 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission e935549e-9276-47d5-8da6-79f28129bb46 (iteration 10)
-2026-03-01 19:32:46.770 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 16b17ae4-7e58-4c59-b1a0-8ee7a58335fb (iteration 13)
-2026-03-01 19:32:59.050 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:32:59.062 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #20
-2026-03-01 19:32:59.062 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:32:59.062 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 10)
-2026-03-01 19:32:59.062 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 20)
-2026-03-01 19:32:59.062 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:32:59.062 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:32:59.062 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:32:59.062 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 6 total chunks
-2026-03-01 19:32:59.093 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #21
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:32:59.093 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 8)
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 21)
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:32:59.093 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:32:59.093 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 54 total chunks
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #3
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=21 (every 7 acceptances)
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 21 % 7 == 0
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=0, removals_executed=0
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #3 (triggered at 21 acceptances)
-2026-03-01 19:32:59.109 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:32:59.109 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:32:59.109 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:32:59.109 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:32:59.109 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 21 submissions
-2026-03-01 19:32:59.109 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 116160 chars
-2026-03-01 19:32:59.125 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (34625 tokens)
-2026-03-01 19:32:59.125 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:32:59.125 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:32:59.125 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 122346 chars
-2026-03-01 19:32:59.156 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 35926, Max allowed: 1969500
-2026-03-01 19:32:59.156 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:32:59.156 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:32:59.156 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 21 submissions
-2026-03-01 19:32:59.156 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_013
-2026-03-01 19:32:59.266 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 21 acceptances
-2026-03-01 19:32:59.302 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (34625 tokens <= 310000 available)
-2026-03-01 19:32:59.318 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=36882t, RAG=False, task_id=auto_cr_002)
-2026-03-01 19:32:59.829 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:32:59.829 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=256
-2026-03-01 19:33:25.802 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 20d5c83b-3e74-44c3-be9b-1eadd357c344 (iteration 14)
-2026-03-01 19:33:44.105 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 0f0e35cf-c6a5-4668-bf0a-64db129b2dfa (iteration 11)
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1298 chars
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": true,
-  "submission_number": 4,
-  "reasoning": "Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertainties, leading to a conservative safety margin scaling with B sqrt((T/2) ln(2/eps)) for storage sizing and chance-constrained SOCP embedding. This is now fully superseded by submission #10, which provides a superior variance-adaptive Freedman (Bernstein-style) martingale inequality using predictable quadratic variation V_H (from forecast ensembles), yielding tighter bounds exp(-h^2 / 2(V_H + B h/3)) that automatically shrink with better forecasts, handle temporal dependence without independence assumptions, and embed similarly in SOCP via sqrt(V_H) representability. #4's worst-case B^2 T scaling is recovered as a special case when V_H = O(B^2 T), making #4 marginally useful initially but providing no unique value, perspecti
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': True, 'submission_number': 4, 'reasoning': "Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertainties, leading to a conservative safety margin scaling with B sqrt((T/2) ln(2/eps)) for storage sizing and chance-constrained SOCP embedding. This is now fully superseded by submission #10, which provides a superior variance-adaptive Freedman (Bernstein-style) martingale inequality using predictable quadratic variation V_H (from forecast ensembles), yielding tighter bounds exp(-h^2 / 2(V_H + B h/3)) that automatically shrink with better forecasts, handle temporal dependence without independence assumptions, and embed similarly in SOCP via sqrt(V_H) representability. #4's worst-case B^2 T scaling is recovered as a special case when V_H = O(B^2 T), making #4 marginally useful initially but providing no unique value, perspective, or specific details (e.g., network extension via Laplacians is conservatively replicated in #10 via scalar/weighted aggregates) given the current database state. Removing #4 improves quality without loss of diversity, as #10 advances the same reliability certification goal more effectively."}
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=True, submission_number=4
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertainties, leading to a conservative safety margin scaling with B sqrt((T/2) ln(2/eps)) for storage sizing
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: REMOVAL PROPOSED - submission #4
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - Cleanup review: Proposing removal of submission #4 - Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertaint...
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal={'submission_number': 4, 'reasoning': "Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertainties, leading to a conservative safety margin scaling with B sqrt((T/2) ln(2/eps)) for storage sizing and chance-constrained SOCP embedding. This is now fully superseded by submission #10, which provides a superior variance-adaptive Freedman (Bernstein-style) martingale inequality using predictable quadratic variation V_H (from forecast ensembles), yielding tighter bounds exp(-h^2 / 2(V_H + B h/3)) that automatically shrink with better forecasts, handle temporal dependence without independence assumptions, and embed similarly in SOCP via sqrt(V_H) representability. #4's worst-case B^2 T scaling is recovered as a special case when V_H = O(B^2 T), making #4 marginally useful initially but providing no unique value, perspective, or specific details (e.g., network extension via Laplacians is conservatively replicated in #10 via scalar/weighted aggregates) given the current database state. Removing #4 improves quality without loss of diversity, as #10 advances the same reliability certification goal more effectively."}
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: REMOVAL PROPOSED for submission #4
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Removal reasoning: Submission #4 introduces a Hoeffding (Azuma-Hoeffding) concentration inequality for bounding the probability of cumulative storage deficits in integrated water supply networks under bounded uncertainties, leading to a conservative safety margin scaling with B sqrt((T/2) ln(2/eps)) for storage sizing...
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - Cleanup review #3: Removal proposed for submission #4
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 2: Getting content for submission #4...
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 2 Complete: Got submission content, length=3437 chars
-2026-03-01 19:33:55.635 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 3: Calling validator.validate_removal()...
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 2: REMOVAL VALIDATION START ==========
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:33:55.635 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Validating removal of submission #4
-2026-03-01 19:33:55.650 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Submission content length: 3437 chars
-2026-03-01 19:33:55.650 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Removal reasoning length: 1226 chars
-2026-03-01 19:33:55.650 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Full database context length: 116160 chars
-2026-03-01 19:33:55.668 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (34625 tokens)
-2026-03-01 19:33:55.668 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:33:55.668 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:33:55.668 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built removal validation prompt with direct injection, length: 125912 chars
-2026-03-01 19:33:55.685 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 37056, Max allowed: 1969500
-2026-03-01 19:33:55.685 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:33:55.685 - backend.aggregator.agents.validator - INFO - Removal validation: Validating proposed removal of submission #4
-2026-03-01 19:33:55.685 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_014
-2026-03-01 19:34:05.001 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:05.034 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:05.035 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:05.040 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:05.040 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:11.035 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=36935t, RAG=False, task_id=auto_cr_003)
-2026-03-01 19:34:11.135 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:11.154 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:11.168 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:11.218 - backend.shared.openrouter_client - INFO - OpenRouter client closed successfully
-2026-03-01 19:34:59.117 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission c60a6a74-b8aa-432f-b755-53d8b433f145 (iteration 15)
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1756 chars
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "decision": "accept",
-  "reasoning": "The proposed removal is justified. Submission #4 provides a Hoeffding (Azuma-Hoeffding) concentration bound for the probability of storage deficits in aggregate water storage dynamics under bounded uncertainties, yielding a worst-case storage sizing rule scaling as B sqrt((T/2) ln(2/ε)) for chance-constrained SOCP embeddings. This is fully subsumed and superseded by submission #10, which derives a tighter, variance-adaptive Freedman (Bernstein-style) martingale inequality using predictable quadratic variation V_H from forecast ensembles, with bound exp(-h² / 2(V_H + B h/3)). The Hoeffding bound recovers as a special case when V_H = O(B² T), but #10 is strictly superior: less conservative (shrinks with better forecasts), handles temporal dependence via martingale differences (no independence assumption in #4), and embeds analogously in SOCP via tightened nominal trajectories with sqrt(V_H) representability. Specific details in #4 (scalar aggrega
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'decision': 'accept', 'reasoning': 'The proposed removal is justified. Submission #4 provides a Hoeffding (Azuma-Hoeffding) concentration bound for the probability of storage deficits in aggregate water storage dynamics under bounded uncertainties, yielding a worst-case storage sizing rule scaling as B sqrt((T/2) ln(2/ε)) for chance-constrained SOCP embeddings. This is fully subsumed and superseded by submission #10, which derives a tighter, variance-adaptive Freedman (Bernstein-style) martingale inequality using predictable quadratic variation V_H from forecast ensembles, with bound exp(-h² / 2(V_H + B h/3)). The Hoeffding bound recovers as a special case when V_H = O(B² T), but #10 is strictly superior: less conservative (shrinks with better forecasts), handles temporal dependence via martingale differences (no independence assumption in #4), and embeds analogously in SOCP via tightened nominal trajectories with sqrt(V_H) representability. Specific details in #4 (scalar aggregate S_t dynamics with desal efficiency α and ecosystem flows, pseudocode, CAISO Monte Carlo validation, vague network extension via graph Laplacians and ||A||_1 norm) are conservatively replicated or improved in #10 (aggregate serviceable water S_t via weighted sums or epigraph min over districts, forecast-based V_H for renewables/demand/inflow, similar optimization embedding). No unique value, perspective, or actionable content is lost; the database improves in quality by retaining only the advanced, general bound while preserving solution diversity through complementary UQ methods (#1-3 DRO, #7/12 conformal, #13 cuts, etc.). Removal narrows redundancy without reducing coverage of storage reliability certification under renewables uncertainty.'}
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - decision=accept
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): The proposed removal is justified. Submission #4 provides a Hoeffding (Azuma-Hoeffding) concentration bound for the probability of storage deficits in aggregate water storage dynamics under bounded uncertainties, yielding a worst-case storage sizing rule scaling as B sqrt((T/2) ln(2/ε)) for chance-c
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: REMOVAL APPROVED for submission #4
-2026-03-01 19:35:20.665 - backend.aggregator.agents.validator - INFO - Removal validation: APPROVED removal of submission #4 - The proposed removal is justified. Submission #4 provides a Hoeffding (Azuma-Hoeffding) concentration bound for the probability of storage deficits in aggregate water storage dynamics under bounded un...
-2026-03-01 19:35:20.665 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 3 Complete: removal_validated=True
-2026-03-01 19:35:20.665 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 4: Executing removal of submission #4...
-2026-03-01 19:35:20.665 - backend.aggregator.memory.shared_training - INFO - Removed submission #4 from shared training
-2026-03-01 19:35:20.682 - backend.aggregator.memory.shared_training - INFO - Triggering re-chunking callback after removal of submission #4
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 4 Complete: removal_success=True
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: REMOVAL EXECUTED SUCCESSFULLY for submission #4
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Total removals executed: 1
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - Cleanup review #3: Successfully removed submission #4
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:35:20.682 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: No new submissions to process
-2026-03-01 19:35:20.715 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (Success=True) ==================
-2026-03-01 19:35:20.715 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #22
-2026-03-01 19:35:20.715 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:35:20.715 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 4)
-2026-03-01 19:35:20.715 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 22)
-2026-03-01 19:35:20.715 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:35:20.715 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: No new submissions to process
-2026-03-01 19:35:20.732 - backend.aggregator.core.coordinator - INFO - Validator iteration 12 - batch validating 3 submissions: ['4964cb1e-15e5-4f72-8de3-bd3dafa5ddda', 'e935549e-9276-47d5-8da6-79f28129bb46', '16b17ae4-7e58-4c59-b1a0-8ee7a58335fb']
-2026-03-01 19:35:20.732 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:35:20.732 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:35:30.897 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission d6dd4b18-b15f-409e-9831-5661c5459ceb (iteration 12)
-2026-03-01 19:35:39.813 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The continue_brainstorm decision is accurate. The current database is indeed strong on Wasserstein/KL DRO, robust invariance/tube MPC, multistage time-consistent DRO (SDDP/DRMDP), conformal prediction, martingale concentration bounds, decentralized ADMM, min-cut reliability certificates, online Lyapunov/OCO control, and convex-conic hydraulics (plus some nonconvex SOS/CBF extensions). However, the assessment correctly identifies concrete missing pillars rel
-2026-03-01 19:35:39.813 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:35:39.813 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The continue_brainstorm decision is accurate. The current database is indeed strong on Wasserstein/KL DRO, robust invariance/tube MPC, multistage time-consistent DRO (SDDP/DRMDP), conformal prediction, martingale concentration bounds, decentralized ADMM, min-cut reliability certificates, online Lyap...
-2026-03-01 19:35:39.831 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:35:52.128 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission ee2ef953-4b3f-4791-a3c1-93f6572e8729 (iteration 16)
-2026-03-01 19:36:08.626 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission f1bb618c-3885-4bf9-b98c-ec72e3cb5ffc (iteration 5)
-2026-03-01 19:36:11.150 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:36:11.160 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #23
-2026-03-01 19:36:11.160 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:36:11.160 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 11)
-2026-03-01 19:36:11.160 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 23)
-2026-03-01 19:36:11.160 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:36:11.209 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:36:11.209 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:36:11.209 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 13 total chunks
-2026-03-01 19:36:11.226 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #24
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:36:11.226 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 9)
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 24)
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:36:11.226 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:36:11.241 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 20 total chunks
-2026-03-01 19:36:11.251 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #25
-2026-03-01 19:36:11.251 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:36:11.251 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:36:11.251 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 12)
-2026-03-01 19:36:11.259 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 25)
-2026-03-01 19:36:11.262 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:36:11.262 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:36:11.262 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:36:11.262 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:36:11.262 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 23 total chunks
-2026-03-01 19:36:11.276 - backend.aggregator.core.coordinator - INFO - Validator iteration 13 - batch validating 3 submissions: ['20d5c83b-3e74-44c3-be9b-1eadd357c344', '0f0e35cf-c6a5-4668-bf0a-64db129b2dfa', 'c60a6a74-b8aa-432f-b755-53d8b433f145']
-2026-03-01 19:36:11.276 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:36:11.276 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:36:12.060 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:36:12.060 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=1024
-2026-03-01 19:36:45.072 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 9bb9b66e-9a78-4ada-a64f-84320a8b61d3 (iteration 17)
-2026-03-01 19:36:58.654 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 8f2a7033-6845-4ca4-bcfa-f6421142a0d8 (iteration 13)
-2026-03-01 19:37:00.854 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:37:00.870 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #26
-2026-03-01 19:37:00.870 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:37:00.870 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 13)
-2026-03-01 19:37:00.870 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 26)
-2026-03-01 19:37:00.886 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:37:00.936 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:37:00.937 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:37:00.937 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 18 total chunks
-2026-03-01 19:37:00.954 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #27
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:37:00.954 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 10)
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 27)
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:37:00.954 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:37:00.954 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 27 total chunks
-2026-03-01 19:37:00.970 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #28
-2026-03-01 19:37:00.970 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:37:00.970 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:37:00.970 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 14)
-2026-03-01 19:37:00.970 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 28)
-2026-03-01 19:37:00.988 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:37:00.988 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:37:00.988 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:37:00.988 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:37:00.988 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 29 total chunks
-2026-03-01 19:37:01.002 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:37:01.002 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:37:01.002 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:37:01.002 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #4
-2026-03-01 19:37:01.003 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=28 (every 7 acceptances)
-2026-03-01 19:37:01.003 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 28 % 7 == 0
-2026-03-01 19:37:01.003 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:37:01.003 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #4 (triggered at 28 acceptances)
-2026-03-01 19:37:01.004 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:37:01.004 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:37:01.004 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:37:01.004 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:37:01.004 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 27 submissions
-2026-03-01 19:37:01.004 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 146025 chars
-2026-03-01 19:37:01.021 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (44068 tokens)
-2026-03-01 19:37:01.021 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:37:01.021 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:37:01.021 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 152211 chars
-2026-03-01 19:37:01.054 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 45369, Max allowed: 1969500
-2026-03-01 19:37:01.054 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:37:01.054 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:37:01.054 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 27 submissions
-2026-03-01 19:37:01.054 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_017
-2026-03-01 19:37:01.902 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:37:01.902 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:37:33.851 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 9a27c098-068c-46d1-96dd-2fba92c39ae9 (iteration 18)
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1271 chars
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, perspectives, or techniques that advance the goal of rigorous optimization/control for integrated water-renewable systems. While there are thematic overlaps (e.g., multiple DRO/MPC variants, hydraulic relaxations), each offers distinct elements: specific theorems/proofs (e.g., #1 foundational Wasserstein DRO planning reformulation; #10 martingale Freedman bounds; #19 KL-DRO entropic dual; #22 unimodal moment tightening), unique models (e.g., #9 Port-Hamiltonian passivity; #13 cut-based max-flow; #15 Koopman spectral lifting; #24 aquifer exponential-sum convolution), handling of particular challenges (e.g., #16/#21/#28 progressive hydraulic relaxations for power-cone/radial/looped; #20 DR-CBF hard safety; #23 SOS polynomial RCI; #25 DR Nash equilibria), or computational frameworks (e.g., #6 DR-SDDP multistage; #11 decentralized ADMM; #26 tree DP decompositi
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, perspectives, or techniques that advance the goal of rigorous optimization/control for integrated water-renewable systems. While there are thematic overlaps (e.g., multiple DRO/MPC variants, hydraulic relaxations), each offers distinct elements: specific theorems/proofs (e.g., #1 foundational Wasserstein DRO planning reformulation; #10 martingale Freedman bounds; #19 KL-DRO entropic dual; #22 unimodal moment tightening), unique models (e.g., #9 Port-Hamiltonian passivity; #13 cut-based max-flow; #15 Koopman spectral lifting; #24 aquifer exponential-sum convolution), handling of particular challenges (e.g., #16/#21/#28 progressive hydraulic relaxations for power-cone/radial/looped; #20 DR-CBF hard safety; #23 SOS polynomial RCI; #25 DR Nash equilibria), or computational frameworks (e.g., #6 DR-SDDP multistage; #11 decentralized ADMM; #26 tree DP decomposition). No submission is fully redundant, contradictory, or superseded; each adds verifiable value (e.g., different ambiguity sets, exactness conditions, convergence proofs) enhancing solution diversity. Conservative approach: database quality maintained without removal.'}
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, perspectives, or techniques that advance the goal of rigorous optimization/control for integrated water-renewable systems. While there are thematic overlaps (e.g., multiple DRO/MPC variants, hydraulic relaxations), each offers distinct eleme
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, perspectives, or techniques that advance the goal of rigorous optimization/control for integrated water-renewable systems. While there are th
-2026-03-01 19:37:53.498 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:37:53.498 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:37:53.498 - backend.aggregator.core.coordinator - INFO - Cleanup review #4: No removal needed
-2026-03-01 19:37:53.498 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:37:53.498 - backend.aggregator.core.coordinator - INFO - Validator iteration 14 - batch validating 3 submissions: ['d6dd4b18-b15f-409e-9831-5661c5459ceb', 'ee2ef953-4b3f-4791-a3c1-93f6572e8729', 'f1bb618c-3885-4bf9-b98c-ec72e3cb5ffc']
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:37:53.498 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:38:10.213 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission ca646294-7878-4e8e-a084-ee5ed9233b10 (iteration 14)
-2026-03-01 19:38:27.444 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission af837b51-c794-4567-a300-9542012bc147 (iteration 19)
-2026-03-01 19:38:48.008 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:38:48.025 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #29
-2026-03-01 19:38:48.025 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:38:48.025 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 11)
-2026-03-01 19:38:48.025 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 29)
-2026-03-01 19:38:48.025 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:38:48.040 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:38:48.040 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:38:48.042 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 9 total chunks
-2026-03-01 19:38:48.058 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #30
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:38:48.058 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 15)
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 30)
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:38:48.058 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:38:48.074 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 52 total chunks
-2026-03-01 19:38:48.091 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #31
-2026-03-01 19:38:48.092 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:38:48.092 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:38:48.092 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 5)
-2026-03-01 19:38:48.092 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 31)
-2026-03-01 19:38:48.096 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:38:48.096 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:38:48.096 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:38:48.096 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:38:48.098 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 48 total chunks
-2026-03-01 19:38:48.109 - backend.aggregator.core.coordinator - INFO - Validator iteration 15 - batch validating 3 submissions: ['9bb9b66e-9a78-4ada-a64f-84320a8b61d3', '8f2a7033-6845-4ca4-bcfa-f6421142a0d8', '9a27c098-068c-46d1-96dd-2fba92c39ae9']
-2026-03-01 19:38:48.109 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:38:48.109 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:38:49.358 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:38:49.358 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=512
-2026-03-01 19:38:50.075 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 31 acceptances
-2026-03-01 19:38:50.108 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (49213 tokens <= 310000 available)
-2026-03-01 19:38:50.142 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=52631t, RAG=False, task_id=auto_cr_004)
-2026-03-01 19:39:29.271 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 09ddfb09-55a3-4054-953a-3a2281ad9367 (iteration 20)
-2026-03-01 19:39:41.303 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission d3cf1848-da1b-4774-856b-262a08ce3ba0 (iteration 15)
-2026-03-01 19:39:43.686 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:39:43.704 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #32
-2026-03-01 19:39:43.704 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:39:43.704 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 16)
-2026-03-01 19:39:43.704 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 32)
-2026-03-01 19:39:43.704 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:39:43.768 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:39:43.768 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:39:43.769 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 9 total chunks
-2026-03-01 19:39:43.785 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #33
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:39:43.785 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 12)
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 33)
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:39:43.785 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:39:43.785 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 18 total chunks
-2026-03-01 19:39:43.803 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #34
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:39:43.803 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 17)
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 34)
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:39:43.803 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:39:43.821 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 79 total chunks
-2026-03-01 19:39:43.823 - backend.aggregator.core.coordinator - INFO - Validator iteration 16 - batch validating 3 submissions: ['ca646294-7878-4e8e-a084-ee5ed9233b10', 'af837b51-c794-4567-a300-9542012bc147', '09ddfb09-55a3-4054-953a-3a2281ad9367']
-2026-03-01 19:39:43.823 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:39:43.823 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:39:45.101 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:39:45.102 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=256
-2026-03-01 19:39:58.401 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 769db3e7-d8af-47e3-8877-952a15800226 (iteration 6)
-2026-03-01 19:40:07.382 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=51352t, RAG=False, task_id=auto_cr_005)
-2026-03-01 19:40:25.648 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 46511b0d-6961-4e7b-ae74-ad1968edc153 (iteration 21)
-2026-03-01 19:40:46.562 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:40:46.580 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #35
-2026-03-01 19:40:46.580 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:40:46.580 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 13)
-2026-03-01 19:40:46.580 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 35)
-2026-03-01 19:40:46.580 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:40:46.580 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:40:46.580 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:40:46.580 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 18 total chunks
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #5
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=35 (every 7 acceptances)
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 35 % 7 == 0
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #5 (triggered at 35 acceptances)
-2026-03-01 19:40:46.597 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:40:46.597 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:40:46.597 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:40:46.597 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:40:46.597 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 34 submissions
-2026-03-01 19:40:46.597 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 186699 chars
-2026-03-01 19:40:46.630 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (56267 tokens)
-2026-03-01 19:40:46.630 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:40:46.630 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:40:46.630 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 192885 chars
-2026-03-01 19:40:46.663 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 57568, Max allowed: 1969500
-2026-03-01 19:40:46.663 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:40:46.663 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:40:46.663 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 34 submissions
-2026-03-01 19:40:46.663 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_021
-2026-03-01 19:40:46.846 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:40:46.846 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-03-01 19:41:16.460 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 1b80dd3b-f96f-4282-836d-9f25e4c5cb64 (iteration 16)
-2026-03-01 19:41:18.376 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f3a9d4e4-5a92-4635-a643-fb1d494b7504 (iteration 22)
-2026-03-01 19:41:29.174 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The continue_brainstorm decision is accurate given the current database. While the submissions cover many major optimization/control pillars (Wasserstein/KL/moment DRO, multistage time-consistent control, MPC/RCI/viability, conformal sets, martingale bounds, decentralized algorithms, hydraulics convexifications/relaxations, SOS/SDP tools, and EVT tails), the assessment correctly identifies several concrete missing areas that would materially strengthen a ri
-2026-03-01 19:41:29.174 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:41:29.174 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The continue_brainstorm decision is accurate given the current database. While the submissions cover many major optimization/control pillars (Wasserstein/KL/moment DRO, multistage time-consistent control, MPC/RCI/viability, conformal sets, martingale bounds, decentralized algorithms, hydraulics conv...
-2026-03-01 19:41:29.206 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:41:34.974 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:41:34.974 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:41:34.974 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1148 chars
-2026-03-01 19:41:34.974 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, perspectives, or techniques that enhance solution diversity for the water-energy optimization goal. While there are thematic overlaps (e.g., multiple DRO variants with Wasserstein ambiguity, hydraulic relaxations across #16, #21, #28, MPC extensions in #5, #7, #12), no submission is fully redundant, contradicted, or superseded: each offers distinct proofs (e.g., exact reformulations, convergence theorems), physics modeling (e.g., aquifer convolution #24, quality blending #35, EVT tails #31), control structures (e.g., DRMDP #8, CBF #20, zonotopic RCI #32), or scalability (e.g., tree DP #26, submodular discrete #29, decentralized Nash #25). Hydraulics modules complementarily cover power-cone general (#16), radial SOCP (#21), looped SDP (#28) with topology-specific exactness. DRO flavors (KL #19, moment #27, comonotone #34, nested #33) address different ambig
-2026-03-01 19:41:34.974 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:41:34.990 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, perspectives, or techniques that enhance solution diversity for the water-energy optimization goal. While there are thematic overlaps (e.g., multiple DRO variants with Wasserstein ambiguity, hydraulic relaxations across #16, #21, #28, MPC extensions in #5, #7, #12), no submission is fully redundant, contradicted, or superseded: each offers distinct proofs (e.g., exact reformulations, convergence theorems), physics modeling (e.g., aquifer convolution #24, quality blending #35, EVT tails #31), control structures (e.g., DRMDP #8, CBF #20, zonotopic RCI #32), or scalability (e.g., tree DP #26, submodular discrete #29, decentralized Nash #25). Hydraulics modules complementarily cover power-cone general (#16), radial SOCP (#21), looped SDP (#28) with topology-specific exactness. DRO flavors (KL #19, moment #27, comonotone #34, nested #33) address different ambiguity geometries without overlap. Conservative approach: database quality maintained with full diversity; no single weakest candidate for removal.'}
-2026-03-01 19:41:34.990 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:41:34.990 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, perspectives, or techniques that enhance solution diversity for the water-energy optimization goal. While there are thematic overlaps (e.g., multiple DRO variants with Wasserstein ambiguity, hydraulic relaxations across #16, #21, #28, MPC ex
-2026-03-01 19:41:34.990 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:41:34.990 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, perspectives, or techniques that enhance solution diversity for the water-energy optimization goal. While there are thematic overlaps (e.g.,
-2026-03-01 19:41:34.990 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:41:34.990 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:41:34.990 - backend.aggregator.core.coordinator - INFO - Cleanup review #5: No removal needed
-2026-03-01 19:41:34.990 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:41:34.990 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #36
-2026-03-01 19:41:34.990 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:41:34.990 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 18)
-2026-03-01 19:41:35.006 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 36)
-2026-03-01 19:41:35.006 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:41:35.007 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:41:35.007 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:41:35.007 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 7 total chunks
-2026-03-01 19:41:35.025 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #37
-2026-03-01 19:41:35.025 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:41:35.025 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:41:35.025 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 19)
-2026-03-01 19:41:35.025 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 37)
-2026-03-01 19:41:35.035 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:41:35.036 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:41:35.036 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:41:35.036 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:41:35.036 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 11 total chunks
-2026-03-01 19:41:35.041 - backend.aggregator.core.coordinator - INFO - Validator iteration 17 - batch validating 3 submissions: ['d3cf1848-da1b-4774-856b-262a08ce3ba0', '769db3e7-d8af-47e3-8877-952a15800226', '46511b0d-6961-4e7b-ae74-ad1968edc153']
-2026-03-01 19:41:35.041 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:41:35.041 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:41:35.398 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:41:35.400 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=1024
-2026-03-01 19:42:12.403 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 2ad63c06-51f8-4ef8-85c1-405fe898a233 (iteration 23)
-2026-03-01 19:42:31.351 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:42:31.351 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #38
-2026-03-01 19:42:31.351 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:42:31.351 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 14)
-2026-03-01 19:42:31.351 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 38)
-2026-03-01 19:42:31.351 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:42:31.351 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:42:31.351 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:42:31.351 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 28 total chunks
-2026-03-01 19:42:31.370 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #39
-2026-03-01 19:42:31.370 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:42:31.370 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:42:31.370 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 6)
-2026-03-01 19:42:31.386 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 39)
-2026-03-01 19:42:31.390 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:42:31.390 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:42:31.391 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:42:31.391 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:42:31.393 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 36 total chunks
-2026-03-01 19:42:31.401 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #40
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:42:31.401 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 20)
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 40)
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:42:31.401 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:42:31.417 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 31 total chunks
-2026-03-01 19:42:31.419 - backend.aggregator.core.coordinator - INFO - Validator iteration 18 - batch validating 3 submissions: ['1b80dd3b-f96f-4282-836d-9f25e4c5cb64', 'f3a9d4e4-5a92-4635-a643-fb1d494b7504', '2ad63c06-51f8-4ef8-85c1-405fe898a233']
-2026-03-01 19:42:31.419 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:42:31.419 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:42:33.000 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 38686950-433e-40cd-8deb-9a28c961ba80 (iteration 17)
-2026-03-01 19:42:33.083 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:42:33.083 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:43:19.195 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 2ab2e277-5207-4fdf-a7db-6191b8f7880b (iteration 24)
-2026-03-01 19:43:32.111 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:43:32.127 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #41
-2026-03-01 19:43:32.127 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:43:32.127 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 15)
-2026-03-01 19:43:32.127 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 41)
-2026-03-01 19:43:32.127 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:43:32.127 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:43:32.127 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:43:32.127 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 11 total chunks
-2026-03-01 19:43:32.146 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 41 acceptances
-2026-03-01 19:43:32.146 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #42
-2026-03-01 19:43:32.146 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:43:32.146 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:43:32.146 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 21)
-2026-03-01 19:43:32.146 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 42)
-2026-03-01 19:43:32.146 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:43:32.161 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:43:32.161 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:43:32.161 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:43:32.164 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 52 total chunks
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #6
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=42 (every 7 acceptances)
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 42 % 7 == 0
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #6 (triggered at 42 acceptances)
-2026-03-01 19:43:32.178 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:43:32.178 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:43:32.178 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:43:32.178 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:43:32.178 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 41 submissions
-2026-03-01 19:43:32.178 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 221731 chars
-2026-03-01 19:43:32.211 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (66977 tokens)
-2026-03-01 19:43:32.211 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:43:32.211 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:43:32.211 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 227917 chars
-2026-03-01 19:43:32.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 68278, Max allowed: 1969500
-2026-03-01 19:43:32.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:43:32.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:43:32.244 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 41 submissions
-2026-03-01 19:43:32.244 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_024
-2026-03-01 19:43:32.295 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (66977 tokens <= 310000 available)
-2026-03-01 19:43:32.327 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=71385t, RAG=False, task_id=auto_cr_006)
-2026-03-01 19:43:32.911 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:43:32.911 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=256
-2026-03-01 19:43:36.444 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 544b5cc7-e864-4b9e-83f7-5bdbc6f19005 (iteration 18)
-2026-03-01 19:43:58.975 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 930cd494-136a-4bd8-94f4-8a008143110e (iteration 25)
-2026-03-01 19:44:00.207 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=69019t, RAG=False, task_id=auto_cr_007)
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1161 chars
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, perspectives, or extensions that enhance solution diversity for the water-energy optimization goal. While there is thematic overlap (e.g., multiple DRO variants with Wasserstein ambiguity sets in #1, #3, #5, #6, #11, #12, etc., or hydraulic relaxations in #16, #21, #28), each introduces distinct elements: specific theorems (e.g., tractable reformulations for multistage DR-SDDP in #6, zonotopic RCI in #32, aquifer convolution in #24), novel uncertainty models (conformal in #7/#12, KL in #19, copula in #38, EVT tails in #31), control structures (pH passivity #9, CBF safety #20, OCO drift #14, coalitions #42), physics handling (quality blending #35/#40, bilinear desal #18/#36), or computational methods (submodular discrete #29, tree DP #26, Benson CVO #41). No submission is fully covered/redundant/superseded; earlier ones serve as foundational 'shared' module
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': "All submissions provide unique mathematical contributions, perspectives, or extensions that enhance solution diversity for the water-energy optimization goal. While there is thematic overlap (e.g., multiple DRO variants with Wasserstein ambiguity sets in #1, #3, #5, #6, #11, #12, etc., or hydraulic relaxations in #16, #21, #28), each introduces distinct elements: specific theorems (e.g., tractable reformulations for multistage DR-SDDP in #6, zonotopic RCI in #32, aquifer convolution in #24), novel uncertainty models (conformal in #7/#12, KL in #19, copula in #38, EVT tails in #31), control structures (pH passivity #9, CBF safety #20, OCO drift #14, coalitions #42), physics handling (quality blending #35/#40, bilinear desal #18/#36), or computational methods (submodular discrete #29, tree DP #26, Benson CVO #41). No submission is fully covered/redundant/superseded; earlier ones serve as foundational 'shared' modules explicitly composed upon by later ones. No contradictions or conflicts with math principles. Retaining all maintains a high-quality, diverse knowledge base."}
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, perspectives, or extensions that enhance solution diversity for the water-energy optimization goal. While there is thematic overlap (e.g., multiple DRO variants with Wasserstein ambiguity sets in #1, #3, #5, #6, #11, #12, etc., or hydraulic
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:44:16.373 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, perspectives, or extensions that enhance solution diversity for the water-energy optimization goal. While there is thematic overlap (e.g., mu
-2026-03-01 19:44:16.373 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:44:16.373 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:44:16.373 - backend.aggregator.core.coordinator - INFO - Cleanup review #6: No removal needed
-2026-03-01 19:44:16.373 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:44:16.389 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #43
-2026-03-01 19:44:16.389 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:44:16.389 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 22)
-2026-03-01 19:44:16.389 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 43)
-2026-03-01 19:44:16.389 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:44:16.389 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:44:16.389 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:44:16.389 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 12 total chunks
-2026-03-01 19:44:16.407 - backend.aggregator.core.coordinator - INFO - Validator iteration 19 - batch validating 3 submissions: ['38686950-433e-40cd-8deb-9a28c961ba80', '2ab2e277-5207-4fdf-a7db-6191b8f7880b', '544b5cc7-e864-4b9e-83f7-5bdbc6f19005']
-2026-03-01 19:44:16.407 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:44:16.407 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:44:16.622 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:44:16.622 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-03-01 19:44:39.054 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission de21565f-a363-4a97-80cc-b49ead82f9c0 (iteration 26)
-2026-03-01 19:44:58.202 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 6ae99652-b2c2-4e2b-9180-01199ad03dba (iteration 19)
-2026-03-01 19:45:08.800 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The prior completion assessment is accurate given the brainstorm database content. The accepted submissions heavily cover DRO (Wasserstein/KL/moments), time-consistent multistage formulations (DR-SDDP/DRMDP/nested distance), MPC/viability/CBF safety layers, hydraulics convexification/relaxations, decomposition/game-theoretic methods, tail-risk ideas, and quality blending. However, the identified gaps are genuinely not addressed in any concrete, central way:
-2026-03-01 19:45:08.816 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:45:08.816 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The prior completion assessment is accurate given the brainstorm database content. The accepted submissions heavily cover DRO (Wasserstein/KL/moments), time-consistent multistage formulations (DR-SDDP/DRMDP/nested distance), MPC/viability/CBF safety layers, hydraulics convexification/relaxations, de...
-2026-03-01 19:45:09.999 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:45:10.033 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #44
-2026-03-01 19:45:10.033 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:45:10.033 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 16)
-2026-03-01 19:45:10.033 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 44)
-2026-03-01 19:45:10.033 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:45:10.037 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:45:10.037 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:45:10.037 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 15 total chunks
-2026-03-01 19:45:10.037 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:45:10.067 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #45
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:45:10.067 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 23)
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 45)
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:45:10.067 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:45:10.076 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 16 total chunks
-2026-03-01 19:45:10.082 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #46
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:45:10.082 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 17)
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 46)
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:45:10.082 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:45:10.101 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 83 total chunks
-2026-03-01 19:45:10.101 - backend.aggregator.core.coordinator - INFO - Validator iteration 20 - batch validating 3 submissions: ['930cd494-136a-4bd8-94f4-8a008143110e', 'de21565f-a363-4a97-80cc-b49ead82f9c0', '6ae99652-b2c2-4e2b-9180-01199ad03dba']
-2026-03-01 19:45:10.101 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:45:10.101 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:45:11.449 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:45:11.449 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=256
-2026-03-01 19:45:25.815 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 7552ddbc-8ad8-4936-a0c6-95e8823defbe (iteration 7)
-2026-03-01 19:45:49.929 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 773ad632-7842-4cf9-8dc1-3e91727f1aec (iteration 27)
-2026-03-01 19:46:04.377 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 4b2353a3-4004-4ac7-9719-9a3c3f8ca1bb (iteration 20)
-2026-03-01 19:46:12.909 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:46:12.929 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #47
-2026-03-01 19:46:12.929 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:46:12.929 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 24)
-2026-03-01 19:46:12.929 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 47)
-2026-03-01 19:46:12.929 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:46:12.929 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:46:12.929 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:46:12.929 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 12 total chunks
-2026-03-01 19:46:12.961 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #48
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:46:12.961 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 25)
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 48)
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:46:12.961 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:46:12.969 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 17 total chunks
-2026-03-01 19:46:12.976 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #49
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:46:12.976 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 18)
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 49)
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:46:12.976 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:46:12.994 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 25 total chunks
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #7
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=49 (every 7 acceptances)
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 49 % 7 == 0
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #7 (triggered at 49 acceptances)
-2026-03-01 19:46:12.994 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:46:12.994 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:46:12.994 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:46:12.994 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:46:12.994 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 48 submissions
-2026-03-01 19:46:12.994 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 261882 chars
-2026-03-01 19:46:13.043 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (78968 tokens)
-2026-03-01 19:46:13.043 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:46:13.043 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:46:13.043 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 268068 chars
-2026-03-01 19:46:13.093 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 80269, Max allowed: 1969500
-2026-03-01 19:46:13.093 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:46:13.093 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:46:13.093 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 48 submissions
-2026-03-01 19:46:13.093 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_027
-2026-03-01 19:46:13.776 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:46:13.776 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=1024
-2026-03-01 19:46:32.173 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission ad1f8229-ddab-4be4-ab3c-a17ac0e0a23a (iteration 28)
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1156 chars
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, techniques, or perspectives that enhance solution diversity and are not fully redundant, contradictory, or superseded. Core DRO frameworks (#1, #3, #6) offer foundational reformulations, multistage extensions, and aquifer-specific details. MPC variants (#2, #5, #7, #12) differ in robust viability, tube-based, conformal, and adaptive ambiguity. Hydraulic relaxations (#16, #21, #28, #44) vary by power-cone/SOCP/SDP for n=1.85/quadratic losses, radial/loops/valves with distinct exactness theorems. Multi-agent (#11, #25, #39, #42) progress from ADMM to Nash/coalitions. Pareto methods (#39, #40, #42) use distinct vector opt/Benson. Aquifer (#24 convolution approx), quality (#35 bilinear SOCP), switched (#47 JSR), spectral (#43, #48 KMEDRO), risk alloc (#46), SSD (#49) each introduce novel UQ/physics/risk models with proofs. No single submission is fully covered
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, techniques, or perspectives that enhance solution diversity and are not fully redundant, contradictory, or superseded. Core DRO frameworks (#1, #3, #6) offer foundational reformulations, multistage extensions, and aquifer-specific details. MPC variants (#2, #5, #7, #12) differ in robust viability, tube-based, conformal, and adaptive ambiguity. Hydraulic relaxations (#16, #21, #28, #44) vary by power-cone/SOCP/SDP for n=1.85/quadratic losses, radial/loops/valves with distinct exactness theorems. Multi-agent (#11, #25, #39, #42) progress from ADMM to Nash/coalitions. Pareto methods (#39, #40, #42) use distinct vector opt/Benson. Aquifer (#24 convolution approx), quality (#35 bilinear SOCP), switched (#47 JSR), spectral (#43, #48 KMEDRO), risk alloc (#46), SSD (#49) each introduce novel UQ/physics/risk models with proofs. No single submission is fully covered by others; weaker overlaps (e.g., radial hydraulics #16/#21) retain unique generality/exactness conditions. Database quality maintained without removal.'}
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, techniques, or perspectives that enhance solution diversity and are not fully redundant, contradictory, or superseded. Core DRO frameworks (#1, #3, #6) offer foundational reformulations, multistage extensions, and aquifer-specific details. M
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, techniques, or perspectives that enhance solution diversity and are not fully redundant, contradictory, or superseded. Core DRO frameworks (#
-2026-03-01 19:46:52.871 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:46:52.871 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:46:52.871 - backend.aggregator.core.coordinator - INFO - Cleanup review #7: No removal needed
-2026-03-01 19:46:52.871 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:46:52.871 - backend.aggregator.core.coordinator - INFO - Validator iteration 21 - batch validating 3 submissions: ['7552ddbc-8ad8-4936-a0c6-95e8823defbe', '773ad632-7842-4cf9-8dc1-3e91727f1aec', '4b2353a3-4004-4ac7-9719-9a3c3f8ca1bb']
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:46:52.871 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:47:15.552 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 8a47562f-7c7d-40ec-9f52-d458c8f975f1 (iteration 21)
-2026-03-01 19:47:25.535 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission d95df02c-7c7e-4f7b-9299-a98f79287c41 (iteration 29)
-2026-03-01 19:47:49.415 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:47:49.431 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #50
-2026-03-01 19:47:49.431 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:47:49.431 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 7)
-2026-03-01 19:47:49.431 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 50)
-2026-03-01 19:47:49.431 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:47:49.448 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:47:49.448 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:47:49.449 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 21 total chunks
-2026-03-01 19:47:49.465 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #51
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:47:49.465 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 26)
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 51)
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:47:49.465 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:47:49.465 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 25 total chunks
-2026-03-01 19:47:49.483 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #52
-2026-03-01 19:47:49.483 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:47:49.483 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:47:49.483 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 19)
-2026-03-01 19:47:49.483 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 52)
-2026-03-01 19:47:49.499 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:47:49.499 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:47:49.499 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:47:49.499 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:47:49.499 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 31 total chunks
-2026-03-01 19:47:49.499 - backend.aggregator.core.coordinator - INFO - Validator iteration 22 - batch validating 3 submissions: ['ad1f8229-ddab-4be4-ab3c-a17ac0e0a23a', '8a47562f-7c7d-40ec-9f52-d458c8f975f1', 'd95df02c-7c7e-4f7b-9299-a98f79287c41']
-2026-03-01 19:47:49.513 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:47:49.515 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:47:49.648 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 52 acceptances
-2026-03-01 19:47:49.699 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (83916 tokens <= 310000 available)
-2026-03-01 19:47:49.750 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=89217t, RAG=False, task_id=auto_cr_008)
-2026-03-01 19:47:50.432 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:47:50.432 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:47:58.868 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 9b7ea784-c120-4d80-b319-6c1789295988 (iteration 8)
-2026-03-01 19:48:26.294 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 2dbc1f79-b513-4c46-b2c9-fa00d1fa2741 (iteration 30)
-2026-03-01 19:48:45.775 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:48:45.807 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #53
-2026-03-01 19:48:45.807 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:48:45.807 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 27)
-2026-03-01 19:48:45.808 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 53)
-2026-03-01 19:48:45.809 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:48:45.809 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:48:45.809 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:48:45.809 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 6 total chunks
-2026-03-01 19:48:45.827 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #54
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:48:45.827 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 20)
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 54)
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:48:45.827 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:48:45.842 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 44 total chunks
-2026-03-01 19:48:45.843 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #55
-2026-03-01 19:48:45.857 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:48:45.857 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:48:45.857 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 28)
-2026-03-01 19:48:45.858 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 55)
-2026-03-01 19:48:45.859 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:48:45.859 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:48:45.859 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:48:45.859 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:48:45.859 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 41 total chunks
-2026-03-01 19:48:45.876 - backend.aggregator.core.coordinator - INFO - Validator iteration 23 - batch validating 2 submissions: ['9b7ea784-c120-4d80-b319-6c1789295988', '2dbc1f79-b513-4c46-b2c9-fa00d1fa2741']
-2026-03-01 19:48:45.876 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
-2026-03-01 19:48:45.877 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
-2026-03-01 19:48:46.859 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:48:46.859 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=512
-2026-03-01 19:48:50.645 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission acaa72f3-daf1-4b92-bc15-4b950c8a8a46 (iteration 22)
-2026-03-01 19:49:12.739 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=85909t, RAG=False, task_id=auto_cr_009)
-2026-03-01 19:49:17.989 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 97f43706-1628-4e69-a9f5-65f90f287d21 (iteration 31)
-2026-03-01 19:49:43.302 - backend.aggregator.agents.validator - INFO - Batch validation complete: 2/2 accepted
-2026-03-01 19:49:43.328 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #56
-2026-03-01 19:49:43.328 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:49:43.328 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 8)
-2026-03-01 19:49:43.328 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 56)
-2026-03-01 19:49:43.328 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:49:43.328 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:49:43.328 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:49:43.335 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 9 total chunks
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #8
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=56 (every 7 acceptances)
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 56 % 7 == 0
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:49:43.339 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #8 (triggered at 56 acceptances)
-2026-03-01 19:49:43.351 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:49:43.351 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:49:43.351 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:49:43.351 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:49:43.352 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 55 submissions
-2026-03-01 19:49:43.352 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 298267 chars
-2026-03-01 19:49:43.401 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (90097 tokens)
-2026-03-01 19:49:43.401 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:49:43.401 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:49:43.401 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 304453 chars
-2026-03-01 19:49:43.436 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 91398, Max allowed: 1969500
-2026-03-01 19:49:43.436 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:49:43.436 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:49:43.436 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 55 submissions
-2026-03-01 19:49:43.436 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_031
-2026-03-01 19:49:43.536 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:49:43.536 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-03-01 19:50:19.399 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission d9e0619f-3ea4-4687-82c3-869758809621 (iteration 23)
-2026-03-01 19:50:31.129 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The prior completion assessment is accurate. A scan of the accepted submissions shows extensive coverage of DRO/MPC/SDDP/DRMDP, invariance/viability, hydraulics relaxations, quality blending, decentralization/game theory, Pareto computation, and scenario reduction. However, the specific gaps cited are genuinely not addressed in a rigorous, explicit way:\n\n1) Contingency/resilience (N-1/N-k, outage sets, component failures, cyber/actuation faults) is not de
-2026-03-01 19:50:31.130 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:50:31.130 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The prior completion assessment is accurate. A scan of the accepted submissions shows extensive coverage of DRO/MPC/SDDP/DRMDP, invariance/viability, hydraulics relaxations, quality blending, decentralization/game theory, Pareto computation, and scenario reduction. However, the specific gaps cited a...
-2026-03-01 19:50:31.146 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:50:33.297 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 50088585-02d7-4643-8d90-3d2c70f3c99d (iteration 32)
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 891 chars
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical contributions, theorems, proofs, or model extensions that advance different aspects of the problem (e.g., DRO variants with specific reformulations (#1,3,6,19,22,27), robust MPC/RCI techniques (#2,5,7,23,32,46), hydraulics relaxations (#16,21,28,44), quality blending (#35,39,55), multi-objective Pareto methods (#39,42), aquifer dynamics (#24), conformal adaptations (#7,12,53), multistage/decentralized (#6,11,25,38,42), and niche UQ like SSD (#49), copulas (#38), multi-fidelity (#51), coresets (#52)). No submission is fully redundant, contradicted, or superseded; even overlapping DRO-MPC themes (#5,7,12) differ in guarantees (tube-ISS vs conformal coverage vs adaptive drifting). Diversity maintains solution robustness; database quality preserved without removal."
-}
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical contributions, theorems, proofs, or model extensions that advance different aspects of the problem (e.g., DRO variants with specific reformulations (#1,3,6,19,22,27), robust MPC/RCI techniques (#2,5,7,23,32,46), hydraulics relaxations (#16,21,28,44), quality blending (#35,39,55), multi-objective Pareto methods (#39,42), aquifer dynamics (#24), conformal adaptations (#7,12,53), multistage/decentralized (#6,11,25,38,42), and niche UQ like SSD (#49), copulas (#38), multi-fidelity (#51), coresets (#52)). No submission is fully redundant, contradicted, or superseded; even overlapping DRO-MPC themes (#5,7,12) differ in guarantees (tube-ISS vs conformal coverage vs adaptive drifting). Diversity maintains solution robustness; database quality preserved without removal.'}
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical contributions, theorems, proofs, or model extensions that advance different aspects of the problem (e.g., DRO variants with specific reformulations (#1,3,6,19,22,27), robust MPC/RCI techniques (#2,5,7,23,32,46), hydraulics relaxations (#16,21,28,44), quali
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:50:46.806 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical contributions, theorems, proofs, or model extensions that advance different aspects of the problem (e.g., DRO variants with specific reformulations (#1,3,6,
-2026-03-01 19:50:46.806 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:50:46.806 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:50:46.806 - backend.aggregator.core.coordinator - INFO - Cleanup review #8: No removal needed
-2026-03-01 19:50:46.806 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:50:46.812 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #57
-2026-03-01 19:50:46.812 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:50:46.812 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 29)
-2026-03-01 19:50:46.812 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 57)
-2026-03-01 19:50:46.812 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:50:46.812 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:50:46.812 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:50:46.812 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 6 total chunks
-2026-03-01 19:50:46.831 - backend.aggregator.core.coordinator - INFO - Validator iteration 24 - batch validating 3 submissions: ['acaa72f3-daf1-4b92-bc15-4b950c8a8a46', '97f43706-1628-4e69-a9f5-65f90f287d21', 'd9e0619f-3ea4-4687-82c3-869758809621']
-2026-03-01 19:50:46.831 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:50:46.831 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:50:46.995 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:50:46.995 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-03-01 19:51:21.673 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 273a7886-e5be-4acd-873d-39351fb897a1 (iteration 24)
-2026-03-01 19:51:38.705 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 45b06e36-3313-42b2-b44c-c0e4e91e2066 (iteration 33)
-2026-03-01 19:51:57.886 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:51:57.903 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #58
-2026-03-01 19:51:57.903 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:51:57.903 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 21)
-2026-03-01 19:51:57.903 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 58)
-2026-03-01 19:51:57.903 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:51:57.903 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:51:57.903 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:51:57.903 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 27 total chunks
-2026-03-01 19:51:57.945 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #59
-2026-03-01 19:51:57.945 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:51:57.945 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:51:57.945 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 30)
-2026-03-01 19:51:57.945 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 59)
-2026-03-01 19:51:57.945 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:51:57.952 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:51:57.953 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:51:57.953 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:51:57.953 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 30 total chunks
-2026-03-01 19:51:57.969 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #60
-2026-03-01 19:51:57.969 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:51:57.969 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:51:57.970 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 22)
-2026-03-01 19:51:57.970 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 60)
-2026-03-01 19:51:57.970 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:51:57.970 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:51:57.970 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:51:57.970 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:51:57.976 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 33 total chunks
-2026-03-01 19:51:57.986 - backend.aggregator.core.coordinator - INFO - Validator iteration 25 - batch validating 3 submissions: ['50088585-02d7-4643-8d90-3d2c70f3c99d', '273a7886-e5be-4acd-873d-39351fb897a1', '45b06e36-3313-42b2-b44c-c0e4e91e2066']
-2026-03-01 19:51:57.986 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:51:57.986 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:51:59.178 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:51:59.178 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:52:08.334 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 63a0be3d-e5cc-49e4-8bed-f59e616c9fa3 (iteration 9)
-2026-03-01 19:52:17.267 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission c2ddb538-745b-46fd-9909-71ffc9ca8a49 (iteration 25)
-2026-03-01 19:52:22.682 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 1003f0e1-92bb-4308-a786-1d965bb856c7 (iteration 34)
-2026-03-01 19:52:48.481 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:52:48.498 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #61
-2026-03-01 19:52:48.498 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:52:48.498 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 31)
-2026-03-01 19:52:48.498 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 61)
-2026-03-01 19:52:48.498 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:52:48.498 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:52:48.498 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:52:48.498 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 7 total chunks
-2026-03-01 19:52:48.515 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #62
-2026-03-01 19:52:48.515 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:52:48.515 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:52:48.515 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 23)
-2026-03-01 19:52:48.515 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 62)
-2026-03-01 19:52:48.531 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:52:48.531 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:52:48.531 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:52:48.531 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:52:48.531 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 52 total chunks
-2026-03-01 19:52:48.548 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #63
-2026-03-01 19:52:48.548 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:52:48.548 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:52:48.548 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 32)
-2026-03-01 19:52:48.548 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 63)
-2026-03-01 19:52:48.557 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:52:48.557 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:52:48.557 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:52:48.557 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:52:48.557 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 45 total chunks
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #9
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=63 (every 7 acceptances)
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 63 % 7 == 0
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=1, removals_executed=1
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #9 (triggered at 63 acceptances)
-2026-03-01 19:52:48.565 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:52:48.565 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:52:48.565 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:52:48.565 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:52:48.565 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 62 submissions
-2026-03-01 19:52:48.565 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 334817 chars
-2026-03-01 19:52:48.631 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (101101 tokens)
-2026-03-01 19:52:48.631 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:52:48.631 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:52:48.631 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 341003 chars
-2026-03-01 19:52:48.681 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 102402, Max allowed: 1969500
-2026-03-01 19:52:48.681 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:52:48.681 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:52:48.681 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 62 submissions
-2026-03-01 19:52:48.681 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_034
-2026-03-01 19:52:49.663 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:52:49.663 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=512
-2026-03-01 19:52:50.515 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 63 acceptances
-2026-03-01 19:52:50.581 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (101101 tokens <= 310000 available)
-2026-03-01 19:52:50.631 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=107246t, RAG=False, task_id=auto_cr_010)
-2026-03-01 19:53:24.661 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission c586b4ab-a2a6-4f3a-afe8-5ccd8169cf03 (iteration 35)
-2026-03-01 19:53:27.811 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 85901409-893e-4184-a20f-fbb5106ac397 (iteration 26)
-2026-03-01 19:53:49.176 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=103166t, RAG=False, task_id=auto_cr_011)
-2026-03-01 19:53:50.764 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:53:50.774 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:53:50.774 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 965 chars
-2026-03-01 19:53:50.774 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": true,
-  "submission_number": 44,
-  "reasoning": "Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guarantees on the upper image approximation. This is fully covered by submission #41, which presents the same DR-CVO framework (Distributionally Robust Convex Vector Optimization) with identical algorithmic structure, scalarization subproblems, convergence theorems, and ε-approximation properties, explicitly tailored to DRO constraints in the water-energy context. #44 repeats the same mathematical content (e.g., PS scalarization, supporting hyperplanes from duals, Hausdorff error bounds) without adding unique proofs, extensions (e.g., no new handling of DRO-specific non-smoothness), or perspectives. Given the database's growth, #44 now provides no unique value and is the weaker duplicate."
-}
-2026-03-01 19:53:50.774 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': True, 'submission_number': 44, 'reasoning': "Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guarantees on the upper image approximation. This is fully covered by submission #41, which presents the same DR-CVO framework (Distributionally Robust Convex Vector Optimization) with identical algorithmic structure, scalarization subproblems, convergence theorems, and ε-approximation properties, explicitly tailored to DRO constraints in the water-energy context. #44 repeats the same mathematical content (e.g., PS scalarization, supporting hyperplanes from duals, Hausdorff error bounds) without adding unique proofs, extensions (e.g., no new handling of DRO-specific non-smoothness), or perspectives. Given the database's growth, #44 now provides no unique value and is the weaker duplicate."}
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=True, submission_number=44
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guarantees on the upper image approximation. This is fully covered by submission #41, which presents the
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: REMOVAL PROPOSED - submission #44
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - Cleanup review: Proposing removal of submission #44 - Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guara...
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal={'submission_number': 44, 'reasoning': "Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guarantees on the upper image approximation. This is fully covered by submission #41, which presents the same DR-CVO framework (Distributionally Robust Convex Vector Optimization) with identical algorithmic structure, scalarization subproblems, convergence theorems, and ε-approximation properties, explicitly tailored to DRO constraints in the water-energy context. #44 repeats the same mathematical content (e.g., PS scalarization, supporting hyperplanes from duals, Hausdorff error bounds) without adding unique proofs, extensions (e.g., no new handling of DRO-specific non-smoothness), or perspectives. Given the database's growth, #44 now provides no unique value and is the weaker duplicate."}
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: REMOVAL PROPOSED for submission #44
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Removal reasoning: Submission #44 proposes a Benson-type outer-approximation algorithm using Pascoletti-Serafini scalarizations for computing ε-accurate Pareto fronts in convex multi-objective conic programs, with guarantees on the upper image approximation. This is fully covered by submission #41, which presents the ...
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - Cleanup review #9: Removal proposed for submission #44
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 2: Getting content for submission #44...
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 2 Complete: Got submission content, length=7462 chars
-2026-03-01 19:53:50.776 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 3: Calling validator.validate_removal()...
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 2: REMOVAL VALIDATION START ==========
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Validating removal of submission #44
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Submission content length: 7462 chars
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Removal reasoning length: 892 chars
-2026-03-01 19:53:50.776 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Full database context length: 334817 chars
-2026-03-01 19:53:50.826 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (101101 tokens)
-2026-03-01 19:53:50.826 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:53:50.826 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:53:50.826 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built removal validation prompt with direct injection, length: 348261 chars
-2026-03-01 19:53:50.876 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 104551, Max allowed: 1969500
-2026-03-01 19:53:50.876 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:53:50.876 - backend.aggregator.agents.validator - INFO - Removal validation: Validating proposed removal of submission #44
-2026-03-01 19:53:50.876 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_035
-2026-03-01 19:54:35.339 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 18325a00-6143-4eec-89c3-6a048477aa69 (iteration 36)
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1093 chars
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "decision": "accept",
-  "reasoning": "Submission #44 is genuinely redundant with submission #41. Both describe the identical Benson-type outer-approximation algorithm for computing ε-accurate Pareto fronts in convex multi-objective conic programs using Pascoletti-Serafini scalarizations, supporting hyperplanes from conic duality, and Hausdorff-type error bounds on the upper image approximation. #41 explicitly frames it as DR-CVO tailored to DRO constraints in water-energy systems, including the same PS subproblem formulation, dual cut generation, convergence theorem, and solver-ready implementation template. #44 repeats this mathematical content verbatim (e.g., PS min τ s.t. f(z) ≤ y - τ d, dual w^⊤ y ≥ inf w^⊤ f with w^⊤ d=1, ε-stopping on max τ^⋆(y) ≤ ε) without adding unique proofs, DRO-specific extensions (e.g., handling non-smoothness), implementation details, or perspectives. The claimed distinction from 'λ-grid' submissions is already covered by #41. Removing #44 objectively
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'decision': 'accept', 'reasoning': "Submission #44 is genuinely redundant with submission #41. Both describe the identical Benson-type outer-approximation algorithm for computing ε-accurate Pareto fronts in convex multi-objective conic programs using Pascoletti-Serafini scalarizations, supporting hyperplanes from conic duality, and Hausdorff-type error bounds on the upper image approximation. #41 explicitly frames it as DR-CVO tailored to DRO constraints in water-energy systems, including the same PS subproblem formulation, dual cut generation, convergence theorem, and solver-ready implementation template. #44 repeats this mathematical content verbatim (e.g., PS min τ s.t. f(z) ≤ y - τ d, dual w^⊤ y ≥ inf w^⊤ f with w^⊤ d=1, ε-stopping on max τ^⋆(y) ≤ ε) without adding unique proofs, DRO-specific extensions (e.g., handling non-smoothness), implementation details, or perspectives. The claimed distinction from 'λ-grid' submissions is already covered by #41. Removing #44 objectively improves the database by eliminating duplication while preserving comprehensive coverage."}
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - decision=accept
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): Submission #44 is genuinely redundant with submission #41. Both describe the identical Benson-type outer-approximation algorithm for computing ε-accurate Pareto fronts in convex multi-objective conic programs using Pascoletti-Serafini scalarizations, supporting hyperplanes from conic duality, and Ha
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: REMOVAL APPROVED for submission #44
-2026-03-01 19:54:48.921 - backend.aggregator.agents.validator - INFO - Removal validation: APPROVED removal of submission #44 - Submission #44 is genuinely redundant with submission #41. Both describe the identical Benson-type outer-approximation algorithm for computing ε-accurate Pareto fronts in convex multi-objective conic ...
-2026-03-01 19:54:48.921 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 3 Complete: removal_validated=True
-2026-03-01 19:54:48.921 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 4: Executing removal of submission #44...
-2026-03-01 19:54:48.921 - backend.aggregator.memory.shared_training - INFO - Removed submission #44 from shared training
-2026-03-01 19:54:48.938 - backend.aggregator.memory.shared_training - INFO - Triggering re-chunking callback after removal of submission #44
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 4 Complete: removal_success=True
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: REMOVAL EXECUTED SUCCESSFULLY for submission #44
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Total removals executed: 2
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - Cleanup review #9: Successfully removed submission #44
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:54:48.938 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: No new submissions to process
-2026-03-01 19:54:48.954 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (Success=True) ==================
-2026-03-01 19:54:48.954 - backend.aggregator.core.coordinator - INFO - Validator iteration 26 - batch validating 3 submissions: ['63a0be3d-e5cc-49e4-8bed-f59e616c9fa3', 'c2ddb538-745b-46fd-9909-71ffc9ca8a49', '1003f0e1-92bb-4308-a786-1d965bb856c7']
-2026-03-01 19:54:48.954 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:54:48.954 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:55:17.586 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission e9fdd653-8073-4c19-a7c5-5a1bd49be395 (iteration 27)
-2026-03-01 19:55:25.751 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The continue_brainstorm decision is accurate. The database is extensive on DRO/MPC/RCI/conic hydraulics/quality/Pareto computation and even touches parameter adaptation (conformal, drifting radii, Fisher-information sensor placement, scenario bounds), but it does not yet provide a rigorous, explicit contingency/resilience optimization layer (N-1/N-k component outages with tractable screening/separation and correctness guarantees). It also lacks a true power
-2026-03-01 19:55:25.751 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 19:55:25.751 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The continue_brainstorm decision is accurate. The database is extensive on DRO/MPC/RCI/conic hydraulics/quality/Pareto computation and even touches parameter adaptation (conformal, drifting radii, Fisher-information sensor placement, scenario bounds), but it does not yet provide a rigorous, explicit...
-2026-03-01 19:55:26.968 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission c9589d8b-494e-41e5-b053-bf053e97fa3b (iteration 37)
-2026-03-01 19:55:26.984 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 19:55:47.799 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:55:47.816 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #64
-2026-03-01 19:55:47.816 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:55:47.816 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 9)
-2026-03-01 19:55:47.816 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 64)
-2026-03-01 19:55:47.816 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:55:47.816 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: No new submissions to process
-2026-03-01 19:55:47.840 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #65
-2026-03-01 19:55:47.840 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:55:47.840 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 24)
-2026-03-01 19:55:47.840 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 65)
-2026-03-01 19:55:47.840 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:55:47.840 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:55:47.840 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:55:47.840 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 15 total chunks
-2026-03-01 19:55:47.864 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #66
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:55:47.864 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 33)
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 66)
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:55:47.864 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:55:47.864 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 16 total chunks
-2026-03-01 19:55:47.882 - backend.aggregator.core.coordinator - INFO - Validator iteration 27 - batch validating 3 submissions: ['c586b4ab-a2a6-4f3a-afe8-5ccd8169cf03', '85901409-893e-4184-a20f-fbb5106ac397', '18325a00-6143-4eec-89c3-6a048477aa69']
-2026-03-01 19:55:47.882 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:55:47.882 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:55:48.366 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:55:48.366 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=1024
-2026-03-01 19:56:19.313 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 6f994fd2-0325-4dce-8618-cba988d0e807 (iteration 38)
-2026-03-01 19:56:35.312 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:56:35.328 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #67
-2026-03-01 19:56:35.328 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:56:35.328 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 34)
-2026-03-01 19:56:35.328 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 67)
-2026-03-01 19:56:35.328 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:56:35.328 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:56:35.328 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:56:35.328 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 15 total chunks
-2026-03-01 19:56:35.345 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #68
-2026-03-01 19:56:35.345 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:56:35.345 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:56:35.345 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 25)
-2026-03-01 19:56:35.345 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 68)
-2026-03-01 19:56:35.360 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:56:35.360 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:56:35.360 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:56:35.360 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:56:35.360 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 35 total chunks
-2026-03-01 19:56:35.378 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #69
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:56:35.378 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 35)
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 69)
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:56:35.378 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:56:35.378 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 31 total chunks
-2026-03-01 19:56:35.395 - backend.aggregator.core.coordinator - INFO - Validator iteration 28 - batch validating 3 submissions: ['e9fdd653-8073-4c19-a7c5-5a1bd49be395', 'c9589d8b-494e-41e5-b053-bf053e97fa3b', '6f994fd2-0325-4dce-8618-cba988d0e807']
-2026-03-01 19:56:35.395 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:56:35.395 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:56:36.287 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 19:56:36.287 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 19:56:58.060 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 825bbdd6-dc84-47ac-a22b-a54825033a7a (iteration 10)
-2026-03-01 19:56:59.559 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission fce4ac15-d84a-4814-8a69-8232b3d71e33 (iteration 39)
-2026-03-01 19:57:19.275 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:57:19.303 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #70
-2026-03-01 19:57:19.303 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:57:19.303 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 26)
-2026-03-01 19:57:19.305 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 70)
-2026-03-01 19:57:19.305 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:57:19.307 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:57:19.307 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:57:19.309 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 13 total chunks
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #10
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=70 (every 7 acceptances)
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 70 % 7 == 0
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=2, removals_executed=2
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #10 (triggered at 70 acceptances)
-2026-03-01 19:57:19.326 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 19:57:19.326 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:57:19.326 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 19:57:19.326 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 19:57:19.326 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 68 submissions
-2026-03-01 19:57:19.326 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 368108 chars
-2026-03-01 19:57:19.391 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (110919 tokens)
-2026-03-01 19:57:19.392 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 19:57:19.392 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 19:57:19.392 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 374294 chars
-2026-03-01 19:57:19.443 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 112220, Max allowed: 1969500
-2026-03-01 19:57:19.443 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 19:57:19.443 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 19:57:19.443 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 68 submissions
-2026-03-01 19:57:19.443 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_039
-2026-03-01 19:57:19.609 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 19:57:19.609 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-03-01 19:57:31.673 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 340cc2f0-8a26-4d79-8e4a-e78d0ab45ded (iteration 28)
-2026-03-01 19:57:46.760 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 6a682f24-635b-4892-b0e6-f6eb578f8ed2 (iteration 40)
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 884 chars
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions provide unique mathematical value through distinct theorems, models, or extensions that complement each other without full redundancy or contradiction. For example, core DRO planning (#1, #3) differ in network/aquifer focus and proofs; MPC variants (#5 tube-DR, #7 conformal-robust, #12 CDRO) offer different guarantees (probabilistic feasibility, coverage, adaptation); hydraulics modules (#16 power-cone radial, #21 SOS nonlinear, #28 SDP looped, #45 valve-SDP) target specific topologies/nonlinearities with exactness certificates; martingale bounds (#10 scalar, #30 vector) build hierarchically; no submission is fully covered/superseded by others, and all enhance solution diversity (decentralized #11, min-cut #13, Koopman #15, etc.). Removal would reduce coverage without quality gain."
-}
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions provide unique mathematical value through distinct theorems, models, or extensions that complement each other without full redundancy or contradiction. For example, core DRO planning (#1, #3) differ in network/aquifer focus and proofs; MPC variants (#5 tube-DR, #7 conformal-robust, #12 CDRO) offer different guarantees (probabilistic feasibility, coverage, adaptation); hydraulics modules (#16 power-cone radial, #21 SOS nonlinear, #28 SDP looped, #45 valve-SDP) target specific topologies/nonlinearities with exactness certificates; martingale bounds (#10 scalar, #30 vector) build hierarchically; no submission is fully covered/superseded by others, and all enhance solution diversity (decentralized #11, min-cut #13, Koopman #15, etc.). Removal would reduce coverage without quality gain.'}
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions provide unique mathematical value through distinct theorems, models, or extensions that complement each other without full redundancy or contradiction. For example, core DRO planning (#1, #3) differ in network/aquifer focus and proofs; MPC variants (#5 tube-DR, #7 conformal-robust, #
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 19:58:19.387 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions provide unique mathematical value through distinct theorems, models, or extensions that complement each other without full redundancy or contradiction. For example, core DRO planning (
-2026-03-01 19:58:19.387 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 19:58:19.387 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 19:58:19.387 - backend.aggregator.core.coordinator - INFO - Cleanup review #10: No removal needed
-2026-03-01 19:58:19.387 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 19:58:19.420 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #71
-2026-03-01 19:58:19.420 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:58:19.420 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 36)
-2026-03-01 19:58:19.420 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 71)
-2026-03-01 19:58:19.420 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:58:19.420 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:58:19.420 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:58:19.420 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 19 total chunks
-2026-03-01 19:58:19.438 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #72
-2026-03-01 19:58:19.438 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:58:19.438 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:58:19.438 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 37)
-2026-03-01 19:58:19.438 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 72)
-2026-03-01 19:58:19.454 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:58:19.454 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:58:19.454 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:58:19.454 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 19:58:19.454 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 20 total chunks
-2026-03-01 19:58:19.470 - backend.aggregator.core.coordinator - INFO - Validator iteration 29 - batch validating 3 submissions: ['825bbdd6-dc84-47ac-a22b-a54825033a7a', 'fce4ac15-d84a-4814-8a69-8232b3d71e33', '340cc2f0-8a26-4d79-8e4a-e78d0ab45ded']
-2026-03-01 19:58:19.470 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:58:19.470 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:58:19.970 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-03-01 19:58:19.970 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=512
-2026-03-01 19:58:37.718 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 8e05e964-6be2-4dc1-bc04-3b04f551375a (iteration 29)
-2026-03-01 19:58:47.418 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission dc1c2007-9272-4dc2-b750-55c6339b14a9 (iteration 41)
-2026-03-01 19:59:03.000 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 19:59:03.033 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #73
-2026-03-01 19:59:03.033 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:59:03.033 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 10)
-2026-03-01 19:59:03.033 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 73)
-2026-03-01 19:59:03.033 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:59:03.033 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 19:59:03.033 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 19:59:03.033 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 10 total chunks
-2026-03-01 19:59:03.051 - backend.autonomous.core.autonomous_coordinator - INFO - Running completion review at 73 acceptances
-2026-03-01 19:59:03.051 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #74
-2026-03-01 19:59:03.051 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:59:03.051 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:59:03.051 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 38)
-2026-03-01 19:59:03.051 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 74)
-2026-03-01 19:59:03.069 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:59:03.070 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:59:03.070 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 19:59:03.070 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 19:59:03.072 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 12 total chunks
-2026-03-01 19:59:03.085 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Direct injection of brainstorm (0 tokens <= 310000 available)
-2026-03-01 19:59:03.085 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #75
-2026-03-01 19:59:03.085 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 19:59:03.085 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 19:59:03.085 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 27)
-2026-03-01 19:59:03.085 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 75)
-2026-03-01 19:59:03.099 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 19:59:03.099 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 19:59:03.099 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 19:59:03.099 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 19:59:03.104 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 64 total chunks
-2026-03-01 19:59:03.104 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Generating assessment with model openai/gpt-5.2 (prompt=6069t, RAG=False, task_id=auto_cr_012)
-2026-03-01 19:59:03.117 - backend.aggregator.core.coordinator - INFO - Validator iteration 30 - batch validating 3 submissions: ['6a682f24-635b-4892-b0e6-f6eb578f8ed2', '8e05e964-6be2-4dc1-bc04-3b04f551375a', 'dc1c2007-9272-4dc2-b750-55c6339b14a9']
-2026-03-01 19:59:03.117 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 19:59:03.117 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 19:59:04.150 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-03-01 19:59:04.150 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=256
-2026-03-01 19:59:20.265 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 4e68179e-cc3b-4771-bce3-173d7a400daa (iteration 11)
-2026-03-01 19:59:42.563 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 69de5168-3ceb-4685-98e6-8d6c88d58efe (iteration 42)
-2026-03-01 19:59:45.096 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 3a9f7320-e43f-426b-ab14-c8b68f3479ee (iteration 30)
-2026-03-01 19:59:57.979 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validating with SAME model openai/gpt-5.2 (prompt=1754t, RAG=False, task_id=auto_cr_013)
-2026-03-01 20:00:03.727 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 20:00:03.744 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #76
-2026-03-01 20:00:03.744 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:00:03.744 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 39)
-2026-03-01 20:00:03.744 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 76)
-2026-03-01 20:00:03.744 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:00:03.744 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 20:00:03.744 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 20:00:03.744 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 9 total chunks
-2026-03-01 20:00:03.767 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #77
-2026-03-01 20:00:03.767 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 20:00:03.767 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:00:03.767 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 28)
-2026-03-01 20:00:03.767 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 77)
-2026-03-01 20:00:03.781 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 20:00:03.781 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:00:03.781 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 20:00:03.781 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 20:00:03.781 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 22 total chunks
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW START ==================
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - ================================================================================
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Review #11
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Triggered at total_acceptances=77 (every 7 acceptances)
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Trigger condition check: 77 % 7 == 0
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: Stats - removals_proposed=2, removals_executed=2
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - Starting cleanup review #11 (triggered at 77 acceptances)
-2026-03-01 20:00:03.796 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: >>> PHASE 1: Calling validator.perform_cleanup_review()...
-2026-03-01 20:00:03.796 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 20:00:03.796 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: ========== PHASE 1: CLEANUP REVIEW START ==========
-2026-03-01 20:00:03.796 - backend.aggregator.agents.validator - INFO - ============================================================
-2026-03-01 20:00:03.796 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Database has 75 submissions
-2026-03-01 20:00:03.796 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Formatted submissions length: 402779 chars
-2026-03-01 20:00:03.867 - backend.aggregator.core.context_allocator - INFO - Cleanup: All submissions direct injected (121384 tokens)
-2026-03-01 20:00:03.867 - backend.aggregator.core.context_allocator - INFO - Cleanup: All content fits in direct injection - no RAG needed
-2026-03-01 20:00:03.867 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: All submissions fit in direct injection
-2026-03-01 20:00:03.867 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Built cleanup review prompt with direct injection, length: 408965 chars
-2026-03-01 20:00:03.928 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Final prompt tokens: 122685, Max allowed: 1969500
-2026-03-01 20:00:03.928 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Context window: 2000000
-2026-03-01 20:00:03.928 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Prompt size OK, sending to LLM model: x-ai/grok-4.1-fast
-2026-03-01 20:00:03.928 - backend.aggregator.agents.validator - INFO - Cleanup review: Analyzing 75 submissions
-2026-03-01 20:00:03.928 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Calling LLM with max_tokens=30000, temperature=0.0, task_id=agg_val_042
-2026-03-01 20:00:04.245 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 20:00:04.245 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 2 submissions added, chunk_size=768
-2026-03-01 20:00:52.673 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 2c8e0751-fa7c-4e8d-a38f-28aff831cfa8 (iteration 31)
-2026-03-01 20:00:56.090 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission d2272f08-1349-4056-944d-a39e81600f03 (iteration 43)
-2026-03-01 20:00:57.940 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation raw content (first 500 chars): {
-  "validated": true,
-  "reasoning": "The assessment is accurate given the provided context: the brainstorm database is empty and contains none of the claimed 73 submissions or their substance. Therefore, it is impossible to verify whether key technical pillars (contingency/resilience optimization, endogenous grid/market coupling, statistically defensible robustness calibration under nonstationarity/dependence, and reproducible benchmarks) have been covered. In that situation, choosing \"contin
-2026-03-01 20:00:57.940 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation result: validated=True
-2026-03-01 20:00:57.940 - backend.autonomous.agents.completion_reviewer - INFO - CompletionReviewer: Self-validation reasoning: The assessment is accurate given the provided context: the brainstorm database is empty and contains none of the claimed 73 submissions or their substance. Therefore, it is impossible to verify whether key technical pillars (contingency/resilience optimization, endogenous grid/market coupling, stati...
-2026-03-01 20:00:57.957 - backend.autonomous.core.autonomous_coordinator - INFO - Completion review: CONTINUE BRAINSTORM
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM response received: True
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Response has 1 choices
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: LLM output length: 1912 chars
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Raw LLM output (first 1000 chars):
-{
-  "should_remove": false,
-  "submission_number": null,
-  "reasoning": "All submissions contribute unique mathematical value and perspectives that enhance the knowledge base without redundancy, contradictions, or supersession. Core DRO frameworks (#1, #3, #6, #19, #27) differ in ambiguity sets (Wasserstein planning, multistage aquifer-DRO, KL-entropic, moment-Cantelli) and reformulations (SOCP/MI-SOCP theorems). MPC extensions (#2, #5, #7, #12, #20, #32, #43, #47, #53, #61) provide distinct guarantees (viability-RCI, tube-ISS, conformal coverage, CBF safety, zonotope/JSR switched, spectral-graph, interval-monotone). Hydraulics models (#16 power-cone general n, #21 SOCP quadratic radial, #28 SDP looped, #45 valve-chordal SDP, #64 Forchheimer aquifer, #70 GP Hazen-Williams) target different topologies/nonlinearities with unique exactness proofs. Aquifer/quality (#24 exp-sum convolution, #35 SOCP blending, #40 GP bilinear salinity, #55 SOS ADR) add specialized physics. Reliability certif
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Attempting to parse JSON from LLM output...
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: JSON parsed successfully: {'should_remove': False, 'submission_number': None, 'reasoning': 'All submissions contribute unique mathematical value and perspectives that enhance the knowledge base without redundancy, contradictions, or supersession. Core DRO frameworks (#1, #3, #6, #19, #27) differ in ambiguity sets (Wasserstein planning, multistage aquifer-DRO, KL-entropic, moment-Cantelli) and reformulations (SOCP/MI-SOCP theorems). MPC extensions (#2, #5, #7, #12, #20, #32, #43, #47, #53, #61) provide distinct guarantees (viability-RCI, tube-ISS, conformal coverage, CBF safety, zonotope/JSR switched, spectral-graph, interval-monotone). Hydraulics models (#16 power-cone general n, #21 SOCP quadratic radial, #28 SDP looped, #45 valve-chordal SDP, #64 Forchheimer aquifer, #70 GP Hazen-Williams) target different topologies/nonlinearities with unique exactness proofs. Aquifer/quality (#24 exp-sum convolution, #35 SOCP blending, #40 GP bilinear salinity, #55 SOS ADR) add specialized physics. Reliability certificates (#10 martingale variance, #13 min-cut, #22 unimodal, #30 vector Bernstein, #31 EVT tails, #38 copula, #46 Boole allocation, #58 Max-CVaR, #60 anytime CS, #69 EVaR) offer diverse bounds (tail-specific, joint, anytime). Decentralized/strategic (#11 ADMM, #25 DRNE, #39 GNE VI, #42 coalitions) vary in cooperation (cooperative vs Nash vs hedonic). Scalability/high-d (#43 spectral, #48 MMD kernel, #49 coreset quantize, #50 multi-fid, #61 sliced MaxSW, #62 MaxSW graph, #68 MMD RKHS) address dimension curse uniquely. Multi-obj/Pareto (#41 Benson CVO, #67 monotone policies) provide structure/exact fronts. Others (pH passivity #9, Koopman #15, Lyapunov OCO #14, state-price #62, etc.) add control-theoretic/novelty. No submission is fully covered/superseded; each has specific theorems/models/guarantees advancing solution diversity. Conservative retention preserves high-quality, comprehensive database.'}
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Parsed fields - should_remove=False, submission_number=None
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: Reasoning (first 300 chars): All submissions contribute unique mathematical value and perspectives that enhance the knowledge base without redundancy, contradictions, or supersession. Core DRO frameworks (#1, #3, #6, #19, #27) differ in ambiguity sets (Wasserstein planning, multistage aquifer-DRO, KL-entropic, moment-Cantelli)
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - CLEANUP DEBUG: NO REMOVAL NEEDED - should_remove is False
-2026-03-01 20:01:33.586 - backend.aggregator.agents.validator - INFO - Cleanup review: No removal needed - All submissions contribute unique mathematical value and perspectives that enhance the knowledge base without redundancy, contradictions, or supersession. Core DRO frameworks (#1, #3, #6, #19, #27) di
-2026-03-01 20:01:33.586 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: <<< PHASE 1 Complete: removal_proposal=None
-2026-03-01 20:01:33.586 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: No removal proposal returned (None) - cleanup review complete
-2026-03-01 20:01:33.586 - backend.aggregator.core.coordinator - INFO - Cleanup review #11: No removal needed
-2026-03-01 20:01:33.586 - backend.aggregator.core.coordinator - INFO - CLEANUP DEBUG: ================== COORDINATOR CLEANUP REVIEW END (No Removal) ==================
-2026-03-01 20:01:33.620 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #78
-2026-03-01 20:01:33.620 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:01:33.620 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 40)
-2026-03-01 20:01:33.620 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 78)
-2026-03-01 20:01:33.620 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:01:33.620 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 20:01:33.620 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-03-01 20:01:33.620 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 6 total chunks
-2026-03-01 20:01:33.638 - backend.aggregator.core.coordinator - INFO - Validator iteration 31 - batch validating 3 submissions: ['4e68179e-cc3b-4771-bce3-173d7a400daa', '69de5168-3ceb-4685-98e6-8d6c88d58efe', '3a9f7320-e43f-426b-ab14-c8b68f3479ee']
-2026-03-01 20:01:33.638 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 20:01:33.638 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 20:01:33.820 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-03-01 20:01:33.820 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-03-01 20:02:00.067 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission b51ddd62-1016-4284-aedd-684cf1f03230 (iteration 32)
-2026-03-01 20:02:15.799 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 08057c63-26ca-440c-9ce7-9e34d4df0dd3 (iteration 44)
-2026-03-01 20:02:22.882 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission fb03a689-29d8-4288-b257-f7a0e940779c (iteration 12)
-2026-03-01 20:02:31.480 - backend.aggregator.agents.validator - INFO - Batch validation complete: 3/3 accepted
-2026-03-01 20:02:31.481 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #79
-2026-03-01 20:02:31.481 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:02:31.481 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 11)
-2026-03-01 20:02:31.497 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 79)
-2026-03-01 20:02:31.497 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:02:31.498 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-03-01 20:02:31.498 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-03-01 20:02:31.499 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 17 total chunks
-2026-03-01 20:02:31.517 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #80
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:02:31.517 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 41)
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 80)
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 2 new submissions
-2026-03-01 20:02:31.517 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-03-01 20:02:31.517 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 25 total chunks
-2026-03-01 20:02:31.535 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #81
-2026-03-01 20:02:31.535 - backend.aggregator.core.coordinator - WARNING - Previous re-chunking still in progress, cancelling it...
-2026-03-01 20:02:31.535 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-03-01 20:02:31.535 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 29)
-2026-03-01 20:02:31.535 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 81)
-2026-03-01 20:02:31.549 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking cancelled (newer update triggered)
-2026-03-01 20:02:31.549 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-03-01 20:02:31.549 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 3 new submissions
-2026-03-01 20:02:31.549 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-03-01 20:02:31.549 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 33 total chunks
-2026-03-01 20:02:31.566 - backend.aggregator.core.coordinator - INFO - Validator iteration 32 - batch validating 3 submissions: ['2c8e0751-fa7c-4e8d-a38f-28aff831cfa8', 'd2272f08-1349-4056-944d-a39e81600f03', 'b51ddd62-1016-4284-aedd-684cf1f03230']
-2026-03-01 20:02:31.566 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-03-01 20:02:31.567 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-03-01 20:02:32.465 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-03-01 20:02:32.465 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 3 submissions added, chunk_size=768
-2026-03-01 20:02:33.537 - backend.autonomous.core.autonomous_coordinator - INFO - Hard limit of 80 acceptances reached for topic_001. Forcing paper writing transition.
-2026-03-01 20:02:33.548 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-03-01 20:02:33.548 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-03-01 20:02:33.548 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-03-01 20:02:33.565 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-03-01 20:02:33.582 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 32
-2026-03-01 20:02:33.582 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 32 iterations - is_running=False
-2026-03-01 20:02:33.582 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-03-01 20:02:33.582 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared shared_training_memory in-memory data (will reload from file when needed)
-2026-03-01 20:02:33.582 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper compilation for brainstorm topic_001
-2026-03-01 20:02:33.582 - backend.autonomous.core.autonomous_coordinator - INFO - No papers available for additional reference selection
-2026-03-01 20:02:33.599 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 1
-2026-03-01 20:02:33.599 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model openai/gpt-5.2 (task_id=auto_pt_000)
-2026-03-01 20:02:39.573 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=auto_pt_001)
-2026-03-01 20:02:45.463 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title accepted: 'Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems'
-2026-03-01 20:02:45.482 - backend.autonomous.core.autonomous_coordinator - INFO - Compiling paper: Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems
-2026-03-01 20:02:45.482 - backend.autonomous.core.autonomous_coordinator - INFO - Clearing RAG for autonomous paper compilation...
-2026-03-01 20:02:45.482 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-03-01 20:02:45.531 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-03-01 20:02:45.567 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-03-01 20:02:45.597 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-03-01 20:02:45.630 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-03-01 20:02:45.798 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-03-01 20:02:45.848 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-03-01 20:02:45.881 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-03-01 20:02:45.931 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-03-01 20:02:45.948 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-03-01 20:02:45.948 - backend.autonomous.core.autonomous_coordinator - INFO - RAG cleared successfully
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Initializing compiler coordinator...
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Resetting compiler RAG manager state...
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager state reset
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Initializing compiler RAG manager...
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Updating compiler context window from 131072 to 131072
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager initialized
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Skipping Part 1 aggregator database load (autonomous mode)
-2026-03-01 20:02:45.948 - backend.compiler.agents.high_context_submitter - INFO - High-context submitter initialized with model: openai/gpt-5.2
-2026-03-01 20:02:45.948 - backend.compiler.agents.high_context_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-03-01 20:02:45.948 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_context': provider=openrouter, model=openai/gpt-5.2 via Google
-2026-03-01 20:02:45.948 - backend.compiler.agents.high_param_submitter - INFO - High-param submitter initialized with model: moonshotai/kimi-k2.5
-2026-03-01 20:02:45.948 - backend.compiler.agents.high_param_submitter - INFO - Context budget: 105572 tokens (window: 131072)
-2026-03-01 20:02:45.948 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_param': provider=openrouter, model=moonshotai/kimi-k2.5 via Google
-2026-03-01 20:02:45.948 - backend.compiler.validation.compiler_validator - INFO - Compiler validator initialized with model: x-ai/grok-4.1-fast
-2026-03-01 20:02:45.948 - backend.shared.api_client_manager - INFO - Configured role 'compiler_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 20:02:45.948 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Per-paper model tracking enabled for manual compiler mode
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Compiler coordinator initialized successfully
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Autonomous mode enabled - section order: Body → Conclusion → Intro → Abstract
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Clearing paper and outline...
-2026-03-01 20:02:45.948 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 99, 0 words)
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Paper is empty, skipping re-chunking
-2026-03-01 20:02:45.948 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 24)
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_rag_manager - INFO - Outline is empty, skipping re-chunking
-2026-03-01 20:02:45.948 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique memory
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Cleared rejection/acceptance logs
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Reset per-paper model tracker
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Reset autonomous section phase to body
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Reset critique phase state
-2026-03-01 20:02:45.948 - backend.compiler.core.compiler_coordinator - INFO - Paper and outline cleared - system reset to fresh start
-2026-03-01 20:02:45.948 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared previous paper/outline for fresh paper paper_001
-2026-03-01 20:02:45.948 - backend.autonomous.core.autonomous_coordinator - INFO - Loading brainstorm database into compiler RAG: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms\brainstorm_topic_001.txt
-2026-03-01 20:02:46.048 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_001.txt: 1202 total chunks
-2026-03-01 20:03:01.713 - backend.aggregator.core.rag_manager - INFO - Added document: backend\data\auto_sessions\solve_the_global_freshwater_scarcity_crisis_entire_2026-03-01_19-20\brainstorms\brainstorm_topic_001.txt
-2026-03-01 20:03:01.713 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm database loaded into compiler RAG
-2026-03-01 20:03:01.713 - backend.compiler.core.compiler_coordinator - INFO - Starting compiler...
-2026-03-01 20:03:01.713 - backend.compiler.core.compiler_coordinator - INFO - Compiler started successfully
-2026-03-01 20:03:01.713 - backend.autonomous.core.autonomous_coordinator - INFO - Compiler started for paper paper_001
-2026-03-01 20:03:01.713 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow started
-2026-03-01 20:03:01.713 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring started - will check for new acceptances every 30 seconds
-2026-03-01 20:03:01.729 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: None → body
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_coordinator - INFO - Starting fresh - no existing paper or outline found
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_coordinator - INFO - PHASE 1: ITERATIVE OUTLINE CREATION
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_coordinator - INFO -
---- Outline Creation Iteration 1/15 ---
-2026-03-01 20:03:01.729 - backend.compiler.agents.high_context_submitter - INFO - Starting outline creation submission generation...
-2026-03-01 20:03:01.729 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:03:01.729 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_create, query_length=146
-2026-03-01 20:03:55.675 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_create in 53.95s (coverage=0.75, tokens=5800)
-2026-03-01 20:03:55.675 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 53907 chars retrieved
-2026-03-01 20:03:55.675 - backend.compiler.agents.high_context_submitter - INFO - Building outline creation prompt...
-2026-03-01 20:03:55.675 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 71118 chars
-2026-03-01 20:03:55.691 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_000)...
-2026-03-01 20:04:53.936 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 16212 chars
-2026-03-01 20:04:53.936 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:04:53.952 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:04:53.952 - backend.compiler.agents.high_context_submitter - INFO - Outline creation submission generated: 4b936420-bf3a-40cd-8fd9-a8a736a675de, outline_complete=True
-2026-03-01 20:04:53.952 - backend.compiler.validation.compiler_validator - INFO - Validating outline_create submission: 4b936420-bf3a-40cd-8fd9-a8a736a675de
-2026-03-01 20:04:53.952 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_create, operation=full_content
-2026-03-01 20:04:53.968 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_000)...
-2026-03-01 20:05:05.734 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:05:05.753 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_create)
-2026-03-01 20:05:05.753 - backend.compiler.core.compiler_coordinator - INFO - ✓ Iteration 1: Outline ACCEPTED
-2026-03-01 20:05:05.753 - backend.compiler.core.compiler_coordinator - INFO -   Validator feedback: The submission is a complete outline that fully matches the required structure: optional Abstract present and correctly formatted, followed by 'I. Introduction' (exact match), multiple body sections (...
-2026-03-01 20:05:05.753 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 20:05:05.753 - backend.compiler.core.compiler_coordinator - INFO - OUTLINE MARKED COMPLETE BY SUBMITTER - LOCKING
-2026-03-01 20:05:05.753 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-03-01 20:05:05.753 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 25)
-2026-03-01 20:05:06.001 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 20:05:06.017 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 39 total chunks
-2026-03-01 20:05:06.535 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 20:05:06.535 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 20:05:06.535 - backend.compiler.memory.outline_memory - INFO - Outline creation feedback cleared
-2026-03-01 20:05:06.535 - backend.compiler.core.compiler_coordinator - INFO - Outline locked after 1 iterations
-2026-03-01 20:05:06.535 - backend.compiler.core.compiler_coordinator - INFO - Starting initial paper loop...
-2026-03-01 20:05:06.535 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=True, phase=body)
-2026-03-01 20:05:06.535 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:05:06.535 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=0 chars
-2026-03-01 20:05:06.535 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 0 chars → 0 chars (markers removed)
-2026-03-01 20:05:06.535 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:05:06.535 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=146
-2026-03-01 20:05:58.580 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 52.04s (coverage=0.81, tokens=5834)
-2026-03-01 20:05:58.580 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 53630 chars retrieved
-2026-03-01 20:05:58.580 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:05:58.580 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 81597 chars
-2026-03-01 20:05:58.596 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_001)...
-2026-03-01 20:06:57.274 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13037 chars
-2026-03-01 20:06:57.274 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:06:57.291 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:06:57.291 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 3604d4d2-7e79-42c8-8c1e-8dd0ea5b4c13 (section_complete=False)
-2026-03-01 20:06:57.291 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 3604d4d2-7e79-42c8-8c1e-8dd0ea5b4c13
-2026-03-01 20:06:57.291 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 12102 -> 12101 chars, new_string: 12102 -> 12101 chars)
-2026-03-01 20:06:57.312 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=full_content
-2026-03-01 20:06:57.314 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_001)...
-2026-03-01 20:07:14.340 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:07:14.356 - backend.compiler.memory.paper_memory - INFO - Paper initialized with placeholders (version 100)
-2026-03-01 20:07:14.356 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:07:14.356 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 39 total chunks
-2026-03-01 20:07:14.906 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:07:14.906 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:07:14.906 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:07:14.921 - backend.compiler.core.compiler_coordinator - INFO - Initial paper portion accepted with placeholders! (1527 words)
-2026-03-01 20:07:14.921 - backend.compiler.core.compiler_coordinator - INFO - Initial paper loop complete
-2026-03-01 20:07:14.921 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 20:07:14.922 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:07:14.922 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:07:14.923 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=12488 chars
-2026-03-01 20:07:14.923 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 12488 chars → 12415 chars (markers removed)
-2026-03-01 20:07:14.923 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:07:14.923 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:08:08.872 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 53.95s (coverage=0.94, tokens=5741)
-2026-03-01 20:08:08.872 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 52070 chars retrieved
-2026-03-01 20:08:08.872 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:08:08.872 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 92376 chars
-2026-03-01 20:08:08.872 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_002)...
-2026-03-01 20:09:04.124 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 11951 chars
-2026-03-01 20:09:04.124 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:09:04.129 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:09:04.129 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: a5e44861-e4af-4fd7-96f3-bd335165dcf9 (section_complete=False)
-2026-03-01 20:09:04.140 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: a5e44861-e4af-4fd7-96f3-bd335165dcf9
-2026-03-01 20:09:04.140 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 10473 -> 10471 chars, new_string: 10473 -> 10471 chars)
-2026-03-01 20:09:04.140 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:09:04.140 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary of the control layer. Over horizon H, an MPC subproblem will minimize a scalarization of the'...
-2026-03-01 20:09:04.140 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 11808
-2026-03-01 20:09:04.156 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_002)...
-2026-03-01 20:09:14.179 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:09:14.179 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=503, new_string_len=10471
-2026-03-01 20:09:14.179 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 10471 chars (conclusion boundary preserved)
-2026-03-01 20:09:14.195 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 101, 2753 words)
-2026-03-01 20:09:14.424 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:09:14.424 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 72 total chunks
-2026-03-01 20:09:15.313 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:09:15.313 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:09:15.313 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:09:15.329 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2753 words)
-2026-03-01 20:09:15.329 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:09:15.329 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:09:15.329 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=22961 chars
-2026-03-01 20:09:15.329 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 22961 chars → 22888 chars (markers removed)
-2026-03-01 20:09:15.329 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:09:15.329 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:10:23.180 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 67.85s (coverage=0.96, tokens=6318)
-2026-03-01 20:10:23.180 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 55900 chars retrieved
-2026-03-01 20:10:23.196 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:10:23.196 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 106679 chars
-2026-03-01 20:10:23.196 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_003)...
-2026-03-01 20:11:30.443 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 11767 chars
-2026-03-01 20:11:30.459 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:11:30.459 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:11:30.459 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 7f23c051-ec95-41a4-922e-7b227aa9ebfb (section_complete=False)
-2026-03-01 20:11:30.474 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 7f23c051-ec95-41a4-922e-7b227aa9ebfb
-2026-03-01 20:11:30.474 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 10376 -> 10374 chars, new_string: 10376 -> 10374 chars)
-2026-03-01 20:11:30.474 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:11:30.474 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary. The remainder of the paper will primarily use Wasserstein balls around empirical distributi'...
-2026-03-01 20:11:30.490 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 22412
-2026-03-01 20:11:30.490 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_003)...
-2026-03-01 20:11:46.226 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:11:46.226 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=372, new_string_len=10374
-2026-03-01 20:11:46.226 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 10374 chars (conclusion boundary preserved)
-2026-03-01 20:11:46.242 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 102, 3969 words)
-2026-03-01 20:11:46.464 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:11:46.480 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 104 total chunks
-2026-03-01 20:11:47.704 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:11:47.704 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:11:47.719 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:11:47.719 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (3969 words)
-2026-03-01 20:11:47.719 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:11:47.719 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:11:47.725 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=33337 chars
-2026-03-01 20:11:47.725 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 33337 chars → 33264 chars (markers removed)
-2026-03-01 20:11:47.725 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:11:47.725 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:12:51.667 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 63.94s (coverage=0.94, tokens=5758)
-2026-03-01 20:12:51.667 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 52962 chars retrieved
-2026-03-01 20:12:51.667 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:12:51.667 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 114117 chars
-2026-03-01 20:12:51.683 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_004)...
-2026-03-01 20:14:25.114 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14848 chars
-2026-03-01 20:14:25.114 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:14:25.130 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:14:25.130 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6dcba7a1-d3a1-4bbd-821f-f3185f0f8a07 (section_complete=False)
-2026-03-01 20:14:25.130 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6dcba7a1-d3a1-4bbd-821f-f3185f0f8a07
-2026-03-01 20:14:25.130 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 13327 -> 13222 chars, new_string: 13327 -> 13222 chars)
-2026-03-01 20:14:25.146 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 20:14:25.146 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLET'...
-2026-03-01 20:14:25.146 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 33162
-2026-03-01 20:14:25.146 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_004)...
-2026-03-01 20:14:41.842 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:14:41.842 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=102, new_string_len=13222
-2026-03-01 20:14:41.842 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 102 chars with 13222 chars
-2026-03-01 20:14:41.866 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 103, 5466 words)
-2026-03-01 20:14:42.095 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:14:42.095 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 147 total chunks
-2026-03-01 20:14:43.885 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:14:43.885 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:14:43.888 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:14:43.888 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (5466 words)
-2026-03-01 20:14:43.888 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:14:43.888 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:14:43.888 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=46457 chars
-2026-03-01 20:14:43.888 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 46457 chars → 46384 chars (markers removed)
-2026-03-01 20:14:43.888 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:14:43.888 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:15:42.086 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 58.20s (coverage=0.95, tokens=5519)
-2026-03-01 20:15:42.086 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 49783 chars retrieved
-2026-03-01 20:15:42.086 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:15:42.101 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 124058 chars
-2026-03-01 20:15:42.102 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_005)...
-2026-03-01 20:17:00.264 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 15435 chars
-2026-03-01 20:17:00.264 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:17:00.281 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:17:00.281 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 906adcb9-36d5-470e-96d3-fb9df569c1b1 (section_complete=False)
-2026-03-01 20:17:00.297 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 906adcb9-36d5-470e-96d3-fb9df569c1b1
-2026-03-01 20:17:00.297 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 13812 -> 13810 chars, new_string: 13812 -> 13810 chars)
-2026-03-01 20:17:00.315 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 104)
-2026-03-01 20:17:00.315 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:17:00.315 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:17:00.315 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary. Section V introduced the basic DRO objects used later in the paper: Wasserstein-robust expe'...
-2026-03-01 20:17:00.315 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 45929
-2026-03-01 20:17:00.332 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_005)...
-2026-03-01 20:17:13.163 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:17:13.163 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=455, new_string_len=13810
-2026-03-01 20:17:13.163 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 13810 chars after anchor
-2026-03-01 20:17:13.180 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 105, 7385 words)
-2026-03-01 20:17:13.430 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:17:13.446 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 189 total chunks
-2026-03-01 20:17:15.678 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:17:15.678 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:17:15.680 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:17:15.680 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (7385 words)
-2026-03-01 20:17:15.680 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-03-01 20:17:15.680 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:17:15.692 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=14748 chars, paper=60269 chars
-2026-03-01 20:17:15.692 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 60269 chars → 60196 chars (markers removed)
-2026-03-01 20:17:15.692 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:17:15.694 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=146
-2026-03-01 20:18:09.392 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 53.70s (coverage=0.81, tokens=5931)
-2026-03-01 20:18:09.392 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54281 chars retrieved
-2026-03-01 20:18:09.392 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-03-01 20:18:09.392 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 141821 chars
-2026-03-01 20:18:09.409 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_006)...
-2026-03-01 20:18:58.673 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 4444 chars
-2026-03-01 20:18:58.673 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:18:58.673 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:18:58.673 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: 5da4ac83-a972-4ac3-9129-f6f4c301eebd
-2026-03-01 20:18:58.673 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: 5da4ac83-a972-4ac3-9129-f6f4c301eebd
-2026-03-01 20:18:58.673 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 3295 -> 3293 chars)
-2026-03-01 20:18:58.690 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-03-01 20:18:58.690 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '      4. Unimodality assumptions realism and how to test/relax them'
-2026-03-01 20:18:58.690 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 13999
-2026-03-01 20:18:58.690 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_006)...
-2026-03-01 20:19:17.822 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:19:17.822 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-03-01 20:19:17.822 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 3293 chars
-2026-03-01 20:19:17.838 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 26)
-2026-03-01 20:19:18.088 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 20:19:18.088 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 47 total chunks
-2026-03-01 20:19:18.786 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 20:19:18.787 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 20:19:18.788 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-03-01 20:19:18.788 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=60269 chars
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 60269 chars → 60196 chars (markers removed)
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 20:19:18.788 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 86874 chars
-2026-03-01 20:19:18.805 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_007)...
-2026-03-01 20:20:02.935 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1439 chars
-2026-03-01 20:20:02.935 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:20:02.935 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:20:02.935 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 18a0b441-3348-47a6-8c1d-6ee636b5a4b1 (miniscule=False)
-2026-03-01 20:20:02.952 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 18a0b441-3348-47a6-8c1d-6ee636b5a4b1
-2026-03-01 20:20:02.962 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 106)
-2026-03-01 20:20:02.962 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:20:02.968 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 20:20:02.968 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '(a) Quadratic: represent \\(t_e\\ge q_e^2\\) via a rotated second-order cone (RSOC)\n\\[\n(q_e,1,t_e)\\in \\'...
-2026-03-01 20:20:02.968 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 48324
-2026-03-01 20:20:02.985 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_007)...
-2026-03-01 20:20:19.533 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:20:19.533 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=293, new_string_len=574
-2026-03-01 20:20:19.533 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 293 chars with 574 chars
-2026-03-01 20:20:19.534 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 107, 7426 words)
-2026-03-01 20:20:19.749 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:20:19.750 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 190 total chunks
-2026-03-01 20:20:22.017 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:20:22.017 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:20:22.017 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-03-01 20:20:22.017 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (7426 words)
-2026-03-01 20:20:22.033 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 20:20:22.033 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:20:22.034 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=60550 chars
-2026-03-01 20:20:22.034 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 60550 chars → 60477 chars (markers removed)
-2026-03-01 20:20:22.034 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 20:20:22.034 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 87155 chars
-2026-03-01 20:20:22.050 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_008)...
-2026-03-01 20:21:18.230 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 5795 chars
-2026-03-01 20:21:18.230 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:21:18.246 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:21:18.246 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: d319279f-08b0-44fc-b622-2ad3c03de81c (miniscule=False)
-2026-03-01 20:21:18.246 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: d319279f-08b0-44fc-b622-2ad3c03de81c
-2026-03-01 20:21:18.246 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 2508 -> 2507 chars, new_string: 2508 -> 2507 chars)
-2026-03-01 20:21:18.263 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 108)
-2026-03-01 20:21:18.263 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:21:18.283 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 20:21:18.283 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'VI.A.3. A conditional exactness result for inequality-relaxed head-loss constraints\n\nThe inequality '...
-2026-03-01 20:21:18.283 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-03-01 20:21:18.283 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=2422 | first20='VI.A.3. A conditiona' | last20='hysical extra head.\n'
-2026-03-01 20:21:18.283 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=60654 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-03-01 20:21:18.295 - backend.compiler.validation.compiler_validator - WARNING - BACKSLASH_NORMALIZED_MATCH: Exact/hyphen/whitespace match failed but found unique backslash-normalized match at pos 50993. This indicates a model over-escaping quirk.
-2026-03-01 20:21:18.295 - backend.compiler.validation.compiler_validator - WARNING -   Model provided (normalized): 'VI.A.3. A conditional exactness result for inequality-relaxed head-loss constraints\n\nThe inequality '...
-2026-03-01 20:21:18.295 - backend.compiler.validation.compiler_validator - WARNING -   Document actual: 'VI.A.3. A conditional exactness result for inequality-relaxed head-loss constraints\n\nThe inequality '...
-2026-03-01 20:21:18.295 - backend.compiler.validation.compiler_validator - INFO - Unicode hyphen normalization applied - updating old_string to actual document text
-2026-03-01 20:21:18.296 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 50993
-2026-03-01 20:21:18.297 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_008)...
-2026-03-01 20:21:28.830 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:21:28.830 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=2420, new_string_len=2507
-2026-03-01 20:21:28.830 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 2420 chars with 2507 chars
-2026-03-01 20:21:28.846 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 109, 7429 words)
-2026-03-01 20:21:29.029 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:21:29.046 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 192 total chunks
-2026-03-01 20:21:31.311 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:21:31.311 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:21:31.315 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-03-01 20:21:31.317 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (7429 words)
-2026-03-01 20:21:31.317 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-03-01 20:21:31.319 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-03-01 20:21:31.319 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-03-01 20:21:31.319 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-03-01 20:21:31.323 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=18041 chars, paper=60637 chars
-2026-03-01 20:21:31.323 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-03-01 20:21:31.323 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:22:33.509 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 62.19s (coverage=0.90, tokens=5505)
-2026-03-01 20:22:33.509 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 49703 chars
-2026-03-01 20:22:33.509 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-03-01 20:22:33.525 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_000)...
-2026-03-01 20:24:54.958 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1122 chars
-2026-03-01 20:24:54.961 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-03-01 20:24:54.961 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=367
-2026-03-01 20:24:54.961 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-03-01 20:24:54.961 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-03-01 20:24:54.961 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:25:57.378 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 62.42s (coverage=0.90, tokens=5505)
-2026-03-01 20:25:57.378 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-03-01 20:25:57.394 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_001)...
-2026-03-01 20:27:00.475 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 692 chars
-2026-03-01 20:27:00.475 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM refused (Step 1 made mistake)
-2026-03-01 20:27:00.475 - backend.compiler.core.compiler_coordinator - INFO - No rigor enhancement needed
-2026-03-01 20:27:00.491 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
-2026-03-01 20:27:00.491 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-03-01 20:27:00.491 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-03-01 20:27:00.491 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 20:27:00.491 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:27:00.491 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:27:00.491 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=60637 chars
-2026-03-01 20:27:00.491 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 60637 chars → 60564 chars (markers removed)
-2026-03-01 20:27:00.491 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:27:00.491 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:27:55.669 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 55.18s (coverage=0.96, tokens=5505)
-2026-03-01 20:27:55.669 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 48907 chars retrieved
-2026-03-01 20:27:55.669 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:27:55.669 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 140655 chars
-2026-03-01 20:27:55.687 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_009)...
-2026-03-01 20:29:42.232 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 22894 chars
-2026-03-01 20:29:42.232 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:29:42.249 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:29:42.249 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: b882ee42-d12f-4e6e-b07c-38c71d050e9f (section_complete=False)
-2026-03-01 20:29:42.265 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: b882ee42-d12f-4e6e-b07c-38c71d050e9f
-2026-03-01 20:29:42.265 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 20869 -> 20867 chars, new_string: 20869 -> 20867 chars)
-2026-03-01 20:29:42.283 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 110)
-2026-03-01 20:29:42.283 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:29:42.283 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:29:42.283 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary. Section VI provided conic-compatible physical modeling layers: (i) convex epigraphs for hea'...
-2026-03-01 20:29:42.283 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 59901
-2026-03-01 20:29:42.299 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_009)...
-2026-03-01 20:29:53.397 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:29:53.397 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=663, new_string_len=20867
-2026-03-01 20:29:53.397 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 20867 chars after anchor
-2026-03-01 20:29:53.413 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 111, 10138 words)
-2026-03-01 20:29:53.701 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:29:53.714 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 259 total chunks
-2026-03-01 20:29:57.030 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:29:57.030 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:29:57.047 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:29:57.047 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (10138 words)
-2026-03-01 20:29:57.047 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:29:57.047 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:29:57.062 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=81506 chars
-2026-03-01 20:29:57.062 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 81506 chars → 81433 chars (markers removed)
-2026-03-01 20:29:57.063 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:29:57.063 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:30:54.510 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 57.45s (coverage=0.96, tokens=5813)
-2026-03-01 20:30:54.510 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 51187 chars retrieved
-2026-03-01 20:30:54.510 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:30:54.510 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 163804 chars
-2026-03-01 20:30:54.527 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_010)...
-2026-03-01 20:32:34.855 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 16979 chars
-2026-03-01 20:32:34.855 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:32:34.873 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:32:34.874 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 42f8c651-c4ea-4ead-83e4-db1c1b4077e1 (section_complete=False)
-2026-03-01 20:32:34.879 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 42f8c651-c4ea-4ead-83e4-db1c1b4077e1
-2026-03-01 20:32:34.879 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 15207 -> 15204 chars, new_string: 15207 -> 15204 chars)
-2026-03-01 20:32:34.898 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 112)
-2026-03-01 20:32:34.904 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:32:34.905 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:32:34.905 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary. Section VII specified a closed-loop architecture for Wasserstein DRO-MPC in which WDRO cons'...
-2026-03-01 20:32:34.905 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 80821
-2026-03-01 20:32:34.922 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_010)...
-2026-03-01 20:32:41.805 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:32:41.805 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=612, new_string_len=15204
-2026-03-01 20:32:41.805 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 15204 chars after anchor
-2026-03-01 20:32:41.822 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 113, 11969 words)
-2026-03-01 20:32:42.138 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:32:42.155 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 307 total chunks
-2026-03-01 20:32:45.722 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:32:45.722 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:32:45.722 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:32:45.722 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (11969 words)
-2026-03-01 20:32:45.737 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:32:45.737 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:32:45.738 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=96712 chars
-2026-03-01 20:32:45.738 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 96712 chars → 96639 chars (markers removed)
-2026-03-01 20:32:45.738 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:32:45.738 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:33:39.233 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 53.48s (coverage=0.94, tokens=5448)
-2026-03-01 20:33:39.233 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 49036 chars retrieved
-2026-03-01 20:33:39.233 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:33:39.234 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 176859 chars
-2026-03-01 20:33:39.252 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_011)...
-2026-03-01 20:34:58.197 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13510 chars
-2026-03-01 20:34:58.197 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:34:58.214 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:34:58.214 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 60114208-777b-46f0-8829-7a3a7e148ae8 (section_complete=False)
-2026-03-01 20:34:58.227 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 60114208-777b-46f0-8829-7a3a7e148ae8
-2026-03-01 20:34:58.227 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11747 -> 11745 chars, new_string: 11747 -> 11745 chars)
-2026-03-01 20:34:58.248 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 114)
-2026-03-01 20:34:58.248 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:34:58.248 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:34:58.248 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary.\nSection VIII described time-consistent extensions beyond standard open-loop MPC: rectangula'...
-2026-03-01 20:34:58.248 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 96099
-2026-03-01 20:34:58.265 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_011)...
-2026-03-01 20:35:08.913 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:35:08.914 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=540, new_string_len=11745
-2026-03-01 20:35:08.914 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11745 chars after anchor
-2026-03-01 20:35:08.930 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 115, 13197 words)
-2026-03-01 20:35:09.247 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:35:09.264 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 345 total chunks
-2026-03-01 20:35:13.497 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:35:13.497 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:35:13.530 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:35:13.530 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (13197 words)
-2026-03-01 20:35:13.530 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:35:13.530 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:35:13.530 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=108459 chars
-2026-03-01 20:35:13.530 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 108459 chars → 108386 chars (markers removed)
-2026-03-01 20:35:13.530 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:35:13.530 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 20:36:08.393 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 54.86s (coverage=0.96, tokens=5549)
-2026-03-01 20:36:08.393 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 50038 chars retrieved
-2026-03-01 20:36:08.393 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 20:36:08.393 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 189608 chars
-2026-03-01 20:36:08.427 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_012)...
-2026-03-01 20:37:17.873 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 13353 chars
-2026-03-01 20:37:17.873 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:37:17.890 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:37:17.890 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 0bc29dde-527f-4650-9406-fb12d6892632 (section_complete=False)
-2026-03-01 20:37:17.906 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 0bc29dde-527f-4650-9406-fb12d6892632
-2026-03-01 20:37:17.906 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11764 -> 11762 chars, new_string: 11764 -> 11762 chars)
-2026-03-01 20:37:17.923 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 116)
-2026-03-01 20:37:17.923 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:37:17.923 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 20:37:17.923 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary.\nSection IX presented three scalability layers for WDRO-MPC in high-dimensional uncertainty '...
-2026-03-01 20:37:17.923 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 107747
-2026-03-01 20:37:17.956 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_012)...
-2026-03-01 20:37:25.890 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:37:25.890 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=639, new_string_len=11762
-2026-03-01 20:37:25.890 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11762 chars after anchor
-2026-03-01 20:37:25.906 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 117, 14706 words)
-2026-03-01 20:37:26.230 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:37:26.256 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 383 total chunks
-2026-03-01 20:37:30.692 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:37:30.692 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:37:30.705 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 20:37:30.706 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (14706 words)
-2026-03-01 20:37:30.706 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-03-01 20:37:30.706 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:37:30.706 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18041 chars, paper=120223 chars
-2026-03-01 20:37:30.706 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 120223 chars → 120150 chars (markers removed)
-2026-03-01 20:37:30.706 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:37:30.706 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=146
-2026-03-01 20:38:26.685 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 55.98s (coverage=0.81, tokens=5926)
-2026-03-01 20:38:26.685 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 54246 chars retrieved
-2026-03-01 20:38:26.685 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-03-01 20:38:26.685 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 205033 chars
-2026-03-01 20:38:26.702 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_013)...
-2026-03-01 20:39:12.751 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1658 chars
-2026-03-01 20:39:12.751 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:39:12.751 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:39:12.751 - backend.compiler.agents.high_context_submitter - INFO - Outline update submission generated: 927c57f6-7d26-47cc-896f-558da65fd1d8
-2026-03-01 20:39:12.767 - backend.compiler.validation.compiler_validator - INFO - Validating outline_update submission: 927c57f6-7d26-47cc-896f-558da65fd1d8
-2026-03-01 20:39:12.767 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 0 -> 0 chars, new_string: 690 -> 686 chars)
-2026-03-01 20:39:12.767 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_update, operation=insert_after
-2026-03-01 20:39:12.767 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '   D. Nonlinear water-quality transport (ADR) and polynomial approximations\n      1. Polynomial ADR '...
-2026-03-01 20:39:12.767 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 6183
-2026-03-01 20:39:12.784 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_013)...
-2026-03-01 20:39:27.169 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:39:27.169 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit_to_outline: operation=insert_after, mode=outline_update
-2026-03-01 20:39:27.169 - backend.compiler.core.compiler_coordinator - INFO - Outline insert after: inserted 686 chars
-2026-03-01 20:39:27.178 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 27)
-2026-03-01 20:39:27.407 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-03-01 20:39:27.414 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 49 total chunks
-2026-03-01 20:39:28.042 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-03-01 20:39:28.042 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-03-01 20:39:28.042 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_update)
-2026-03-01 20:39:28.042 - backend.compiler.core.compiler_coordinator - INFO - Outline update accepted
-2026-03-01 20:39:28.042 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 20:39:28.042 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:39:28.042 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=120223 chars
-2026-03-01 20:39:28.042 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 120223 chars → 120150 chars (markers removed)
-2026-03-01 20:39:28.058 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 20:39:28.058 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 147514 chars
-2026-03-01 20:39:28.082 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_014)...
-2026-03-01 20:40:13.700 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 3665 chars
-2026-03-01 20:40:13.700 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:40:13.716 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:40:13.716 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 41fb7dcf-68e9-4cce-b940-1783a7926caf (miniscule=False)
-2026-03-01 20:40:13.716 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 41fb7dcf-68e9-4cce-b940-1783a7926caf
-2026-03-01 20:40:13.716 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 1410 -> 1409 chars, new_string: 1410 -> 1409 chars)
-2026-03-01 20:40:13.732 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 118)
-2026-03-01 20:40:13.732 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:40:13.748 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 20:40:13.748 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Corollary 5.2 (Wasserstein-1 bound for Lipschitz losses).\nLet \\(p=1\\), \\(\\Xi=\\mathbb{R}^d\\), and sup'...
-2026-03-01 20:40:13.748 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 35627
-2026-03-01 20:40:13.764 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_014)...
-2026-03-01 20:40:31.875 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:40:31.875 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=1319, new_string_len=1409
-2026-03-01 20:40:31.875 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 1319 chars with 1409 chars
-2026-03-01 20:40:31.875 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 119, 14687 words)
-2026-03-01 20:40:32.317 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:40:32.351 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 384 total chunks
-2026-03-01 20:40:36.830 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:40:36.830 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:40:36.830 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: review)
-2026-03-01 20:40:36.830 - backend.compiler.core.compiler_coordinator - INFO - Review edit accepted (14687 words)
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=120313 chars
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 120313 chars → 120240 chars (markers removed)
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 20:40:36.843 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 147604 chars
-2026-03-01 20:40:36.869 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_015)...
-2026-03-01 20:41:17.147 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1800 chars
-2026-03-01 20:41:17.147 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 20:41:17.147 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 20:41:17.147 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: c0de1247-84e8-4ef2-aea8-21f45fa57ffe (miniscule=False)
-2026-03-01 20:41:17.147 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: c0de1247-84e8-4ef2-aea8-21f45fa57ffe
-2026-03-01 20:41:17.163 - backend.compiler.memory.paper_memory - INFO - Repaired missing markers in paper (version 120)
-2026-03-01 20:41:17.163 - backend.compiler.validation.compiler_validator - INFO - Paper markers were missing and have been repaired
-2026-03-01 20:41:17.163 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 20:41:17.163 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Control. Let u_t \\in \\mathbb{R}^{n_u} denote manipulated decisions, e.g.,\n\\nu_t := \\begin{bmatrix} q'...
-2026-03-01 20:41:17.163 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 2139
-2026-03-01 20:41:17.195 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_015)...
-2026-03-01 20:41:52.189 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=False, rigor=True, placement=True)
-2026-03-01 20:41:52.189 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: review)
-2026-03-01 20:41:52.189 - backend.compiler.core.compiler_coordinator - INFO - Review edit rejected
-2026-03-01 20:41:52.189 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-03-01 20:41:52.189 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-03-01 20:41:52.189 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-03-01 20:41:52.189 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-03-01 20:41:52.205 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=18727 chars, paper=120417 chars
-2026-03-01 20:41:52.205 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-03-01 20:41:52.205 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:43:00.401 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 68.20s (coverage=0.86, tokens=5818)
-2026-03-01 20:43:00.401 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 52546 chars
-2026-03-01 20:43:00.401 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-03-01 20:43:00.417 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_002)...
-2026-03-01 20:44:48.405 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1220 chars
-2026-03-01 20:44:48.405 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-03-01 20:44:48.405 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=474
-2026-03-01 20:44:48.405 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-03-01 20:44:48.421 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-03-01 20:44:48.421 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:45:56.645 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 68.22s (coverage=0.86, tokens=5818)
-2026-03-01 20:45:56.645 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-03-01 20:45:56.662 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_003)...
-2026-03-01 20:48:14.692 - backend.shared.openrouter_client - WARNING - OpenRouter connection error for model 'moonshotai/kimi-k2.5' (attempt 1/3): [ReadError] ReadError('')
-2026-03-01 20:52:33.891 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 9467 chars
-2026-03-01 20:52:33.891 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Rigor enhancement submission generated - b2911509-f6db-441f-ac0e-bae6a7f07a54
-2026-03-01 20:52:33.907 - backend.compiler.validation.compiler_validator - INFO - Validating rigor submission: b2911509-f6db-441f-ac0e-bae6a7f07a54
-2026-03-01 20:52:33.923 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=rigor, operation=replace
-2026-03-01 20:52:33.923 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'V. Wasserstein DRO Building Blocks for MPC\n\nThis section collects distributionally robust optimizati'...
-2026-03-01 20:52:33.923 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 33162
-2026-03-01 20:52:33.942 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_016)...
-2026-03-01 20:52:43.807 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 20:52:43.807 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=replace, old_string_len=278, new_string_len=3831
-2026-03-01 20:52:43.807 - backend.compiler.core.compiler_coordinator - INFO - Replace: replaced 278 chars with 3831 chars
-2026-03-01 20:52:43.823 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 121, 15093 words)
-2026-03-01 20:52:44.188 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 20:52:44.220 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 393 total chunks
-2026-03-01 20:52:49.025 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 20:52:49.025 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 20:52:49.040 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: rigor)
-2026-03-01 20:52:49.040 - backend.compiler.core.compiler_coordinator - INFO - Rigor enhancement accepted (15093 words)
-2026-03-01 20:52:49.040 - backend.compiler.agents.high_param_submitter - INFO - Starting rigor enhancement (Step 1: Planning)...
-2026-03-01 20:52:49.040 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Loading document state for planning...
-2026-03-01 20:52:49.040 - backend.compiler.agents.high_param_submitter - INFO - Step 1: State loaded - outline=18727 chars, paper=123970 chars
-2026-03-01 20:52:49.040 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Retrieving relevant paper sections via RAG...
-2026-03-01 20:52:49.040 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:53:57.748 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 68.71s (coverage=0.90, tokens=5762)
-2026-03-01 20:53:57.748 - backend.compiler.agents.high_param_submitter - INFO - Step 1: RAG retrieval complete - 52131 chars
-2026-03-01 20:53:57.748 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Building planning prompt...
-2026-03-01 20:53:57.764 - backend.compiler.agents.high_param_submitter - INFO - Step 1: Generating LLM completion (task_id=comp_hp_004)...
-2026-03-01 20:56:51.580 - backend.compiler.agents.high_param_submitter - INFO - Step 1: LLM completion received - 1328 chars
-2026-03-01 20:56:51.596 - backend.compiler.agents.high_param_submitter - INFO - Step 1: JSON parsed successfully
-2026-03-01 20:56:51.596 - backend.compiler.agents.high_param_submitter - INFO - Step 1 complete: mode=standard_enhancement, target_section_len=367
-2026-03-01 20:56:51.596 - backend.compiler.agents.high_param_submitter - INFO - Starting Step 2: standard_enhancement execution...
-2026-03-01 20:56:51.596 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Retrieving paper sections via RAG...
-2026-03-01 20:56:51.596 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=1147
-2026-03-01 20:58:00.513 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 68.92s (coverage=0.90, tokens=5762)
-2026-03-01 20:58:00.513 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Building execution prompt...
-2026-03-01 20:58:00.529 - backend.compiler.agents.high_param_submitter - INFO - Step 2: Generating LLM completion (task_id=comp_hp_005)...
-2026-03-01 20:59:48.373 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM completion received - 974 chars
-2026-03-01 20:59:48.375 - backend.compiler.agents.high_param_submitter - INFO - Step 2: LLM refused (Step 1 made mistake)
-2026-03-01 20:59:48.376 - backend.compiler.core.compiler_coordinator - INFO - No rigor enhancement needed
-2026-03-01 20:59:48.376 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
-2026-03-01 20:59:48.376 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (first rejection)
-2026-03-01 20:59:48.376 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-03-01 20:59:48.376 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-03-01 20:59:48.376 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 20:59:48.376 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 20:59:48.390 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=123970 chars
-2026-03-01 20:59:48.390 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 123970 chars → 123897 chars (markers removed)
-2026-03-01 20:59:48.390 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 20:59:48.391 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 21:00:53.004 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 64.61s (coverage=0.96, tokens=5900)
-2026-03-01 21:00:53.004 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 52797 chars retrieved
-2026-03-01 21:00:53.004 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 21:00:53.004 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 210732 chars
-2026-03-01 21:00:53.027 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_016)...
-2026-03-01 21:01:57.919 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 12962 chars
-2026-03-01 21:01:57.928 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 21:01:57.935 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 21:01:57.935 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 1900d4a7-9cc7-4f5f-9189-b9261d424230 (section_complete=False)
-2026-03-01 21:01:57.935 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 1900d4a7-9cc7-4f5f-9189-b9261d424230
-2026-03-01 21:01:57.935 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11470 -> 11468 chars, new_string: 11470 -> 11468 chars)
-2026-03-01 21:01:57.951 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 21:01:57.951 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary.\nSection X compared several reliability certification layers and how they plug into multi-ob'...
-2026-03-01 21:01:57.951 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 123267
-2026-03-01 21:01:57.969 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_017)...
-2026-03-01 21:02:10.869 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 21:02:10.869 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=630, new_string_len=11468
-2026-03-01 21:02:10.869 - backend.compiler.core.compiler_coordinator - WARNING - AUTO-CORRECTING BOUNDARY VIOLATION: insert_after anchor is after CONCLUSION_PLACEHOLDER. Relocating insertion to just before the placeholder. Original anchor position: 123897, Conclusion placeholder position: 123795
-2026-03-01 21:02:10.869 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 11468 chars (conclusion boundary preserved)
-2026-03-01 21:02:10.885 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 122, 16510 words)
-2026-03-01 21:02:11.253 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 21:02:11.285 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 430 total chunks
-2026-03-01 21:02:16.304 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 21:02:16.304 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 21:02:16.304 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 21:02:16.318 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (16510 words)
-2026-03-01 21:02:16.318 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 21:02:16.318 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 21:02:16.318 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=135440 chars
-2026-03-01 21:02:16.318 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 135440 chars → 135367 chars (markers removed)
-2026-03-01 21:02:16.318 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 21:02:16.318 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 21:03:26.532 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 70.21s (coverage=0.83, tokens=5310)
-2026-03-01 21:03:26.532 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 48120 chars retrieved
-2026-03-01 21:03:26.532 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 21:03:26.532 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 217525 chars
-2026-03-01 21:03:26.566 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_017)...
-2026-03-01 21:04:25.180 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10664 chars
-2026-03-01 21:04:25.191 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 21:04:25.197 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 21:04:25.197 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 1510b2bd-e366-4c5f-b1b0-852ba19c99a8 (section_complete=False)
-2026-03-01 21:04:25.197 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 1510b2bd-e366-4c5f-b1b0-852ba19c99a8
-2026-03-01 21:04:25.197 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 9258 -> 9256 chars, new_string: 9258 -> 9256 chars)
-2026-03-01 21:04:25.212 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 21:04:25.212 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary.\nSection XI defined extension templates for (i) decentralized multi-agent operation via DR-G'...
-2026-03-01 21:04:25.212 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 134703
-2026-03-01 21:04:25.230 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_018)...
-2026-03-01 21:04:35.063 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 21:04:35.063 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=560, new_string_len=9256
-2026-03-01 21:04:35.075 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 9256 chars (conclusion boundary preserved)
-2026-03-01 21:04:35.080 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 123, 17692 words)
-2026-03-01 21:04:35.604 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 21:04:35.630 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 460 total chunks
-2026-03-01 21:04:41.027 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 21:04:41.027 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 21:04:41.027 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 21:04:41.027 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (17692 words)
-2026-03-01 21:04:41.027 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-03-01 21:04:41.027 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 21:04:41.043 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=144698 chars
-2026-03-01 21:04:41.043 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 144698 chars → 144625 chars (markers removed)
-2026-03-01 21:04:41.043 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 21:04:41.043 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 21:05:49.579 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 68.54s (coverage=0.94, tokens=5811)
-2026-03-01 21:05:49.579 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 50969 chars retrieved
-2026-03-01 21:05:49.579 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-03-01 21:05:49.579 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 229632 chars
-2026-03-01 21:05:49.610 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_018)...
-2026-03-01 21:07:44.372 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 23140 chars
-2026-03-01 21:07:44.372 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 21:07:44.388 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 21:07:44.388 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 0070aad6-b42a-453a-b70e-0a3d37acd3bf (section_complete=True)
-2026-03-01 21:07:44.388 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 0070aad6-b42a-453a-b70e-0a3d37acd3bf
-2026-03-01 21:07:44.404 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 21247 -> 21245 chars, new_string: 21247 -> 21245 chars)
-2026-03-01 21:07:44.404 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-03-01 21:07:44.404 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Summary.\nSection XII provided two information-centric extension modules: (i) Fisher-information-awar'...
-2026-03-01 21:07:44.404 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 143910
-2026-03-01 21:07:44.439 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_019)...
-2026-03-01 21:07:56.484 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 21:07:56.484 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=611, new_string_len=21245
-2026-03-01 21:07:56.484 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 21245 chars (conclusion boundary preserved)
-2026-03-01 21:07:56.500 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 124, 20408 words)
-2026-03-01 21:07:56.897 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 21:07:56.948 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 525 total chunks
-2026-03-01 21:08:03.296 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 21:08:03.296 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 21:08:03.296 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=body, paper_words=20408
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - Body section complete - transitioning to CRITIQUE PHASE
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - STARTING CRITIQUE PHASE
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - Snapshot pre-critique paper: 165945 chars
-2026-03-01 21:08:03.311 - backend.compiler.memory.critique_memory - INFO - Initialized critique memory for paper_v1 at backend\data\critique_feedback_paper_v1.txt
-2026-03-01 21:08:03.311 - backend.compiler.memory.critique_memory - INFO - Cleared all critiques from critique memory
-2026-03-01 21:08:03.311 - backend.compiler.memory.critique_memory - INFO - Critique file is empty
-2026-03-01 21:08:03.311 - backend.compiler.core.compiler_coordinator - INFO - Critique memory initialized for paper_v1
-2026-03-01 21:08:03.311 - backend.compiler.agents.critique_submitter - INFO - Critique submitter initialized with model google/gemini-3.1-pro-preview
-2026-03-01 21:08:03.311 - backend.compiler.memory.critique_rejection_memory - INFO - Loaded 0 critique rejections
-2026-03-01 21:08:03.327 - backend.compiler.agents.critique_submitter - INFO - Critique submitter rejection memory initialized
-2026-03-01 21:08:03.327 - backend.compiler.memory.critique_rejection_memory - INFO - Reset critique rejection log
-2026-03-01 21:08:03.327 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique rejection feedback for fresh start
-2026-03-01 21:08:03.327 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter created with model: google/gemini-3.1-pro-preview
-2026-03-01 21:08:03.327 - backend.shared.api_client_manager - INFO - Configured role 'compiler_critique_submitter': provider=openrouter, model=google/gemini-3.1-pro-preview via Google
-2026-03-01 21:08:03.327 - backend.shared.api_client_manager - INFO - Configured role 'critique_validator': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 21:08:03.327 - backend.shared.api_client_manager - INFO - Configured role 'critique_cleanup': provider=openrouter, model=x-ai/grok-4.1-fast via Novita
-2026-03-01 21:08:03.327 - backend.compiler.core.compiler_coordinator - INFO - Starting critique aggregation loop (target: 5 total attempts, accepted OR rejected)
-2026-03-01 21:08:03.327 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 0/5, accepted: 0, rejected: 0)
-2026-03-01 21:08:15.020 - backend.shared.json_parser - WARNING - No JSON start character found in content (length=873)
-2026-03-01 21:08:15.020 - backend.shared.json_parser - WARNING - Content preview: '**Considering Peer Review Request**\n\nI\'m focusing on the request for a peer review of "Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems." My curre'...
-2026-03-01 21:08:15.020 - backend.shared.json_parser - ERROR - 🚨 MODEL OUTPUT CONTAINS NO JSON STRUCTURE
-2026-03-01 21:08:15.020 - backend.shared.json_parser - ERROR - This indicates the model spent all tokens on reasoning text
-2026-03-01 21:08:15.020 - backend.shared.json_parser - ERROR - Consider: shorter prompts, or explicit 'JSON ONLY' instruction
-2026-03-01 21:08:15.020 - backend.shared.json_parser - ERROR - parse_json: No JSON found in response - only conversational reasoning text (873 chars). Model likely hit max_tokens before writing JSON. Content starts with: '**Considering Peer Review Request**\n\nI\'m focusing on the request for a peer review of "Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems." My curre'
-2026-03-01 21:08:15.021 - backend.compiler.agents.critique_submitter - ERROR - Error generating critique: No JSON found in response - only conversational reasoning text (873 chars). Model likely hit max_tokens before writing JSON. Content starts with: '**Considering Peer Review Request**\n\nI\'m focusing on the request for a peer review of "Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems." My curre'
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\agents\critique_submitter.py", line 167, in submit_critique
-    data = parse_json(llm_output)
-           ^^^^^^^^^^^^^^^^^^^^^^
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\shared\json_parser.py", line 691, in parse_json
-    sanitized_content = sanitize_json_response(response_content)
-                        ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\shared\json_parser.py", line 153, in sanitize_json_response
-    raise ValueError(
-ValueError: No JSON found in response - only conversational reasoning text (873 chars). Model likely hit max_tokens before writing JSON. Content starts with: '**Considering Peer Review Request**\n\nI\'m focusing on the request for a peer review of "Multi-Objective Wasserstein Distributionally Robust MPC for Renewable-Powered Integrated Water Systems." My curre'
-2026-03-01 21:08:15.022 - backend.compiler.core.compiler_coordinator - WARNING - Critique generation returned None - retrying
-2026-03-01 21:08:20.036 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 0/5, accepted: 0, rejected: 0)
-2026-03-01 21:10:35.633 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #1
-2026-03-01 21:10:35.633 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 4416559b-703b-481d-85f8-fddc24991fc8
-2026-03-01 21:11:01.767 - backend.compiler.memory.critique_memory - INFO - Added critique #1 to critique memory
-2026-03-01 21:11:01.767 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (1/5): 4416559b-703b-481d-85f8-fddc24991fc8
-2026-03-01 21:11:04.780 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 1/5, accepted: 1, rejected: 0)
-2026-03-01 21:13:32.792 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #2
-2026-03-01 21:13:32.792 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: 02f3b344-38fd-4c14-9e0c-051d4fff2571
-2026-03-01 21:13:47.724 - backend.compiler.memory.critique_memory - INFO - Added critique #2 to critique memory
-2026-03-01 21:13:47.724 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (2/5): 02f3b344-38fd-4c14-9e0c-051d4fff2571
-2026-03-01 21:13:50.724 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 2/5, accepted: 2, rejected: 0)
-2026-03-01 21:16:19.620 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #3
-2026-03-01 21:16:19.626 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: f6f377fa-5ef5-4ab6-b9ab-1ed6e119de8f
-2026-03-01 21:16:36.837 - backend.compiler.memory.critique_memory - INFO - Added critique #3 to critique memory
-2026-03-01 21:16:36.837 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (3/5): f6f377fa-5ef5-4ab6-b9ab-1ed6e119de8f
-2026-03-01 21:16:39.850 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 3/5, accepted: 3, rejected: 0)
-2026-03-01 21:20:27.244 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #4
-2026-03-01 21:20:27.244 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: e9ffe2ea-ad61-4dc8-8ec7-d76778060d3c
-2026-03-01 21:20:35.877 - backend.compiler.memory.critique_memory - INFO - Added critique #4 to critique memory
-2026-03-01 21:20:35.877 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (4/5): e9ffe2ea-ad61-4dc8-8ec7-d76778060d3c
-2026-03-01 21:20:38.875 - backend.compiler.core.compiler_coordinator - INFO - Generating critique (attempts: 4/5, accepted: 4, rejected: 0)
-2026-03-01 21:22:12.740 - backend.compiler.agents.critique_submitter - INFO - Critique submitter generated critique #5
-2026-03-01 21:22:12.740 - backend.compiler.core.compiler_coordinator - INFO - Critique generated: a4c3b298-9fed-4d8b-bc53-3273681c6ffb
-2026-03-01 21:22:23.957 - backend.compiler.memory.critique_memory - INFO - Added critique #5 to critique memory
-2026-03-01 21:22:23.957 - backend.compiler.core.compiler_coordinator - INFO - Critique ACCEPTED (5/5): a4c3b298-9fed-4d8b-bc53-3273681c6ffb
-2026-03-01 21:22:26.972 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete: 5 total attempts (5 accepted, 0 rejected)
-2026-03-01 21:22:26.972 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:22:26.973 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete (5 total attempts) - triggering rewrite decision (attempt 1)
-2026-03-01 21:22:26.973 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:22:26.973 - backend.compiler.core.compiler_coordinator - INFO - Critique submitter generating rewrite decision...
-2026-03-01 21:22:53.156 - backend.compiler.agents.critique_submitter - INFO - Rewrite decision generated: partial_revision
-2026-03-01 21:22:53.156 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision: partial_revision
-2026-03-01 21:22:53.156 - backend.compiler.core.compiler_coordinator - INFO - Validator reviewing rewrite decision...
-2026-03-01 21:22:53.156 - backend.compiler.validation.compiler_validator - INFO - Validating rewrite decision...
-2026-03-01 21:23:02.588 - backend.compiler.validation.compiler_validator - INFO - Rewrite decision VALIDATED: The partial_revision decision is justified. All five accepted critiques identify specific, localized mathematical errors or structural issues: (1) incorrect Loewner order implication in Proposition 12...
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - Rewrite decision validated - executing
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - Decision: PARTIAL REVISION (iterative targeted edits)
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - EXECUTING PARTIAL REVISION (ITERATIVE EDITS)
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - Partial revision initiated (pending successful completion, max: 1)
-2026-03-01 21:23:02.588 - backend.compiler.core.compiler_coordinator - INFO - Paper title unchanged
-2026-03-01 21:23:02.605 - backend.compiler.core.compiler_coordinator - INFO - Starting iterative edit loop...
-2026-03-01 21:23:02.605 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 21:23:40.303 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 21:23:40.303 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a mathematical error in the proof of Proposition 12.1 regarding the Loewner o...
-2026-03-01 21:23:40.303 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 21:23:46.771 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses CRITIQUE #1, which identifies a mathematical error in the proof of Proposition 12.1 regarding the invalid Loewner order pr...
-2026-03-01 21:23:46.771 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 21:23:46.771 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 21:24:25.052 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 21:24:25.052 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a mathematical error in the proof of Proposition 12.1 regarding the Loewner o...
-2026-03-01 21:24:25.052 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 21:24:30.435 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses Critique #1 by correcting the mathematical error in the proof of Proposition 12.1. The original proof incorrectly claimed ...
-2026-03-01 21:24:30.435 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 21:24:30.452 - backend.compiler.core.compiler_coordinator - INFO - Requesting edit #1...
-2026-03-01 21:25:08.651 - backend.compiler.agents.critique_submitter - INFO - Iterative edit #1 proposed: replace (more_edits_needed=True)
-2026-03-01 21:25:08.651 - backend.compiler.core.compiler_coordinator - INFO - Edit proposal: replace - Critique #1 identified a mathematical error in the proof of Proposition 12.1 regarding the Loewner o...
-2026-03-01 21:25:08.651 - backend.compiler.validation.compiler_validator - INFO - Validating partial revision edit...
-2026-03-01 21:25:13.701 - backend.compiler.validation.compiler_validator - INFO - Partial revision edit VALIDATED: The edit directly addresses Critique #1 by correcting the mathematical error in the proof of Proposition 12.1. The original proof incorrectly claimed ...
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - ERROR - Error in iterative edit loop: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-Traceback (most recent call last):
-  File "C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-main\backend\compiler\core\compiler_coordinator.py", line 2888, in _execute_partial_revision
-    success = await self._apply_edit(operation, old_string, new_string)
-                    ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-TypeError: CompilerCoordinator._apply_edit() takes 3 positional arguments but 4 were given
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - ERROR - Max consecutive failures (3) reached - stopping iterative loop
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - Iterative edit loop complete: 0 successful, 3 failed
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - Ending critique phase (rewrite=False)
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - Critique phase complete - transitioning to CONCLUSION phase
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - Title unchanged - continuing to conclusion
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - PARTIAL REVISION COMPLETE - Continuing to CONCLUSION
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - ================================================================================
-2026-03-01 21:25:13.701 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (20408 words)
-2026-03-01 21:25:13.701 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: body → conclusion
-2026-03-01 21:25:13.720 - backend.compiler.memory.paper_memory - INFO - Placeholders check: All sections either have placeholders or actual content
-2026-03-01 21:25:13.720 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=conclusion)
-2026-03-01 21:25:13.720 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 21:25:13.736 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=165945 chars
-2026-03-01 21:25:13.737 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 165945 chars → 165872 chars (markers removed)
-2026-03-01 21:25:13.737 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-03-01 21:25:13.737 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=647
-2026-03-01 21:26:28.698 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 74.96s (coverage=0.94, tokens=5585)
-2026-03-01 21:26:28.698 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 49290 chars retrieved
-2026-03-01 21:26:28.698 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: conclusion...
-2026-03-01 21:26:28.698 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 248961 chars
-2026-03-01 21:26:28.731 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_019)...
-2026-03-01 21:26:57.697 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 7623 chars
-2026-03-01 21:26:57.701 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 21:26:57.701 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 21:26:57.701 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 83b9f51e-12ae-4aca-8d91-8c22137e2c75 (section_complete=True)
-2026-03-01 21:26:57.714 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 83b9f51e-12ae-4aca-8d91-8c22137e2c75
-2026-03-01 21:26:57.714 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=replace
-2026-03-01 21:26:57.714 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: '[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLET'...
-2026-03-01 21:26:57.714 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 165770
-2026-03-01 21:26:57.746 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_024)...
-2026-03-01 21:27:09.214 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-03-01 21:27:09.245 - backend.compiler.memory.paper_memory - INFO - Placeholder replaced (version 125)
-2026-03-01 21:27:09.663 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-03-01 21:27:09.696 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 547 total chunks
-2026-03-01 21:27:16.646 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-03-01 21:27:16.646 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-03-01 21:27:16.646 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-03-01 21:27:16.663 - backend.compiler.core.compiler_coordinator - INFO - Phase transition requested: current=conclusion, paper_words=21234
-2026-03-01 21:27:16.663 - backend.compiler.core.compiler_coordinator - INFO - Phase transition: conclusion → introduction (explicit section_complete)
-2026-03-01 21:27:16.663 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (21234 words)
-2026-03-01 21:27:16.663 - backend.compiler.core.compiler_coordinator - INFO - Skipping outline update - body construction complete
-2026-03-01 21:27:16.663 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements...
-2026-03-01 21:27:16.663 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-03-01 21:27:16.673 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=18727 chars, paper=172761 chars
-2026-03-01 21:27:16.673 - backend.compiler.agents.high_context_submitter - INFO - Paper stripped: 172761 chars → 172688 chars (markers removed)
-2026-03-01 21:27:16.673 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-03-01 21:27:16.673 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 202196 chars
-2026-03-01 21:27:16.696 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_020)...
-2026-03-01 21:27:16.763 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: conclusion → introduction
-2026-03-01 21:27:58.395 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 1876 chars
-2026-03-01 21:27:58.395 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-03-01 21:27:58.395 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-03-01 21:27:58.395 - backend.compiler.agents.high_context_submitter - INFO - Review submission generated: 94862a12-1c41-4af1-935a-b3f99753c724 (miniscule=False)
-2026-03-01 21:27:58.410 - backend.compiler.validation.compiler_validator - INFO - Validating review submission: 94862a12-1c41-4af1-935a-b3f99753c724
-2026-03-01 21:27:58.410 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 732 -> 731 chars, new_string: 732 -> 731 chars)
-2026-03-01 21:27:58.411 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=review, operation=replace
-2026-03-01 21:27:58.411 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Control. Let u_t \\in \\mathbb{R}^{n_u} denote manipulated decisions, e.g.,\n\\nu_t := \\begin{bmatrix} q'...
-2026-03-01 21:27:58.411 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 2139
-2026-03-01 21:27:58.445 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_025)...
-2026-03-01 21:28:06.464 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coher
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index ff65e9d..ec7f494 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -11,12 +11,12 @@ rank-bm25>=0.2.2
 
 # Data processing
 numpy>=1.26.0
-pydantic>=2.5.3
+pydantic>=2.5.3,<=2.12.4
 pydantic-settings>=2.1.0
 
 # Utilities
 python-dotenv>=1.0.0
-aiofiles>=23.2.1
+aiofiles>=23.2.1,<25.0
 tiktoken>=0.5.2
 
 # PDF generation (headless Chromium via Playwright - full rendering fidelity)

From 20910d1532d03f27d0f878b10ece68837da18f86 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Wed, 8 Apr 2026 20:03:48 -0500
Subject: [PATCH 02/32] Fix CodeQL alerts: secure backend secret storage, safe
 path resolution

---
 .cursor/rules/api-key-controls.mdc            |   4 +-
 ...program-directory-and-file-definitions.mdc |   4 +-
 README.md                                     |  28 +-
 backend/api/main.py                           |  30 +-
 backend/api/routes/autonomous.py              | 164 +++++------
 backend/api/routes/compiler.py                |  12 +
 backend/api/routes/openrouter.py              |  24 +-
 .../autonomous/core/autonomous_coordinator.py |   4 +-
 .../autonomous/memory/final_answer_memory.py  |  42 ++-
 backend/autonomous/memory/paper_library.py    |  25 +-
 .../autonomous/memory/research_metadata.py    |   6 +-
 backend/autonomous/memory/session_manager.py  |  12 +-
 backend/shared/critique_memory.py             | 268 +++++++-----------
 backend/shared/path_safety.py                 |  43 +++
 backend/shared/secret_store.py                |  96 +++++++
 frontend/src/App.jsx                          |  42 +--
 frontend/src/components/BoostControlModal.jsx |  15 +-
 .../src/components/OpenRouterApiKeyModal.jsx  |  50 +++-
 .../autonomous/AutonomousResearchSettings.jsx |  32 +--
 .../components/compiler/CompilerSettings.jsx  |  40 +--
 requirements.txt                              |   1 +
 21 files changed, 540 insertions(+), 402 deletions(-)
 create mode 100644 backend/shared/path_safety.py
 create mode 100644 backend/shared/secret_store.py

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index d247fc1..30c1ea0 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -192,6 +192,8 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 ## Configuration Persistence
 
-**localStorage:** `openrouter_api_key`, `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`)
+**Secure backend storage (OS keyring):** OpenRouter global API key and Wolfram Alpha API key persist via `backend/shared/secret_store.py` using the OS keychain/keyring. Restored into backend memory on startup in `backend/api/main.py`.
+
+**localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`)
 
 **Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs persist to file (`boost_api_log.txt`).
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index 4dea653..86e5844 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -28,7 +28,9 @@ project-root/
 │   │   ├── utils.py                     # Common utilities
 │   │   ├── json_parser.py               # JSON parsing with sanitization for LLM quirks
 │   │   ├── critique_memory.py           # Paper critique persistence (saves up to 10 validator critiques per paper)
-│   │   └── critique_prompts.py          # Default critique prompt and builder function for validator critiques 
+│   │   ├── critique_prompts.py          # Default critique prompt and builder function for validator critiques
+│   │   ├── secret_store.py              # Secure API key persistence via OS keyring (OpenRouter, Wolfram Alpha)
+│   │   └── path_safety.py               # Safe path resolution helpers (realpath/normpath containment checks)
 │   ├── aggregator/                      # AGGREGATOR 
 │   │   ├── __init__.py
 │   │   ├── core/
diff --git a/README.md b/README.md
index a737b0a..c6ab89f 100644
--- a/README.md
+++ b/README.md
@@ -1,12 +1,12 @@
-# MOTO - S.T.E.M. Mathematics Variant
-# Autonomous AI/ASI Deep Research Harness
+# MOTO Autonomous ASI - Novel S.T.E.M. Solution Variant for ASI Automated Theory Generation
+# Autonomous Superintelligence Deep Research Harness
 **Version: 1.0.5**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**A breakthrough in AI and autonmated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration changes how we look at AI weights, a specific combination of reiterative brainstorming, validation, feedback, pruning allow for superintelligence exploration and data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation for mathematics: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for other research topics such as general academic research, chat bots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration changes how we look at AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation for mathematics: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for other research topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
 ### The Core Discovery: Top-P Exploration (Solution Basin Aggregation)
 
@@ -20,9 +20,7 @@ Once a brainstorm is sufficiently explored, MOTO writes a research paper from it
 
 MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is an experimental system; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
-MOTO may produce many brilliant papers as it runs, these start-up papers are answers that rival traditional paid cloud deep research functions. As the user, observe MOTO as often or as little as you'd like - skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode, a final answer beyond the growing collection of related papers. In this mode, we have found quality can vary - however that is because MOTO is capable of autonomously deciding if it should output a shortform answer, like traditional cloud deep research - or whether to collect existing pre-final answer papers and write a long-form academic volume. With models over 131,000 token context limits, the harness is easily capable of producing final volumes with over 40,000 words, and MOTO produces this book-length content autonomously. It should be noted that this long-form answer is often so detailed that for any AI critique it requires the system to fully direct-inject the paper content. Providing an attempt at a novel 40,000 academic volume to a cloud agent using RAG (summarization-like techniques) may provide mixed results. MOTO strives to direct inject all content where possible. The built in “critique” feature allows the user to direct inject the full 40,000+ word volume into nearly any AI model of their choice. If the system decides to do a long form answer it will collect any relevant papers it has written, take only the best and related ones, organize them into chapters, write any gap papers, write the conclusion, and then lastly write the introduction chapter. This reverse order, body first, conclusion second, then introduction portion(s) last is crucial to allow MOTO the ability to be creative as it write. The traditional introduction -> body -> conclusion writing style ensures we limit any non-Markovian constraints on the creative process. In other words, if the system wrote its introduction first, the body paragraphs are locked in and bound to the rules the introduction set. Writing the body section first gives the system greater freedom to discover as it writes as it is not bound by a detailed introduction. MOTO is an experimental system, the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
-
-Give the program a try, MOTO is as cool as it sounds – there is a one-click installer. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green “< > Code” drop-down menu on the top right of this GitHub page, download the zip file, extract it to your desktop then double-click "Press to Launch MOTO.bat". Put in your OpenRouter.AI API key (or optionally connect LM studio for faster  performance), select your agents in the settings profile – if desired and you are unsure you may use the preselected “fastest” profile.
+Give the program a try, MOTO is as cool as it sounds – there is a one-click installer. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green “< > Code” drop-down menu on the top right of this GitHub page, download the zip file, extract it to your desktop then double-click "Press to Launch MOTO.bat". Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile – if desired and you are unsure you may use the preselected “fastest” profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
 
@@ -32,12 +30,12 @@ Give the program a try, MOTO is as cool as it sounds – there is a one-click in
 
 ## Outline of "MOTO - S.T.E.M. Mathematics Variant"
 
-MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeking AI) mathematics researcher designed to run for days at a time after pressing start without user interaction. This program can support multiple simultaneous models working in parallel from either local host LM studio, OpenRouter API key, or both.
+MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeking AI) mathematics researcher designed to run for days at a time after pressing start without user interaction. This program can support multiple simultaneous models working in parallel from either local host LM Studio, OpenRouter API key, or both.
 
 ### Key Features
 
 - 🤖 **Autonomous Topic Selection, Brainstorming, and Paper Generation**: AI chooses research avenues based on high-level goals and produces you a final answer with ZERO extra user input. Let MOTO run for days using the best models without touching it, or for a few hours using a faster draft model. How deep you research and how long it takes is left up to you, the user.
-- **OpenRouter Integration**: Supports both local (LM Studio) and cloud (OpenRouter) models. Use your local LM studio models ran offline from your computer or add your OpenRouter API key to compete and team up 3rd party models from the largest closed source LLMs like ChatGPT, Claude, DeepSeek, Gemini and Perplexity
+- **OpenRouter Integration**: Supports both local (LM Studio) and cloud (OpenRouter) models. Use your local LM Studio models run offline from your computer or add your OpenRouter API key to compete and team up 3rd party models from the largest closed source LLMs like ChatGPT, Claude, DeepSeek, Gemini and Perplexity
 
 ---
 
@@ -50,9 +48,9 @@ Before installation, you need:
 1. **Python 3.8+** - [Download here](https://www.python.org/downloads/)
    - ⚠️ **IMPORTANT**: Check "Add Python to PATH" during installation
 2. **Node.js 16+** - [Download here](https://nodejs.org/)
-3. **LM Studio** (optional but HIGHLY recommended - otherwise your system will need to pay OpenRouter for RAG embedding calls, which is very slow compared to LM studio's local embeddings) - [Download here](https://lmstudio.ai/)
-   - If using open router, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle, however it is always worth a try!)
-   - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will suport. In this develop tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (I.e. GPT OSS 20b, DeepSeek 32B, etc). **If you do not not download LM studio and enable the Nomic agent the system will run much slower and cost a slightly more due to having to use the paid service OpenRouter for RAG calls.**
+3. **LM Studio** (optional but HIGHLY recommended - otherwise your system will need to pay OpenRouter for RAG embedding calls, which is very slow compared to LM Studio's local embeddings) - [Download here](https://lmstudio.ai/)
+   - If using OpenRouter, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle, however it is always worth a try!)
+   - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM Studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM Studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will support. In this developer tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (I.e. GPT OSS 20b, DeepSeek 32B, etc). **If you do not download LM Studio and enable the Nomic agent the system will run much slower and cost slightly more due to having to use the paid service OpenRouter for RAG calls.**
    - Start the local server (port 1234)
 4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download the MOTO deep research harness, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
 5. **On first startup, pick your provider path**: After you acknowledge the disclaimer, MOTO will prompt you to either enter an OpenRouter key or confirm that LM Studio is running. If you save an OpenRouter key there, the recommended default autonomous profile is applied immediately so you can open Settings and see it already selected.
@@ -127,7 +125,7 @@ Before installation, you need:
 - **Backend**: Python 3.8+, FastAPI, Uvicorn
 - **Frontend**: React, Vite, Tailwind CSS
 - **AI**: LM Studio API, OpenRouter API
-- **RAG**: ChromaDB, Nomic Embeddings, or OpenRouter embeddings fallback if LM studio is unavailable (not recommended - slower).
+- **RAG**: ChromaDB, Nomic Embeddings, or OpenRouter embeddings fallback if LM Studio is unavailable (not recommended - slower).
 - **WebSocket**: Real-time updates
 
 ### Key Components
@@ -233,7 +231,7 @@ All configurable per role:
 - Review validator reasoning in logs
 - Ensure prompt is clear and specific
 - Use larger models for better results
-- View the learning curve analysis on the Intrafere.com website and ensure you are not just at a learning curve wall - 100's of rejections in a row before the first acceptance in the brainstorming session can be common.
+- View the learning curve analysis on the Intrafere.com website and ensure you are not just at a learning curve wall - 100s of rejections in a row before the first acceptance in the brainstorming session can be common.
 
 **System running slow**
 - Use faster/smaller models
@@ -253,10 +251,10 @@ All configurable per role:
 - Check logs for detailed token usage
 
 **JSON and output errors**
-- Monitor your model(s) output(s) occassionally to see if its stuck in output loops and is repeatedly utilizing its entire output token budget - this is a sign the model runtime instance from either LM Studio or OpenRouter has corrupted. If this is the case you will either need to Switch OpenRouter hosts for that model, switch models, or if using LM studio you must unload and reload the model. However if this happens once, it is likely to happen again so you should either try to switch hosts (if using OpenRouter), switch runtime engines (if using LM studio), or switch models entirely as some models may be more vulnerable to this than others. This issue does not appear to be related to MOTO harness and the MOTO developers have no control over this deterministic model-loop corruption state. The repetitive nature of the harness appear to stress certain engines, for example when using AMD comptable engines, ROCm *may* have more instabilities than Vulkan as of 1/11/2026. This is an odd bug and it is unclear if this is related to the 3rd party runtime engine's K/V caching mechanism or some other feature of the code. If you find any information on this bug please submit it to the GitHub.
+- Monitor your model(s) output(s) occasionally to see if it's stuck in output loops and is repeatedly utilizing its entire output token budget - this is a sign the model runtime instance from either LM Studio or OpenRouter has corrupted. If this is the case you will either need to switch OpenRouter hosts for that model, switch models, or if using LM Studio you must unload and reload the model. However if this happens once, it is likely to happen again so you should either try to switch hosts (if using OpenRouter), switch runtime engines (if using LM Studio), or switch models entirely as some models may be more vulnerable to this than others. This issue does not appear to be related to the MOTO harness and the MOTO developers have no control over this deterministic model-loop corruption state. The repetitive nature of the harness appears to stress certain engines, for example when using AMD compatible engines, ROCm *may* have more instabilities than Vulkan as of 1/11/2026. This is an odd bug and it is unclear if this is related to the 3rd party runtime engine's K/V caching mechanism or some other feature of the code. If you find any information on this bug please submit it to GitHub.
 
 **JSON truncation errors**
-- Ensure you are not experiencing the output error looping mentioned above that some LLM runtime engines seem to experience, if your JSON truncation is not a result of looping then you should try increasing your models max output tokens. It is highly likely that your model was truncated because you did not set enough output tokens (20% or more of your token budget being allotted for token output is standard practice, longer thinking models like DeepSeek V3.2 Speciale may require much larger splits such as (164K total tokens, 64K reserved for output tokens), however most models function great closer to the 20% output budget mark.
+- Ensure you are not experiencing the output error looping mentioned above that some LLM runtime engines seem to experience. If your JSON truncation is not a result of looping then you should try increasing your model's max output tokens. It is highly likely that your model was truncated because you did not set enough output tokens (20% or more of your token budget being allotted for token output is standard practice, longer thinking models like DeepSeek V3.2 Speciale may require much larger splits such as (164K total tokens, 64K reserved for output tokens), however most models function great closer to the 20% output budget mark.
 ---
 
 ## 📚 Documentation
diff --git a/backend/api/main.py b/backend/api/main.py
index 4639098..b78f433 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -8,6 +8,7 @@
 from backend.api.middleware import setup_middleware
 from backend.api.routes import aggregator, websocket, compiler, autonomous, boost, workflow, openrouter, download
 from backend.shared.lm_studio_client import lm_studio_client
+from backend.shared.config import rag_config, system_config
 from backend.aggregator.core.coordinator import coordinator
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
@@ -30,6 +31,34 @@ async def lifespan(app: FastAPI):
     """Lifespan events for the FastAPI app."""
     # Startup
     logger.info("Starting ASI Aggregator System...")
+
+    # Restore securely persisted provider credentials before the UI checks status.
+    from backend.shared.api_client_manager import api_client_manager
+    try:
+        from backend.shared.secret_store import (
+            SecretStoreError,
+            load_openrouter_api_key,
+            load_wolfram_api_key,
+        )
+        from backend.shared.wolfram_alpha_client import initialize_wolfram_client
+
+        openrouter_api_key = load_openrouter_api_key()
+        if openrouter_api_key:
+            rag_config.openrouter_api_key = openrouter_api_key
+            rag_config.openrouter_enabled = True
+            api_client_manager.set_openrouter_api_key(openrouter_api_key)
+            logger.info("Restored OpenRouter API key from secure backend storage")
+
+        wolfram_api_key = load_wolfram_api_key()
+        if wolfram_api_key:
+            initialize_wolfram_client(wolfram_api_key)
+            system_config.wolfram_alpha_api_key = wolfram_api_key
+            system_config.wolfram_alpha_enabled = True
+            logger.info("Restored Wolfram Alpha API key from secure backend storage")
+    except SecretStoreError as e:
+        logger.warning(f"Secure credential storage unavailable on startup: {e}")
+    except Exception as e:
+        logger.warning(f"Failed to restore provider credentials on startup: {e}")
     
     # Test LM Studio connection (non-blocking - system works without it)
     connected = await lm_studio_client.test_connection()
@@ -78,7 +107,6 @@ async def lifespan(app: FastAPI):
     boost_manager.set_broadcast_callback(websocket.broadcast_event)
     
     # Set API client manager broadcaster (token tracking, rate limits, fallbacks)
-    from backend.shared.api_client_manager import api_client_manager
     api_client_manager.set_broadcast_callback(websocket.broadcast_event)
     
     logger.info("ASI Aggregator System ready")
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index e101281..b07716b 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -4,17 +4,20 @@
 """
 import asyncio
 import logging
-import os
 from pathlib import Path
 from typing import Optional, Any, Dict
 from fastapi import APIRouter, HTTPException, BackgroundTasks
 
 from backend.shared.models import AutonomousResearchStartRequest, CritiqueRequest
+from backend.shared.path_safety import (
+    resolve_path_within_root,
+    validate_single_path_component,
+)
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
 from backend.autonomous.memory.research_metadata import research_metadata, ResearchMetadata
 from backend.autonomous.memory.brainstorm_memory import brainstorm_memory, BrainstormMemory
 from backend.autonomous.memory.paper_library import paper_library, PaperLibrary
-from backend.autonomous.memory.final_answer_memory import final_answer_memory
+from backend.autonomous.memory.final_answer_memory import final_answer_memory, FinalAnswerMemory
 from backend.autonomous.memory.session_manager import session_manager
 from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
 from backend.aggregator.core.coordinator import coordinator
@@ -38,7 +41,9 @@ def _validate_history_session_id(session_id: str) -> None:
     if session_id == "legacy":
         return
 
-    if session_id in {".", ".."} or "/" in session_id or "\\" in session_id:
+    try:
+        validate_single_path_component(session_id, "session ID")
+    except ValueError:
         raise HTTPException(status_code=400, detail=f"Invalid session ID: {session_id}")
 
 
@@ -72,10 +77,12 @@ def _resolve_history_session_paths(session_id: str) -> Dict[str, Path]:
             "workflow_state_path": Path(system_config.auto_workflow_state_file),
         }
     else:
-        sessions_root = Path(system_config.auto_sessions_base_dir).resolve()
-        session_root = (sessions_root / session_id).resolve()
-
-        if session_root.parent != sessions_root:
+        try:
+            session_root = resolve_path_within_root(
+                Path(system_config.auto_sessions_base_dir),
+                validate_single_path_component(session_id, "session ID"),
+            )
+        except ValueError:
             raise HTTPException(status_code=400, detail=f"Invalid session ID: {session_id}")
 
         if not session_root.exists():
@@ -98,6 +105,34 @@ def _resolve_history_session_paths(session_id: str) -> Dict[str, Path]:
     return paths
 
 
+def _resolve_final_answer_dir(answer_id: str) -> Path:
+    """Resolve a legacy or session-based final answer directory safely."""
+    from backend.shared.config import system_config
+
+    if answer_id == "legacy":
+        base_dir = Path(system_config.data_dir) / "auto_final_answer"
+    else:
+        try:
+            session_dir = resolve_path_within_root(
+                Path(system_config.auto_sessions_base_dir),
+                validate_single_path_component(answer_id, "final answer ID"),
+            )
+        except ValueError:
+            raise HTTPException(status_code=400, detail=f"Invalid final answer ID: {answer_id}")
+
+        base_dir = session_dir / "final_answer"
+
+    if not base_dir.exists():
+        raise HTTPException(status_code=404, detail=f"Final answer not found: {answer_id}")
+
+    return base_dir
+
+
+def _build_scoped_final_answer_memory(answer_id: str) -> FinalAnswerMemory:
+    """Create a temporary FinalAnswerMemory rooted at one validated answer directory."""
+    return FinalAnswerMemory.build_scoped_memory(_resolve_final_answer_dir(answer_id))
+
+
 def _build_scoped_paper_library(paths: Dict[str, Path]) -> PaperLibrary:
     """Create a temporary PaperLibrary rooted at one legacy/session papers directory."""
     scoped_library = PaperLibrary()
@@ -194,7 +229,7 @@ async def _generate_autonomous_paper_critique(
     paper_id: str,
     paper_title: str,
     content: str,
-    base_path: str,
+    base_dir: Path,
     request: Optional[CritiqueRequest] = None,
 ) -> Dict[str, Any]:
     """Generate and persist a critique for an autonomous Stage 2 paper."""
@@ -281,7 +316,7 @@ async def _generate_autonomous_paper_critique(
         full_critique=critique_data.get("full_critique", ""),
     )
 
-    saved_critique = await save_critique("autonomous_paper", critique, paper_id, base_path)
+    saved_critique = await save_critique("autonomous_paper", critique, paper_id, base_dir)
     return {
         "success": True,
         "critique": saved_critique.model_dump(),
@@ -294,12 +329,12 @@ async def _get_autonomous_paper_critiques_response(
     *,
     paper_id: str,
     paper_title: str,
-    base_path: str,
+    base_dir: Path,
 ) -> Dict[str, Any]:
     """Load critique history for an autonomous Stage 2 paper."""
     from backend.shared.critique_memory import get_critiques
 
-    critiques = await get_critiques("autonomous_paper", paper_id, base_path)
+    critiques = await get_critiques("autonomous_paper", paper_id, base_dir)
     return {
         "success": True,
         "paper_id": paper_id,
@@ -338,7 +373,7 @@ async def _delete_autonomous_paper_from_scope(
         raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
 
     paper_path = scoped_paper_library.get_paper_path(paper_id)
-    base_path = os.path.dirname(paper_path)
+    base_dir = Path(paper_path).parent
     source_brainstorms = metadata.source_brainstorm_ids or []
 
     success = await scoped_paper_library.delete_paper(paper_id)
@@ -359,7 +394,7 @@ async def _delete_autonomous_paper_from_scope(
             )
 
     try:
-        await clear_critiques("autonomous_paper", paper_id, base_path)
+        await clear_critiques("autonomous_paper", paper_id, base_dir)
         logger.info(f"Cleared critiques for deleted paper {paper_id}")
     except Exception as e:
         logger.warning(f"Failed to clear critiques for paper {paper_id}: {e}")
@@ -662,14 +697,14 @@ async def get_all_papers():
         for p in papers:
             # Get latest critique for this paper
             paper_path = paper_library.get_paper_path(p.paper_id)
-            base_path = None
+            base_dir = None
             if paper_path:
-                base_path = str(Path(paper_path).parent)
+                base_dir = Path(paper_path).parent
             
             latest_critique = await get_latest_critique(
                 paper_type="autonomous_paper",
                 paper_id=p.paper_id,
-                base_path=base_path
+                base_dir=base_dir
             )
             
             # Calculate average rating if critique exists
@@ -1752,18 +1787,8 @@ async def get_final_answer_archived_papers(answer_id: str):
     Returns:
         List of paper metadata
     """
-    from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
-    from backend.shared.config import system_config
-    from pathlib import Path
-    
     try:
-        # Create temporary memory instance with correct path
-        memory = FinalAnswerMemory()
-        if answer_id == "legacy":
-            memory._base_dir = Path(system_config.data_dir) / "auto_final_answer"
-        else:
-            memory._base_dir = Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer"
-        
+        memory = _build_scoped_final_answer_memory(answer_id)
         papers = await memory.get_archived_papers_list()
         return {"papers": papers}
     except Exception as e:
@@ -1783,18 +1808,8 @@ async def get_final_answer_archived_paper(answer_id: str, paper_id: str):
     Returns:
         Paper content, abstract, outline, metadata
     """
-    from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
-    from backend.shared.config import system_config
-    from pathlib import Path
-    
     try:
-        # Create temporary memory instance with correct path
-        memory = FinalAnswerMemory()
-        if answer_id == "legacy":
-            memory._base_dir = Path(system_config.data_dir) / "auto_final_answer"
-        else:
-            memory._base_dir = Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer"
-        
+        memory = _build_scoped_final_answer_memory(answer_id)
         paper = await memory.get_archived_paper(paper_id)
         if paper is None:
             raise HTTPException(status_code=404, detail=f"Archived paper {paper_id} not found")
@@ -1818,18 +1833,8 @@ async def get_final_answer_archived_brainstorms(answer_id: str):
     Returns:
         List of brainstorm metadata
     """
-    from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
-    from backend.shared.config import system_config
-    from pathlib import Path
-    
     try:
-        # Create temporary memory instance with correct path
-        memory = FinalAnswerMemory()
-        if answer_id == "legacy":
-            memory._base_dir = Path(system_config.data_dir) / "auto_final_answer"
-        else:
-            memory._base_dir = Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer"
-        
+        memory = _build_scoped_final_answer_memory(answer_id)
         brainstorms = await memory.get_archived_brainstorms_list()
         return {"brainstorms": brainstorms}
     except Exception as e:
@@ -1849,18 +1854,8 @@ async def get_final_answer_archived_brainstorm(answer_id: str, topic_id: str):
     Returns:
         Brainstorm content and metadata
     """
-    from backend.autonomous.memory.final_answer_memory import FinalAnswerMemory
-    from backend.shared.config import system_config
-    from pathlib import Path
-    
     try:
-        # Create temporary memory instance with correct path
-        memory = FinalAnswerMemory()
-        if answer_id == "legacy":
-            memory._base_dir = Path(system_config.data_dir) / "auto_final_answer"
-        else:
-            memory._base_dir = Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer"
-        
+        memory = _build_scoped_final_answer_memory(answer_id)
         brainstorm = await memory.get_archived_brainstorm(topic_id)
         if brainstorm is None:
             raise HTTPException(status_code=404, detail=f"Archived brainstorm {topic_id} not found")
@@ -1906,13 +1901,13 @@ async def request_paper_critique(paper_id: str, request: CritiqueRequest = None)
             raise HTTPException(status_code=404, detail=f"Paper content not found: {paper_id}")
 
         paper_path = paper_library.get_paper_path(paper_id)
-        base_path = os.path.dirname(paper_path)
+        base_dir = Path(paper_path).parent
 
         return await _generate_autonomous_paper_critique(
             paper_id=paper_id,
             paper_title=metadata.title,
             content=content,
-            base_path=base_path,
+            base_dir=base_dir,
             request=request,
         )
     except HTTPException:
@@ -1939,12 +1934,12 @@ async def get_paper_critiques(paper_id: str):
             raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
 
         paper_path = paper_library.get_paper_path(paper_id)
-        base_path = os.path.dirname(paper_path)
+        base_dir = Path(paper_path).parent
 
         return await _get_autonomous_paper_critiques_response(
             paper_id=paper_id,
             paper_title=metadata.title,
-            base_path=base_path,
+            base_dir=base_dir,
         )
     except HTTPException:
         raise
@@ -1980,11 +1975,9 @@ async def delete_paper_critiques(paper_id: str, confirm: bool = False):
         if not metadata:
             raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
         
-        # Get session-aware base path for critique storage
-        paper_path = paper_library.get_paper_path(paper_id)
-        base_path = os.path.dirname(paper_path)
+        base_dir = Path(paper_library.get_paper_path(paper_id)).parent
         
-        await clear_critiques("autonomous_paper", paper_id, base_path)
+        await clear_critiques("autonomous_paper", paper_id, base_dir)
         
         return {
             "success": True,
@@ -2031,7 +2024,7 @@ async def request_history_paper_critique(
             paper_id=paper_id,
             paper_title=metadata.title,
             content=content,
-            base_path=str(paths["papers_dir"]),
+            base_dir=paths["papers_dir"],
             request=request,
         )
     except HTTPException:
@@ -2056,7 +2049,7 @@ async def get_history_paper_critiques(session_id: str, paper_id: str):
         return await _get_autonomous_paper_critiques_response(
             paper_id=paper_id,
             paper_title=metadata.title,
-            base_path=str(paths["papers_dir"]),
+            base_dir=paths["papers_dir"],
         )
     except HTTPException:
         raise
@@ -2088,13 +2081,11 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
     Returns:
         The critique with ratings and feedback
     """
-    from backend.shared.config import system_config
     from backend.shared.critique_prompts import build_critique_prompt, DEFAULT_CRITIQUE_PROMPT
     from backend.shared.critique_memory import save_critique
     from backend.shared.models import PaperCritique, CritiqueRequest
     from backend.shared.api_client_manager import api_client_manager
     from backend.shared.utils import count_tokens
-    from pathlib import Path
     import uuid
     from datetime import datetime
     
@@ -2112,12 +2103,7 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
         if not content:
             raise HTTPException(status_code=404, detail=f"Final answer content not found: {answer_id}")
         
-        # Determine session-aware base path for critique storage
-        # Final answers can be in legacy or session-based locations
-        if answer_id == "legacy":
-            base_path = str(Path(system_config.data_dir) / "auto_final_answer")
-        else:
-            base_path = str(Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer")
+        base_dir = _resolve_final_answer_dir(answer_id)
         
         # Try to get validator config from request body first (allows critiques without starting research)
         # Then fall back to autonomous coordinator's stored config
@@ -2246,7 +2232,7 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
         )
         
         # Save the critique with session-aware path
-        saved_critique = await save_critique("final_answer", critique, answer_id, base_path)
+        saved_critique = await save_critique("final_answer", critique, answer_id, base_dir)
         
         return {
             "success": True,
@@ -2274,8 +2260,6 @@ async def get_final_answer_critiques(answer_id: str):
         List of critiques for the final answer
     """
     from backend.shared.critique_memory import get_critiques
-    from backend.shared.config import system_config
-    from pathlib import Path
     
     try:
         # Verify final answer exists
@@ -2285,14 +2269,10 @@ async def get_final_answer_critiques(answer_id: str):
         if not final_answer:
             raise HTTPException(status_code=404, detail=f"Final answer not found: {answer_id}")
         
-        # Determine session-aware base path for critique storage
-        if answer_id == "legacy":
-            base_path = str(Path(system_config.data_dir) / "auto_final_answer")
-        else:
-            base_path = str(Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer")
+        base_dir = _resolve_final_answer_dir(answer_id)
         
         title = final_answer.get("title", "Final Answer")
-        critiques = await get_critiques("final_answer", answer_id, base_path)
+        critiques = await get_critiques("final_answer", answer_id, base_dir)
         
         return {
             "success": True,
@@ -2322,8 +2302,6 @@ async def delete_final_answer_critiques(answer_id: str, confirm: bool = False):
         Success status
     """
     from backend.shared.critique_memory import clear_critiques
-    from backend.shared.config import system_config
-    from pathlib import Path
     
     try:
         if not confirm:
@@ -2339,13 +2317,9 @@ async def delete_final_answer_critiques(answer_id: str, confirm: bool = False):
         if not final_answer:
             raise HTTPException(status_code=404, detail=f"Final answer not found: {answer_id}")
         
-        # Determine session-aware base path for critique storage
-        if answer_id == "legacy":
-            base_path = str(Path(system_config.data_dir) / "auto_final_answer")
-        else:
-            base_path = str(Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer")
+        base_dir = _resolve_final_answer_dir(answer_id)
         
-        await clear_critiques("final_answer", answer_id, base_path)
+        await clear_critiques("final_answer", answer_id, base_dir)
         
         return {
             "success": True,
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index 34cd872..cb41ef0 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -737,6 +737,7 @@ async def set_wolfram_api_key(request: dict):
     Returns:
         Success status and validation result
     """
+    from backend.shared.secret_store import SecretStoreError, store_wolfram_api_key
     from backend.shared.wolfram_alpha_client import initialize_wolfram_client, get_wolfram_client
     
     try:
@@ -761,6 +762,9 @@ async def set_wolfram_api_key(request: dict):
         # Store in system config
         system_config.wolfram_alpha_api_key = api_key
         system_config.wolfram_alpha_enabled = True
+
+        # Persist to secure backend storage so the key survives restarts.
+        store_wolfram_api_key(api_key)
         
         logger.info("Wolfram Alpha API key set and validated")
         
@@ -770,6 +774,9 @@ async def set_wolfram_api_key(request: dict):
             "test_result": test_result
         }
         
+    except SecretStoreError as e:
+        logger.error(f"Failed to persist Wolfram Alpha API key securely: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
     except HTTPException:
         raise
     except Exception as e:
@@ -785,6 +792,7 @@ async def clear_wolfram_api_key():
     Returns:
         Success status
     """
+    from backend.shared.secret_store import SecretStoreError, clear_wolfram_api_key as clear_persisted_wolfram_api_key
     from backend.shared.wolfram_alpha_client import clear_wolfram_client
     
     try:
@@ -794,6 +802,7 @@ async def clear_wolfram_api_key():
         # Clear from config
         system_config.wolfram_alpha_api_key = None
         system_config.wolfram_alpha_enabled = False
+        clear_persisted_wolfram_api_key()
         
         logger.info("Wolfram Alpha API key cleared")
         
@@ -802,6 +811,9 @@ async def clear_wolfram_api_key():
             "message": "Wolfram Alpha API key cleared"
         }
         
+    except SecretStoreError as e:
+        logger.error(f"Failed to clear Wolfram Alpha API key from secure storage: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to clear Wolfram Alpha API key: {e}")
         raise HTTPException(status_code=500, detail=str(e))
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index 4f6c586..80e2642 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -22,6 +22,11 @@
 from backend.shared.openrouter_client import OpenRouterClient
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.free_model_manager import free_model_manager
+from backend.shared.secret_store import (
+    SecretStoreError,
+    clear_openrouter_api_key,
+    store_openrouter_api_key,
+)
 from backend.shared.models import FreeModelSettings
 
 router = APIRouter()
@@ -83,11 +88,12 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
         Success status and validation result
     """
     try:
-        if not request.api_key:
+        api_key = request.api_key.strip()
+        if not api_key:
             raise HTTPException(status_code=400, detail="API key is required")
         
         # Validate API key by testing connection
-        client = OpenRouterClient(request.api_key)
+        client = OpenRouterClient(api_key)
         try:
             models = await client.list_models()
             
@@ -98,11 +104,14 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
                 )
             
             # Store the API key globally
-            rag_config.openrouter_api_key = request.api_key
+            rag_config.openrouter_api_key = api_key
             rag_config.openrouter_enabled = True
             
             # Also configure the API client manager
-            api_client_manager.set_openrouter_api_key(request.api_key)
+            api_client_manager.set_openrouter_api_key(api_key)
+
+            # Persist to secure OS-backed storage so the key survives restarts.
+            store_openrouter_api_key(api_key)
             
             # Reset exhaustion flags so roles can retry OpenRouter
             free_model_manager.clear_account_exhaustion()
@@ -121,6 +130,9 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
         finally:
             await client.close()
             
+    except SecretStoreError as e:
+        logger.error(f"Failed to persist OpenRouter API key securely: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
     except HTTPException:
         raise
     except Exception as e:
@@ -143,6 +155,7 @@ async def clear_api_key() -> Dict[str, Any]:
         rag_config.openrouter_api_key = None
         rag_config.openrouter_enabled = False
         api_client_manager.set_openrouter_api_key(None)
+        clear_openrouter_api_key()
         
         logger.info("Global OpenRouter API key cleared")
         
@@ -150,6 +163,9 @@ async def clear_api_key() -> Dict[str, Any]:
             "success": True,
             "message": "OpenRouter API key cleared"
         }
+    except SecretStoreError as e:
+        logger.error(f"Failed to clear OpenRouter API key from secure storage: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to clear OpenRouter API key: {e}")
         raise HTTPException(status_code=500, detail=f"Failed to clear API key: {str(e)}")
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 1319faa..d741024 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -3935,12 +3935,12 @@ async def _auto_generate_paper_critique(
             
             paper_path = paper_library.get_paper_path(paper_id)  # Synchronous, returns str
             if paper_path:
-                base_path = Path(paper_path).parent
+                paper_dir = Path(paper_path).parent
                 await save_critique(
                     paper_type="autonomous_paper",
                     critique=critique,
                     paper_id=paper_id,
-                    base_path=str(base_path)
+                    base_dir=paper_dir
                 )
                 logger.info(
                     f"Auto-critique saved for paper {paper_id}: "
diff --git a/backend/autonomous/memory/final_answer_memory.py b/backend/autonomous/memory/final_answer_memory.py
index 4b58ae0..b1ca815 100644
--- a/backend/autonomous/memory/final_answer_memory.py
+++ b/backend/autonomous/memory/final_answer_memory.py
@@ -14,6 +14,10 @@
 import aiofiles
 
 from backend.shared.config import system_config
+from backend.shared.path_safety import (
+    resolve_path_within_root,
+    validate_single_path_component,
+)
 from backend.shared.models import (
     FinalAnswerState,
     CertaintyAssessment,
@@ -53,6 +57,35 @@ def __init__(self):
         # In-memory state
         self._state: Optional[FinalAnswerState] = None
         self._session_manager = None
+
+    @classmethod
+    def build_scoped_memory(cls, base_dir: Path) -> "FinalAnswerMemory":
+        """Create a temporary instance rooted at one validated final-answer directory."""
+        memory = cls()
+        memory._base_dir = base_dir
+        memory._state_path = base_dir / "final_answer_state.json"
+        memory._volume_path = base_dir / "volume_organization.json"
+        memory._rejections_path = base_dir / "tier3_rejections.txt"
+        memory._final_volume_path = base_dir / "final_volume.txt"
+        return memory
+
+    @staticmethod
+    def resolve_answer_base_dir(answer_id: str) -> Optional[Path]:
+        """Resolve a legacy or session-based final-answer directory safely."""
+        if answer_id == "legacy":
+            base_dir = Path(system_config.data_dir) / "auto_final_answer"
+        else:
+            try:
+                session_dir = resolve_path_within_root(
+                    Path(system_config.auto_sessions_base_dir),
+                    validate_single_path_component(answer_id, "final answer ID"),
+                )
+            except ValueError:
+                return None
+
+            base_dir = session_dir / "final_answer"
+
+        return base_dir if base_dir.exists() else None
     
     def set_session_manager(self, session_manager) -> None:
         """Set session manager for session-based path resolution."""
@@ -1441,13 +1474,8 @@ async def get_final_answer_by_id(self, answer_id: str) -> Optional[Dict[str, Any
             - content: Full text of volume/paper
             - chapters: List of chapter details (long form only)
         """
-        # Determine location
-        if answer_id == "legacy":
-            base_dir = Path(system_config.data_dir) / "auto_final_answer"
-        else:
-            base_dir = Path(system_config.data_dir) / "auto_sessions" / answer_id / "final_answer"
-        
-        if not base_dir.exists():
+        base_dir = self.resolve_answer_base_dir(answer_id)
+        if not base_dir:
             return None
         
         state_path = base_dir / "final_answer_state.json"
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index aa009af..24cf6e9 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -14,6 +14,10 @@
 
 from backend.shared.config import system_config
 from backend.shared.models import PaperMetadata
+from backend.shared.path_safety import (
+    resolve_path_within_root,
+    validate_single_path_component,
+)
 
 logger = logging.getLogger(__name__)
 
@@ -115,12 +119,15 @@ def get_history_papers_dir(self, session_id: str) -> Optional[Path]:
             papers_dir = Path(system_config.auto_papers_dir)
             return papers_dir if papers_dir.exists() else None
 
-        if not session_id or session_id in {".", ".."} or "/" in session_id or "\\" in session_id:
+        try:
+            safe_session_id = validate_single_path_component(session_id, "session ID")
+        except ValueError:
             return None
 
-        sessions_root = Path(system_config.auto_sessions_base_dir).resolve()
-        session_dir = (sessions_root / session_id).resolve()
-        if session_dir.parent != sessions_root:
+        try:
+            sessions_root = Path(system_config.auto_sessions_base_dir)
+            session_dir = resolve_path_within_root(sessions_root, safe_session_id)
+        except ValueError:
             return None
 
         papers_dir = session_dir / "papers"
@@ -132,7 +139,11 @@ async def _get_history_user_prompt(self, session_id: str) -> str:
             metadata_path = Path(system_config.auto_research_metadata_file)
             default_prompt = "Legacy research session"
         else:
-            metadata_path = Path(system_config.auto_sessions_base_dir) / session_id / "session_metadata.json"
+            papers_dir = self.get_history_papers_dir(session_id)
+            if not papers_dir:
+                return "Unknown research question"
+
+            metadata_path = papers_dir.parent / "session_metadata.json"
             default_prompt = "Unknown research question"
 
         if not metadata_path.exists():
@@ -177,7 +188,7 @@ async def _list_history_papers_from_directory(self, papers_dir: Path, session_id
             latest_critique = await get_latest_critique(
                 paper_type="autonomous_paper",
                 paper_id=metadata.paper_id,
-                base_path=str(papers_dir)
+                base_dir=papers_dir
             )
 
             history_papers.append({
@@ -243,7 +254,7 @@ async def get_history_paper(self, session_id: str, paper_id: str) -> Optional[Di
         latest_critique = await get_latest_critique(
             paper_type="autonomous_paper",
             paper_id=paper_id,
-            base_path=str(papers_dir)
+            base_dir=papers_dir
         )
 
         return {
diff --git a/backend/autonomous/memory/research_metadata.py b/backend/autonomous/memory/research_metadata.py
index 1375987..c801537 100644
--- a/backend/autonomous/memory/research_metadata.py
+++ b/backend/autonomous/memory/research_metadata.py
@@ -12,6 +12,7 @@
 
 from backend.shared.config import system_config
 from backend.shared.models import BrainstormMetadata, PaperMetadata
+from backend.shared.path_safety import resolve_path_within_root
 
 logger = logging.getLogger(__name__)
 
@@ -41,7 +42,10 @@ def set_session_manager(self, session_manager) -> None:
         """Set session manager for session-based path resolution."""
         self._session_manager = session_manager
         if session_manager and session_manager.is_session_active:
-            session_path = session_manager.session_path
+            session_path = resolve_path_within_root(
+                session_manager.session_path.parent,
+                session_manager.session_path.name,
+            )
             self._metadata_path = session_path / "session_metadata.json"
             self._stats_path = session_path / "session_stats.json"
             self._workflow_state_path = session_path / "workflow_state.json"
diff --git a/backend/autonomous/memory/session_manager.py b/backend/autonomous/memory/session_manager.py
index d6e452e..fa9be68 100644
--- a/backend/autonomous/memory/session_manager.py
+++ b/backend/autonomous/memory/session_manager.py
@@ -12,6 +12,11 @@
 from datetime import datetime
 import aiofiles
 
+from backend.shared.path_safety import (
+    resolve_path_within_root,
+    validate_single_path_component,
+)
+
 logger = logging.getLogger(__name__)
 
 
@@ -170,7 +175,12 @@ async def resume_session(self, session_id: str, base_dir: str = "backend/data/au
         """
         async with self._lock:
             self._base_dir = Path(base_dir)
-            self._session_path = self._base_dir / session_id
+            try:
+                safe_session_id = validate_single_path_component(session_id, "session ID")
+                self._session_path = resolve_path_within_root(self._base_dir, safe_session_id)
+            except ValueError as e:
+                logger.error(f"Invalid session ID: {session_id} ({e})")
+                return None
             
             if not self._session_path.exists():
                 logger.error(f"Session not found: {session_id}")
diff --git a/backend/shared/critique_memory.py b/backend/shared/critique_memory.py
index 5c4b2aa..a57cfc0 100644
--- a/backend/shared/critique_memory.py
+++ b/backend/shared/critique_memory.py
@@ -19,22 +19,23 @@
    - Final answers: backend/data/auto_sessions/{session_id}/final_answer/
    - Created for new research sessions
 
-HOW TO USE base_path PARAMETER:
-- For session-based papers: Pass the paper's directory from paper_library.get_paper_path()
-- For final answers: Pass the final answer's base directory
-- If base_path is None, falls back to legacy paths (for backward compatibility)
+HOW TO USE base_dir PARAMETER:
+- For session-based papers: Pass the trusted papers directory
+- For final answers: Pass the trusted final answer directory
+- If base_dir is None, falls back to legacy paths (for backward compatibility)
 
-The compiler paper type always uses a single global file and ignores base_path.
+The compiler paper type always uses a single global file and ignores base_dir.
 """
 
 import json
-import os
 import logging
+from pathlib import Path
 from typing import List, Optional, Literal
 from datetime import datetime
 import uuid
 
 from backend.shared.models import PaperCritique
+from backend.shared.path_safety import validate_single_path_component
 
 logger = logging.getLogger(__name__)
 
@@ -45,164 +46,136 @@
 PaperType = Literal["autonomous_paper", "final_answer", "compiler_paper"]
 
 
+def _get_legacy_data_dir() -> Path:
+    """Return the shared legacy data directory for critique storage."""
+    return Path(__file__).resolve().parents[1] / "data"
+
+
 def _get_critiques_file_path(
     paper_type: PaperType,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
-) -> str:
+    base_dir: Optional[Path] = None
+) -> Path:
     """
     Get the file path for storing critiques based on paper type.
-    
+
     Args:
         paper_type: Type of paper ("autonomous_paper", "final_answer", "compiler_paper")
         paper_id: Required for autonomous_paper type (used in filename)
-        base_path: Optional override path. If provided, critiques are stored here
-                   instead of legacy paths. This enables session-aware storage.
-        
+        base_dir: Optional trusted directory for session-aware storage.
+
     Returns:
         Path to the critiques JSON file
     """
-    # If base_path is provided, use it for session-aware storage
-    if base_path:
-        os.makedirs(base_path, exist_ok=True)
-        
+    safe_paper_id = None
+    if paper_id:
+        safe_paper_id = validate_single_path_component(paper_id, "paper ID")
+
+    if base_dir is not None:
+        base_dir.mkdir(parents=True, exist_ok=True)
+
         if paper_type == "autonomous_paper":
-            if not paper_id:
+            if not safe_paper_id:
                 raise ValueError("paper_id is required for autonomous_paper type")
-            return os.path.join(base_path, f"paper_{paper_id}_critiques.json")
-        
-        elif paper_type == "final_answer":
-            # Final answer critiques stored in the final answer directory
-            return os.path.join(base_path, "final_answer_critiques.json")
-        
-        elif paper_type == "compiler_paper":
-            # Compiler always uses global path (ignore base_path)
-            pass  # Fall through to legacy handling
-        
-        else:
+            return base_dir / f"paper_{safe_paper_id}_critiques.json"
+
+        if paper_type == "final_answer":
+            return base_dir / "final_answer_critiques.json"
+
+        if paper_type != "compiler_paper":
             raise ValueError(f"Unknown paper_type: {paper_type}")
-    
-    # Legacy paths (fallback when base_path not provided)
-    data_dir = os.path.join(os.path.dirname(os.path.dirname(__file__)), "data")
-    
+
+    data_dir = _get_legacy_data_dir()
+
     if paper_type == "autonomous_paper":
-        if not paper_id:
+        if not safe_paper_id:
             raise ValueError("paper_id is required for autonomous_paper type")
-        papers_dir = os.path.join(data_dir, "auto_papers")
-        os.makedirs(papers_dir, exist_ok=True)
-        return os.path.join(papers_dir, f"paper_{paper_id}_critiques.json")
-    
-    elif paper_type == "final_answer":
-        final_answer_dir = os.path.join(data_dir, "auto_final_answer")
-        os.makedirs(final_answer_dir, exist_ok=True)
-        return os.path.join(final_answer_dir, "final_answer_critiques.json")
-    
-    elif paper_type == "compiler_paper":
-        os.makedirs(data_dir, exist_ok=True)
-        return os.path.join(data_dir, "compiler_paper_critiques.json")
-    
-    else:
-        raise ValueError(f"Unknown paper_type: {paper_type}")
+        papers_dir = data_dir / "auto_papers"
+        papers_dir.mkdir(parents=True, exist_ok=True)
+        return papers_dir / f"paper_{safe_paper_id}_critiques.json"
+
+    if paper_type == "final_answer":
+        final_answer_dir = data_dir / "auto_final_answer"
+        final_answer_dir.mkdir(parents=True, exist_ok=True)
+        return final_answer_dir / "final_answer_critiques.json"
+
+    if paper_type == "compiler_paper":
+        data_dir.mkdir(parents=True, exist_ok=True)
+        return data_dir / "compiler_paper_critiques.json"
+
+    raise ValueError(f"Unknown paper_type: {paper_type}")
 
 
 async def save_critique(
     paper_type: PaperType,
     critique: PaperCritique,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
+    base_dir: Optional[Path] = None
 ) -> PaperCritique:
     """
     Save a critique to the paper's critique history.
-    
+
     Maintains a maximum of MAX_CRITIQUES_PER_PAPER critiques per paper.
     Oldest critiques are removed when the limit is exceeded.
-    
-    Args:
-        paper_type: Type of paper
-        critique: The PaperCritique to save
-        paper_id: Required for autonomous_paper type
-        base_path: Optional override path for session-aware storage.
-                   If provided, critiques are stored in this directory.
-                   If None, falls back to legacy paths.
-        
-    Returns:
-        The saved PaperCritique (with generated critique_id if not set)
     """
-    file_path = _get_critiques_file_path(paper_type, paper_id, base_path)
-    
-    # Ensure critique has an ID
+    file_path = _get_critiques_file_path(paper_type, paper_id, base_dir)
+
     if not critique.critique_id:
         critique.critique_id = str(uuid.uuid4())[:8]
-    
-    # Load existing critiques
-    critiques = await get_critiques(paper_type, paper_id, base_path)
-    
-    # Add new critique at the beginning (newest first)
+
+    critiques = await get_critiques(paper_type, paper_id, base_dir)
     critiques.insert(0, critique)
-    
-    # Enforce max limit (remove oldest)
+
     while len(critiques) > MAX_CRITIQUES_PER_PAPER:
         removed = critiques.pop()
-        logger.info(f"Removed oldest critique {removed.critique_id} to maintain limit of {MAX_CRITIQUES_PER_PAPER}")
-    
-    # Save to file
+        logger.info(
+            f"Removed oldest critique {removed.critique_id} "
+            f"to maintain limit of {MAX_CRITIQUES_PER_PAPER}"
+        )
+
     critiques_data = [c.model_dump() for c in critiques]
-    
-    # Convert datetime objects to ISO format strings for JSON serialization
-    for c in critiques_data:
-        if isinstance(c.get("date"), datetime):
-            c["date"] = c["date"].isoformat()
-    
+    for critique_dict in critiques_data:
+        if isinstance(critique_dict.get("date"), datetime):
+            critique_dict["date"] = critique_dict["date"].isoformat()
+
     try:
         with open(file_path, "w", encoding="utf-8") as f:
             json.dump(critiques_data, f, indent=2, default=str)
-        logger.info(f"Saved critique {critique.critique_id} for {paper_type}" + 
-                   (f" paper_id={paper_id}" if paper_id else "") +
-                   (f" at {file_path}" if base_path else ""))
+        logger.info(
+            f"Saved critique {critique.critique_id} for {paper_type}"
+            + (f" paper_id={paper_id}" if paper_id else "")
+            + (f" at {file_path}" if base_dir else "")
+        )
     except Exception as e:
         logger.error(f"Failed to save critique: {e}")
         raise
-    
+
     return critique
 
 
 async def get_critiques(
     paper_type: PaperType,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
+    base_dir: Optional[Path] = None
 ) -> List[PaperCritique]:
-    """
-    Get all critiques for a paper.
-    
-    Args:
-        paper_type: Type of paper
-        paper_id: Required for autonomous_paper type
-        base_path: Optional override path for session-aware storage.
-                   If provided, looks for critiques in this directory.
-                   If None, falls back to legacy paths.
-        
-    Returns:
-        List of PaperCritique objects (newest first)
-    """
-    file_path = _get_critiques_file_path(paper_type, paper_id, base_path)
-    
-    if not os.path.exists(file_path):
+    """Get all critiques for a paper."""
+    file_path = _get_critiques_file_path(paper_type, paper_id, base_dir)
+    if not file_path.exists():
         return []
-    
+
     try:
         with open(file_path, "r", encoding="utf-8") as f:
             critiques_data = json.load(f)
-        
+
         critiques = []
-        for c in critiques_data:
-            # Convert ISO format strings back to datetime
-            if isinstance(c.get("date"), str):
+        for critique_dict in critiques_data:
+            if isinstance(critique_dict.get("date"), str):
                 try:
-                    c["date"] = datetime.fromisoformat(c["date"])
+                    critique_dict["date"] = datetime.fromisoformat(critique_dict["date"])
                 except ValueError:
-                    c["date"] = datetime.now()
-            critiques.append(PaperCritique(**c))
-        
+                    critique_dict["date"] = datetime.now()
+            critiques.append(PaperCritique(**critique_dict))
+
         return critiques
     except json.JSONDecodeError as e:
         logger.error(f"Failed to parse critiques file {file_path}: {e}")
@@ -215,34 +188,23 @@ async def get_critiques(
 async def clear_critiques(
     paper_type: PaperType,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
+    base_dir: Optional[Path] = None
 ) -> bool:
-    """
-    Delete all critiques for a paper.
-    
-    Args:
-        paper_type: Type of paper
-        paper_id: Required for autonomous_paper type
-        base_path: Optional override path for session-aware storage.
-                   If provided, deletes critiques from this directory.
-                   If None, falls back to legacy paths.
-        
-    Returns:
-        True if file was deleted, False if it didn't exist
-    """
-    file_path = _get_critiques_file_path(paper_type, paper_id, base_path)
-    
-    if os.path.exists(file_path):
+    """Delete all critiques for a paper."""
+    file_path = _get_critiques_file_path(paper_type, paper_id, base_dir)
+    if file_path.exists():
         try:
-            os.remove(file_path)
-            logger.info(f"Cleared critiques for {paper_type}" + 
-                       (f" paper_id={paper_id}" if paper_id else "") +
-                       (f" at {file_path}" if base_path else ""))
+            file_path.unlink()
+            logger.info(
+                f"Cleared critiques for {paper_type}"
+                + (f" paper_id={paper_id}" if paper_id else "")
+                + (f" at {file_path}" if base_dir else "")
+            )
             return True
         except Exception as e:
             logger.error(f"Failed to delete critiques file {file_path}: {e}")
             raise
-    
+
     return False
 
 
@@ -250,48 +212,26 @@ async def get_critique_by_id(
     paper_type: PaperType,
     critique_id: str,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
+    base_dir: Optional[Path] = None
 ) -> Optional[PaperCritique]:
-    """
-    Get a specific critique by its ID.
-    
-    Args:
-        paper_type: Type of paper
-        critique_id: The critique ID to find
-        paper_id: Required for autonomous_paper type
-        base_path: Optional override path for session-aware storage
-        
-    Returns:
-        The PaperCritique if found, None otherwise
-    """
-    critiques = await get_critiques(paper_type, paper_id, base_path)
-    
+    """Get a specific critique by its ID."""
+    critiques = await get_critiques(paper_type, paper_id, base_dir)
+
     for critique in critiques:
         if critique.critique_id == critique_id:
             return critique
-    
+
     return None
 
 
 async def get_latest_critique(
     paper_type: PaperType,
     paper_id: Optional[str] = None,
-    base_path: Optional[str] = None
+    base_dir: Optional[Path] = None
 ) -> Optional[PaperCritique]:
-    """
-    Get the most recent critique for a paper.
-    
-    Args:
-        paper_type: Type of paper
-        paper_id: Required for autonomous_paper type
-        base_path: Optional override path for session-aware storage
-        
-    Returns:
-        The most recent PaperCritique if any exist, None otherwise
-    """
-    critiques = await get_critiques(paper_type, paper_id, base_path)
-    
+    """Get the most recent critique for a paper."""
+    critiques = await get_critiques(paper_type, paper_id, base_dir)
     if critiques:
-        return critiques[0]  # Already sorted newest first
-    
+        return critiques[0]
+
     return None
diff --git a/backend/shared/path_safety.py b/backend/shared/path_safety.py
new file mode 100644
index 0000000..a9a0379
--- /dev/null
+++ b/backend/shared/path_safety.py
@@ -0,0 +1,43 @@
+"""
+Helpers for resolving user-influenced paths within trusted storage roots.
+"""
+import os
+from pathlib import Path
+
+
+def validate_single_path_component(value: str, label: str = "path component") -> str:
+    """Allow only one non-empty path component with no traversal separators."""
+    normalized = (value or "").strip()
+    if not normalized:
+        raise ValueError(f"{label} is required")
+
+    if normalized in {".", ".."}:
+        raise ValueError(f"Invalid {label}: {value}")
+
+    separators = {os.path.sep}
+    if os.path.altsep:
+        separators.add(os.path.altsep)
+
+    if any(separator in normalized for separator in separators):
+        raise ValueError(f"Invalid {label}: {value}")
+
+    return normalized
+
+
+def resolve_path_within_root(root: Path, *unsafe_parts: str) -> Path:
+    """
+    Resolve an untrusted relative path within a trusted root.
+
+    Uses normpath/realpath containment checks so the resolved result cannot
+    escape the configured storage root.
+    """
+    root_real = os.path.realpath(os.path.normpath(str(root)))
+    candidate_real = os.path.realpath(
+        os.path.normpath(os.path.join(root_real, *unsafe_parts))
+    )
+
+    root_prefix = root_real if root_real.endswith(os.sep) else root_real + os.sep
+    if candidate_real != root_real and not candidate_real.startswith(root_prefix):
+        raise ValueError("Resolved path escapes trusted root")
+
+    return Path(candidate_real)
diff --git a/backend/shared/secret_store.py b/backend/shared/secret_store.py
new file mode 100644
index 0000000..c80181c
--- /dev/null
+++ b/backend/shared/secret_store.py
@@ -0,0 +1,96 @@
+"""
+Secure secret persistence for API keys.
+
+Stores user-provided credentials in the OS-backed keyring instead of browser
+storage so keys survive restarts without being written to frontend localStorage.
+"""
+from typing import Optional
+import logging
+
+import keyring
+from keyring.errors import KeyringError, PasswordDeleteError
+
+logger = logging.getLogger(__name__)
+
+_SERVICE_NAME = "MOTO-Autonomous-ASI"
+_OPENROUTER_KEY = "openrouter_api_key"
+_WOLFRAM_KEY = "wolfram_alpha_api_key"
+
+
+class SecretStoreError(RuntimeError):
+    """Raised when the secure secret store is unavailable or fails."""
+
+
+def _normalize_secret(value: Optional[str]) -> Optional[str]:
+    """Trim whitespace and collapse empty values to None."""
+    if value is None:
+        return None
+
+    stripped = value.strip()
+    return stripped or None
+
+
+def _get_secret(secret_name: str) -> Optional[str]:
+    """Load a secret from the OS-backed keyring."""
+    try:
+        return _normalize_secret(keyring.get_password(_SERVICE_NAME, secret_name))
+    except KeyringError as exc:
+        raise SecretStoreError(
+            "Secure credential storage is unavailable. Please ensure the OS keyring is accessible."
+        ) from exc
+
+
+def _set_secret(secret_name: str, secret_value: str) -> None:
+    """Persist a secret to the OS-backed keyring."""
+    normalized = _normalize_secret(secret_value)
+    if not normalized:
+        raise ValueError("Secret value is required")
+
+    try:
+        keyring.set_password(_SERVICE_NAME, secret_name, normalized)
+    except KeyringError as exc:
+        raise SecretStoreError(
+            "Failed to persist the credential in the OS keyring."
+        ) from exc
+
+
+def _delete_secret(secret_name: str) -> None:
+    """Delete a persisted secret if one exists."""
+    try:
+        keyring.delete_password(_SERVICE_NAME, secret_name)
+    except PasswordDeleteError:
+        return
+    except KeyringError as exc:
+        raise SecretStoreError(
+            "Failed to delete the credential from the OS keyring."
+        ) from exc
+
+
+def load_openrouter_api_key() -> Optional[str]:
+    """Load the persisted global OpenRouter API key."""
+    return _get_secret(_OPENROUTER_KEY)
+
+
+def store_openrouter_api_key(api_key: str) -> None:
+    """Persist the global OpenRouter API key securely."""
+    _set_secret(_OPENROUTER_KEY, api_key)
+
+
+def clear_openrouter_api_key() -> None:
+    """Delete the persisted global OpenRouter API key."""
+    _delete_secret(_OPENROUTER_KEY)
+
+
+def load_wolfram_api_key() -> Optional[str]:
+    """Load the persisted Wolfram Alpha API key."""
+    return _get_secret(_WOLFRAM_KEY)
+
+
+def store_wolfram_api_key(api_key: str) -> None:
+    """Persist the Wolfram Alpha API key securely."""
+    _set_secret(_WOLFRAM_KEY, api_key)
+
+
+def clear_wolfram_api_key() -> None:
+    """Delete the persisted Wolfram Alpha API key."""
+    _delete_secret(_WOLFRAM_KEY)
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 9d32b8c..d98a3b8 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -357,17 +357,7 @@ function App() {
       console.error('Failed to check OpenRouter key status:', err);
     }
 
-    let finalHasOpenRouterKey = Boolean(keyStatus.has_key);
-    const storedKey = localStorage.getItem('openrouter_api_key');
-    if (storedKey && !finalHasOpenRouterKey) {
-      try {
-        await openRouterAPI.setApiKey(storedKey);
-        finalHasOpenRouterKey = true;
-      } catch (err) {
-        console.error('Failed to restore OpenRouter key:', err);
-        localStorage.removeItem('openrouter_api_key');
-      }
-    }
+    const finalHasOpenRouterKey = Boolean(keyStatus.has_key);
     setHasOpenRouterKey(finalHasOpenRouterKey);
 
     let availableModels = [];
@@ -401,42 +391,12 @@ function App() {
     syncProviderAvailability();
   }, [syncProviderAvailability]);
 
-  useEffect(() => {
-    const restoreWolframKey = async () => {
-      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
-      if (!storedWolframKey) {
-        return;
-      }
-
-      try {
-        await api.setWolframApiKey(storedWolframKey);
-      } catch (err) {
-        console.error('Failed to restore Wolfram Alpha key:', err);
-        localStorage.removeItem('wolfram_alpha_api_key');
-      }
-    };
-
-    restoreWolframKey();
-  }, []);
-
   // Periodically re-check OpenRouter key status to keep indicator in sync
   useEffect(() => {
     const interval = setInterval(async () => {
       try {
         const keyStatus = await openRouterAPI.getApiKeyStatus();
         setHasOpenRouterKey(keyStatus.has_key);
-
-        if (!keyStatus.has_key) {
-          const storedKey = localStorage.getItem('openrouter_api_key');
-          if (storedKey) {
-            try {
-              await openRouterAPI.setApiKey(storedKey);
-              setHasOpenRouterKey(true);
-            } catch {
-              // Silent retry next interval
-            }
-          }
-        }
       } catch {
         // Backend unreachable, skip this cycle
       }
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 62f736d..2d4345b 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -118,8 +118,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
     }
 
     const initializeModal = async () => {
-      const savedKey = (localStorage.getItem('openrouter_api_key') || '').trim();
-      setApiKey(savedKey);
+      setApiKey('');
       setError('');
       setSuccess('');
 
@@ -133,10 +132,10 @@ export default function BoostControlModal({ isOpen, onClose }) {
         setHasGlobalKey(false);
       }
 
-      const preferredKey = useGlobalKey ? null : savedKey;
+      const preferredKey = null;
       await fetchBoostStatus(preferredKey);
 
-      if (useGlobalKey || savedKey) {
+      if (useGlobalKey) {
         await fetchModels(freeOnly, { silent: true, keyOverride: preferredKey });
       } else {
         setModels([]);
@@ -212,10 +211,6 @@ export default function BoostControlModal({ isOpen, onClose }) {
         response = await boostAPI.updateModel(config);
         
         if (response.success) {
-          if (trimmedApiKey) {
-            localStorage.setItem('openrouter_api_key', trimmedApiKey);
-          }
-          
           setSuccess(`✓ Boost model updated! State preserved: ${response.preserved_state.boost_next_count} next calls`);
           await fetchBoostStatus();
           
@@ -227,10 +222,6 @@ export default function BoostControlModal({ isOpen, onClose }) {
         response = await boostAPI.enable(config);
         
         if (response.success) {
-          if (trimmedApiKey) {
-            localStorage.setItem('openrouter_api_key', trimmedApiKey);
-          }
-          
           setSuccess('✓ Boost enabled successfully!');
           await fetchBoostStatus();
           
diff --git a/frontend/src/components/OpenRouterApiKeyModal.jsx b/frontend/src/components/OpenRouterApiKeyModal.jsx
index 87d52a0..45f4ab3 100644
--- a/frontend/src/components/OpenRouterApiKeyModal.jsx
+++ b/frontend/src/components/OpenRouterApiKeyModal.jsx
@@ -17,6 +17,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
   const [saving, setSaving] = useState(false);
   const [testResult, setTestResult] = useState(null);
   const [error, setError] = useState('');
+  const [hasStoredKey, setHasStoredKey] = useState(false);
 
   // Reset state when modal opens
   useEffect(() => {
@@ -24,16 +25,30 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
       setApiKey('');
       setTestResult(null);
       setError('');
-    }
-  }, [isOpen]);
+      let isCancelled = false;
 
-  // Load existing key from localStorage on mount
-  useEffect(() => {
-    const storedKey = localStorage.getItem('openrouter_api_key');
-    if (storedKey) {
-      setApiKey(storedKey);
+      const loadKeyStatus = async () => {
+        try {
+          const status = await openRouterAPI.getApiKeyStatus();
+          if (!isCancelled) {
+            setHasStoredKey(Boolean(status.has_key));
+          }
+        } catch {
+          if (!isCancelled) {
+            setHasStoredKey(false);
+          }
+        }
+      };
+
+      loadKeyStatus();
+
+      return () => {
+        isCancelled = true;
+      };
     }
-  }, []);
+    setHasStoredKey(false);
+    return undefined;
+  }, [isOpen]);
 
   const handleTestConnection = async () => {
     if (!apiKey.trim()) {
@@ -71,9 +86,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
     try {
       // Save to backend
       await openRouterAPI.setApiKey(apiKey.trim());
-      
-      // Also save to localStorage for persistence
-      localStorage.setItem('openrouter_api_key', apiKey.trim());
+      setHasStoredKey(true);
       
       // Notify parent
       if (onKeySet) {
@@ -91,10 +104,10 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
   const handleClearKey = async () => {
     try {
       await openRouterAPI.clearApiKey();
-      localStorage.removeItem('openrouter_api_key');
       setApiKey('');
       setTestResult(null);
       setError('');
+      setHasStoredKey(false);
     } catch (err) {
       setError(err.message || 'Failed to clear API key');
     }
@@ -195,6 +208,15 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
           </div>
         )}
 
+        {hasStoredKey && !apiKey.trim() && (
+          <div className="test-result-banner test-result-banner--success" style={{
+            marginBottom: '1rem',
+          }}>
+            An OpenRouter API key is already stored securely on the backend for this machine.
+            Enter a new key below to replace it.
+          </div>
+        )}
+
         {/* Action Buttons */}
         <div style={{ display: 'flex', gap: '0.75rem', marginTop: '1.5rem' }}>
           <button
@@ -236,7 +258,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
         </div>
 
         {/* Clear Key Button */}
-        {apiKey && (
+        {(apiKey || hasStoredKey) && (
           <button
             onClick={handleClearKey}
             className="btn-ghost"
@@ -259,7 +281,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
           backgroundColor: '#0d0d1a',
           borderRadius: '6px',
         }}>
-          This API key is stored locally and sent to the backend for OpenRouter API calls.
+          This API key is stored securely through the backend keyring integration and sent to the backend for OpenRouter API calls.
           API Boost can reuse this key automatically, or you can override it inside the boost modal.
         </p>
       </div>
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index fa7110e..e053eee 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -212,6 +212,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
   // Wolfram Alpha settings (shared with compiler)
   const [wolframEnabled, setWolframEnabled] = useState(false);
   const [wolframApiKey, setWolframApiKey] = useState('');
+  const [hasStoredWolframKey, setHasStoredWolframKey] = useState(false);
   const [wolframTestResult, setWolframTestResult] = useState('');
   const [testingWolfram, setTestingWolfram] = useState(false);
   
@@ -375,20 +376,14 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
         console.error('Failed to check OpenRouter key:', err);
       }
       
-      // Restore Wolfram Alpha key from localStorage
-      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
-      if (storedWolframKey) {
-        setWolframApiKey(storedWolframKey);
-        setWolframEnabled(true);
-      } else {
-        try {
-          const wolframStatus = await api.getWolframStatus();
-          if (wolframStatus.enabled) {
-            setWolframEnabled(true);
-          }
-        } catch (err) {
-          console.error('Failed to load Wolfram Alpha status:', err);
+      try {
+        const wolframStatus = await api.getWolframStatus();
+        setHasStoredWolframKey(Boolean(wolframStatus.has_key));
+        if (wolframStatus.enabled) {
+          setWolframEnabled(true);
         }
+      } catch (err) {
+        console.error('Failed to load Wolfram Alpha status:', err);
       }
 
       // Try to fetch fresh LM Studio models
@@ -770,7 +765,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       if (response.success) {
         setWolframTestResult(`✓ Success! Result: ${response.result}`);
         await api.setWolframApiKey(wolframApiKey);
-        localStorage.setItem('wolfram_alpha_api_key', wolframApiKey);
+        setHasStoredWolframKey(true);
         setWolframEnabled(true);
       } else {
         setWolframTestResult('✗ Failed: ' + response.message);
@@ -786,9 +781,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const handleClearWolframKey = async () => {
     try {
       await api.clearWolframApiKey();
-      localStorage.removeItem('wolfram_alpha_api_key');
       setWolframApiKey('');
       setWolframEnabled(false);
+      setHasStoredWolframKey(false);
       setWolframTestResult('Key cleared');
       setTimeout(() => setWolframTestResult(''), 3000);
     } catch (err) {
@@ -1517,9 +1512,14 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                       type="password"
                       value={wolframApiKey}
                       onChange={(e) => setWolframApiKey(e.target.value)}
-                      placeholder="Enter your Wolfram Alpha App ID"
+                      placeholder={hasStoredWolframKey && !wolframApiKey ? "Stored securely on backend. Enter a new App ID to replace it." : "Enter your Wolfram Alpha App ID"}
                       className="input-dark"
                     />
+                    {hasStoredWolframKey && !wolframApiKey && (
+                      <small className="hint-text">
+                        A Wolfram Alpha key is already stored securely on the backend for this machine.
+                      </small>
+                    )}
                   </div>
 
                   <div style={{ display: 'flex', gap: '0.75rem', marginTop: '1rem' }}>
diff --git a/frontend/src/components/compiler/CompilerSettings.jsx b/frontend/src/components/compiler/CompilerSettings.jsx
index fb7f411..e22f2c2 100644
--- a/frontend/src/components/compiler/CompilerSettings.jsx
+++ b/frontend/src/components/compiler/CompilerSettings.jsx
@@ -53,6 +53,7 @@ function CompilerSettings() {
   // Wolfram Alpha settings
   const [wolframEnabled, setWolframEnabled] = useState(false);
   const [wolframApiKey, setWolframApiKey] = useState('');
+  const [hasStoredWolframKey, setHasStoredWolframKey] = useState(false);
   const [wolframTestResult, setWolframTestResult] = useState('');
   const [testingWolfram, setTestingWolfram] = useState(false);
 
@@ -129,24 +130,18 @@ function CompilerSettings() {
         }
       }
       
-      // Restore Wolfram Alpha key from localStorage
-      const storedWolframKey = localStorage.getItem('wolfram_alpha_api_key');
-      if (storedWolframKey) {
-        setWolframApiKey(storedWolframKey);
-        setWolframEnabled(true);
-      } else {
-        const loadWolframStatus = async () => {
-          try {
-            const response = await api.getWolframStatus();
-            if (response.enabled) {
-              setWolframEnabled(true);
-            }
-          } catch (err) {
-            console.error('Failed to load Wolfram Alpha status:', err);
+      const loadWolframStatus = async () => {
+        try {
+          const response = await api.getWolframStatus();
+          setHasStoredWolframKey(Boolean(response.has_key));
+          if (response.enabled) {
+            setWolframEnabled(true);
           }
-        };
-        loadWolframStatus();
-      }
+        } catch (err) {
+          console.error('Failed to load Wolfram Alpha status:', err);
+        }
+      };
+      loadWolframStatus();
       
       setIsLoaded(true);
       setLoadingModels(false);
@@ -317,7 +312,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       if (response.success) {
         setWolframTestResult(`✓ Success! Result: ${response.result}`);
         await api.setWolframApiKey(wolframApiKey);
-        localStorage.setItem('wolfram_alpha_api_key', wolframApiKey);
+        setHasStoredWolframKey(true);
         setWolframEnabled(true);
       } else {
         setWolframTestResult('✗ Failed: ' + response.message);
@@ -333,9 +328,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const handleClearWolframKey = async () => {
     try {
       await api.clearWolframApiKey();
-      localStorage.removeItem('wolfram_alpha_api_key');
       setWolframApiKey('');
       setWolframEnabled(false);
+      setHasStoredWolframKey(false);
       setWolframTestResult('Key cleared');
       setTimeout(() => setWolframTestResult(''), 3000);
     } catch (err) {
@@ -719,10 +714,15 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 type="password"
                 value={wolframApiKey}
                 onChange={(e) => setWolframApiKey(e.target.value)}
-                placeholder="Enter your Wolfram Alpha App ID"
+                placeholder={hasStoredWolframKey && !wolframApiKey ? "Stored securely on backend. Enter a new App ID to replace it." : "Enter your Wolfram Alpha App ID"}
                 className="input-dark"
                 style={{ marginBottom: '0.5rem' }}
               />
+              {hasStoredWolframKey && !wolframApiKey && (
+                <small className="hint-text">
+                  A Wolfram Alpha key is already stored securely on the backend for this machine.
+                </small>
+              )}
             </div>
             
             <div className="provider-toggle-group" style={{ marginTop: '0.75rem' }}>
diff --git a/requirements.txt b/requirements.txt
index ec7f494..5f1af5b 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -18,6 +18,7 @@ pydantic-settings>=2.1.0
 python-dotenv>=1.0.0
 aiofiles>=23.2.1,<25.0
 tiktoken>=0.5.2
+keyring>=25.6.0
 
 # PDF generation (headless Chromium via Playwright - full rendering fidelity)
 playwright>=1.40.0

From 36259f9647d582a99969986306bce4683a6c39c6 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Wed, 8 Apr 2026 21:18:41 -0500
Subject: [PATCH 03/32] Fix CodeQL alerts: secure backend secret storage, safe
 path resolution

---
 Press to Launch MOTO.bat                      | 24 ++++++++--
 README.md                                     | 28 +++++++----
 _moto_internal_launcher.ps1                   | 23 +++++++--
 .../autonomous/FinalAnswerLibrary.jsx         |  2 +-
 frontend/src/utils/autonomousProfiles.js      | 48 +++++++++++++------
 5 files changed, 93 insertions(+), 32 deletions(-)

diff --git a/Press to Launch MOTO.bat b/Press to Launch MOTO.bat
index 52710c8..0b6b42c 100644
--- a/Press to Launch MOTO.bat	
+++ b/Press to Launch MOTO.bat	
@@ -140,8 +140,15 @@ if not exist "frontend" (
     exit /b 1
 )
 pushd frontend
-call npm install
-if errorlevel 1 (
+set "SHOW_VULN_RESTART_HINT="
+set "NPM_INSTALL_LOG=%TEMP%\moto_npm_install_%RANDOM%_%RANDOM%.log"
+call npm install >"%NPM_INSTALL_LOG%" 2>&1
+set "NPM_INSTALL_EXIT=%ERRORLEVEL%"
+type "%NPM_INSTALL_LOG%"
+findstr /i /c:"vulnerabilities found" "%NPM_INSTALL_LOG%" >nul 2>&1
+if not errorlevel 1 set "SHOW_VULN_RESTART_HINT=1"
+del "%NPM_INSTALL_LOG%" >nul 2>&1
+if not "%NPM_INSTALL_EXIT%"=="0" (
     echo.
     echo ============================================================
     echo ERROR: Failed to install Node.js dependencies
@@ -155,7 +162,14 @@ if errorlevel 1 (
     pause
     exit /b 1
 )
-echo Fixing known vulnerabilities - if a vulnerability was found restart your terminal after completion...
+if defined SHOW_VULN_RESTART_HINT (
+    echo.
+    echo NOTE: npm reported vulnerability warnings during install.
+    echo MOTO is running npm audit fix automatically right now.
+    echo After startup finishes, restart this terminal / launcher once to check whether the warning is gone.
+    echo.
+)
+echo Fixing known vulnerabilities automatically...
 call npm audit fix >nul 2>&1
 popd
 echo Node.js dependencies installed successfully!
@@ -298,6 +312,10 @@ echo.
 echo Browser opened automatically to: http://localhost:5173
 echo If it didn't open, open that URL manually.
 echo.
+if defined SHOW_VULN_RESTART_HINT (
+echo If you saw npm vulnerability warnings earlier, restart this terminal / launcher once now that startup is complete.
+echo.
+)
 echo To stop the system: Close both service windows
 echo.
 echo This launcher window can now be closed.
diff --git a/README.md b/README.md
index c6ab89f..21f3af8 100644
--- a/README.md
+++ b/README.md
@@ -366,19 +366,27 @@ All content generated by this system is for informational purposes only. Papers
 
 ## 📊 System Requirements
 
-### Minimum
+### Option 1 - Local Large-Model / Large-MoE Setup
 
-- **OS**: Windows 10+, macOS 10.15+, Linux
-- **RAM**: 16GB (for running local models)
-- **Storage**: 10GB free space
-- **Internet**: Required for package installation and OpenRouter
+Best if you want to run local models in LM Studio, especially models above 20B parameters or larger MoE-style models.
 
-### Recommended
+- **OS**: Windows 10+, macOS 12+, Linux
+- **RAM**: 32GB+ recommended
+- **Storage**: 50GB+ free space for models and project data
+- **GPU**: 16GB+ VRAM recommended for practical local inference on 20B+ class models
+- **Internet**: Required for installation; optional afterward if staying local-only
 
-- **OS**: Windows 11, macOS 12+, Linux
-- **RAM**: 32GB+ (for larger models)
-- **Storage**: 50GB+ (for multiple models)
-- **GPU**: NVIDIA GPU with 8GB+ VRAM (for faster inference)
+### Option 2 - OpenRouter-Only Setup
+
+Best if you want the lightest local hardware requirements and are comfortable running inference in the cloud through OpenRouter.
+
+- **OS**: Windows, macOS, Linux, or Raspberry Pi OS
+- **RAM**: 4GB minimum, 8GB recommended
+- **Storage**: 5GB+ free space
+- **GPU**: Not required
+- **Internet**: Required
+
+Because the heavy model inference happens on OpenRouter, MOTO can run on very modest local hardware in this mode, including a Raspberry Pi, as long as it can run Python, Node.js, and maintain a stable internet connection.
 
 ---
 
diff --git a/_moto_internal_launcher.ps1 b/_moto_internal_launcher.ps1
index 8e21bba..26f7bc2 100644
--- a/_moto_internal_launcher.ps1
+++ b/_moto_internal_launcher.ps1
@@ -136,12 +136,19 @@ try {
     }
     
     Set-Location frontend
+    $showVulnerabilityRestartHint = $false
     if (-not (Test-Path "node_modules")) {
         Write-Host "Installing Node.js dependencies..." -ForegroundColor Yellow
         Write-Host "This may take a few minutes..." -ForegroundColor Yellow
         Write-Host ""
-        npm install
-        if ($LASTEXITCODE -ne 0) {
+        $npmInstallLog = Join-Path $env:TEMP ("moto_npm_install_{0}.log" -f ([guid]::NewGuid().ToString("N")))
+        npm install 2>&1 | Tee-Object -FilePath $npmInstallLog
+        $npmInstallExit = $LASTEXITCODE
+        if (Test-Path $npmInstallLog) {
+            $showVulnerabilityRestartHint = Select-String -Path $npmInstallLog -Pattern "vulnerabilities found" -Quiet
+            Remove-Item -Path $npmInstallLog -Force -ErrorAction SilentlyContinue
+        }
+        if ($npmInstallExit -ne 0) {
             Write-Host ""
             Write-Host "============================================================" -ForegroundColor Red
             Write-Host "ERROR: Failed to install Node.js dependencies" -ForegroundColor Red
@@ -157,7 +164,13 @@ try {
     } else {
         Write-Host "Node.js dependencies already installed" -ForegroundColor Green
     }
-    Write-Host "Fixing known vulnerabilities..." -ForegroundColor Yellow
+    if ($showVulnerabilityRestartHint) {
+        Write-Host "" 
+        Write-Host "NOTE: npm reported vulnerability warnings during install." -ForegroundColor Yellow
+        Write-Host "MOTO is running npm audit fix automatically right now." -ForegroundColor Yellow
+        Write-Host "After startup finishes, restart this terminal / launcher once to check whether the warning is gone." -ForegroundColor Yellow
+    }
+    Write-Host "Fixing known vulnerabilities automatically..." -ForegroundColor Yellow
     npm audit fix 2>&1 | Out-Null
     Set-Location ..
     Write-Host ""
@@ -297,6 +310,10 @@ try {
     Write-Host ""
     Write-Host "If it didn't open, open that URL manually." -ForegroundColor Yellow
     Write-Host ""
+    if ($showVulnerabilityRestartHint) {
+        Write-Host "If you saw npm vulnerability warnings earlier, restart this terminal / launcher once now that startup is complete." -ForegroundColor Yellow
+        Write-Host ""
+    }
     Write-Host "To stop the system: Close both service windows" -ForegroundColor Yellow
     Write-Host ""
     Write-Host "This launcher window can now be closed." -ForegroundColor Green
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
index 24a963f..e39a523 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
@@ -1,4 +1,4 @@
-import React, { useState, useEffect } from 'react';
+import React, { useState, useEffect, useMemo } from 'react';
 import LatexRenderer from '../LatexRenderer';
 import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
index d626853..b3d998c 100644
--- a/frontend/src/utils/autonomousProfiles.js
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -189,16 +189,34 @@ export const RECOMMENDED_PROFILES = {
     },
   },
   [RECOMMENDED_CHEAPER_PROFILE_KEY]: {
-    name: 'Cheaper, lower knowledge',
+    name: 'Cheaper, lower-knowledge validator',
     numSubmitters: 3,
-    submitters: Array.from({ length: 3 }, () => ({
-      modelId: 'qwen/qwen3.5-flash-02-23',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500,
-    })),
+    submitters: [
+      {
+        modelId: 'moonshotai/kimi-k2.5',
+        provider: 'openrouter',
+        openrouterProvider: 'SiliconFlow',
+        lmStudioFallbackId: null,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
+      },
+      {
+        modelId: 'openai/gpt-oss-120b',
+        provider: 'openrouter',
+        openrouterProvider: 'Groq',
+        lmStudioFallbackId: null,
+        contextWindow: 131072,
+        maxOutputTokens: 25000,
+      },
+      {
+        modelId: 'deepseek/deepseek-v3.2',
+        provider: 'openrouter',
+        openrouterProvider: 'AtlasCloud',
+        lmStudioFallbackId: null,
+        contextWindow: 163800,
+        maxOutputTokens: 30000,
+      },
+    ],
     validator: {
       modelId: 'qwen/qwen3.5-flash-02-23',
       provider: 'openrouter',
@@ -208,15 +226,15 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
     highContext: {
-      modelId: 'qwen/qwen3.5-flash-02-23',
+      modelId: 'moonshotai/kimi-k2.5',
       provider: 'openrouter',
-      openrouterProvider: null,
+      openrouterProvider: 'SiliconFlow',
       lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500,
+      contextWindow: 262000,
+      maxOutputTokens: 40000,
     },
     highParam: {
-      modelId: 'qwen/qwen3.5-flash-02-23',
+      modelId: 'google/gemini-3.1-pro-preview',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,
@@ -224,7 +242,7 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
     critique: {
-      modelId: 'qwen/qwen3.5-flash-02-23',
+      modelId: 'google/gemini-3.1-pro-preview',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,

From bfec33f6ad87705f3672f327889809043115ce21 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Wed, 8 Apr 2026 21:37:24 -0500
Subject: [PATCH 04/32] Fix CodeQL alerts: secure backend secret storage, safe
 path resolution

---
 .cursor/rules/api-key-controls.mdc            |   6 +-
 .../rules/part-3-autonomous-research-mode.mdc |   8 +-
 backend/shared/critique_memory.py             | 105 +++++++++++++-----
 3 files changed, 87 insertions(+), 32 deletions(-)

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index 30c1ea0..58f22d7 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -9,10 +9,10 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 
 **Key Features:**
 - **Per-Role OpenRouter Selection**: Each role independently uses LM Studio or OpenRouter
-- **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections (separate from boost)
+- **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections. Boost can reuse it when no explicit boost-only override key is provided.
 - **LM Studio Fallback**: Optional fallback per role on credit exhaustion
 - **Free Model Cooldown Handling**: SERIAL BOTTLENECK pause, free model looping, and auto-selector backup (see below)
-- **Boost Mode**: Separate boost API key for selective task acceleration via three modes:
+- **Boost Mode**: Selective task acceleration via three modes, using either an explicit boost override key or the active global OpenRouter key:
   - **Boost Next X Calls**: Counter-based, next X API calls regardless of task ID
   - **Category Boost**: Role-based, boosts all calls for specific role categories
   - **Per-task Toggle**: Task ID based (legacy)
@@ -67,7 +67,7 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 
 #### BoostManager (`backend/shared/boost_manager.py`)
 - Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `toggle_task_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call), `is_task_boosted` (DO NOT USE in coordinators — legacy only)
-- Boost uses a **separate** OpenRouter API key. Temporary `OpenRouterClient` created per boosted task, closed immediately after.
+- Boost can use an **explicit override** OpenRouter API key, or it falls back to the active global OpenRouter key. A temporary `OpenRouterClient` is created per boosted task and closed immediately after.
 
 #### BoostLogger (`backend/shared/boost_logger.py`)
 - Singleton. Log file: `backend/data/boost_api_log.txt`
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index fb31b54..a284f38 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -1326,10 +1326,10 @@ backend/data/auto_sessions/{session_id}/final_answer/    # Session final answers
 4. Memory modules handle path resolution automatically
 
 **Critique Storage Integration:**
-- Critiques are stored in `.critiques/` subdirectory within each paper's directory
-- `critique_memory.py` accepts `base_path` parameter for session-awareness
-- When paper is deleted, critiques are automatically cleaned up from correct location
-- Path is derived from `paper_library.get_paper_path(paper_id)` which returns session-aware paths
+- Critiques are stored as JSON files inside the resolved legacy/session `papers/` or `final_answer/` directory
+- `critique_memory.py` accepts `base_dir` for session-aware storage and revalidates it against trusted roots before file access
+- When a paper or final answer is deleted, critiques are automatically cleaned up from the matching resolved storage location
+- Callers derive the directory from session-aware memory/path helpers before invoking critique storage
 
 **Important for New Features:**
 - Always use memory module methods (e.g., `paper_library.get_paper_path()`) to get paths
diff --git a/backend/shared/critique_memory.py b/backend/shared/critique_memory.py
index a57cfc0..bfbae69 100644
--- a/backend/shared/critique_memory.py
+++ b/backend/shared/critique_memory.py
@@ -34,8 +34,12 @@
 from datetime import datetime
 import uuid
 
+from backend.shared.config import system_config
 from backend.shared.models import PaperCritique
-from backend.shared.path_safety import validate_single_path_component
+from backend.shared.path_safety import (
+    resolve_path_within_root,
+    validate_single_path_component,
+)
 
 logger = logging.getLogger(__name__)
 
@@ -51,6 +55,69 @@ def _get_legacy_data_dir() -> Path:
     return Path(__file__).resolve().parents[1] / "data"
 
 
+def _get_legacy_critiques_dir(paper_type: PaperType) -> Path:
+    """Return the trusted legacy directory for a critique storage type."""
+    data_dir = _get_legacy_data_dir()
+
+    if paper_type == "autonomous_paper":
+        return resolve_path_within_root(data_dir, "auto_papers")
+
+    if paper_type == "final_answer":
+        return resolve_path_within_root(data_dir, "auto_final_answer")
+
+    if paper_type == "compiler_paper":
+        return data_dir
+
+    raise ValueError(f"Unknown paper_type: {paper_type}")
+
+
+def _resolve_session_critiques_dir(base_dir: Path, paper_type: PaperType) -> Path:
+    """
+    Rebuild a session-aware critique directory from validated components.
+
+    This prevents callers from passing arbitrary absolute paths into critique
+    file operations. Only `<session_id>/papers` and `<session_id>/final_answer`
+    directories under the trusted sessions root are allowed.
+    """
+    sessions_root = Path(system_config.auto_sessions_base_dir)
+    candidate_dir = Path(base_dir)
+    expected_leaf = "papers" if paper_type == "autonomous_paper" else "final_answer"
+
+    try:
+        relative_dir = candidate_dir.resolve(strict=False).relative_to(
+            sessions_root.resolve(strict=False)
+        )
+    except ValueError as exc:
+        raise ValueError(f"Untrusted critique storage directory: {base_dir}") from exc
+
+    if len(relative_dir.parts) != 2 or relative_dir.parts[1] != expected_leaf:
+        raise ValueError(f"Untrusted critique storage directory: {base_dir}")
+
+    safe_session_id = validate_single_path_component(relative_dir.parts[0], "session ID")
+    return resolve_path_within_root(sessions_root, safe_session_id, expected_leaf)
+
+
+def _resolve_trusted_critiques_dir(
+    paper_type: PaperType,
+    base_dir: Optional[Path] = None,
+) -> Path:
+    """
+    Resolve critique storage to a trusted legacy or session-scoped directory.
+    """
+    if paper_type == "compiler_paper":
+        return _get_legacy_critiques_dir(paper_type)
+
+    legacy_dir = _get_legacy_critiques_dir(paper_type)
+    if base_dir is None:
+        return legacy_dir
+
+    candidate_dir = Path(base_dir)
+    if candidate_dir.resolve(strict=False) == legacy_dir.resolve(strict=False):
+        return legacy_dir
+
+    return _resolve_session_critiques_dir(candidate_dir, paper_type)
+
+
 def _get_critiques_file_path(
     paper_type: PaperType,
     paper_id: Optional[str] = None,
@@ -71,37 +138,25 @@ def _get_critiques_file_path(
     if paper_id:
         safe_paper_id = validate_single_path_component(paper_id, "paper ID")
 
-    if base_dir is not None:
-        base_dir.mkdir(parents=True, exist_ok=True)
-
-        if paper_type == "autonomous_paper":
-            if not safe_paper_id:
-                raise ValueError("paper_id is required for autonomous_paper type")
-            return base_dir / f"paper_{safe_paper_id}_critiques.json"
-
-        if paper_type == "final_answer":
-            return base_dir / "final_answer_critiques.json"
-
-        if paper_type != "compiler_paper":
-            raise ValueError(f"Unknown paper_type: {paper_type}")
-
-    data_dir = _get_legacy_data_dir()
-
     if paper_type == "autonomous_paper":
         if not safe_paper_id:
             raise ValueError("paper_id is required for autonomous_paper type")
-        papers_dir = data_dir / "auto_papers"
-        papers_dir.mkdir(parents=True, exist_ok=True)
-        return papers_dir / f"paper_{safe_paper_id}_critiques.json"
+        critiques_dir = _resolve_trusted_critiques_dir(paper_type, base_dir)
+        critiques_dir.mkdir(parents=True, exist_ok=True)
+        return resolve_path_within_root(
+            critiques_dir,
+            f"paper_{safe_paper_id}_critiques.json",
+        )
 
     if paper_type == "final_answer":
-        final_answer_dir = data_dir / "auto_final_answer"
-        final_answer_dir.mkdir(parents=True, exist_ok=True)
-        return final_answer_dir / "final_answer_critiques.json"
+        critiques_dir = _resolve_trusted_critiques_dir(paper_type, base_dir)
+        critiques_dir.mkdir(parents=True, exist_ok=True)
+        return resolve_path_within_root(critiques_dir, "final_answer_critiques.json")
 
     if paper_type == "compiler_paper":
-        data_dir.mkdir(parents=True, exist_ok=True)
-        return data_dir / "compiler_paper_critiques.json"
+        critiques_dir = _resolve_trusted_critiques_dir(paper_type, base_dir)
+        critiques_dir.mkdir(parents=True, exist_ok=True)
+        return resolve_path_within_root(critiques_dir, "compiler_paper_critiques.json")
 
     raise ValueError(f"Unknown paper_type: {paper_type}")
 

From 1b6429af9802481a81b7eebc212d896ef2a896cf Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Sun, 19 Apr 2026 15:01:06 -0500
Subject: [PATCH 05/32] v1.0.6: security hardening, empirical-provenance
 guardrails, boost UX improvements, bug fixes

---
 .cursor/rules/api-key-controls.mdc            |  29 +-
 .cursor/rules/json-prompt-design.mdc          |  15 +-
 ...t-2-compiler-tool-design-specification.mdc |   2 +
 .../rules/part-3-autonomous-research-mode.mdc |  39 +-
 ...program-directory-and-file-definitions.mdc |  22 +-
 .github/ISSUE_TEMPLATE/bug_report.yml         |  81 ++++
 .github/ISSUE_TEMPLATE/config.yml             |   5 +
 .github/ISSUE_TEMPLATE/feature_request.yml    |  57 +++
 .github/pull_request_template.md              |  28 ++
 .gitignore                                    |   1 +
 ...aunch MOTO.bat => Click To Launch MOTO.bat |   0
 README.md                                     |  14 +-
 _moto_internal_launcher.ps1                   |  46 +-
 backend/aggregator/agents/submitter.py        |  24 +-
 backend/aggregator/agents/validator.py        |  30 +-
 backend/aggregator/core/coordinator.py        | 125 +++---
 .../aggregator/prompts/submitter_prompts.py   |  26 +-
 .../aggregator/prompts/validator_prompts.py   |  88 ++--
 backend/api/main.py                           |   4 +-
 backend/api/routes/aggregator.py              |  10 +-
 backend/api/routes/autonomous.py              | 210 ++++++++-
 backend/api/routes/boost.py                   |  38 +-
 backend/api/routes/compiler.py                |   1 +
 backend/api/routes/websocket.py               |   4 +-
 .../autonomous/agents/completion_reviewer.py  |   2 +-
 .../final_answer/answer_format_selector.py    |   2 +-
 .../agents/final_answer/certainty_assessor.py |   2 +-
 .../agents/final_answer/volume_organizer.py   |   2 +-
 .../autonomous/agents/paper_title_selector.py |   5 +-
 .../autonomous/agents/reference_selector.py   |  53 ++-
 backend/autonomous/agents/topic_selector.py   |   2 +-
 backend/autonomous/agents/topic_validator.py  |   2 +-
 .../autonomous/core/autonomous_coordinator.py | 284 +++++++-----
 .../autonomous/memory/brainstorm_memory.py    |  13 +-
 backend/autonomous/memory/paper_library.py    |  87 +++-
 .../autonomous/memory/research_metadata.py    |   9 +-
 .../autonomous/prompts/completion_prompts.py  |  28 +-
 .../prompts/final_answer_prompts.py           | 102 +----
 .../prompts/paper_continuation_prompts.py     |  19 +-
 .../prompts/paper_redundancy_prompts.py       |  14 +-
 .../prompts/paper_reference_prompts.py        | 154 +++----
 .../autonomous/prompts/paper_title_prompts.py |  61 +--
 backend/autonomous/prompts/topic_prompts.py   |  28 +-
 .../validation/paper_redundancy_checker.py    |   2 +-
 .../compiler/agents/high_context_submitter.py |  23 +-
 .../compiler/agents/high_param_submitter.py   |   9 +
 backend/compiler/core/compiler_coordinator.py | 125 ++++--
 .../compiler/prompts/construction_prompts.py  | 112 ++---
 backend/compiler/prompts/critique_prompts.py  | 115 +++--
 backend/compiler/prompts/outline_prompts.py   |  93 ++--
 backend/compiler/prompts/review_prompts.py    |  59 ++-
 backend/compiler/prompts/rigor_prompts.py     |  14 +-
 .../compiler/validation/compiler_validator.py | 105 +++--
 backend/shared/api_client_manager.py          | 189 +++++++-
 backend/shared/boost_logger.py                |   3 +-
 backend/shared/boost_manager.py               | 215 ++++++---
 backend/shared/config.py                      |   3 +-
 backend/shared/critique_memory.py             |  10 +-
 backend/shared/free_model_manager.py          |  86 ++--
 backend/shared/models.py                      |   4 +-
 frontend/package-lock.json                    |  10 +-
 frontend/package.json                         |   2 +-
 frontend/src/App.jsx                          | 165 ++++---
 frontend/src/components/BoostControlModal.jsx |  85 +++-
 frontend/src/components/BoostLogs.css         | 361 ---------------
 frontend/src/components/BoostLogs.jsx         | 239 ----------
 frontend/src/components/WorkflowPanel.css     | 253 +++--------
 frontend/src/components/WorkflowPanel.jsx     | 410 +++++-------------
 .../autonomous/AutonomousResearch.css         |  99 ++++-
 .../autonomous/AutonomousResearchLogs.jsx     |  77 +++-
 .../autonomous/AutonomousResearchSettings.jsx |   6 +-
 .../components/autonomous/BrainstormList.jsx  |   2 +-
 .../autonomous/FinalAnswerLibrary.css         |  17 +-
 .../autonomous/FinalAnswerLibrary.jsx         |   5 +-
 .../autonomous/Stage2PaperHistory.jsx         |   5 +-
 frontend/src/index.css                        |  33 +-
 frontend/src/services/api.js                  |  44 +-
 frontend/src/services/websocket.js            |   6 +-
 frontend/src/utils/autonomousProfiles.js      |  46 +-
 package-lock.json                             |   4 +-
 package.json                                  |   2 +-
 81 files changed, 2488 insertions(+), 2318 deletions(-)
 create mode 100644 .github/ISSUE_TEMPLATE/bug_report.yml
 create mode 100644 .github/ISSUE_TEMPLATE/config.yml
 create mode 100644 .github/ISSUE_TEMPLATE/feature_request.yml
 create mode 100644 .github/pull_request_template.md
 rename Press to Launch MOTO.bat => Click To Launch MOTO.bat (100%)
 delete mode 100644 frontend/src/components/BoostLogs.css
 delete mode 100644 frontend/src/components/BoostLogs.jsx

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index 58f22d7..83e40ac 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -5,17 +5,16 @@ alwaysApply: false
 
 ## Overview
 
-Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic workflow prediction panel showing the next 20 API calls with boost feature.
+Enables OpenRouter integration with automatic LM Studio fallback, plus boost controls and research metrics in the workflow panel.
 
 **Key Features:**
 - **Per-Role OpenRouter Selection**: Each role independently uses LM Studio or OpenRouter
 - **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections. Boost can reuse it when no explicit boost-only override key is provided.
 - **LM Studio Fallback**: Optional fallback per role on credit exhaustion
 - **Free Model Cooldown Handling**: SERIAL BOTTLENECK pause, free model looping, and auto-selector backup (see below)
-- **Boost Mode**: Selective task acceleration via three modes, using either an explicit boost override key or the active global OpenRouter key:
+- **Boost Mode**: Selective task acceleration via two modes, using either an explicit boost override key or the active global OpenRouter key:
   - **Boost Next X Calls**: Counter-based, next X API calls regardless of task ID
-  - **Category Boost**: Role-based, boosts all calls for specific role categories
-  - **Per-task Toggle**: Task ID based (legacy)
+  - **Category Boost**: Role-based, boosts all calls for specific role categories (Aggregator and Compiler only; Autonomous agents inherit from their parent roles automatically)
 - **System works without LM Studio**: Defaults to OpenRouter when LM Studio unavailable
 
 ---
@@ -51,7 +50,6 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 **Boost Mode Priority** (`should_use_boost(task_id)`):
 1. Boost Next X: `boost_next_count > 0` → True
 2. Category Boost: `_extract_role_prefix(task_id) in boosted_categories` → True
-3. Per-task Toggle: `task_id in boosted_task_ids` → True
 
 **Counter Decrement:** `boost_next_count` decrements ONLY on successful boost API calls. Failed/exhausted calls do NOT decrement.
 
@@ -66,15 +64,17 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus a dynamic
 - `autonomous_*` → "Autonomous"
 
 #### BoostManager (`backend/shared/boost_manager.py`)
-- Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `toggle_task_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call), `is_task_boosted` (DO NOT USE in coordinators — legacy only)
+- Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call)
 - Boost can use an **explicit override** OpenRouter API key, or it falls back to the active global OpenRouter key. A temporary `OpenRouterClient` is created per boosted task and closed immediately after.
+- **Autonomous agent task ID inheritance**: All autonomous orchestration agents use parent role task ID prefixes — Topic Selector/Completion Reviewer/Reference Selector/Paper Title Selector/Tier 3 agents use `agg_sub1_*`; Topic Validator/Redundancy Checker use `agg_val_*`. Boosting a parent role automatically covers all autonomous agents that run on that model.
 
 #### BoostLogger (`backend/shared/boost_logger.py`)
 - Singleton. Log file: `backend/data/boost_api_log.txt`
 - Methods: `log_api_call`, `get_logs(limit)`, `clear_logs`, `get_stats`
+- Boost logs are merged into the main API call log view; boost endpoints remain available for boost-only debugging.
 
-#### Workflow Task Generation (Direct from Agent Sequences)
-Coordinators read actual agent `task_sequence` counters — no prediction. Task IDs exactly match what agents will generate.
+#### Workflow Task Generation (Internal Backend Tracking)
+Coordinators track task IDs internally for boost routing. The frontend does NOT display predicted task lists.
 - Aggregator: `agg_sub{N}_{seq:03d}`, `agg_val_{seq:03d}`
 - Compiler: `comp_hc_{seq:03d}`, `comp_hp_{seq:03d}`, `comp_val_{seq:03d}`
 - Autonomous: `auto_te_{seq:03d}`, `auto_tev_{seq:03d}`, `auto_ts_{seq:03d}`, `auto_tv_{seq:03d}`
@@ -93,9 +93,9 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 ## WebSocket Events
 
-**Workflow:** `workflow_updated` (tasks+mode), `task_started` (task_id), `task_completed` (task_id+sequence), `token_usage_updated` (total_input, total_output, by_model, elapsed_seconds)
+**Workflow:** `workflow_updated` (mode), `token_usage_updated` (total_input, total_output, by_model, elapsed_seconds)
 
-**Boost:** `boost_enabled` (model_id, provider, context_window, max_output_tokens), `boost_disabled`, `task_boost_toggled` (task_id, boosted), `boost_next_count_updated` (count), `category_boost_toggled` (category, boosted), `boost_credits_exhausted` (task_id, message)
+**Boost:** `boost_enabled` (model_id, provider, context_window, max_output_tokens), `boost_disabled`, `boost_next_count_updated` (count), `category_boost_toggled` (category, boosted), `boost_credits_exhausted` (task_id, message)
 
 **Fallback:** `openrouter_fallback` (role_id, reason, message, fallback_model), `openrouter_fallback_failed` (role_id, reason, message), `openrouter_fallbacks_reset` (reset_roles, message)
 
@@ -115,11 +115,10 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `GET /api/boost/status` — Current config, counts, categories
 - `POST /api/boost/set-next-count` — Set Boost Next X counter `{ "count": int }`
 - `POST /api/boost/toggle-category/{category}` — Toggle category boost
-- `GET /api/boost/categories?mode=` — Available categories for mode
-- `POST /api/boost/toggle-task/{task_id}` — Legacy per-task boost toggle
+- `GET /api/boost/categories?mode=` — All categories (mode param ignored, always returns all)
 - `GET /api/boost/openrouter-models` — Fetch OpenRouter models (Bearer key header)
 - `GET /api/boost/model-providers?model_id=` — Providers for a model
-- `GET /api/boost/logs?limit=` — Recent boost logs
+- `GET /api/boost/logs?limit=` — Recent boost-only logs (debug)
 - `POST /api/boost/clear-logs` — Clear logs
 
 ### OpenRouter (`backend/api/routes/openrouter.py`)
@@ -136,7 +135,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `GET /api/model-cache` — Cached model ID mapping (display_name → api_id)
 
 ### Workflow (`backend/api/routes/workflow.py`)
-- `GET /api/workflow/predictions` — Next 20 predicted tasks
+- `GET /api/workflow/predictions` — Current workflow mode (also returns tasks for internal use)
 - `GET /api/workflow/history?limit=` — Completed tasks
 - `GET /api/token-stats` — Cumulative token usage (total_input, total_output, by_model, elapsed_seconds)
 
@@ -196,4 +195,4 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 **localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`)
 
-**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs persist to file (`boost_api_log.txt`).
+**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs persist to file (`boost_api_log.txt`) and are merged into the main API call log view.
diff --git a/.cursor/rules/json-prompt-design.mdc b/.cursor/rules/json-prompt-design.mdc
index bae4719..ee05f4d 100644
--- a/.cursor/rules/json-prompt-design.mdc
+++ b/.cursor/rules/json-prompt-design.mdc
@@ -2424,21 +2424,21 @@ Proceed Without References:
 
 **File:** `backend/autonomous/prompts/paper_reference_prompts.py`
 
-**Function:** `get_reference_selection_json_schema()`
+**Function:** `get_reference_selection_json_schema(max_papers)`
 
 ```
 REQUIRED JSON FORMAT:
 {
-  "selected_papers": ["array of up to 6 paper_ids"],
+  "selected_papers": ["array of up to caller cap paper_ids"],
   "reasoning": "string - Why these specific papers are very useful for the upcoming paper"
 }
 
 FIELD REQUIREMENTS:
-- selected_papers: Array of paper IDs (maximum 6, can be empty)
+- selected_papers: Array of paper IDs (maximum = caller-provided cap, can be empty)
 - reasoning: ALWAYS required
 
 CONSTRAINTS:
-- Maximum 6 papers can be selected (hard limit for context budget)
+- Caller supplies the cap: 3 for the normal topic-cycle reference workflow, 6 for Tier 3 short-form reference selection
 - Papers must be selected from those shown in expansion request
 
 EXAMPLE:
@@ -2620,9 +2620,10 @@ All Part 3 prompts follow similar assembly patterns to Part 1 and Part 2:
 - Purpose: Add additional relevant papers based on brainstorm insights
 
 **Paper Title Selection:**
-- Brainstorm database (RAG)
-- Existing paper titles from same brainstorm
-- Selected reference papers (if any, RAG)
+- Brainstorm summary (direct injection; no full brainstorm RAG)
+- Existing paper titles and abstracts from same brainstorm
+- Selected reference paper title/abstract summaries (if any, direct injection)
+- Validated candidate titles from title exploration (direct injection)
 
 **Paper Compilation:**
 - Uses Part 2 Compiler context (outline, paper, brainstorm DB, reference papers)
diff --git a/.cursor/rules/part-2-compiler-tool-design-specification.mdc b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
index 4559443..dfabd4f 100644
--- a/.cursor/rules/part-2-compiler-tool-design-specification.mdc
+++ b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
@@ -11,6 +11,8 @@ Compiler runs independently from aggregator (manual start via API only). Strict
 
 Reads aggregator database + user prompt, distills into a single coherent paper. 1 high-context submitter + 1 high-param submitter + 1 validator. Sequential workflow (no parallel submitters).
 
+Aggregator/brainstorm database material is high-priority optional source context, not a mandatory checklist. Compiler submitters may selectively use, synthesize beyond, or depart from database material when that better serves the user's prompt and remains rigorous. Validator must not reject solely for selective non-use of database material.
+
 **Context Anchors**:
 - **Paper Anchor**: `[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]`
 - **Outline Anchor** (two lines): `[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]` then `[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]`
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index a284f38..cf0d7e6 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -59,11 +59,13 @@ The autonomous coordinator USES actual Part 1 aggregator infrastructure for brai
 ### Part 2 Compiler Integration (Tier 2)
 The autonomous coordinator USES actual Part 2 compiler infrastructure for paper compilation:
 - Creates separate `CompilerCoordinator` instance per paper
-- Configures with brainstorm database as primary source
-- Adds reference papers (up to 6) to RAG context if selected
+- Configures with brainstorm database as high-priority optional source material
+- Adds selected reference papers to RAG context if selected (topic-cycle cap 3; Tier 3 short-form cap 6)
 - Monitors compiler progress to detect abstract completion (final section)
 - Extracts abstract from completed paper for metadata storage
 
+Compiler submitters may selectively use, synthesize beyond, or depart from brainstorm material when that better serves the user's prompt and remains rigorous. Validator must not reject solely for selective non-use of brainstorm/database material.
+
 **Critical Implementation Details**:
 - **system_config propagation (REQUIRED)**: Before creating `CompilerCoordinator`, autonomous mode MUST write all compiler context/token settings to `system_config` (e.g., `system_config.compiler_high_context_context_window = self._high_context_context`). Compiler modules read from `system_config` at init — the manual `/api/compiler/start` route does this, but autonomous mode bypasses that route and must do it explicitly. Applies to both `_compile_paper_from_brainstorm()` and `_compile_tier3_paper()`.
 - Constrains section order: Body → Conclusion → Introduction → Abstract
@@ -224,7 +226,7 @@ After topic selection is validated, the reference selector:
 1. Reviews ALL completed paper abstracts
 2. Requests expansion of papers that would be VERY USEFUL for brainstorm exploration
 3. Reviews full content of expanded papers
-4. Selects up to 6 papers to use as context during brainstorming
+4. Selects up to 3 papers to use as topic-cycle base context during brainstorming
 5. Selected papers are loaded into brainstorm aggregator as `user_files`
 
 ### Why Outlines Are Included
@@ -242,11 +244,12 @@ After topic selection is validated, the reference selector:
 - Outlines are fetched from `paper_{paper_id}_outline.txt`
 - If outline is unavailable, displays "[Not available]"
 - Outlines are included in BOTH abstract review (Step 1) AND full paper review (Step 2)
+- Paper titles shown during reference review and later selected-reference contexts include compact validator-review snapshots: initial system critique always, plus up to the latest 4 user-triggered critiques when available. Snapshot content is model ID + novelty/correctness/impact ratings only (no feedback text).
 
 ### Two-Step Browsing Workflow
 
 **Step 1**: Review abstracts+outlines → Request expansion of promising papers  
-**Step 2**: Review full content → Final selection (max 6 papers)
+**Step 2**: Review full content → Final selection (max 3 papers)
 
 Context: Direct inject if fits (~40% budget), RAG if too large. No truncation.
 
@@ -257,7 +260,7 @@ Context: Direct inject if fits (~40% budget), RAG if too large. No truncation.
 - Current brainstorm topic prompt (direct injection)
 - ALL Tier 2 paper titles + abstracts + outlines (direct injection if fits, RAG if too large)
 
-JSON schemas defined in `json-prompt-design.mdc`. Two-step: submitter requests paper expansions (`expand_papers`, `proceed_without_references`), then makes final selection (`selected_papers`). Max 6 papers total.
+JSON schemas defined in `json-prompt-design.mdc`. Two-step: submitter requests paper expansions (`expand_papers`, `proceed_without_references`), then makes final selection (`selected_papers`). Max 3 papers total for the topic cycle.
 
 **Context Handling (DIRECT INJECTION FIRST, RAG SECOND):**
 
@@ -274,7 +277,7 @@ JSON schemas defined in `json-prompt-design.mdc`. Two-step: submitter requests p
 - Submitter CHOOSES which papers to expand (not automatic expansion of all papers)
 - Submitter makes FINAL selection after reviewing full content
 - System intelligently handles large papers via RAG when needed
-- Maximum 6 papers enforced across both selection modes
+- Maximum 3 papers enforced across the topic-cycle selection modes
 
 ### Context for Pre-Brainstorm Reference Selection
 - User's high-level research prompt (direct injection)
@@ -284,7 +287,7 @@ JSON schemas defined in `json-prompt-design.mdc`. Two-step: submitter requests p
 
 ### Key Design Points
 - **Same references persist**: References selected here are used for BOTH brainstorming AND paper writing
-- **Additional selection later**: AI can select MORE references (up to 6 total) before paper writing
+- **Additional selection later**: AI can select MORE references (up to 3 total) before paper writing
 - **No re-selection/removal**: Already-selected references remain selected throughout topic cycle
 
 ---
@@ -445,7 +448,7 @@ Once completion review decides WRITE_PAPER (and self-validates), the system tran
 
 **SKIP THIS STEP if**:
 - No Tier 2 papers exist yet, OR
-- Already at max capacity (6 papers selected during pre-brainstorm)
+- Already at max capacity (3 papers selected during pre-brainstorm)
 
 **Context**:
 - Papers already selected for brainstorming (shown as "ALREADY SELECTED")
@@ -455,7 +458,7 @@ Once completion review decides WRITE_PAPER (and self-validates), the system tran
 **Key Differences from Pre-Brainstorm Selection**:
 - Shows which papers are ALREADY SELECTED (cannot be removed)
 - Only shows papers NOT YET selected for expansion
-- Maximum additional papers = 6 - (already selected count)
+- Maximum additional papers = 3 - (already selected count)
 - Benefits from brainstorm insights to identify newly-relevant papers
 
 ### Two-Step Browsing Workflow (Additional Mode)
@@ -467,7 +470,7 @@ Same two-step browsing workflow as pre-brainstorm selection (expand request →
 - Rejects if reasoning is unsound or selection doesn't align with brainstorm content
 - Rejection feedback goes to rolling cache
 
-**Final Reference List**: Already-selected papers + newly-selected papers (max 6 total)
+**Final Reference List**: Already-selected papers + newly-selected papers (max 3 total)
 
 ### Paper Title Exploration (Pre-Title Candidate Brainstorm)
 
@@ -497,8 +500,8 @@ Same two-step browsing workflow as pre-brainstorm selection (expand request →
 
 **Context**:
 - User's high-level research prompt
-- Current brainstorm database (RAG)
-- Selected reference papers (if any, RAG)
+- Current brainstorm summary (direct injection; no full brainstorm RAG in title selection)
+- Selected reference paper summaries (if any, direct injection)
 - ALL existing paper titles from THIS brainstorm topic (direct injection)
 - ALL existing paper abstracts from THIS brainstorm topic (if any, direct injection)
 - **5 validated candidate titles from Paper Title Exploration phase** (direct injection)
@@ -521,10 +524,11 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `paper_title`, `reasoni
 
 **Validator Role**:
 - Topic validator reviews title selection
+- Validator also sees selected reference paper summaries (if any) so acceptance/rejection reflects the intended paper scope
 - Rejects if title is too similar to **EXISTING COMPLETED PAPERS** from this brainstorm (NOT brainstorm submissions!)
 - Rejects if title doesn't align with brainstorm content
 - DO NOT reject simply because title reflects brainstorm submission content - that is INTENDED behavior
-- Rejection feedback goes to rolling cache
+- Rejection feedback is threaded into subsequent retries within the current title-selection loop (keeps last 5 attempts in local retry history)
 
 ---
 
@@ -872,7 +876,7 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `answer_format` (short_
 
 **Workflow**:
 
-1. **Reference Selection**: Browse all papers, select up to 6 for direct injection
+1. **Reference Selection**: Browse all papers, select up to 6 for Tier 3 short-form context
 2. **Title Selection**: Title that directly answers user's prompt (uses existing `PaperTitleSelectorAgent`)
 3. **Paper Compilation**: Use existing Tier 2 compiler infrastructure
    - Outline creation → Body → Conclusion → Introduction → Abstract
@@ -912,6 +916,8 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `volume_title`, `chapte
 2. **Conclusion Paper**: Synthesizes all chapters, directly answers user's question
 3. **Introduction Paper**: Frames the volume, provides roadmap (written LAST)
 
+**Chapter Reference Scope**: Gap/introduction/conclusion chapter writing uses all `existing_paper` chapters chosen for the organized volume as references. There is no separate 6-paper selector inside long-form chapter writing.
+
 **Volume Assembly**: After all chapters are written:
 - Papers are combined into final volume
 - Displayed in "FINAL ANSWER" section of GUI
@@ -1517,7 +1523,8 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
   - Constrained section order (body → conclusion → intro → abstract)
   - AI-generated paper titles instead of user-provided prompts
   - Reference paper selection workflow
-  - Brainstorm database as primary source
+  - Brainstorm database as high-priority optional source material
+  - Selective non-use of brainstorm/database material is allowed when the resulting paper is stronger, rigorous, and aligned with the prompt
 
 ### Running Modes
 - **Part 1, Part 2, and Part 3 remain user-selectable modes**
@@ -1599,7 +1606,7 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 5. **Paper is NOT complete until abstract is written AND validated** - Sequential order must complete
 6. **Same model MUST self-validate completion review decisions** - SPECIAL SELF-VALIDATION MODE
 7. **Completion review counts both acceptances and removals** - Pruning counts toward 10-acceptance trigger
-8. **Maximum 6 reference papers total** - Context budget constraint (applies to brainstorm AND paper writing)
+8. **Maximum 3 topic-cycle base reference papers total** - Applies across pre-brainstorm + additional selection for brainstorm/Tier 2 paper writing. Tier 3 short-form keeps its own 6-paper selection cap, and Tier 3 long-form chapter writing uses all selected `existing_paper` volume chapters as references.
 9. **Paper section order is FIXED**: Body → Conclusion → Introduction → Abstract - Cannot skip or reorder
 10. **Paper redundancy review is CONSERVATIVE** - Maximum 1 removal per cycle, when in doubt keep
 11. **Workflow state is ALWAYS persisted for crash recovery** - System auto-resumes from last checkpoint on restart
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index 86e5844..b0eb31e 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -18,7 +18,7 @@ project-root/
 │   │   ├── lm_studio_client.py          # LM Studio HTTP API client
 │   │   ├── openrouter_client.py         # OpenRouter HTTP API client (credit exhaustion detection)
 │   │   ├── api_client_manager.py        # Unified API router (OpenRouter/LM Studio fallback + boost)
-│   │   ├── boost_manager.py             # Singleton boost manager (tracks boosted tasks)
+│   │   ├── boost_manager.py             # Singleton boost manager (tracks boost modes: next-count, always-prefer, category)
 │   │   ├── boost_logger.py              # Boost API call logger (persists to boost_api_log.txt)
 │   │   ├── workflow_predictor.py        # Predicts next 20 API calls (mode-specific algorithms)
 │   │   ├── free_model_manager.py        # Free model rotation/cooldown singleton (looping + auto-selector backup)
@@ -222,7 +222,7 @@ project-root/
 │   │   │       ├── BrainstormList.jsx       # List all brainstorm topics with status
 │   │   │       ├── PaperLibrary.jsx         # Grid view of completed papers (title + abstract)
 │   │   │       ├── AutonomousResearchSettings.jsx  # Model configs for all roles
-│   │   │       ├── AutonomousResearchLogs.jsx      # Metrics, graphs, event log
+│   │   │       ├── AutonomousResearchLogs.jsx      # Metrics, graphs, event log, combined API call logs
 │   │   │       ├── LivePaperProgress.jsx    # Real-time Tier 2 paper display (embedded in interface)
 │   │   │       ├── LiveTier3Progress.jsx    # Real-time Tier 3 final answer display (embedded in interface)
 │   │   │       ├── FinalAnswerView.jsx      # TIER 3 - Final answer tab (separate tab for completed answers)
@@ -237,12 +237,10 @@ project-root/
 │   │   ├── CritiqueNotificationStack.jsx # Persistent popup notifications for high-scoring critiques (≥7.0 avg)
 │   │   ├── CreditExhaustionNotificationStack.jsx # Persistent red notifications for OpenRouter credit exhaustion with "Retry OpenRouter" reset button
 │   │   ├── HungConnectionNotificationStack.jsx # Persistent amber notifications for API calls exceeding 15 minutes (possible hung connections)
-│   │   ├── BoostLogs.jsx                # Boost API call log viewer
-│   │   ├── BoostLogs.css                # Boost logs styles
-│   │   ├── BoostControlModal.jsx        # Modal for boost configuration (next-X, category, per-task)
+│   │   ├── BoostControlModal.jsx        # Modal for boost configuration (next-X, category, always-prefer)
 │   │   ├── BoostControlModal.css        # Boost control modal styles
-│   │   ├── WorkflowPanel.jsx            # Workflow prediction panel (next 20 API calls display)
-│   │   ├── WorkflowPanel.css            # Workflow panel styles
+│   │   ├── WorkflowPanel.jsx            # Boost controls panel (Boost Next X, Always Prefer, Category Boost, token stats, research timer)
+│   │   ├── WorkflowPanel.css            # Boost controls panel styles
 │   │   ├── TextFileUploader.jsx         # User file upload component
 │   │   ├── TextFileUploader.css         # File uploader styles
 │   │   ├── OpenRouterPrivacyWarningModal.jsx # Privacy policy error modal (OpenRouter data sharing)
@@ -269,7 +267,7 @@ project-root/
 ├── requirements.txt                     # Python dependencies
 ├── package.json                         # Root scripts
 ├── SECURITY.md                          # Security policy and private vulnerability reporting
-├── Press to Launch MOTO.bat             # The user's one-click program launcher.
+├── Click To Launch MOTO.bat             # The user's one-click program launcher.
 └── _moto_internal_launcher.ps1          # Internal PowerShell launcher (not for direct user use)
 
 ## File Purpose Descriptions
@@ -281,9 +279,9 @@ project-root/
 - `lm_studio_client.py`: LM Studio HTTP client (completions, embeddings, model listing)
 - `openrouter_client.py`: OpenRouter HTTP client (credit exhaustion detection, fallback)
 - `api_client_manager.py`: Unified API router (OpenRouter/LM Studio fallback + boost + model tracking)
-- `boost_manager.py`: Singleton boost manager (tracks boosted tasks, broadcasts events)
-- `boost_logger.py`: Boost API call logger (persists to `boost_api_log.txt`)
-- `workflow_predictor.py`: Predicts next 20 API calls (mode-specific algorithms)
+- `boost_manager.py`: Singleton boost manager (three modes: Boost Next X Calls, Always Prefer Boost, Category Boost; broadcasts events)
+- `boost_logger.py`: Boost API call logger (persists boost-routed calls for the combined API log view)
+- `workflow_predictor.py`: Predicts next 20 API calls for internal boost routing (not displayed in UI)
 - `free_model_manager.py`: Free model rotation/cooldown singleton (looping, auto-selector `openrouter/free`, account exhaustion detection)
 - `wolfram_alpha_client.py`: Wolfram Alpha API client for rigor verification
 - `rag_lock.py`: Global RAG operation lock (prevents collision, retry logic for reads)
@@ -325,5 +323,5 @@ project-root/
 - **Aggregator**: `AggregatorInterface.jsx`, `AggregatorSettings.jsx`, `AggregatorLogs.jsx`, `LiveResults.jsx`
 - **Compiler**: `CompilerInterface.jsx`, `CompilerSettings.jsx`, `CompilerLogs.jsx`, `LivePaper.jsx`
 - **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx`, `ArchiveViewerModal.jsx`
-- **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostLogs.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
+- **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
 - **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
diff --git a/.github/ISSUE_TEMPLATE/bug_report.yml b/.github/ISSUE_TEMPLATE/bug_report.yml
new file mode 100644
index 0000000..57df786
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/bug_report.yml
@@ -0,0 +1,81 @@
+name: Bug report
+description: Report a reproducible problem in MOTO.
+title: "[Bug]: "
+body:
+  - type: checkboxes
+    attributes:
+      label: Before submitting
+      description: Confirm the following before opening a public issue.
+      options:
+        - label: I searched existing issues and did not find a duplicate.
+          required: true
+        - label: I reviewed the relevant documentation in `README.md`, `CONTRIBUTING.md`, or `.cursor/rules/` when applicable.
+          required: false
+        - label: This is not a security vulnerability or secret exposure. I will use `security@intrafere.com` for security reports.
+          required: true
+  - type: dropdown
+    id: area
+    attributes:
+      label: Affected area
+      description: Which part of the project is impacted?
+      options:
+        - Aggregator (Tier 1)
+        - Compiler (Tier 2)
+        - Autonomous Research (Tier 3)
+        - Frontend / UI
+        - API / backend
+        - Documentation
+        - Other
+    validations:
+      required: true
+  - type: textarea
+    id: description
+    attributes:
+      label: Describe the bug
+      description: Clear description of what is happening.
+      placeholder: The compiler validator rejects a valid section update after the outline is accepted...
+    validations:
+      required: true
+  - type: textarea
+    id: reproduce
+    attributes:
+      label: Steps to reproduce
+      description: List the exact steps needed to trigger the problem.
+      placeholder: |
+        1. Open...
+        2. Click...
+        3. Start...
+        4. Observe...
+    validations:
+      required: true
+  - type: textarea
+    id: expected
+    attributes:
+      label: Expected behavior
+      description: What did you expect to happen instead?
+    validations:
+      required: true
+  - type: textarea
+    id: environment
+    attributes:
+      label: Environment
+      description: Include anything relevant about your setup.
+      placeholder: |
+        - OS: Windows 11
+        - Python version:
+        - Node.js version:
+        - LM Studio version:
+        - Models used:
+    validations:
+      required: true
+  - type: textarea
+    id: logs
+    attributes:
+      label: Logs and screenshots
+      description: Paste relevant backend logs, browser console output, stack traces, or screenshots.
+      render: shell
+  - type: textarea
+    id: additional
+    attributes:
+      label: Additional context
+      description: Add any other details that might help reproduce or diagnose the issue.
diff --git a/.github/ISSUE_TEMPLATE/config.yml b/.github/ISSUE_TEMPLATE/config.yml
new file mode 100644
index 0000000..e57ccf1
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/config.yml
@@ -0,0 +1,5 @@
+blank_issues_enabled: false
+contact_links:
+  - name: Report a security vulnerability
+    url: https://github.com/Intrafere/MOTO-Autonomous-ASI/security/policy
+    about: Do not open a public issue for security reports. Follow the Security Policy and email security@intrafere.com instead.
diff --git a/.github/ISSUE_TEMPLATE/feature_request.yml b/.github/ISSUE_TEMPLATE/feature_request.yml
new file mode 100644
index 0000000..922ca52
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/feature_request.yml
@@ -0,0 +1,57 @@
+name: Feature request
+description: Suggest an improvement or new capability for MOTO.
+title: "[Feature]: "
+body:
+  - type: checkboxes
+    attributes:
+      label: Before submitting
+      description: Confirm the following before opening a feature request.
+      options:
+        - label: I searched existing issues and did not find a duplicate request.
+          required: true
+        - label: I reviewed the relevant architecture notes in `.cursor/rules/` for the areas this may affect.
+          required: false
+  - type: textarea
+    id: problem
+    attributes:
+      label: Problem to solve
+      description: What problem, limitation, or missing workflow are you trying to address?
+      placeholder: It is difficult to see why a Tier 3 phase was skipped when reviewing past sessions...
+    validations:
+      required: true
+  - type: textarea
+    id: solution
+    attributes:
+      label: Proposed solution
+      description: Describe the behavior or capability you want to add.
+    validations:
+      required: true
+  - type: textarea
+    id: alternatives
+    attributes:
+      label: Alternatives considered
+      description: Describe any alternatives or workarounds you have considered.
+  - type: checkboxes
+    id: impact
+    attributes:
+      label: Likely impact areas
+      description: Select every area this request may affect.
+      options:
+        - label: Aggregator (Tier 1)
+        - label: Compiler (Tier 2)
+        - label: Autonomous Research (Tier 3)
+        - label: RAG / retrieval pipeline
+        - label: Backend API
+        - label: Frontend / UI
+        - label: Documentation
+  - type: textarea
+    id: architecture
+    attributes:
+      label: Architecture impact
+      description: Explain any expected impact on workflows, models, persistence, or UI behavior.
+      placeholder: This would add a new Tier 3 status event and a small settings toggle in the autonomous UI...
+  - type: textarea
+    id: context
+    attributes:
+      label: Additional context
+      description: Add mockups, examples, related issues, or anything else that helps explain the request.
diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
new file mode 100644
index 0000000..aec49a5
--- /dev/null
+++ b/.github/pull_request_template.md
@@ -0,0 +1,28 @@
+> Do not use a public pull request for an undisclosed security vulnerability. Report security concerns privately to `security@intrafere.com` instead.
+
+## Summary
+- Briefly describe the change.
+- Explain why it was needed.
+
+## Related Issue
+Fixes #
+
+## Testing
+- [ ] Tested with LM Studio models
+- [ ] Tested with OpenRouter models
+- [ ] Tested aggregator workflow
+- [ ] Tested compiler workflow
+- [ ] Tested autonomous research
+- [ ] UI changes work in Chrome/Firefox/Edge
+
+## Screenshots (if UI changes)
+[Add screenshots]
+
+## Checklist
+- [ ] Code follows style guidelines
+- [ ] Documentation updated
+- [ ] No new warnings/errors
+- [ ] Tested on Windows/Mac/Linux (if applicable)
+
+## Notes for Reviewers
+- Include any extra context, tradeoffs, or follow-up work here.
diff --git a/.gitignore b/.gitignore
index fa067da..4aee7fb 100644
--- a/.gitignore
+++ b/.gitignore
@@ -82,6 +82,7 @@ backend/data/chroma_db/*
 !backend/data/chroma_db/.gitkeep
 
 backend/data/boost_api_log.txt
+backend/data/boost_state.json
 backend/data/model_cache.json
 backend/data/paper_version_*.txt
 backend/data/critique_feedback_*.txt
diff --git a/Press to Launch MOTO.bat b/Click To Launch MOTO.bat
similarity index 100%
rename from Press to Launch MOTO.bat
rename to Click To Launch MOTO.bat
diff --git a/README.md b/README.md
index 21f3af8..7e2b85c 100644
--- a/README.md
+++ b/README.md
@@ -1,16 +1,16 @@
 # MOTO Autonomous ASI - Novel S.T.E.M. Solution Variant for ASI Automated Theory Generation
 # Autonomous Superintelligence Deep Research Harness
-**Version: 1.0.5**
+**Version: 1.0.6**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration changes how we look at AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation for mathematics: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for other research topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assist in decyphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
-### The Core Discovery: Top-P Exploration (Solution Basin Aggregation)
+### The Core Discovery: Top-P Exploration 
 
-MOTO is built on a [key insight](https://intrafere.com/structured-brainstorming-validated-feedback/) about how generative transformers operate: **transformers predict what tokens come next, so providing them with their own prior ideas enables deeper probing of the solution space**. This is called **solution basin aggregation** — each brainstorming pass explores a richer, more informed landscape, and the cross-recombination of "mined" knowledge compounds to create new insights that do not exist from the model's training alone. Intrafere considers this the mechanism that produces [ASI-like results](https://intrafere.com/structured-brainstorming-validated-feedback/) in practice. MOTO essentially "mines" creativity from a transformer's knowledge set, and this compounding effect is what differentiates it from traditional single-pass AI.
+MOTO is built on a [key insight](https://intrafere.com/structured-brainstorming-validated-feedback/) about how generative transformers operate: **transformers predict what tokens come next, so providing them with their own prior ideas enables deeper probing of the solution space**. At Intrafere, we have been calling this constrained brainstorming **solution basin aggregation** — each round of brainstorming explores a richer, more informed landscape, and the cross-recombination of "mined" knowledge compounds to create new insights that do not exist from the model's training alone. Intrafere considers this the mechanism that produces [ASI-like results](https://intrafere.com/structured-brainstorming-validated-feedback/) in practice. MOTO essentially "mines" creativity from a transformer's knowledge set, and this compounding effect is what differentiates it from traditional single-pass AI.
 
 The brainstorming phase runs **multiple submitters in parallel**, each independently exploring the solution space, funneled into a **single bottleneck validator** — a completely separate model instance whose only job is to decide whether each submission genuinely advances the knowledge base. This architectural separation between creative exploration and critical evaluation mitigates the hallucination loops and drift that plague single-model autonomous agents. Every rejection carries specific feedback that steers the next round of exploration, so failure is never wasted. Iterative pruning continuously removes entries that become redundant as stronger ideas emerge, producing an ever-denser, self-refining knowledge base. [View the learning curve data](https://intrafere.com/motos-brainstorming-potential-data/) for empirical evidence of this approach.
 
@@ -20,7 +20,7 @@ Once a brainstorm is sufficiently explored, MOTO writes a research paper from it
 
 MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is an experimental system; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
-Give the program a try, MOTO is as cool as it sounds – there is a one-click installer. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green “< > Code” drop-down menu on the top right of this GitHub page, download the zip file, extract it to your desktop then double-click "Press to Launch MOTO.bat". Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile – if desired and you are unsure you may use the preselected “fastest” profile.
+Give the program a try, MOTO is as cool as it sounds – there is a one-click installer. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green “< > Code” drop-down menu on the top right of this GitHub page, download the zip file, extract it to your desktop then double-click "Click To Launch MOTO.bat". Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile – if desired and you are unsure you may use the preselected “fastest” profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
 
@@ -61,7 +61,7 @@ Before installation, you need:
 
 1. Clone or download this repository
 2. Start LM Studio and load your models and "nomic-embed-text-v1.5" agent **and/or** have your OpenRouter API key ready
-3. **Double-click `Press to Launch MOTO.bat`**
+3. **Double-click `Click To Launch MOTO.bat`**
 4. After acknowledging the disclaimer, choose one of the startup setup paths:
    - Enter your OpenRouter API key
    - Confirm that LM Studio is already running with a loaded model
@@ -155,7 +155,7 @@ moto-math-variant/
 │       └── services/        # API and WebSocket clients
 ├── .cursor/
 │   └── rules/               # AI agent design specifications (full system documentation)
-├── Press to Launch MOTO.bat  # One-click Windows launcher
+├── Click To Launch MOTO.bat  # One-click Windows launcher
 ├── requirements.txt         # Python dependencies
 └── package.json             # Node.js dependencies
 ```
diff --git a/_moto_internal_launcher.ps1 b/_moto_internal_launcher.ps1
index 26f7bc2..7d45baa 100644
--- a/_moto_internal_launcher.ps1
+++ b/_moto_internal_launcher.ps1
@@ -1,5 +1,5 @@
 # MOTO Internal Launcher (PowerShell)
-# This is an internal script. Use "Press to Launch MOTO.bat" instead.
+# This is an internal script. Use "Click To Launch MOTO.bat" instead.
 # If needed manually: powershell -ExecutionPolicy Bypass -File _moto_internal_launcher.ps1
 
 # ================================================================
@@ -140,30 +140,30 @@ try {
     if (-not (Test-Path "node_modules")) {
         Write-Host "Installing Node.js dependencies..." -ForegroundColor Yellow
         Write-Host "This may take a few minutes..." -ForegroundColor Yellow
-        Write-Host ""
-        $npmInstallLog = Join-Path $env:TEMP ("moto_npm_install_{0}.log" -f ([guid]::NewGuid().ToString("N")))
-        npm install 2>&1 | Tee-Object -FilePath $npmInstallLog
-        $npmInstallExit = $LASTEXITCODE
-        if (Test-Path $npmInstallLog) {
-            $showVulnerabilityRestartHint = Select-String -Path $npmInstallLog -Pattern "vulnerabilities found" -Quiet
-            Remove-Item -Path $npmInstallLog -Force -ErrorAction SilentlyContinue
-        }
-        if ($npmInstallExit -ne 0) {
-            Write-Host ""
-            Write-Host "============================================================" -ForegroundColor Red
-            Write-Host "ERROR: Failed to install Node.js dependencies" -ForegroundColor Red
-            Write-Host "============================================================" -ForegroundColor Red
-            Write-Host ""
-            Write-Host "Please check:" -ForegroundColor Yellow
-            Write-Host "- Internet connection is working" -ForegroundColor Yellow
-            Write-Host "- package.json exists in frontend directory" -ForegroundColor Yellow
-            Set-Location ..
-            Exit-WithPause -ExitCode 1
-        }
-        Write-Host "Node.js dependencies installed successfully" -ForegroundColor Green
     } else {
-        Write-Host "Node.js dependencies already installed" -ForegroundColor Green
+        Write-Host "Updating Node.js dependencies..." -ForegroundColor Yellow
+    }
+    Write-Host ""
+    $npmInstallLog = Join-Path $env:TEMP ("moto_npm_install_{0}.log" -f ([guid]::NewGuid().ToString("N")))
+    npm install 2>&1 | Tee-Object -FilePath $npmInstallLog
+    $npmInstallExit = $LASTEXITCODE
+    if (Test-Path $npmInstallLog) {
+        $showVulnerabilityRestartHint = Select-String -Path $npmInstallLog -Pattern "vulnerabilities found" -Quiet
+        Remove-Item -Path $npmInstallLog -Force -ErrorAction SilentlyContinue
+    }
+    if ($npmInstallExit -ne 0) {
+        Write-Host ""
+        Write-Host "============================================================" -ForegroundColor Red
+        Write-Host "ERROR: Failed to install Node.js dependencies" -ForegroundColor Red
+        Write-Host "============================================================" -ForegroundColor Red
+        Write-Host ""
+        Write-Host "Please check:" -ForegroundColor Yellow
+        Write-Host "- Internet connection is working" -ForegroundColor Yellow
+        Write-Host "- package.json exists in frontend directory" -ForegroundColor Yellow
+        Set-Location ..
+        Exit-WithPause -ExitCode 1
     }
+    Write-Host "Node.js dependencies up to date" -ForegroundColor Green
     if ($showVulnerabilityRestartHint) {
         Write-Host "" 
         Write-Host "NOTE: npm reported vulnerability warnings during install." -ForegroundColor Yellow
diff --git a/backend/aggregator/agents/submitter.py b/backend/aggregator/agents/submitter.py
index de2e5b3..12123ec 100644
--- a/backend/aggregator/agents/submitter.py
+++ b/backend/aggregator/agents/submitter.py
@@ -145,18 +145,9 @@ async def _run_loop(self) -> None:
                 await asyncio.sleep(2)
                 
             except FreeModelExhaustedError as e:
-                if e.soonest_retry:
-                    import time as _time
-                    wait_secs = max(0, e.soonest_retry - _time.time())
-                    wait_mins = round(wait_secs / 60, 1)
-                    logger.warning(
-                        f"SERIAL BOTTLENECK: Submitter {self.submitter_id} paused for "
-                        f"{wait_mins} minutes (all free models rate-limited)"
-                    )
-                    await asyncio.sleep(wait_secs)
-                else:
-                    logger.error(f"Submitter {self.submitter_id}: all free models exhausted: {e}")
-                    await asyncio.sleep(60)
+                # All free models exhausted after retries - wait briefly and retry
+                logger.warning(f"Submitter {self.submitter_id}: all free models exhausted: {e}")
+                await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             except Exception as e:
                 logger.error(f"Submitter {self.submitter_id} error on iteration {iteration}: {e}", exc_info=True)
                 await asyncio.sleep(5)
@@ -236,6 +227,7 @@ async def _generate_submission(self) -> Optional[Submission]:
             
             # Generate completion with retry for 400 errors
             response = None
+            call_metadata = {}
             max_retries = 3  # 400 errors won't fix themselves - fail fast
             
             for attempt in range(max_retries):
@@ -249,6 +241,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                         temperature=0.0,  # Deterministic generation - evolving context provides diversity
                         max_tokens=self.max_output_tokens  # Per-submitter max output tokens
                     )
+                    call_metadata = api_client_manager.extract_call_metadata(response)
                     break  # Success
                     
                 except (httpx.HTTPStatusError, ValueError) as e:
@@ -277,7 +270,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                     raise
                 except RuntimeError as e:
                     if "credits exhausted" in str(e).lower():
-                        raise FreeModelExhaustedError(str(e), soonest_retry=None)
+                        raise FreeModelExhaustedError(str(e))
                     logger.error(f"Submitter {self.submitter_id}: Unexpected error during completion: {e}")
                     if self.task_tracking_callback:
                         self.task_tracking_callback("completed", task_id)
@@ -389,6 +382,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                         )
                     
                     if retry_response_1.get("choices"):
+                        call_metadata = api_client_manager.extract_call_metadata(retry_response_1)
                         retry_output_1 = retry_response_1["choices"][0]["message"]["content"]
                         
                         try:
@@ -460,6 +454,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                                     )
                                 
                                 if retry_response_2.get("choices"):
+                                    call_metadata = api_client_manager.extract_call_metadata(retry_response_2)
                                     retry_output_2 = retry_response_2["choices"][0]["message"]["content"]
                                     
                                     try:
@@ -526,7 +521,8 @@ async def _generate_submission(self) -> Optional[Submission]:
                 chunk_size_used=chunk_size,
                 metadata={
                     "chunk_size": chunk_size,
-                    "rag_used": bool(allocation["rag_context"])
+                    "rag_used": bool(allocation["rag_context"]),
+                    "llm_call": call_metadata,
                 }
             )
             
diff --git a/backend/aggregator/agents/validator.py b/backend/aggregator/agents/validator.py
index 4094ef5..5eff887 100644
--- a/backend/aggregator/agents/validator.py
+++ b/backend/aggregator/agents/validator.py
@@ -3,7 +3,7 @@
 Always uses 512-char chunks for consistency.
 """
 import asyncio
-from typing import Optional, Dict, Callable, List
+from typing import Optional, Dict, Callable, List, Any
 import logging
 import httpx
 
@@ -191,6 +191,7 @@ async def _assess_quality(self, submission: Submission) -> ValidationResult:
             
             # Generate validation with retry for 400 errors
             response = None
+            call_metadata = {}
             max_retries = 3  # 400 errors won't fix themselves - fail fast
             
             for attempt in range(max_retries):
@@ -204,6 +205,7 @@ async def _assess_quality(self, submission: Submission) -> ValidationResult:
                         temperature=0.0,  # Deterministic validation - evolving context provides diversity
                         max_tokens=rag_config.validator_max_output_tokens  # User-configurable max output tokens
                     )
+                    call_metadata = api_client_manager.extract_call_metadata(response)
                     break  # Success
                     
                 except (httpx.HTTPStatusError, ValueError) as e:
@@ -367,6 +369,7 @@ async def _assess_quality(self, submission: Submission) -> ValidationResult:
                         )
                     
                     if retry_response.get("choices"):
+                        call_metadata = api_client_manager.extract_call_metadata(retry_response)
                         retry_output = retry_response["choices"][0]["message"]["content"]
                         
                         try:
@@ -417,7 +420,8 @@ async def _assess_quality(self, submission: Submission) -> ValidationResult:
                 reasoning=parsed["reasoning"],
                 summary=summary,
                 contradiction_check_passed=True,
-                json_valid=True
+                json_valid=True,
+                metadata={"llm_call": call_metadata}
             )
             
             return result
@@ -620,6 +624,7 @@ async def _assess_batch_quality(self, submissions: List[Submission]) -> List[Val
                 self.task_tracking_callback("started", task_id)
             
             # Generate validation using api_client_manager for boost support
+            call_metadata = {}
             response = await api_client_manager.generate_completion(
                 task_id=task_id,
                 role_id=self.role_id,
@@ -628,6 +633,7 @@ async def _assess_batch_quality(self, submissions: List[Submission]) -> List[Val
                 temperature=0.0,
                 max_tokens=rag_config.validator_max_output_tokens
             )
+            call_metadata = api_client_manager.extract_call_metadata(response)
             
             if not response or not response.get("choices"):
                 logger.error("Batch validator: No choices in response")
@@ -655,7 +661,9 @@ async def _assess_batch_quality(self, submissions: List[Submission]) -> List[Val
             except Exception as e:
                 logger.warning(f"Batch validator: JSON parse failed: {e}")
                 # Attempt conversational retry
-                parsed = await self._retry_batch_json_parse(prompt, llm_output, batch_size, task_id)
+                parsed, retry_call_metadata = await self._retry_batch_json_parse(prompt, llm_output, batch_size, task_id)
+                if retry_call_metadata:
+                    call_metadata = retry_call_metadata
                 if parsed is None:
                     return [
                         ValidationResult(
@@ -663,7 +671,8 @@ async def _assess_batch_quality(self, submissions: List[Submission]) -> List[Val
                             decision="reject",
                             reasoning=f"Validator JSON error: {e}",
                             summary="Validator output error",
-                            json_valid=False
+                            json_valid=False,
+                            metadata={"llm_call": call_metadata}
                         )
                         for s in submissions
                     ]
@@ -729,7 +738,8 @@ async def _assess_batch_quality(self, submissions: List[Submission]) -> List[Val
                     reasoning=reasoning,
                     summary=summary,
                     contradiction_check_passed=True,
-                    json_valid=True
+                    json_valid=True,
+                    metadata={"llm_call": call_metadata}
                 ))
             
             # Notify task completed successfully
@@ -763,7 +773,7 @@ async def _retry_batch_json_parse(
         failed_output: str, 
         batch_size: int,
         task_id: str
-    ) -> Optional[Dict]:
+    ) -> tuple[Optional[Dict], Dict[str, Any]]:
         """
         Attempt conversational retry for batch JSON parsing.
         
@@ -774,7 +784,7 @@ async def _retry_batch_json_parse(
             task_id: Task ID for tracking retry attempt
         
         Returns:
-            Parsed JSON dict if successful, None otherwise
+            Tuple of (parsed JSON dict if successful, call metadata dict)
         """
         logger.info("Batch validator: Attempting conversational retry for JSON parse")
         
@@ -805,6 +815,7 @@ async def _retry_batch_json_parse(
         )
         
         try:
+            call_metadata = {}
             # CRITICAL FIX: Truncate failed output to prevent context overflow during retry
             max_failed_output_chars = 2000  # ~500 tokens - enough for error context
             if len(failed_output) > max_failed_output_chars:
@@ -848,16 +859,17 @@ async def _retry_batch_json_parse(
                     temperature=0.0,
                     max_tokens=rag_config.validator_max_output_tokens  # Respect max_tokens on retry
                 )
+            call_metadata = api_client_manager.extract_call_metadata(retry_response)
             
             if retry_response.get("choices"):
                 retry_output = retry_response["choices"][0]["message"]["content"]
                 parsed = parse_json(retry_output)
                 logger.info("Batch validator: Conversational retry succeeded!")
-                return parsed
+                return parsed, call_metadata
         except Exception as e:
             logger.warning(f"Batch validator: Retry failed - {e}")
         
-        return None
+        return None, {}
     
     def _get_system_prompt(self) -> str:
         """Get system prompt for single submission."""
diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index 3767c89..344065a 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -18,6 +18,7 @@
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.free_model_manager import free_model_manager
 from backend.aggregator.agents.submitter import SubmitterAgent
 from backend.aggregator.agents.validator import ValidatorAgent
 from backend.aggregator.core.queue_manager import queue_manager
@@ -165,6 +166,7 @@ async def initialize(
         # Store configurations
         self.submitter_configs = submitter_configs
         self.validator_model = validator_model
+        self.validator_provider = validator_provider
         
         # Override validator context window if provided
         if validator_context_window is not None:
@@ -504,19 +506,18 @@ async def start(self) -> None:
         self.is_running = True
         logger.info("Starting coordinator...")
         
+        # Reset free model manager state for fresh start
+        free_model_manager.reset()
+        
         # Refresh workflow predictions at start
         await self.refresh_workflow_predictions()
         
         if self.single_model_mode:
             # Single-model mode: Round-based sequential workflow
-            # NOTE: Boost routing (if enabled) is INDEPENDENT - it only affects which API
-            # each call uses (OpenRouter vs LM Studio), not whether calls are parallel/serial
             logger.info("Starting single-model workflow (sequential submitters + validator)")
             self._main_task = asyncio.create_task(self._single_model_workflow())
         else:
             # Multi-model mode: Parallel submitters + independent validator
-            # NOTE: Boost can be active here - submitters run in parallel regardless,
-            # boost only affects which API endpoint each call uses
             logger.info("Starting multi-model workflow (parallel submitters)")
             for submitter in self.submitters:
                 await submitter.start()
@@ -617,28 +618,14 @@ async def _validator_loop(self) -> None:
                 logger.info(f"Validator loop cancelled at iteration {iteration}")
                 break
             except FreeModelExhaustedError as e:
-                if e.soonest_retry:
-                    wait_secs = max(0, e.soonest_retry - time.time())
-                    wait_mins = round(wait_secs / 60, 1)
-                    logger.warning(
-                        f"SERIAL BOTTLENECK: Validator paused for {wait_mins} minutes "
-                        f"(all free models rate-limited)"
-                    )
-                    if self.broadcast_callback:
-                        await self.broadcast_callback("serial_bottleneck_paused", {
-                            "role_id": "aggregator_validator",
-                            "model": str(e),
-                            "wait_seconds": round(wait_secs),
-                            "resume_at": time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.soonest_retry)),
-                        })
-                    await asyncio.sleep(wait_secs)
-                    if self.broadcast_callback:
-                        await self.broadcast_callback("serial_bottleneck_resumed", {
-                            "role_id": "aggregator_validator",
-                        })
-                else:
-                    logger.error(f"Validator: all free models exhausted, no cooldown info: {e}")
-                    await asyncio.sleep(60)
+                # All free models exhausted after retries - wait briefly and retry
+                logger.warning(f"Validator: all free models exhausted: {e}")
+                if self.broadcast_callback:
+                    await self.broadcast_callback("free_models_exhausted", {
+                        "role_id": "aggregator_validator",
+                        "message": str(e),
+                    })
+                await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             except Exception as e:
                 logger.error(f"Validator loop error on iteration {iteration}: {e}", exc_info=True)
                 await asyncio.sleep(2)
@@ -733,28 +720,14 @@ async def _single_model_workflow(self) -> None:
                 logger.info(f"Single-model workflow cancelled at round {round_number}")
                 break
             except FreeModelExhaustedError as e:
-                if e.soonest_retry:
-                    wait_secs = max(0, e.soonest_retry - time.time())
-                    wait_mins = round(wait_secs / 60, 1)
-                    logger.warning(
-                        f"SERIAL BOTTLENECK: Single-model workflow paused for {wait_mins} minutes "
-                        f"(all free models rate-limited)"
-                    )
-                    if self.broadcast_callback:
-                        await self.broadcast_callback("serial_bottleneck_paused", {
-                            "role_id": "aggregator_single_model",
-                            "model": str(e),
-                            "wait_seconds": round(wait_secs),
-                            "resume_at": time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.soonest_retry)),
-                        })
-                    await asyncio.sleep(wait_secs)
-                    if self.broadcast_callback:
-                        await self.broadcast_callback("serial_bottleneck_resumed", {
-                            "role_id": "aggregator_single_model",
-                        })
-                else:
-                    logger.error(f"Single-model workflow: all free models exhausted, no cooldown info: {e}")
-                    await asyncio.sleep(60)
+                # All free models exhausted after retries - wait briefly and retry
+                logger.warning(f"Single-model workflow: all free models exhausted: {e}")
+                if self.broadcast_callback:
+                    await self.broadcast_callback("free_models_exhausted", {
+                        "role_id": "aggregator_single_model",
+                        "message": str(e),
+                    })
+                await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             except Exception as e:
                 logger.error(f"Single-model workflow error at round {round_number}: {e}", exc_info=True)
                 await asyncio.sleep(5)
@@ -769,22 +742,40 @@ async def _handle_acceptance(self, submission: Submission, result: ValidationRes
         await shared_training_memory.add_accepted_submission(submission.content)
         
         # Notify submitter
-        submitter = self.submitters[submission.submitter_id - 1]
-        await submitter.handle_acceptance()
+        submitter = next((s for s in self.submitters if s.submitter_id == submission.submitter_id), None)
+        if submitter:
+            await submitter.handle_acceptance()
         
         # Get submitter config for model info
         submitter_config = self.submitter_configs[submission.submitter_id - 1] if submission.submitter_id <= len(self.submitter_configs) else None
+        submitter_call = submission.metadata.get("llm_call", {}) if submission.metadata else {}
+        validator_call = result.metadata.get("llm_call", {}) if result.metadata else {}
+        configured_submitter_model = submitter_config.model_id if submitter_config else (submitter.model_name if submitter else "unknown")
+        configured_submitter_provider = submitter_config.provider if submitter_config else ("openrouter" if submission.submitter_id == 11 else "lm_studio")
+        actual_submitter_model = submitter_call.get("effective_model") or configured_submitter_model
+        actual_submitter_provider = submitter_call.get("provider") or configured_submitter_provider
+        actual_validator_model = validator_call.get("effective_model") or self.validator_model
+        actual_validator_provider = validator_call.get("provider") or self.validator_provider
         
         # Broadcast
         await self._broadcast("submission_accepted", {
             "submission_id": submission.submission_id,
             "submitter_id": submission.submitter_id,
-            "submitter_model": submitter_config.model_id if submitter_config else submitter.model_name,
-            "submitter_provider": submitter_config.provider if submitter_config else "lm_studio",
+            "submitter_model": actual_submitter_model,
+            "submitter_provider": actual_submitter_provider,
+            "submitter_configured_model": configured_submitter_model,
+            "submitter_configured_provider": configured_submitter_provider,
+            "submitter_boosted": bool(submitter_call.get("boosted", False)),
+            "submitter_boost_mode": submitter_call.get("boost_mode"),
             "content": submission.content,
             "reasoning": result.reasoning,
             "total_acceptances": self.total_acceptances,
-            "validator_model": self.validator_model
+            "validator_model": actual_validator_model,
+            "validator_provider": actual_validator_provider,
+            "validator_configured_model": self.validator_model,
+            "validator_configured_provider": self.validator_provider,
+            "validator_boosted": bool(validator_call.get("boosted", False)),
+            "validator_boost_mode": validator_call.get("boost_mode"),
         })
         
         logger.info(f"Accepted submission from submitter {submission.submitter_id} (total: {self.total_acceptances})")
@@ -808,21 +799,39 @@ async def _handle_rejection(self, submission: Submission, result: ValidationResu
         self.total_rejections += 1
         
         # Notify submitter (stores last 5 rejections in local memory)
-        submitter = self.submitters[submission.submitter_id - 1]
-        await submitter.handle_rejection(result.summary, submission.content)
+        submitter = next((s for s in self.submitters if s.submitter_id == submission.submitter_id), None)
+        if submitter:
+            await submitter.handle_rejection(result.summary, submission.content)
         
         # Get submitter config for model info
         submitter_config = self.submitter_configs[submission.submitter_id - 1] if submission.submitter_id <= len(self.submitter_configs) else None
+        submitter_call = submission.metadata.get("llm_call", {}) if submission.metadata else {}
+        validator_call = result.metadata.get("llm_call", {}) if result.metadata else {}
+        configured_submitter_model = submitter_config.model_id if submitter_config else (submitter.model_name if submitter else "unknown")
+        configured_submitter_provider = submitter_config.provider if submitter_config else ("openrouter" if submission.submitter_id == 11 else "lm_studio")
+        actual_submitter_model = submitter_call.get("effective_model") or configured_submitter_model
+        actual_submitter_provider = submitter_call.get("provider") or configured_submitter_provider
+        actual_validator_model = validator_call.get("effective_model") or self.validator_model
+        actual_validator_provider = validator_call.get("provider") or self.validator_provider
         
         # Broadcast
         await self._broadcast("submission_rejected", {
             "submission_id": submission.submission_id,
             "submitter_id": submission.submitter_id,
-            "submitter_model": submitter_config.model_id if submitter_config else submitter.model_name,
-            "submitter_provider": submitter_config.provider if submitter_config else "lm_studio",
+            "submitter_model": actual_submitter_model,
+            "submitter_provider": actual_submitter_provider,
+            "submitter_configured_model": configured_submitter_model,
+            "submitter_configured_provider": configured_submitter_provider,
+            "submitter_boosted": bool(submitter_call.get("boosted", False)),
+            "submitter_boost_mode": submitter_call.get("boost_mode"),
             "reasoning": result.reasoning,
             "total_rejections": self.total_rejections,
-            "validator_model": self.validator_model
+            "validator_model": actual_validator_model,
+            "validator_provider": actual_validator_provider,
+            "validator_configured_model": self.validator_model,
+            "validator_configured_provider": self.validator_provider,
+            "validator_boosted": bool(validator_call.get("boosted", False)),
+            "validator_boost_mode": validator_call.get("boost_mode"),
         })
         
         logger.info(f"Rejected submission from submitter {submission.submitter_id} (total: {self.total_rejections})")
diff --git a/backend/aggregator/prompts/submitter_prompts.py b/backend/aggregator/prompts/submitter_prompts.py
index 78ffd08..5bb1fbf 100644
--- a/backend/aggregator/prompts/submitter_prompts.py
+++ b/backend/aggregator/prompts/submitter_prompts.py
@@ -3,6 +3,17 @@
 """
 
 
+EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES:
+- Classify concrete claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims must be supported by sound reasoning, derivation, proof sketch, or explicit assumptions.
+- Literature claims must name the external source in-text; never rely on vague phrases like "studies show" or "prior work proves" without identifying the source.
+- Empirical claims include benchmark numbers, latency, throughput, speedup, accuracy, perplexity, hardware performance, ablation outcomes, and measured implementation results.
+- Artifact claims include statements about code, kernels, logs, experiments, reproductions, or accompanying implementations.
+- DO NOT present empirical or artifact claims as facts unless they are backed by an explicit external citation or a provided artifact in context.
+- If such support is absent, rewrite the idea as a hypothesis, design intuition, proposed experiment, expected benefit, or future-work suggestion.
+- NEVER invent experiments, benchmark numbers, hardware measurements, datasets, citations, or code artifacts."""
+
+
 def get_submitter_system_prompt() -> str:
     """Get system prompt for submitter agents."""
     return """You are a mathematical submitter in an AI cluster working to solve complex mathematical problems. Your role is to:
@@ -23,17 +34,11 @@ def get_submitter_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -59,6 +64,7 @@ def get_submitter_system_prompt() -> str:
 - Avoid redundancy with existing accepted submissions
 - Focus on increasing solution availability or narrowing the search space
 - Present rigorous mathematical arguments
+- Unsupported empirical or artifact claims must be framed as proposals, hypotheses, or future work rather than as completed results
 
 Your submission will be validated against these criteria:
 - Does it meaningfully advance the solution space?
diff --git a/backend/aggregator/prompts/validator_prompts.py b/backend/aggregator/prompts/validator_prompts.py
index 50da411..52822de 100644
--- a/backend/aggregator/prompts/validator_prompts.py
+++ b/backend/aggregator/prompts/validator_prompts.py
@@ -3,6 +3,17 @@
 """
 
 
+EMPIRICAL_PROVENANCE_VALIDATION_RULES = """EMPIRICAL PROVENANCE RULES:
+- Classify concrete claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims must be supported by sound reasoning, derivation, proof sketch, or explicit assumptions.
+- Literature claims must identify the external source in-text; vague references like "studies show" are not sufficient.
+- Empirical claims include benchmark numbers, latency, throughput, speedup, accuracy, perplexity, hardware performance, ablations, and measured outcomes.
+- Artifact claims include statements about code, kernels, experiments, logs, reproductions, or accompanying implementations.
+- REJECT empirical or artifact claims that are presented as established facts without explicit external citation or a provided artifact in context.
+- If a submission offers an unsupported benchmark-style idea that is still useful, it must be framed as a proposed experiment, hypothesis, expected benefit, or future-work direction rather than as a completed result.
+- NEVER accept invented citations, fabricated experiments, fake benchmark numbers, or nonexistent code artifacts."""
+
+
 def get_validator_system_prompt() -> str:
     """Get system prompt for validator agent."""
     return """You are a validation agent in an AI cluster. Your role is to evaluate mathematical submissions and decide whether they should be added to the shared knowledge base.
@@ -18,17 +29,11 @@ def get_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -48,6 +53,7 @@ def get_validator_system_prompt() -> str:
 - Is the submission grounded in established mathematical principles and rigorous logic?
 - Does the submission avoid unfounded claims or logical fallacies?
 - Is the submission based on proven mathematical theorems and valid reasoning?
+- Are any empirical or artifact claims properly cited or backed by a provided artifact rather than asserted from nowhere?
 
 VALIDATION DECISION RULES:
 A submission should be ACCEPTED if it:
@@ -64,6 +70,7 @@ def get_validator_system_prompt() -> str:
 5. Is obviously unhelpful or time-wasting content
 6. Contains logical fallacies or mathematically unsound reasoning
 7. Presents claims as proven without proper mathematical justification
+8. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
 
 Ask yourself: "Does adding this submission to our knowledge base make us more capable of solving the user's mathematical prompt than we were without it?"
 
@@ -192,17 +199,11 @@ def get_validator_dual_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -222,6 +223,7 @@ def get_validator_dual_system_prompt() -> str:
 - Is the submission obviously unhelpful or time-wasting content?
 - Is the submission grounded in established mathematical principles and rigorous logic?
 - Does the submission avoid unfounded claims or logical fallacies?
+- Are any empirical or artifact claims properly cited or backed by a provided artifact rather than asserted from nowhere?
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
@@ -236,6 +238,7 @@ def get_validator_dual_system_prompt() -> str:
 3. Contains logical contradictions or unsupported claims
 4. Is too vague or generic to be actionable
 5. Contains logical fallacies or mathematically unsound reasoning
+6. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
 
 CRITICAL - INTRA-BATCH REDUNDANCY PREVENTION:
 You must make TWO SEPARATE, INDEPENDENT decisions first - one for each submission.
@@ -419,17 +422,11 @@ def get_validator_triple_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -449,6 +446,7 @@ def get_validator_triple_system_prompt() -> str:
 - Is the submission obviously unhelpful or time-wasting content?
 - Is the submission grounded in established mathematical principles and rigorous logic?
 - Does the submission avoid unfounded claims or logical fallacies?
+- Are any empirical or artifact claims properly cited or backed by a provided artifact rather than asserted from nowhere?
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
@@ -463,6 +461,7 @@ def get_validator_triple_system_prompt() -> str:
 3. Contains logical contradictions or unsupported claims
 4. Is too vague or generic to be actionable
 5. Contains logical fallacies or mathematically unsound reasoning
+6. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
 
 CRITICAL - INTRA-BATCH REDUNDANCY PREVENTION:
 You must make THREE SEPARATE, INDEPENDENT decisions first - one for each submission.
@@ -682,17 +681,11 @@ def get_cleanup_review_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -712,6 +705,7 @@ def get_cleanup_review_system_prompt() -> str:
 3. Contains information that is now SUPERSEDED by better, more complete submissions
 4. Was MARGINALLY useful initially but provides no unique value given the current database state
 5. Contains claims that CONFLICT with established mathematical principles evident in other submissions
+6. Contains unsupported empirical or artifact claims presented as established fact
 
 REASONS TO KEEP - A submission should be kept if it:
 1. Provides ANY unique information not covered elsewhere
@@ -835,17 +829,11 @@ def get_removal_validation_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
diff --git a/backend/api/main.py b/backend/api/main.py
index b78f433..f716228 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -126,7 +126,7 @@ async def lifespan(app: FastAPI):
 app = FastAPI(
     title="ASI Aggregator System",
     description="AI-powered aggregator with RAG and multi-agent validation",
-    version="1.0.5",
+    version="1.0.6",
     lifespan=lifespan
 )
 
@@ -149,7 +149,7 @@ async def root():
     """Root endpoint."""
     return {
         "name": "ASI Aggregator System",
-        "version": "1.0.5",
+        "version": "1.0.6",
         "status": "running"
     }
 
diff --git a/backend/api/routes/aggregator.py b/backend/api/routes/aggregator.py
index 50715b9..0cb9c14 100644
--- a/backend/api/routes/aggregator.py
+++ b/backend/api/routes/aggregator.py
@@ -11,6 +11,7 @@
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.config import system_config, rag_config
 from backend.shared.token_tracker import token_tracker
+from backend.shared.path_safety import resolve_path_within_root, validate_single_path_component
 from backend.aggregator.core.coordinator import coordinator
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.memory.event_log import event_log
@@ -195,9 +196,10 @@ async def clear_all_submissions():
 async def upload_file(file: UploadFile = File(...)):
     """Upload a user file."""
     try:
-        # Save to user_uploads directory
-        file_path = Path(system_config.user_uploads_dir) / file.filename
-        file_path.parent.mkdir(parents=True, exist_ok=True)
+        safe_filename = validate_single_path_component(file.filename, "filename")
+        uploads_dir = Path(system_config.user_uploads_dir)
+        uploads_dir.mkdir(parents=True, exist_ok=True)
+        file_path = resolve_path_within_root(uploads_dir, safe_filename)
         
         async with aiofiles.open(file_path, 'wb') as f:
             content = await file.read()
@@ -205,7 +207,7 @@ async def upload_file(file: UploadFile = File(...)):
         
         return {
             "status": "uploaded",
-            "filename": file.filename,
+            "filename": safe_filename,
             "path": str(file_path)
         }
     except Exception as e:
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index b07716b..f558c48 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -4,8 +4,9 @@
 """
 import asyncio
 import logging
+from datetime import datetime
 from pathlib import Path
-from typing import Optional, Any, Dict
+from typing import Optional, Any, Dict, List
 from fastapi import APIRouter, HTTPException, BackgroundTasks
 
 from backend.shared.models import AutonomousResearchStartRequest, CritiqueRequest
@@ -22,6 +23,7 @@
 from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
 from backend.aggregator.core.coordinator import coordinator
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
+from backend.shared.boost_logger import boost_logger
 
 logger = logging.getLogger(__name__)
 
@@ -38,6 +40,196 @@ def _validate_history_session_id(session_id: str) -> None:
     if not session_id:
         raise HTTPException(status_code=400, detail="Session ID is required")
 
+
+def _parse_api_log_timestamp(timestamp: Optional[str]) -> datetime:
+    """Parse log timestamps for sorting and deduplication."""
+    if not timestamp:
+        return datetime.min
+
+    try:
+        return datetime.fromisoformat(timestamp)
+    except ValueError:
+        return datetime.min
+
+
+def _normalize_autonomous_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
+    """Normalize autonomous log entries into the combined API log shape."""
+    return {
+        **entry,
+        "source": "api",
+        "boosted": bool(entry.get("boosted", False)),
+        "boost_mode": entry.get("boost_mode"),
+        "provider": entry.get("provider") or "unknown",
+        "phase": entry.get("phase") or "unknown",
+        "prompt_preview": entry.get("prompt_preview") or "",
+        "prompt_full": entry.get("prompt_full") or entry.get("prompt_preview") or "",
+        "response_preview": entry.get("response_preview") or "",
+        "response_full": entry.get("response_full") or entry.get("response_preview") or "",
+    }
+
+
+def _normalize_boost_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
+    """Normalize boost log entries so they can be shown in the main API log view."""
+    prompt_preview = entry.get("prompt_preview") or ""
+    response_preview = entry.get("response_preview") or ""
+    response_full = entry.get("response_full") or response_preview
+
+    return {
+        **entry,
+        "source": "boost",
+        "boosted": True,
+        "provider": entry.get("provider") or "openrouter",
+        "phase": entry.get("phase") or "boost",
+        "prompt_preview": prompt_preview,
+        "prompt_full": entry.get("prompt_full") or prompt_preview,
+        "response_preview": response_preview,
+        "response_full": response_full,
+    }
+
+
+def _build_api_log_match_key(entry: Dict[str, Any]) -> tuple:
+    """Build a stable key used to deduplicate boost entries already logged elsewhere."""
+    return (
+        entry.get("task_id") or "",
+        entry.get("role_id") or "",
+        entry.get("model") or "",
+        bool(entry.get("success", True)),
+    )
+
+
+def _merge_combined_api_logs(
+    autonomous_logs: List[Dict[str, Any]],
+    boost_logs: List[Dict[str, Any]],
+    limit: int,
+) -> List[Dict[str, Any]]:
+    """
+    Combine autonomous and boost logs into one list.
+
+    Autonomous boosted calls are often already mirrored into the autonomous logger,
+    so boost entries are merged into matching autonomous entries when possible.
+    """
+    combined_logs = [_normalize_autonomous_api_log(entry) for entry in autonomous_logs]
+    candidate_map: Dict[tuple, List[int]] = {}
+
+    for index, entry in enumerate(combined_logs):
+        candidate_map.setdefault(_build_api_log_match_key(entry), []).append(index)
+
+    for raw_boost_entry in boost_logs:
+        boost_entry = _normalize_boost_api_log(raw_boost_entry)
+        boost_timestamp = _parse_api_log_timestamp(boost_entry.get("timestamp"))
+        matching_indices = candidate_map.get(_build_api_log_match_key(boost_entry), [])
+        merged = False
+
+        for index in matching_indices:
+            existing_entry = combined_logs[index]
+            if existing_entry.get("_boost_merged"):
+                continue
+
+            existing_timestamp = _parse_api_log_timestamp(existing_entry.get("timestamp"))
+            if abs((existing_timestamp - boost_timestamp).total_seconds()) > 2:
+                continue
+
+            existing_entry["source"] = "api+boost"
+            existing_entry["boosted"] = True
+            existing_entry["boost_mode"] = boost_entry.get("boost_mode")
+            existing_entry["_boost_merged"] = True
+
+            if not existing_entry.get("prompt_full"):
+                existing_entry["prompt_full"] = boost_entry.get("prompt_full") or ""
+            if not existing_entry.get("prompt_preview"):
+                existing_entry["prompt_preview"] = boost_entry.get("prompt_preview") or ""
+            if not existing_entry.get("response_full"):
+                existing_entry["response_full"] = boost_entry.get("response_full") or ""
+            if not existing_entry.get("response_preview"):
+                existing_entry["response_preview"] = boost_entry.get("response_preview") or ""
+
+            merged = True
+            break
+
+        if not merged:
+            combined_logs.append(boost_entry)
+
+    combined_logs.sort(
+        key=lambda entry: _parse_api_log_timestamp(entry.get("timestamp")),
+        reverse=True,
+    )
+
+    for entry in combined_logs:
+        entry.pop("_boost_merged", None)
+
+    return combined_logs[:limit]
+
+
+def _build_combined_api_stats(logs: List[Dict[str, Any]]) -> Dict[str, Any]:
+    """Build summary stats for the merged API log view."""
+    if not logs:
+        return {
+            "total_calls": 0,
+            "successful_calls": 0,
+            "failed_calls": 0,
+            "success_rate": 0.0,
+            "boosted_calls": 0,
+            "by_phase": {},
+            "by_model": {},
+            "by_provider": {},
+            "by_source": {},
+            "by_boost_mode": {},
+        }
+
+    successful_calls = sum(1 for log in logs if log.get("success", True))
+    boosted_calls = sum(1 for log in logs if log.get("boosted"))
+    by_phase: Dict[str, int] = {}
+    by_model: Dict[str, int] = {}
+    by_provider: Dict[str, int] = {}
+    by_source: Dict[str, int] = {}
+    by_boost_mode: Dict[str, int] = {}
+
+    for log in logs:
+        phase = log.get("phase") or "unknown"
+        model = log.get("model") or "unknown"
+        provider = log.get("provider") or "unknown"
+        source = log.get("source") or "unknown"
+
+        by_phase[phase] = by_phase.get(phase, 0) + 1
+        by_model[model] = by_model.get(model, 0) + 1
+        by_provider[provider] = by_provider.get(provider, 0) + 1
+        by_source[source] = by_source.get(source, 0) + 1
+
+        if log.get("boosted"):
+            boost_mode = log.get("boost_mode") or "unknown"
+            by_boost_mode[boost_mode] = by_boost_mode.get(boost_mode, 0) + 1
+
+    total_calls = len(logs)
+
+    return {
+        "total_calls": total_calls,
+        "successful_calls": successful_calls,
+        "failed_calls": total_calls - successful_calls,
+        "success_rate": successful_calls / total_calls if total_calls else 0.0,
+        "boosted_calls": boosted_calls,
+        "by_phase": by_phase,
+        "by_model": by_model,
+        "by_provider": by_provider,
+        "by_source": by_source,
+        "by_boost_mode": by_boost_mode,
+    }
+
+
+async def _get_combined_api_logs(limit: int = 100) -> Dict[str, Any]:
+    """Fetch, deduplicate, and summarize the combined autonomous + boost API logs."""
+    fetch_limit = max(limit * 3, 300)
+    autonomous_logs = await autonomous_api_logger.get_logs(limit=fetch_limit)
+    boost_logs = await boost_logger.get_logs(limit=fetch_limit)
+    combined_logs = _merge_combined_api_logs(autonomous_logs, boost_logs, limit=limit)
+    combined_stats = _build_combined_api_stats(
+        _merge_combined_api_logs(
+            autonomous_logs,
+            boost_logs,
+            limit=max(fetch_limit, len(autonomous_logs) + len(boost_logs)),
+        )
+    )
+    return {"logs": combined_logs, "stats": combined_stats}
+
     if session_id == "legacy":
         return
 
@@ -307,6 +499,7 @@ async def _generate_autonomous_paper_critique(
         host_provider=config["validator_openrouter_provider"],
         date=datetime.now(),
         prompt_used=prompt_to_use,
+        critique_source="user_request",
         novelty_rating=critique_data.get("novelty_rating", 0),
         novelty_feedback=critique_data.get("novelty_feedback", ""),
         correctness_rating=critique_data.get("correctness_rating", 0),
@@ -2222,6 +2415,7 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
             host_provider=validator_openrouter_provider,
             date=datetime.now(),
             prompt_used=prompt_to_use,
+            critique_source="user_request",
             novelty_rating=critique_data.get("novelty_rating", 0),
             novelty_feedback=critique_data.get("novelty_feedback", ""),
             correctness_rating=critique_data.get("correctness_rating", 0),
@@ -2366,13 +2560,12 @@ async def get_autonomous_api_logs(limit: int = 100):
         Dict with logs and statistics
     """
     try:
-        logs = await autonomous_api_logger.get_logs(limit=limit)
-        stats = await autonomous_api_logger.get_stats()
+        combined = await _get_combined_api_logs(limit=limit)
         
         return {
             "success": True,
-            "logs": logs,
-            "stats": stats
+            "logs": combined["logs"],
+            "stats": combined["stats"],
         }
     except Exception as e:
         logger.error(f"Failed to get autonomous API logs: {e}")
@@ -2389,10 +2582,11 @@ async def clear_autonomous_api_logs():
     """
     try:
         await autonomous_api_logger.clear_logs()
+        await boost_logger.clear_logs()
         
         return {
             "success": True,
-            "message": "Autonomous API logs cleared successfully"
+            "message": "Combined API logs cleared successfully"
         }
     except Exception as e:
         logger.error(f"Failed to clear autonomous API logs: {e}")
@@ -2408,11 +2602,11 @@ async def get_autonomous_api_stats():
         Statistics dict (total calls, by phase, by model, success rate, etc.)
     """
     try:
-        stats = await autonomous_api_logger.get_stats()
+        combined = await _get_combined_api_logs(limit=1000)
         
         return {
             "success": True,
-            "stats": stats
+            "stats": combined["stats"]
         }
     except Exception as e:
         logger.error(f"Failed to get autonomous API stats: {e}")
diff --git a/backend/api/routes/boost.py b/backend/api/routes/boost.py
index ff0e9b7..4390021 100644
--- a/backend/api/routes/boost.py
+++ b/backend/api/routes/boost.py
@@ -309,6 +309,40 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
 # NEW: Boost Next X Calls (Counter-based mode)
 # ============================================================
 
+class BoostAlwaysPreferRequest(BaseModel):
+    """Request body for toggling always-prefer-boost mode."""
+    enabled: bool
+
+
+@router.post("/api/boost/set-always-prefer")
+async def set_boost_always_prefer(request: BoostAlwaysPreferRequest) -> Dict[str, Any]:
+    """
+    Enable or disable always-prefer-boost mode.
+    
+    When enabled, every API call attempts boost first and falls back to the
+    primary model on any failure. Mutually exclusive with next_count and category
+    modes — caller should clear those first.
+    """
+    try:
+        if not boost_manager.boost_config or not boost_manager.boost_config.enabled:
+            raise HTTPException(status_code=400, detail="Boost must be enabled first")
+        
+        await boost_manager.set_always_prefer(request.enabled)
+        
+        logger.info(f"Boost always-prefer set to {request.enabled}")
+        
+        return {
+            "success": True,
+            "enabled": request.enabled,
+            "message": "Boost will be attempted for every API call" if request.enabled else "Always-prefer boost disabled"
+        }
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to set always-prefer boost: {e}")
+        raise HTTPException(status_code=500, detail=f"Failed to set always-prefer: {str(e)}")
+
+
 @router.post("/api/boost/set-next-count")
 async def set_boost_next_count(request: BoostNextCountRequest) -> Dict[str, Any]:
     """
@@ -346,10 +380,6 @@ async def set_boost_next_count(request: BoostNextCountRequest) -> Dict[str, Any]
         raise HTTPException(status_code=500, detail=f"Failed to set count: {str(e)}")
 
 
-# ============================================================
-# NEW: Category Boost (Role-based mode)
-# ============================================================
-
 @router.post("/api/boost/toggle-category/{category}")
 async def toggle_category_boost(category: str) -> Dict[str, Any]:
     """
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index cb41ef0..eb3ebd3 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -615,6 +615,7 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
             host_provider=validator_openrouter_provider,
             date=datetime.now(),
             prompt_used=prompt_to_use,
+            critique_source="user_request",
             novelty_rating=critique_data.get("novelty_rating", 0),
             novelty_feedback=critique_data.get("novelty_feedback", ""),
             correctness_rating=critique_data.get("correctness_rating", 0),
diff --git a/backend/api/routes/websocket.py b/backend/api/routes/websocket.py
index 4d8e2d1..92b9dda 100644
--- a/backend/api/routes/websocket.py
+++ b/backend/api/routes/websocket.py
@@ -3,6 +3,7 @@
 """
 from fastapi import APIRouter, WebSocket, WebSocketDisconnect
 from typing import List, Dict
+from datetime import datetime
 import asyncio
 import logging
 import json
@@ -34,7 +35,8 @@ async def broadcast(self, event_type: str, data: Dict):
         """Broadcast message to all connected clients."""
         message = json.dumps({
             "type": event_type,
-            "data": data
+            "data": data,
+            "timestamp": datetime.utcnow().isoformat() + "Z"
         })
         
         disconnected = []
diff --git a/backend/autonomous/agents/completion_reviewer.py b/backend/autonomous/agents/completion_reviewer.py
index ea9d8de..4f62e35 100644
--- a/backend/autonomous/agents/completion_reviewer.py
+++ b/backend/autonomous/agents/completion_reviewer.py
@@ -61,7 +61,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_cr_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_available_context(self) -> int:
         """Calculate available tokens for brainstorm database content."""
diff --git a/backend/autonomous/agents/final_answer/answer_format_selector.py b/backend/autonomous/agents/final_answer/answer_format_selector.py
index aac0a38..67ab4db 100644
--- a/backend/autonomous/agents/final_answer/answer_format_selector.py
+++ b/backend/autonomous/agents/final_answer/answer_format_selector.py
@@ -68,7 +68,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_fs_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
diff --git a/backend/autonomous/agents/final_answer/certainty_assessor.py b/backend/autonomous/agents/final_answer/certainty_assessor.py
index 548ba18..4c04b1e 100644
--- a/backend/autonomous/agents/final_answer/certainty_assessor.py
+++ b/backend/autonomous/agents/final_answer/certainty_assessor.py
@@ -77,7 +77,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_ca_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
diff --git a/backend/autonomous/agents/final_answer/volume_organizer.py b/backend/autonomous/agents/final_answer/volume_organizer.py
index 5f5b2d1..57c8f71 100644
--- a/backend/autonomous/agents/final_answer/volume_organizer.py
+++ b/backend/autonomous/agents/final_answer/volume_organizer.py
@@ -76,7 +76,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_vo_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
diff --git a/backend/autonomous/agents/paper_title_selector.py b/backend/autonomous/agents/paper_title_selector.py
index e58df59..6107b56 100644
--- a/backend/autonomous/agents/paper_title_selector.py
+++ b/backend/autonomous/agents/paper_title_selector.py
@@ -54,7 +54,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_pt_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     async def select_title(
         self,
@@ -122,6 +122,7 @@ async def select_title(
                 topic_prompt,
                 brainstorm_summary,
                 existing_papers_from_brainstorm,
+                reference_papers,
                 selection.paper_title,
                 selection.reasoning
             )
@@ -290,6 +291,7 @@ async def _validate_title(
         topic_prompt: str,
         brainstorm_summary: str,
         existing_papers_from_brainstorm: List[Dict[str, Any]],
+        reference_papers: List[Dict[str, Any]],
         proposed_title: str,
         title_reasoning: str
     ) -> Tuple[bool, str]:
@@ -306,6 +308,7 @@ async def _validate_title(
                 topic_prompt=topic_prompt,
                 brainstorm_summary=brainstorm_summary,
                 existing_papers_from_brainstorm=existing_papers_from_brainstorm,
+                reference_papers=reference_papers,
                 proposed_title=proposed_title,
                 title_reasoning=title_reasoning
             )
diff --git a/backend/autonomous/agents/reference_selector.py b/backend/autonomous/agents/reference_selector.py
index 4e7a741..777e1e3 100644
--- a/backend/autonomous/agents/reference_selector.py
+++ b/backend/autonomous/agents/reference_selector.py
@@ -29,7 +29,7 @@
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.json_parser import parse_json
 from backend.shared.utils import count_tokens
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
 from backend.shared.models import ReferenceExpansionRequest, ReferenceSelectionResult
 from backend.autonomous.prompts.paper_reference_prompts import (
     build_reference_expansion_prompt,
@@ -76,7 +76,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_rs_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
@@ -89,7 +89,9 @@ async def select_references(
         brainstorm_summary: str,
         available_papers: List[Dict[str, Any]],
         mode: str = "initial",
-        already_selected: List[str] = None
+        already_selected: List[str] = None,
+        already_selected_papers: List[Dict[str, Any]] = None,
+        max_total_papers: Optional[int] = None,
     ) -> List[str]:
         """
         Complete reference selection workflow.
@@ -103,25 +105,37 @@ async def select_references(
             available_papers: List of papers with title, abstract, word count
             mode: Selection mode - "initial" (pre-brainstorm) or "additional" (pre-paper)
             already_selected: List of paper_ids already selected (for "additional" mode)
+            max_total_papers: Total paper cap for this workflow. In "additional" mode,
+                already selected papers count toward this total.
         
         Returns:
-            List of selected paper_ids (max 6 for initial, remaining slots for additional)
+            List of selected paper_ids, capped by the caller's policy
         """
         if already_selected is None:
             already_selected = []
+        if already_selected_papers is None:
+            already_selected_papers = []
+        if max_total_papers is None:
+            max_total_papers = system_config.autonomous_tier3_short_form_max_reference_papers
         
         if not available_papers:
             logger.info(f"ReferenceSelector [{mode}]: No papers available, skipping reference selection")
             return []
         
         # Calculate max papers based on mode
-        max_papers = 6 if mode == "initial" else (6 - len(already_selected))
+        max_papers = max_total_papers if mode == "initial" else (max_total_papers - len(already_selected))
         if max_papers <= 0:
-            logger.info(f"ReferenceSelector [{mode}]: Already at max capacity ({len(already_selected)} papers)")
+            logger.info(
+                f"ReferenceSelector [{mode}]: Already at max capacity "
+                f"({len(already_selected)} of {max_total_papers} papers)"
+            )
             return []
         
-        logger.info(f"ReferenceSelector [{mode}]: Starting selection (max {max_papers} papers, "
-                   f"{len(available_papers)} available, {len(already_selected)} already selected)")
+        logger.info(
+            f"ReferenceSelector [{mode}]: Starting selection "
+            f"(limit={max_papers}, total_cap={max_total_papers}, "
+            f"{len(available_papers)} available, {len(already_selected)} already selected)"
+        )
         
         # Step 1: Show abstracts and ask which to expand
         expansion_request = await self._request_expansion(
@@ -130,7 +144,9 @@ async def select_references(
             brainstorm_summary,
             available_papers,
             mode=mode,
-            already_selected=already_selected
+            already_selected=already_selected,
+            already_selected_papers=already_selected_papers,
+            max_total_papers=max_total_papers,
         )
         
         if expansion_request is None:
@@ -175,7 +191,9 @@ async def _request_expansion(
         brainstorm_summary: str,
         papers_with_abstracts: List[Dict[str, Any]],
         mode: str = "initial",
-        already_selected: List[str] = None
+        already_selected: List[str] = None,
+        already_selected_papers: List[Dict[str, Any]] = None,
+        max_total_papers: int = 6,
     ) -> Optional[ReferenceExpansionRequest]:
         """
         Request which papers to expand (Step 1: abstracts only).
@@ -187,6 +205,8 @@ async def _request_expansion(
         """
         if already_selected is None:
             already_selected = []
+        if already_selected_papers is None:
+            already_selected_papers = []
         
         try:
             # Build prompt based on mode
@@ -196,7 +216,8 @@ async def _request_expansion(
                     user_research_prompt=user_research_prompt,
                     topic_prompt=topic_prompt,
                     brainstorm_summary=brainstorm_summary,
-                    papers_with_abstracts=papers_with_abstracts
+                    papers_with_abstracts=papers_with_abstracts,
+                    max_papers=max_total_papers,
                 )
             else:
                 # Additional: select more papers before paper writing
@@ -205,7 +226,9 @@ async def _request_expansion(
                     topic_prompt=topic_prompt,
                     brainstorm_summary=brainstorm_summary,
                     papers_with_abstracts=papers_with_abstracts,
-                    already_selected=already_selected
+                    already_selected=already_selected,
+                    already_selected_papers=already_selected_papers,
+                    max_total_papers=max_total_papers,
                 )
             
             # Validate prompt size
@@ -293,6 +316,10 @@ async def _get_expanded_papers(
                 expanded.append({
                     "paper_id": paper_id,
                     "title": paper_meta.get("title", "Unknown"),
+                    "reference_title_display": paper_meta.get(
+                        "reference_title_display",
+                        paper_meta.get("title", "Unknown"),
+                    ),
                     "word_count": paper_meta.get("word_count", len(content.split())),
                     "content": content,
                     "outline": outline  # NEW: Include outline
@@ -320,7 +347,7 @@ async def _make_final_selection(
         
         Args:
             mode: "initial" for pre-brainstorm, "additional" for pre-paper
-            max_papers: Maximum papers to select (6 for initial, remaining slots for additional)
+            max_papers: Maximum papers to select for this call
         """
         try:
             max_input = self._calculate_max_input_tokens()
diff --git a/backend/autonomous/agents/topic_selector.py b/backend/autonomous/agents/topic_selector.py
index d4126e5..811a818 100644
--- a/backend/autonomous/agents/topic_selector.py
+++ b/backend/autonomous/agents/topic_selector.py
@@ -63,7 +63,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_ts_{self.task_sequence:03d}"
+        return f"agg_sub1_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
diff --git a/backend/autonomous/agents/topic_validator.py b/backend/autonomous/agents/topic_validator.py
index 23632f2..bb63054 100644
--- a/backend/autonomous/agents/topic_validator.py
+++ b/backend/autonomous/agents/topic_validator.py
@@ -58,7 +58,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_tv_{self.task_sequence:03d}"
+        return f"agg_val_{self.task_sequence:03d}"
     
     def _calculate_max_input_tokens(self) -> int:
         """Calculate available tokens for input prompt."""
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index d741024..abac73a 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -24,6 +24,7 @@
 )
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.free_model_manager import free_model_manager
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.token_tracker import token_tracker
 
@@ -558,6 +559,7 @@ async def _check_resume_state(self) -> None:
             self._current_topic_id = workflow_state.get("current_topic_id")
             self._current_paper_id = workflow_state.get("current_paper_id")
             self._current_reference_papers = workflow_state.get("reference_paper_ids", [])
+            self._current_paper_title = workflow_state.get("current_paper_title")
             self._acceptance_count = workflow_state.get("acceptance_count", 0)
             self._rejection_count = workflow_state.get("rejection_count", 0)
             self._consecutive_rejections = workflow_state.get("consecutive_rejections", 0)
@@ -789,6 +791,40 @@ async def _load_saved_paper_to_compiler(self, paper_id: str) -> None:
                 
         except Exception as e:
             logger.error(f"Failed to load saved paper {paper_id} to compiler: {e}")
+
+    async def _preserve_failed_paper_state(self, paper_id: str, paper_title: str) -> None:
+        """
+        Preserve in-progress paper state after a compiler failure so retries resume.
+
+        This keeps the current paper ID/title and stores the best-known phase in the
+        workflow state. The next compilation attempt will then skip title generation
+        and continue from the current paper/outline instead of restarting from scratch.
+        """
+        current_paper = await compiler_paper_memory.get_paper()
+        current_outline = await outline_memory.get_outline()
+
+        resume_phase = None
+        if current_paper and current_paper.strip():
+            resume_phase = self._detect_paper_phase(current_paper)
+        elif current_outline and current_outline.strip():
+            resume_phase = "body"
+        else:
+            resume_phase = self._resume_paper_phase or "body"
+
+        self._current_paper_id = paper_id
+        self._current_paper_title = paper_title
+        self._resume_paper_phase = resume_phase
+
+        await self._save_workflow_state(
+            tier="tier2_paper_writing",
+            phase=resume_phase
+        )
+
+        logger.info(
+            f"Preserved failed paper state for resume: paper={paper_id}, "
+            f"phase={resume_phase}, paper_chars={len(current_paper or '')}, "
+            f"outline_chars={len(current_outline or '')}"
+        )
     
     async def _save_workflow_state(self, tier: str = None, phase: str = None) -> None:
         """Save current workflow state for crash recovery."""
@@ -812,6 +848,7 @@ async def _save_workflow_state(self, tier: str = None, phase: str = None) -> Non
             "current_tier": tier or self._state.current_tier,
             "current_topic_id": self._current_topic_id,
             "current_paper_id": self._current_paper_id,
+            "current_paper_title": self._current_paper_title,
             "paper_phase": phase,
             "reference_paper_ids": self._current_reference_papers,  # Persist reference papers across restarts
             "acceptance_count": self._acceptance_count,
@@ -855,6 +892,9 @@ async def start(self) -> None:
         self._stop_event.clear()
         self._state.is_running = True
         
+        # Reset free model manager state for fresh start
+        free_model_manager.reset()
+        
         # Set up autonomous API logging callback
         async def log_callback(task_id, role_id, model, provider, prompt, response, 
                               tokens_used, duration_ms, success, error, phase):
@@ -938,7 +978,9 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                     f"for brainstorm {self._current_topic_id} - retrying..."
                                 )
                                 await asyncio.sleep(5)
-                            if await self._paper_compilation_workflow():
+                            if await self._paper_compilation_workflow(
+                                emit_resume_event=(_resume_paper_attempt == 1)
+                            ):
                                 break
 
                         if not self._stop_event.is_set():
@@ -1325,28 +1367,13 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                     logger.info("Brainstorm cycle complete, returning to topic selection")
 
               except FreeModelExhaustedError as e:
-                if e.soonest_retry:
-                    wait_secs = max(0, e.soonest_retry - time.time())
-                    wait_mins = round(wait_secs / 60, 1)
-                    logger.warning(
-                        f"SERIAL BOTTLENECK: Autonomous research paused for {wait_mins} minutes "
-                        f"(all free models rate-limited)"
-                    )
-                    await self._broadcast("serial_bottleneck_paused", {
-                        "role_id": "autonomous",
-                        "model": str(e),
-                        "wait_seconds": round(wait_secs),
-                        "resume_at": time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.soonest_retry)),
-                    })
-                    await asyncio.sleep(wait_secs)
-                    await self._broadcast("serial_bottleneck_resumed", {"role_id": "autonomous"})
-                else:
-                    logger.error(f"AutonomousCoordinator: all free models exhausted, no cooldown: {e}")
-                    await self._broadcast("all_free_models_exhausted", {
-                        "message": f"All free models exhausted: {e}"
-                    })
-                    await self._save_workflow_state()
-                    break
+                # All free models exhausted after retries - wait briefly and retry
+                logger.warning(f"AutonomousCoordinator: all free models exhausted: {e}")
+                await self._broadcast("free_models_exhausted", {
+                    "role_id": "autonomous",
+                    "message": str(e),
+                })
+                await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
 
         except Exception as e:
             logger.error(f"AutonomousCoordinator error: {e}")
@@ -1711,28 +1738,13 @@ async def _resume_research_loop_after_tier3(self) -> None:
                     logger.info("Brainstorm cycle complete, returning to topic selection")
 
               except FreeModelExhaustedError as e:
-                if e.soonest_retry:
-                    wait_secs = max(0, e.soonest_retry - time.time())
-                    wait_mins = round(wait_secs / 60, 1)
-                    logger.warning(
-                        f"SERIAL BOTTLENECK: Resumed research paused for {wait_mins} minutes "
-                        f"(all free models rate-limited)"
-                    )
-                    await self._broadcast("serial_bottleneck_paused", {
-                        "role_id": "autonomous_resumed",
-                        "model": str(e),
-                        "wait_seconds": round(wait_secs),
-                        "resume_at": time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.soonest_retry)),
-                    })
-                    await asyncio.sleep(wait_secs)
-                    await self._broadcast("serial_bottleneck_resumed", {"role_id": "autonomous_resumed"})
-                else:
-                    logger.error(f"Resumed research: all free models exhausted, no cooldown: {e}")
-                    await self._broadcast("all_free_models_exhausted", {
-                        "message": f"All free models exhausted: {e}"
-                    })
-                    await self._save_workflow_state()
-                    break
+                # All free models exhausted after retries - wait briefly and retry
+                logger.warning(f"Resumed research: all free models exhausted: {e}")
+                await self._broadcast("free_models_exhausted", {
+                    "role_id": "autonomous_resumed",
+                    "message": str(e),
+                })
+                await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
 
         except Exception as e:
             logger.error(f"Error in resumed research loop: {e}")
@@ -2278,8 +2290,10 @@ async def _pre_brainstorm_reference_selection(self) -> List[str]:
         - Accelerate convergence on valuable insights by standing on prior work
         
         Returns:
-            List of selected paper_ids (max 6)
+            List of selected paper_ids for the topic-cycle base reference cap
         """
+        max_reference_papers = system_config.autonomous_topic_cycle_max_reference_papers
+
         # Get available papers
         papers_summary = await autonomous_rag_manager.get_all_papers_summary()
         
@@ -2309,7 +2323,8 @@ async def _pre_brainstorm_reference_selection(self) -> List[str]:
             brainstorm_summary=brainstorm_summary,
             available_papers=papers_summary,
             mode="initial",  # Pre-brainstorm mode
-            already_selected=[]  # No papers selected yet
+            already_selected=[],  # No papers selected yet
+            max_total_papers=max_reference_papers,
         )
         
         await self._broadcast("reference_selection_complete", {
@@ -2341,6 +2356,35 @@ def _get_reference_paper_paths(self) -> List[str]:
             else:
                 logger.warning(f"Reference paper not found: {paper_path}")
         return paths
+
+    async def _get_reference_paper_details(
+        self,
+        paper_ids: Optional[List[str]] = None
+    ) -> List[Dict[str, Any]]:
+        """
+        Get compact metadata summaries for reference papers used in title prompts.
+        """
+        reference_details: List[Dict[str, Any]] = []
+
+        for paper_id in paper_ids or []:
+            metadata = await paper_library.get_metadata(paper_id)
+            if not metadata:
+                logger.warning(f"Reference paper metadata not found: {paper_id}")
+                continue
+
+            reference_title_display = await paper_library.get_reference_title_display(
+                paper_id,
+                metadata.title,
+            )
+
+            reference_details.append({
+                "paper_id": paper_id,
+                "title": metadata.title,
+                "reference_title_display": reference_title_display,
+                "abstract": metadata.abstract
+            })
+
+        return reference_details
     
     # ========================================================================
     # PHASE 2: BRAINSTORM AGGREGATION
@@ -2970,7 +3014,11 @@ async def _run_completion_review(self) -> bool:
     # PHASE 3: PAPER COMPILATION
     # ========================================================================
     
-    async def _paper_compilation_workflow(self, skip_reference_selection: bool = False) -> bool:
+    async def _paper_compilation_workflow(
+        self,
+        skip_reference_selection: bool = False,
+        emit_resume_event: bool = False
+    ) -> bool:
         """
         Complete paper compilation workflow.
         Order: Reference selection -> Title -> Body -> Conclusion -> Intro -> Abstract
@@ -2981,6 +3029,9 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
         Args:
             skip_reference_selection: If True, skip reference selection (for paper 2/3 
                 from same brainstorm - reuses existing references).
+            emit_resume_event: If True, broadcast `paper_writing_resumed` for a true
+                interrupted-workflow resume. Automatic in-process retries should keep
+                retrying silently and must not be mislabeled as resumed.
         
         Returns:
             True if paper was successfully compiled, False otherwise.
@@ -3001,9 +3052,11 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
             paper_id = self._current_paper_id
             is_resuming_paper = True
             
-            # Get paper title from metadata
+            # Prefer the in-memory/workflow-state title for retries of unsaved papers.
             paper_metadata = await research_metadata.get_paper_entry(paper_id)
-            if paper_metadata:
+            if self._current_paper_title:
+                paper_title = self._current_paper_title
+            elif paper_metadata:
                 paper_title = paper_metadata.get("title", f"Paper {paper_id}")
                 self._current_paper_title = paper_title
             else:
@@ -3023,11 +3076,12 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
             
             logger.info(f"RESUME: Continuing paper {paper_id} compilation (title: {paper_title[:50]}...)")
             
-            await self._broadcast("paper_writing_resumed", {
-                "paper_id": paper_id,
-                "title": paper_title,
-                "source_brainstorm_id": self._current_topic_id
-            })
+            if emit_resume_event:
+                await self._broadcast("paper_writing_resumed", {
+                    "paper_id": paper_id,
+                    "title": paper_title,
+                    "source_brainstorm_id": self._current_topic_id
+                })
         else:
             # FRESH START: Run full title/reference selection workflow
             # Step 1: Reference selection (if papers exist) - skip for continuation papers
@@ -3049,18 +3103,23 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
             existing_papers = await research_metadata.get_papers_by_brainstorm(
                 self._current_topic_id
             )
+            reference_details = await self._get_reference_paper_details(reference_paper_ids)
             
             candidate_titles = await self._paper_title_exploration_phase(
                 topic_prompt=topic_prompt,
                 brainstorm_summary=brainstorm_summary,
-                existing_papers=existing_papers
+                existing_papers=existing_papers,
+                reference_papers=reference_details
             )
             
             if self._stop_event.is_set():
                 return False
             
             # Step 3: Final title selection (informed by candidate titles)
-            paper_title = await self._paper_title_selection(candidate_titles=candidate_titles)
+            paper_title = await self._paper_title_selection(
+                candidate_titles=candidate_titles,
+                reference_papers=reference_details
+            )
             
             if paper_title is None:
                 logger.error("Paper title selection failed")
@@ -3085,7 +3144,10 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
             })
         
         # Save workflow state with paper details
-        await self._save_workflow_state(tier="tier2_paper_writing", phase="outline")
+        await self._save_workflow_state(
+            tier="tier2_paper_writing",
+            phase=(self._resume_paper_phase or "body") if is_resuming_paper else "outline"
+        )
         
         # Step 3: Paper compilation (using Part 2 compiler infrastructure)
         # Pass is_resume flag and phase to preserve existing paper content when resuming
@@ -3097,18 +3159,13 @@ async def _paper_compilation_workflow(self, skip_reference_selection: bool = Fal
             resume_phase=self._resume_paper_phase if is_resuming_paper else None
         )
         
-        # Clear resume state after compilation attempt (whether success or failure)
-        # This prevents stale resume state from affecting future papers
-        if is_resuming_paper:
-            self._resume_paper_phase = None
-        
         if paper_content is None:
             logger.error("Paper compilation failed")
-            # CRITICAL: Clear stale paper_id to prevent future compilations from
-            # entering RESUME MODE for this failed paper with mismatched brainstorm data
-            self._current_paper_id = None
-            self._current_paper_title = None
+            await self._preserve_failed_paper_state(paper_id, paper_title)
             return False
+
+        # Clear resume state after a successful compilation attempt.
+        self._resume_paper_phase = None
         
         # Get final outline
         from backend.compiler.memory.outline_memory import outline_memory as compiler_outline_memory
@@ -3130,21 +3187,26 @@ async def _reference_selection_workflow(self) -> List[str]:
         Run additional reference paper selection workflow before paper writing.
         
         This allows the AI to select ADDITIONAL references discovered to be relevant
-        during brainstorming, up to the 6 paper limit.
+        during brainstorming, while staying within the topic-cycle base reference cap.
         
         The papers already selected during pre-brainstorm reference selection are
         preserved and shown as "ALREADY SELECTED" to the AI.
         
         Returns:
-            Combined list of all selected paper_ids (max 6 total)
+            Combined list of all selected paper_ids for this topic cycle
         """
+        max_reference_papers = system_config.autonomous_topic_cycle_max_reference_papers
+
         # Start with papers already selected during pre-brainstorm
         already_selected = self._current_reference_papers.copy()
         
         # Check how many more we can select
-        remaining_slots = 6 - len(already_selected)
+        remaining_slots = max_reference_papers - len(already_selected)
         if remaining_slots <= 0:
-            logger.info(f"Already have {len(already_selected)} reference papers (max 6), skipping additional selection")
+            logger.info(
+                f"Already have {len(already_selected)} reference papers "
+                f"(max {max_reference_papers}), skipping additional selection"
+            )
             return already_selected
         
         # Get available papers
@@ -3159,6 +3221,10 @@ async def _reference_selection_workflow(self) -> List[str]:
             p for p in papers_summary 
             if p.get("paper_id") not in already_selected
         ]
+        already_selected_details = [
+            p for p in papers_summary
+            if p.get("paper_id") in already_selected
+        ]
         
         if not available_for_selection:
             logger.info("All available papers already selected, skipping additional selection")
@@ -3186,14 +3252,19 @@ async def _reference_selection_workflow(self) -> List[str]:
             brainstorm_summary=brainstorm_summary,
             available_papers=available_for_selection,
             mode="additional",  # Additional selection mode
-            already_selected=already_selected  # Papers already selected
+            already_selected=already_selected,  # Papers already selected
+            already_selected_papers=already_selected_details,
+            max_total_papers=max_reference_papers,
         )
         
-        # Combine with already selected (respecting max 6 limit)
+        # Combine with already selected (respecting the topic-cycle cap)
         combined = already_selected + additional_ids
-        if len(combined) > 6:
-            logger.warning(f"Combined references ({len(combined)}) exceeds limit, truncating to 6")
-            combined = combined[:6]
+        if len(combined) > max_reference_papers:
+            logger.warning(
+                f"Combined references ({len(combined)}) exceeds limit, "
+                f"truncating to {max_reference_papers}"
+            )
+            combined = combined[:max_reference_papers]
         
         # Update current reference papers
         self._current_reference_papers = combined
@@ -3209,11 +3280,18 @@ async def _reference_selection_workflow(self) -> List[str]:
         logger.info(f"Additional reference selection: {len(additional_ids)} new + {len(already_selected)} existing = {len(combined)} total")
         return combined
     
-    async def _paper_title_selection(self, candidate_titles: str = "") -> Optional[str]:
-        """Select paper title, optionally informed by candidate titles from exploration."""
+    async def _paper_title_selection(
+        self,
+        candidate_titles: str = "",
+        reference_papers: Optional[List[Dict[str, Any]]] = None
+    ) -> Optional[str]:
+        """Select paper title, optionally informed by candidate titles and references."""
         metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
         if metadata is None:
             return None
+
+        if reference_papers is None and self._current_reference_papers:
+            reference_papers = await self._get_reference_paper_details(self._current_reference_papers)
         
         # Get brainstorm summary
         brainstorm_summary = await autonomous_rag_manager.get_brainstorm_summary(
@@ -3231,6 +3309,7 @@ async def _paper_title_selection(self, candidate_titles: str = "") -> Optional[s
             topic_prompt=metadata.topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=existing_papers,
+            reference_papers=reference_papers,
             candidate_titles=candidate_titles,
             stop_event=self._stop_event
         )
@@ -3780,17 +3859,17 @@ async def _handle_paper_completion(
         # Add paper reference to brainstorm
         await brainstorm_memory.add_paper_reference(self._current_topic_id, paper_id)
         
-        # Update counts
-        self._papers_completed_count += 1
-        
-        await self._broadcast("paper_completed", {
-            "paper_id": paper_id,
-            "title": title,
-            "word_count": paper_metadata.word_count
-        })
-        
-        # Trigger auto-critique generation in background (only if marking as complete)
         if mark_complete:
+            # Update counts
+            self._papers_completed_count += 1
+
+            await self._broadcast("paper_completed", {
+                "paper_id": paper_id,
+                "title": title,
+                "word_count": paper_metadata.word_count
+            })
+
+            # Trigger auto-critique generation in background (only if marking as complete)
             asyncio.create_task(self._auto_generate_paper_critique(
                 paper_id=paper_id,
                 paper_title=title
@@ -3921,6 +4000,7 @@ async def _auto_generate_paper_critique(
                 host_provider=self._validator_openrouter_provider,
                 date=datetime.now(),
                 prompt_used=DEFAULT_CRITIQUE_PROMPT,  # Always uses default for auto-critiques
+                critique_source="system_auto",
                 novelty_rating=novelty,
                 novelty_feedback=critique_data.get("novelty_feedback", ""),
                 correctness_rating=correctness,
@@ -4787,6 +4867,8 @@ async def _tier3_reference_selection(
         Select reference papers for Tier 3 final answer.
         Directly selects papers without brainstorm context.
         """
+        max_reference_papers = system_config.autonomous_tier3_short_form_max_reference_papers
+
         # For Tier 3, we browse ALL papers and select those most useful for answering
         selected_ids = await self._reference_selector.select_references(
             user_research_prompt=self._user_research_prompt,
@@ -4794,7 +4876,8 @@ async def _tier3_reference_selection(
             brainstorm_summary="[No brainstorm - Tier 3 operates on completed papers only]",
             available_papers=all_papers,
             mode="initial",  # Fresh selection for Tier 3
-            already_selected=[]
+            already_selected=[],
+            max_total_papers=max_reference_papers,
         )
         
         return selected_ids
@@ -4810,16 +4893,7 @@ async def _tier3_title_selection(
         Runs paper title exploration first to collect 5 candidate titles.
         """
         # Get reference paper details
-        reference_details = []
-        for paper_id in reference_papers:
-            content = await paper_library.get_paper_content(paper_id)
-            metadata = await paper_library.get_metadata(paper_id)
-            if metadata:
-                reference_details.append({
-                    "paper_id": paper_id,
-                    "title": metadata.title,
-                    "abstract": metadata.abstract
-                })
+        reference_details = await self._get_reference_paper_details(reference_papers)
         
         # Run title exploration phase for Tier 3
         topic_prompt = f"[TIER 3 FINAL ANSWER] Certainty: {assessment.certainty_level}"
@@ -4841,6 +4915,7 @@ async def _tier3_title_selection(
             topic_prompt=topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=[],
+            reference_papers=reference_details,
             candidate_titles=candidate_titles,
             stop_event=self._stop_event
         )
@@ -4995,11 +5070,7 @@ async def _write_volume_chapter(
         ]
         
         # Run title exploration for this chapter
-        ref_details = []
-        for pid in reference_ids:
-            meta = await paper_library.get_metadata(pid)
-            if meta:
-                ref_details.append({"paper_id": pid, "title": meta.title, "abstract": meta.abstract})
+        ref_details = await self._get_reference_paper_details(reference_ids)
         
         candidate_titles = await self._paper_title_exploration_phase(
             topic_prompt=f"[VOLUME CHAPTER: {chapter.chapter_type}] {context}",
@@ -5017,6 +5088,7 @@ async def _write_volume_chapter(
             topic_prompt=f"[VOLUME CHAPTER: {chapter.chapter_type}] {context}",
             brainstorm_summary=f"Known Certainties:\n{assessment.known_certainties_summary}",
             existing_papers_from_brainstorm=[],
+            reference_papers=ref_details,
             candidate_titles=candidate_titles,
             stop_event=self._stop_event
         )
@@ -5271,12 +5343,12 @@ async def refresh_workflow_predictions(self) -> None:
                 # 20 slots: topic selection (submit/validate pairs)
                 for i in range(20):
                     if i % 2 == 0:
-                        task_id = f"auto_ts_{ts_seq:03d}"
+                        task_id = f"agg_sub1_{ts_seq:03d}"
                         role = "Topic Selector"
                         mode = "Topic Selection"
                         ts_seq += 1
                     else:
-                        task_id = f"auto_tv_{tv_seq:03d}"
+                        task_id = f"agg_val_{tv_seq:03d}"
                         role = "Topic Validator"
                         mode = "Topic Validation"
                         tv_seq += 1
diff --git a/backend/autonomous/memory/brainstorm_memory.py b/backend/autonomous/memory/brainstorm_memory.py
index 65bb4ae..33584bf 100644
--- a/backend/autonomous/memory/brainstorm_memory.py
+++ b/backend/autonomous/memory/brainstorm_memory.py
@@ -12,6 +12,7 @@
 
 from backend.shared.config import system_config
 from backend.shared.models import BrainstormMetadata
+from backend.shared.path_safety import validate_single_path_component
 
 logger = logging.getLogger(__name__)
 
@@ -47,9 +48,13 @@ async def initialize(self) -> None:
         self._base_dir.mkdir(parents=True, exist_ok=True)
         logger.info(f"Brainstorm memory initialized at {self._base_dir}")
     
+    def _safe_topic_id(self, topic_id: str) -> str:
+        """Validate topic_id as a single path component."""
+        return validate_single_path_component(topic_id, "topic ID")
+
     def _get_database_path(self, topic_id: str) -> Path:
         """Get path to brainstorm database file."""
-        return self._base_dir / f"brainstorm_{topic_id}.txt"
+        return self._base_dir / f"brainstorm_{self._safe_topic_id(topic_id)}.txt"
     
     def get_database_path(self, topic_id: str) -> str:
         """
@@ -63,15 +68,15 @@ def get_database_path(self, topic_id: str) -> str:
     
     def _get_metadata_path(self, topic_id: str) -> Path:
         """Get path to brainstorm metadata JSON file."""
-        return self._base_dir / f"brainstorm_{topic_id}_metadata.json"
+        return self._base_dir / f"brainstorm_{self._safe_topic_id(topic_id)}_metadata.json"
     
     def _get_submitter_rejections_path(self, topic_id: str, submitter_id: int) -> Path:
         """Get path to submitter rejection log file."""
-        return self._base_dir / f"brainstorm_{topic_id}_submitter_{submitter_id}_rejections.txt"
+        return self._base_dir / f"brainstorm_{self._safe_topic_id(topic_id)}_submitter_{submitter_id}_rejections.txt"
     
     def _get_completion_feedback_path(self, topic_id: str) -> Path:
         """Get path to completion feedback file."""
-        return self._base_dir / f"completion_feedback_{topic_id}.txt"
+        return self._base_dir / f"completion_feedback_{self._safe_topic_id(topic_id)}.txt"
     
     # ========================================================================
     # METADATA OPERATIONS
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index 24cf6e9..b643b2c 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -57,9 +57,13 @@ async def initialize(self) -> None:
         self._archive_dir.mkdir(parents=True, exist_ok=True)
         logger.info(f"Paper library initialized at {self._base_dir}")
     
+    def _safe_paper_id(self, paper_id: str) -> str:
+        """Validate paper_id as a single path component."""
+        return validate_single_path_component(paper_id, "paper ID")
+
     def _get_paper_path(self, paper_id: str) -> Path:
         """Get path to paper file."""
-        return self._base_dir / f"paper_{paper_id}.txt"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}.txt"
     
     def get_paper_path(self, paper_id: str) -> str:
         """
@@ -83,23 +87,23 @@ def get_outline_path(self, paper_id: str) -> str:
     
     def _get_abstract_path(self, paper_id: str) -> Path:
         """Get path to abstract file."""
-        return self._base_dir / f"paper_{paper_id}_abstract.txt"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_abstract.txt"
     
     def _get_source_brainstorm_path(self, paper_id: str) -> Path:
         """Get path to cached source brainstorm file."""
-        return self._base_dir / f"paper_{paper_id}_source_brainstorm.txt"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_source_brainstorm.txt"
     
     def _get_outline_path(self, paper_id: str) -> Path:
         """Get path to paper outline file."""
-        return self._base_dir / f"paper_{paper_id}_outline.txt"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_outline.txt"
     
     def _get_metadata_path(self, paper_id: str) -> Path:
         """Get path to paper metadata JSON file."""
-        return self._base_dir / f"paper_{paper_id}_metadata.json"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_metadata.json"
     
     def _get_rejections_path(self, paper_id: str) -> Path:
         """Get path to paper compiler rejections file."""
-        return self._base_dir / f"paper_{paper_id}_last_10_rejections.txt"
+        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_last_10_rejections.txt"
 
     # ========================================================================
     # HISTORY HELPERS
@@ -274,6 +278,66 @@ async def get_history_paper(self, session_id: str, paper_id: str) -> Optional[Di
             "content": content,
             "outline": outline,
         }
+
+    @staticmethod
+    def _format_reference_review_entry(label: str, critique: Any) -> str:
+        """Format one compact critique snapshot for reference-paper prompt context."""
+        return (
+            f"{label} {critique.model_id} "
+            f"N{critique.novelty_rating}/10 "
+            f"C{critique.correctness_rating}/10 "
+            f"I{critique.impact_rating}/10"
+        )
+
+    async def get_reference_title_display(self, paper_id: str, title: str) -> str:
+        """
+        Build a compact title string that includes reference-review ratings.
+
+        Shows the initial system auto-critique when available, plus the latest
+        four non-system critique runs. Legacy critique files created before
+        critique_source existed fall back to treating the oldest critique as the
+        initial run.
+        """
+        from backend.shared.critique_memory import get_critiques
+
+        critiques = await get_critiques(
+            paper_type="autonomous_paper",
+            paper_id=paper_id,
+            base_dir=self._base_dir,
+        )
+        if not critiques:
+            return title
+
+        explicit_system = next(
+            (
+                critique
+                for critique in reversed(critiques)
+                if getattr(critique, "critique_source", "unknown") == "system_auto"
+            ),
+            None,
+        )
+        initial_run = explicit_system or critiques[-1]
+        initial_run_id = getattr(initial_run, "critique_id", None)
+        initial_label = "System initial:" if explicit_system else "Initial run:"
+
+        review_entries = [self._format_reference_review_entry(initial_label, initial_run)]
+
+        user_runs = []
+        for critique in critiques:
+            if initial_run_id and critique.critique_id == initial_run_id:
+                continue
+            if getattr(critique, "critique_source", "unknown") == "system_auto":
+                continue
+            user_runs.append(critique)
+            if len(user_runs) >= 4:
+                break
+
+        for idx, critique in enumerate(user_runs, start=1):
+            review_entries.append(
+                self._format_reference_review_entry(f"User#{idx}:", critique)
+            )
+
+        return f"{title} [Validator reviews: {' | '.join(review_entries)}]"
     
     # ========================================================================
     # CONTENT VALIDATION
@@ -709,7 +773,8 @@ async def get_papers_summary(self) -> List[Dict[str, Any]]:
         Returns minimal metadata without full content.
         
         Returns:
-            List of dicts with paper_id, title, abstract, outline, word_count, source_brainstorm_ids, created_at
+            List of dicts with paper_id, title, reference_title_display, abstract,
+            outline, word_count, source_brainstorm_ids, created_at
         """
         return await self.get_all_papers_with_outlines()
     
@@ -719,7 +784,8 @@ async def get_all_papers_with_outlines(self) -> List[Dict[str, Any]]:
         Used for Tier 3 reference selection.
         
         Returns:
-            List of dicts with paper_id, title, abstract, outline, word_count, source_brainstorm_ids
+            List of dicts with paper_id, title, reference_title_display, abstract,
+            outline, word_count, source_brainstorm_ids
         """
         papers = await self.get_all_papers(validate_completeness=True)
         
@@ -727,10 +793,15 @@ async def get_all_papers_with_outlines(self) -> List[Dict[str, Any]]:
         for paper in papers:
             # Fetch outline for this paper
             outline = await self.get_outline(paper.paper_id)
+            reference_title_display = await self.get_reference_title_display(
+                paper.paper_id,
+                paper.title,
+            )
             
             summaries.append({
                 "paper_id": paper.paper_id,
                 "title": paper.title,
+                "reference_title_display": reference_title_display,
                 "abstract": paper.abstract,
                 "outline": outline,  # NEW: Include outline
                 "word_count": paper.word_count,
diff --git a/backend/autonomous/memory/research_metadata.py b/backend/autonomous/memory/research_metadata.py
index c801537..c24a450 100644
--- a/backend/autonomous/memory/research_metadata.py
+++ b/backend/autonomous/memory/research_metadata.py
@@ -223,6 +223,7 @@ def _get_default_workflow_state(self) -> Dict[str, Any]:
             "current_tier": None,  # "tier1_aggregation", "tier2_paper_writing", or "tier3_final_answer"
             "current_topic_id": None,
             "current_paper_id": None,
+            "current_paper_title": None,
             "paper_phase": None,  # "body", "conclusion", "introduction", "abstract"
             "acceptance_count": 0,
             "rejection_count": 0,
@@ -437,7 +438,7 @@ async def register_paper(self, metadata: PaperMetadata) -> None:
             # Update stats
             self._stats["total_papers_completed"] = sum(
                 1 for p in self._data.get("papers", [])
-                if p.get("status") != "archived"
+                if p.get("status") == "complete"
             )
             self._stats["current_paper_id"] = metadata.paper_id
             await self._save_stats()
@@ -485,7 +486,7 @@ async def get_all_papers_summary(self) -> List[Dict[str, Any]]:
         await self._ensure_initialized()
         return [
             p for p in self._data.get("papers", [])
-            if p.get("status") != "archived"
+            if p.get("status") == "complete"
         ]
     
     async def get_brainstorm_entry(self, topic_id: str) -> Optional[Dict[str, Any]]:
@@ -510,7 +511,7 @@ async def get_papers_by_brainstorm(self, topic_id: str) -> List[Dict[str, Any]]:
         return [
             p for p in self._data.get("papers", [])
             if topic_id in p.get("source_brainstorm_ids", [])
-            and p.get("status") != "archived"
+            and p.get("status") == "complete"
         ]
     
     # ========================================================================
@@ -632,7 +633,7 @@ async def delete_paper(self, paper_id: str) -> bool:
                 # Update stats
                 self._stats["total_papers_completed"] = sum(
                     1 for p in self._data.get("papers", [])
-                    if p.get("status") != "archived"
+                    if p.get("status") == "complete"
                 )
                 self._stats["total_papers_archived"] = sum(
                     1 for p in self._data.get("papers", [])
diff --git a/backend/autonomous/prompts/completion_prompts.py b/backend/autonomous/prompts/completion_prompts.py
index f9a6d10..8ac3c59 100644
--- a/backend/autonomous/prompts/completion_prompts.py
+++ b/backend/autonomous/prompts/completion_prompts.py
@@ -25,17 +25,9 @@ def get_completion_review_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -123,17 +115,9 @@ def get_completion_self_validation_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
diff --git a/backend/autonomous/prompts/final_answer_prompts.py b/backend/autonomous/prompts/final_answer_prompts.py
index a8ba969..72bf2f4 100644
--- a/backend/autonomous/prompts/final_answer_prompts.py
+++ b/backend/autonomous/prompts/final_answer_prompts.py
@@ -12,6 +12,8 @@
 """
 from typing import List, Dict, Any
 
+from backend.autonomous.prompts.paper_reference_prompts import get_reference_title_text
+
 
 # ============================================================================
 # PHASE 1: CERTAINTY ASSESSMENT PROMPTS
@@ -33,17 +35,9 @@ def get_certainty_assessment_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -133,17 +127,9 @@ def get_certainty_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -207,17 +193,9 @@ def get_format_selection_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -293,17 +271,9 @@ def get_format_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -365,17 +335,9 @@ def get_final_paper_title_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -440,17 +402,9 @@ def get_volume_organization_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -593,17 +547,9 @@ def get_volume_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -991,7 +937,7 @@ def build_final_paper_title_prompt(
     
     parts.append("REFERENCE PAPERS (informing the answer):\n")
     for p in selected_references:
-        parts.append(f"- {p.get('title')}\n")
+        parts.append(f"- {get_reference_title_text(p)}\n")
     
     parts.append("\n---\n")
     parts.append("Select a title that DIRECTLY ANSWERS the user's question (respond as JSON):")
diff --git a/backend/autonomous/prompts/paper_continuation_prompts.py b/backend/autonomous/prompts/paper_continuation_prompts.py
index 430f7d9..93420e5 100644
--- a/backend/autonomous/prompts/paper_continuation_prompts.py
+++ b/backend/autonomous/prompts/paper_continuation_prompts.py
@@ -26,17 +26,9 @@ def get_continuation_decision_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -119,10 +111,7 @@ def get_continuation_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to verify claims and access current mathematical literature.
-
----
+ ---
 
 YOUR TASK:
 Validate whether the proposed continuation decision is the best use of research resources.
diff --git a/backend/autonomous/prompts/paper_redundancy_prompts.py b/backend/autonomous/prompts/paper_redundancy_prompts.py
index 944ed54..eb57753 100644
--- a/backend/autonomous/prompts/paper_redundancy_prompts.py
+++ b/backend/autonomous/prompts/paper_redundancy_prompts.py
@@ -24,17 +24,9 @@ def get_paper_redundancy_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
diff --git a/backend/autonomous/prompts/paper_reference_prompts.py b/backend/autonomous/prompts/paper_reference_prompts.py
index 97eb372..19bbb11 100644
--- a/backend/autonomous/prompts/paper_reference_prompts.py
+++ b/backend/autonomous/prompts/paper_reference_prompts.py
@@ -16,12 +16,17 @@
 from typing import List, Dict, Any
 
 
-def get_pre_brainstorm_expansion_system_prompt() -> str:
+def get_reference_title_text(paper: Dict[str, Any]) -> str:
+    """Get the display title for a reference paper, including validator context when available."""
+    return paper.get("reference_title_display") or paper.get("title", "N/A")
+
+
+def get_pre_brainstorm_expansion_system_prompt(max_papers: int) -> str:
     """
     Get system prompt for PRE-BRAINSTORM reference expansion request.
     This is the crucial mechanism for compounding knowledge across research cycles.
     """
-    return """You are selecting reference papers to inform your upcoming BRAINSTORM EXPLORATION. Your role is to:
+    return f"""You are selecting reference papers to inform your upcoming BRAINSTORM EXPLORATION. Your role is to:
 
 1. Review your brainstorm topic that you will explore
 2. Review titles and abstracts of existing papers in the library
@@ -38,17 +43,9 @@ def get_pre_brainstorm_expansion_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -74,7 +71,7 @@ def get_pre_brainstorm_expansion_system_prompt() -> str:
 2. Proceed WITHOUT references (none meet the "very useful" threshold)
 
 IMPORTANT CONSTRAINTS:
-- You can select up to 6 papers maximum
+- You can select up to {max_papers} papers maximum
 - These papers will be available during your entire brainstorm exploration
 - The same papers will also be available during paper writing
 - Quality over quantity - only select papers you genuinely need
@@ -87,11 +84,11 @@ def get_pre_brainstorm_expansion_system_prompt() -> str:
 Output your decision ONLY as JSON in the required format."""
 
 
-def get_additional_reference_expansion_system_prompt() -> str:
+def get_additional_reference_expansion_system_prompt(max_total_papers: int) -> str:
     """
     Get system prompt for ADDITIONAL reference expansion request (before paper writing).
     """
-    return """You are selecting ADDITIONAL reference papers for your upcoming paper compilation. Your role is to:
+    return f"""You are selecting ADDITIONAL reference papers for your upcoming paper compilation. Your role is to:
 
 1. Review your completed brainstorm database
 2. Review titles and abstracts of papers NOT YET selected
@@ -108,17 +105,9 @@ def get_additional_reference_expansion_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -141,7 +130,7 @@ def get_additional_reference_expansion_system_prompt() -> str:
 2. Proceed WITHOUT additional references (already selected papers are sufficient)
 
 IMPORTANT CONSTRAINTS:
-- Check how many slots remain (max 6 total including already selected)
+- Check how many slots remain (max {max_total_papers} total including already selected)
 - Already selected papers WILL be kept - you're only adding new ones
 - Quality over quantity - only add genuinely useful papers
 
@@ -153,9 +142,9 @@ def get_additional_reference_expansion_system_prompt() -> str:
 Output your decision ONLY as JSON in the required format."""
 
 
-def get_reference_expansion_system_prompt() -> str:
+def get_reference_expansion_system_prompt(max_papers: int = 6) -> str:
     """Get system prompt for reference expansion request (Step 1: abstracts only)."""
-    return """You are selecting reference papers for an upcoming mathematical research paper. Your role is to:
+    return f"""You are selecting reference papers for an upcoming mathematical research paper. Your role is to:
 
 1. Review your brainstorm topic and database
 2. Review titles and abstracts of existing papers in the library
@@ -172,17 +161,9 @@ def get_reference_expansion_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -199,7 +180,7 @@ def get_reference_expansion_system_prompt() -> str:
 2. Proceed WITHOUT references (none meet the "very useful" threshold)
 
 IMPORTANT CONSTRAINTS:
-- In the final selection (next step), you can only select up to 6 papers
+- In the final selection (next step), you can only select up to {max_papers} papers
 - You can request to expand as many papers as you want to review
 - Only request expansion for papers that genuinely might be "very useful"
 
@@ -242,13 +223,13 @@ def get_reference_expansion_json_schema() -> str:
 }"""
 
 
-def get_reference_selection_system_prompt() -> str:
+def get_reference_selection_system_prompt(max_papers: int) -> str:
     """Get system prompt for final reference selection (Step 2: full papers)."""
-    return """You are making your FINAL SELECTION of reference papers for an upcoming mathematical research paper. Your role is to:
+    return f"""You are making your FINAL SELECTION of reference papers for an upcoming mathematical research paper. Your role is to:
 
 1. Review your brainstorm topic and database
 2. Review the FULL CONTENT of the papers you requested to expand
-3. Select which papers (up to 6) will be used as references during paper writing
+3. Select which papers (up to {max_papers}) will be used as references during paper writing
 
 ⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
 
@@ -261,22 +242,14 @@ def get_reference_selection_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
 YOUR TASK:
-Make your final selection of reference papers (maximum 6) that will be included in your context during paper compilation.
+Make your final selection of reference papers (maximum {max_papers}) that will be included in your context during paper compilation.
 
 SELECTION CRITERIA:
 - Papers that provide essential mathematical background
@@ -285,7 +258,7 @@ def get_reference_selection_system_prompt() -> str:
 - Papers that present related results you'll reference or extend
 
 CONSTRAINT:
-- Maximum 6 papers can be selected (hard limit for context budget)
+- Maximum {max_papers} papers can be selected (hard limit for context budget)
 - These papers will be RAG'd during paper compilation
 - Your brainstorm database has higher direct injection priority
 
@@ -297,30 +270,31 @@ def get_reference_selection_system_prompt() -> str:
 Output your selection ONLY as JSON in the required format."""
 
 
-def get_reference_selection_json_schema() -> str:
+def get_reference_selection_json_schema(max_papers: int) -> str:
     """Get JSON schema for final reference selection."""
-    return """REQUIRED JSON FORMAT:
-{
-  "selected_papers": ["array of up to 6 paper_ids"],
+    return f"""REQUIRED JSON FORMAT:
+{{
+  "selected_papers": ["array of up to {max_papers} paper_ids"],
   "reasoning": "string - Why these specific papers are very useful for the upcoming paper"
-}
+}}
 
 FIELD REQUIREMENTS:
-- selected_papers: Array of paper IDs (maximum 6, can be empty)
+- selected_papers: Array of paper IDs (maximum {max_papers}, can be empty)
 - reasoning: ALWAYS required
 
 EXAMPLE:
-{
+{{
   "selected_papers": ["paper_003", "paper_007", "paper_011"],
   "reasoning": "After reviewing full content, these three papers provide the most useful reference material: Paper 003 establishes the class field theory foundation needed for our reciprocity discussions. Paper 007's treatment of Galois representations will inform our theoretical sections. Paper 011's computational examples of modular forms will enhance our practical demonstrations. The other expanded papers, while relevant, overlap too much with our brainstorm content or cover tangential topics."
-}"""
+}}"""
 
 
 def build_pre_brainstorm_expansion_prompt(
     user_research_prompt: str,
     topic_prompt: str,
     brainstorm_summary: str,
-    papers_with_abstracts: List[Dict[str, Any]]
+    papers_with_abstracts: List[Dict[str, Any]],
+    max_papers: int
 ) -> str:
     """
     Build the PRE-BRAINSTORM reference expansion prompt.
@@ -336,7 +310,7 @@ def build_pre_brainstorm_expansion_prompt(
         Complete prompt string
     """
     parts = [
-        get_pre_brainstorm_expansion_system_prompt(),
+        get_pre_brainstorm_expansion_system_prompt(max_papers),
         "\n---\n",
         get_reference_expansion_json_schema(),
         "\n---\n",
@@ -351,7 +325,7 @@ def build_pre_brainstorm_expansion_prompt(
         parts.append("EXISTING PAPERS IN LIBRARY (select references to inform your brainstorm):\n")
         for p in papers_with_abstracts:
             parts.append(f"\n--- Paper ID: {p.get('paper_id', 'Unknown')} ---")
-            parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+            parts.append(f"\nTitle: {get_reference_title_text(p)}")
             parts.append(f"\nAbstract: {p.get('abstract', 'N/A')}")
             
             # NEW: Display outline
@@ -381,7 +355,9 @@ def build_additional_reference_expansion_prompt(
     topic_prompt: str,
     brainstorm_summary: str,
     papers_with_abstracts: List[Dict[str, Any]],
-    already_selected: List[str]
+    already_selected: List[str],
+    already_selected_papers: List[Dict[str, Any]],
+    max_total_papers: int
 ) -> str:
     """
     Build the ADDITIONAL reference expansion prompt (before paper writing).
@@ -396,10 +372,10 @@ def build_additional_reference_expansion_prompt(
     Returns:
         Complete prompt string
     """
-    remaining_slots = 6 - len(already_selected)
+    remaining_slots = max(0, max_total_papers - len(already_selected))
     
     parts = [
-        get_additional_reference_expansion_system_prompt(),
+        get_additional_reference_expansion_system_prompt(max_total_papers),
         "\n---\n",
         get_reference_expansion_json_schema(),
         "\n---\n",
@@ -413,7 +389,13 @@ def build_additional_reference_expansion_prompt(
     ]
     
     # Show already selected papers
-    if already_selected:
+    if already_selected_papers:
+        for paper in already_selected_papers:
+            parts.append(
+                f"  - {paper.get('paper_id', 'Unknown')}: "
+                f"{get_reference_title_text(paper)}\n"
+            )
+    elif already_selected:
         for paper_id in already_selected:
             parts.append(f"  - {paper_id}\n")
     else:
@@ -426,7 +408,7 @@ def build_additional_reference_expansion_prompt(
         parts.append(f"ADDITIONAL PAPERS AVAILABLE FOR SELECTION (can add up to {remaining_slots} more):\n")
         for p in papers_with_abstracts:
             parts.append(f"\n--- Paper ID: {p.get('paper_id', 'Unknown')} ---")
-            parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+            parts.append(f"\nTitle: {get_reference_title_text(p)}")
             parts.append(f"\nAbstract: {p.get('abstract', 'N/A')}")
             
             # NEW: Display outline
@@ -455,7 +437,8 @@ def build_reference_expansion_prompt(
     user_research_prompt: str,
     topic_prompt: str,
     brainstorm_summary: str,
-    papers_with_abstracts: List[Dict[str, Any]]
+    papers_with_abstracts: List[Dict[str, Any]],
+    max_papers: int = 6
 ) -> str:
     """
     Build the reference expansion prompt (Step 1: abstracts only).
@@ -472,7 +455,7 @@ def build_reference_expansion_prompt(
         Complete prompt string
     """
     parts = [
-        get_reference_expansion_system_prompt(),
+        get_reference_expansion_system_prompt(max_papers),
         "\n---\n",
         get_reference_expansion_json_schema(),
         "\n---\n",
@@ -489,7 +472,7 @@ def build_reference_expansion_prompt(
         parts.append("EXISTING PAPERS IN LIBRARY (Titles, Abstracts, and Outlines):\n")
         for p in papers_with_abstracts:
             parts.append(f"\n--- Paper ID: {p.get('paper_id', 'Unknown')} ---")
-            parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+            parts.append(f"\nTitle: {get_reference_title_text(p)}")
             parts.append(f"\nAbstract: {p.get('abstract', 'N/A')}")
             
             # NEW: Display outline
@@ -535,21 +518,10 @@ def build_reference_selection_prompt(
     Returns:
         Complete prompt string
     """
-    # Customize system prompt based on mode
-    if mode == "initial":
-        system_intro = """You are making your FINAL SELECTION of reference papers for your upcoming BRAINSTORM EXPLORATION.
-
-These papers will be available during your ENTIRE brainstorm exploration AND paper writing phase.
-This enables compounding knowledge - build upon established frameworks and avoid redundant exploration."""
-    else:
-        system_intro = """You are making your FINAL SELECTION of ADDITIONAL reference papers for paper compilation.
-
-These papers will be added to your existing references for paper writing."""
-    
     parts = [
-        get_reference_selection_system_prompt(),
+        get_reference_selection_system_prompt(max_papers),
         "\n---\n",
-        get_reference_selection_json_schema(),
+        get_reference_selection_json_schema(max_papers),
         "\n---\n",
         f"MODE: {mode.upper()} SELECTION",
         "\n---\n",
@@ -566,7 +538,7 @@ def build_reference_selection_prompt(
     for p in expanded_papers:
         parts.append(f"\n{'=' * 60}")
         parts.append(f"\nPaper ID: {p.get('paper_id', 'Unknown')}")
-        parts.append(f"\nTitle: {p.get('title', 'N/A')}")
+        parts.append(f"\nTitle: {get_reference_title_text(p)}")
         parts.append(f"\nWord Count: {p.get('word_count', 0)}")
         parts.append(f"\n{'=' * 60}")
         
diff --git a/backend/autonomous/prompts/paper_title_prompts.py b/backend/autonomous/prompts/paper_title_prompts.py
index 9f8b2d2..fa25fc3 100644
--- a/backend/autonomous/prompts/paper_title_prompts.py
+++ b/backend/autonomous/prompts/paper_title_prompts.py
@@ -3,14 +3,17 @@
 """
 from typing import List, Dict, Any
 
+from backend.autonomous.prompts.paper_reference_prompts import get_reference_title_text
+
 
 def get_paper_title_system_prompt() -> str:
     """Get system prompt for paper title selection."""
     return """You are selecting a title for a mathematical research paper. Your role is to:
 
 1. Review your brainstorm topic and database content
-2. Review any existing papers generated from this brainstorm (if any)
-3. Select an appropriate, descriptive title for the new paper
+2. Review any selected reference papers informing this paper (if any)
+3. Review any existing papers generated from this brainstorm (if any)
+4. Select an appropriate, descriptive title for the new paper
 
 ⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
 
@@ -23,22 +26,14 @@ def get_paper_title_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
 YOUR TASK:
-Choose a title that accurately captures the mathematical content of your brainstorm.
+Choose a title that accurately captures the mathematical content and scope of the planned paper.
 
 IMPORTANT CLARIFICATION:
 - The brainstorm submissions are the SOURCE MATERIAL for your paper
@@ -94,8 +89,9 @@ def get_paper_title_validator_system_prompt() -> str:
 
 1. Review the proposed title
 2. Review the brainstorm content the paper will be based on
-3. Review any EXISTING COMPLETED PAPERS from the same brainstorm (if any)
-4. Decide if the title is appropriate
+3. Review any selected reference papers informing the paper (if any)
+4. Review any EXISTING COMPLETED PAPERS from the same brainstorm (if any)
+5. Decide if the title is appropriate
 
 ⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
 
@@ -108,17 +104,9 @@ def get_paper_title_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -145,6 +133,7 @@ def get_paper_title_validator_system_prompt() -> str:
 
 ACCEPT the title if:
 - It accurately represents the brainstorm content (this is EXPECTED - the paper is based on the brainstorm!)
+- It remains consistent with the paper's intended scope when selected reference papers are present
 - It is appropriately specific (not too broad or narrow)
 - It differentiates from EXISTING COMPLETED PAPERS from the same brainstorm (if any exist)
 - It follows mathematical paper title conventions
@@ -230,9 +219,13 @@ def build_paper_title_prompt(
     
     # Add selected reference papers if any
     if reference_papers:
-        parts.append("SELECTED REFERENCE PAPERS:\n")
+        parts.append("SELECTED REFERENCE PAPERS (inform this paper's scope and title):\n")
         for p in reference_papers:
-            parts.append(f"\n- {p.get('title', 'N/A')}")
+            abstract = p.get("abstract", "N/A")
+            if isinstance(abstract, str) and len(abstract) > 220:
+                abstract = abstract[:220] + "..."
+            parts.append(f"\n- {p.get('paper_id', 'N/A')}: {get_reference_title_text(p)}")
+            parts.append(f"\n  Abstract: {abstract}")
         parts.append("\n---\n")
     
     # Inject validated candidate titles from exploration phase
@@ -265,7 +258,8 @@ def build_paper_title_validation_prompt(
     brainstorm_summary: str,
     existing_papers_from_brainstorm: List[Dict[str, Any]],
     proposed_title: str,
-    title_reasoning: str
+    title_reasoning: str,
+    reference_papers: List[Dict[str, Any]] = None
 ) -> str:
     """
     Build the paper title validation prompt.
@@ -277,6 +271,7 @@ def build_paper_title_validation_prompt(
         existing_papers_from_brainstorm: Papers already created from this brainstorm
         proposed_title: The proposed paper title
         title_reasoning: The reasoning provided for the title
+        reference_papers: Selected reference papers informing the paper's scope
     
     Returns:
         Complete prompt string
@@ -303,6 +298,16 @@ def build_paper_title_validation_prompt(
         parts.append("\n---\n")
     else:
         parts.append("EXISTING PAPERS FROM THIS BRAINSTORM: None\n---\n")
+
+    if reference_papers:
+        parts.append("SELECTED REFERENCE PAPERS:\n")
+        for p in reference_papers:
+            abstract = p.get("abstract", "N/A")
+            if isinstance(abstract, str) and len(abstract) > 220:
+                abstract = abstract[:220] + "..."
+            parts.append(f"\n- {p.get('paper_id', 'N/A')}: {get_reference_title_text(p)}")
+            parts.append(f"\n  Abstract: {abstract}")
+        parts.append("\n---\n")
     
     # Add proposed title
     parts.append("PROPOSED TITLE:\n")
diff --git a/backend/autonomous/prompts/topic_prompts.py b/backend/autonomous/prompts/topic_prompts.py
index 69b3223..449fef2 100644
--- a/backend/autonomous/prompts/topic_prompts.py
+++ b/backend/autonomous/prompts/topic_prompts.py
@@ -24,17 +24,9 @@ def get_topic_selection_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -144,17 +136,9 @@ def get_topic_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
diff --git a/backend/autonomous/validation/paper_redundancy_checker.py b/backend/autonomous/validation/paper_redundancy_checker.py
index 408294f..276e827 100644
--- a/backend/autonomous/validation/paper_redundancy_checker.py
+++ b/backend/autonomous/validation/paper_redundancy_checker.py
@@ -50,7 +50,7 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
-        return f"auto_prc_{self.task_sequence:03d}"
+        return f"agg_val_{self.task_sequence:03d}"
     
     async def check_redundancy(
         self,
diff --git a/backend/compiler/agents/high_context_submitter.py b/backend/compiler/agents/high_context_submitter.py
index b7c5f10..35ff23d 100644
--- a/backend/compiler/agents/high_context_submitter.py
+++ b/backend/compiler/agents/high_context_submitter.py
@@ -594,10 +594,7 @@ async def submit_construction(
             # Check for empty response
             if not response.get("choices") or not response["choices"][0].get("message"):
                 logger.error("construction: LLM returned empty response structure")
-                # Notify task completed (failed but still completed)
-                if self.task_tracking_callback:
-                    self.task_tracking_callback("completed", task_id)
-                return None
+                raise ValueError("LLM returned empty response")
             
             # Extract content from either 'content' or 'reasoning' field
             # Some reasoning models (e.g., DeepSeek R1, certain GPT variants) output JSON in 'reasoning' field
@@ -723,7 +720,7 @@ async def submit_construction(
                 self.task_tracking_callback("completed", task_id)
             return None
     
-    async def submit_review(self) -> Optional[CompilerSubmission]:
+    async def submit_review(self, review_focus: str = "general") -> Optional[CompilerSubmission]:
         """
         Submit paper review (or no-op if no edit needed).
         
@@ -735,7 +732,7 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
         Returns:
             CompilerSubmission if edit needed, None otherwise
         """
-        logger.info("Starting paper review for errors/improvements...")
+        logger.info(f"Starting paper review for errors/improvements (focus={review_focus})...")
         
         try:
             # Get current outline and paper (NO aggregator DB context for this mode)
@@ -754,7 +751,8 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
             prompt = await build_review_prompt(
                 user_prompt=self.user_prompt,
                 current_outline=current_outline,  # ALWAYS fully injected
-                current_paper=paper_for_llm
+                current_paper=paper_for_llm,
+                review_focus=review_focus
             )
             logger.info(f"Prompt built: {len(prompt)} chars")
             
@@ -789,6 +787,12 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
                 temperature=0.0,  # Deterministic generation - evolving context provides diversity
                 max_tokens=system_config.compiler_high_context_max_output_tokens  # User-configurable (outline creation, update, construction, review)
             )
+            
+            # Check for empty response
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                logger.error("review: LLM returned empty response structure")
+                raise ValueError("LLM returned empty response")
+            
             # Extract content from either 'content' or 'reasoning' field
             # Some reasoning models (e.g., DeepSeek R1, certain GPT variants) output JSON in 'reasoning' field
             message = response["choices"][0]["message"]
@@ -844,7 +848,10 @@ async def submit_review(self) -> Optional[CompilerSubmission]:
                 old_string=_normalize_string_field(data.get("old_string", "")),
                 new_string=new_string_content,  # Already normalized above
                 reasoning=data.get("reasoning", ""),
-                metadata={"is_minuscule": is_minuscule}
+                metadata={
+                    "is_minuscule": is_minuscule,
+                    "review_focus": review_focus
+                }
             )
             
             # Notify task completed successfully
diff --git a/backend/compiler/agents/high_param_submitter.py b/backend/compiler/agents/high_param_submitter.py
index 2d9b630..745cda8 100644
--- a/backend/compiler/agents/high_param_submitter.py
+++ b/backend/compiler/agents/high_param_submitter.py
@@ -252,6 +252,9 @@ async def _step1_planning(self) -> Optional[dict]:
         )
         
         # Extract content
+        if not response.get("choices") or not response["choices"][0].get("message"):
+            logger.error("Step 1: LLM returned empty response structure")
+            raise ValueError("LLM returned empty response")
         message = response["choices"][0]["message"]
         llm_output = message.get("content") or message.get("reasoning") or ""
         logger.info(f"Step 1: LLM completion received - {len(llm_output)} chars")
@@ -405,6 +408,9 @@ async def _step2_standard_execution(
             )
             
             # Extract content
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                logger.error("Step 2: LLM returned empty response structure")
+                raise ValueError("LLM returned empty response")
             message = response["choices"][0]["message"]
             llm_output = message.get("content") or message.get("reasoning") or ""
             logger.info(f"Step 2: LLM completion received - {len(llm_output)} chars")
@@ -606,6 +612,9 @@ async def _step2_wolfram_execution(
             )
             
             # Extract content
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                logger.error("Step 2 (Wolfram): LLM returned empty response structure")
+                raise ValueError("LLM returned empty response")
             message = response["choices"][0]["message"]
             llm_output = message.get("content") or message.get("reasoning") or ""
             logger.info(f"Step 2 (Wolfram): LLM completion received - {len(llm_output)} chars")
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 6224e27..66e15da 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -17,6 +17,7 @@
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.free_model_manager import free_model_manager
 from backend.shared.json_parser import parse_json
 from backend.shared.utils import count_tokens
 from backend.compiler.agents.high_context_submitter import HighContextSubmitter
@@ -574,6 +575,9 @@ async def start(self) -> None:
         self.is_running = True
         logger.info("Starting compiler...")
         
+        # Reset free model manager state for fresh start
+        free_model_manager.reset()
+        
         # Refresh workflow predictions at start
         await self.refresh_workflow_predictions()
         
@@ -668,29 +672,15 @@ async def _main_workflow(self) -> None:
         except asyncio.CancelledError:
             logger.info("Compiler workflow cancelled")
         except FreeModelExhaustedError as e:
-            if e.soonest_retry:
-                wait_secs = max(0, e.soonest_retry - time.time())
-                wait_mins = round(wait_secs / 60, 1)
-                logger.warning(
-                    f"SERIAL BOTTLENECK: Compiler paused for {wait_mins} minutes "
-                    f"(all free models rate-limited)"
-                )
-                await self._broadcast("serial_bottleneck_paused", {
-                    "role_id": "compiler",
-                    "model": str(e),
-                    "wait_seconds": round(wait_secs),
-                    "resume_at": time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.soonest_retry)),
-                })
-                await asyncio.sleep(wait_secs)
-                await self._broadcast("serial_bottleneck_resumed", {"role_id": "compiler"})
-                if self.is_running:
-                    asyncio.create_task(self._main_workflow())
-            else:
-                logger.error(f"Compiler: all free models exhausted, no cooldown: {e}")
-                self.is_running = False
-                await self._broadcast("all_free_models_exhausted", {
-                    "message": f"All free models exhausted for compiler: {e}"
-                })
+            # All free models exhausted after retries - wait briefly and retry
+            logger.warning(f"Compiler: all free models exhausted: {e}")
+            await self._broadcast("free_models_exhausted", {
+                "role_id": "compiler",
+                "message": str(e),
+            })
+            await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
+            if self.is_running:
+                asyncio.create_task(self._main_workflow())
         except Exception as e:
             logger.error(f"Compiler workflow error: {e}", exc_info=True)
             self.is_running = False
@@ -1150,6 +1140,7 @@ async def _rigor_loop(self) -> None:
     
     # Maximum retries for premature decline/completion rejections
     MAX_PREMATURE_RETRIES = 5
+    PRE_ABSTRACT_RED_TEAM_MAX_PASSES = 2
     
     async def _submit_and_validate_construction(self, rejection_feedback: Optional[str] = None, retry_count: int = 0) -> Tuple[bool, Optional[str]]:
         """
@@ -1310,7 +1301,6 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                     self.construction_rejections += 1
                     
                     # Log as rejection
-                    from backend.shared.models import CompilerValidationResult
                     rejection_result = CompilerValidationResult(
                         submission_id=str(uuid.uuid4()),
                         decision="reject",
@@ -1393,7 +1383,6 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                     logger.warning(f"Rejecting empty phase completion: {rejection_reason}")
                     self.construction_rejections += 1
                     
-                    from backend.shared.models import CompilerValidationResult
                     rejection_result = CompilerValidationResult(
                         submission_id=str(uuid.uuid4()),
                         decision="reject",
@@ -1501,7 +1490,6 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 self.construction_rejections += 1
                 
                 # Create emergency rejection
-                from backend.shared.models import CompilerValidationResult
                 emergency_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
@@ -1709,7 +1697,6 @@ async def _submit_and_validate_outline_update(self) -> bool:
                 self.outline_rejections += 1
                 
                 # Create emergency rejection
-                from backend.shared.models import CompilerValidationResult
                 emergency_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
@@ -1764,31 +1751,39 @@ async def _submit_and_validate_outline_update(self) -> bool:
             logger.info("Outline update rejected")
             return False
     
-    async def _submit_and_validate_review(self) -> bool:
+    async def _submit_and_validate_review(self, review_focus: str = "general") -> bool:
         """Submit and validate review. Returns True if accepted."""
         self.current_mode = "review"
+        review_label = "empirical red-team review" if review_focus == "empirical_red_team" else "review"
         
         submission = None
         try:
-            submission = await self.high_context_submitter.submit_review()
+            submission = await self.high_context_submitter.submit_review(review_focus=review_focus)
         except ValueError as e:
-            logger.error(f"Review context overflow: {e}")
+            logger.error(f"{review_label.capitalize()} context overflow: {e}")
             self.review_declines += 1
             await compiler_rejection_log.add_decline("review", f"Context overflow: {e}")
             await self._broadcast("compiler_decline", {
                 "mode": "review",
+                "review_focus": review_focus,
                 "reasoning": f"Context overflow: {e}"
             })
             return False
         
         if submission is None:
-            logger.info("No review edit needed")
+            logger.info(f"No {review_label} edit needed")
             self.review_declines += 1
-            await compiler_rejection_log.add_decline("review", "No errors or improvements needed")
+            decline_reason = (
+                "No fabricated experiments or unsupported metrics found"
+                if review_focus == "empirical_red_team"
+                else "No errors or improvements needed"
+            )
+            await compiler_rejection_log.add_decline("review", decline_reason)
             
             await self._broadcast("compiler_decline", {
                 "mode": "review",
-                "reasoning": "No errors or improvements needed"
+                "review_focus": review_focus,
+                "reasoning": decline_reason
             })
             
             return False
@@ -1801,7 +1796,8 @@ async def _submit_and_validate_review(self) -> bool:
         
         await self._broadcast("compiler_submission", {
             "mode": "review",
-            "submission_id": submission.submission_id
+            "submission_id": submission.submission_id,
+            "review_focus": review_focus
         })
         
         current_paper = await paper_memory.get_paper()
@@ -1826,7 +1822,6 @@ async def _submit_and_validate_review(self) -> bool:
                 self.review_rejections += 1
                 
                 # Create emergency rejection
-                from backend.shared.models import CompilerValidationResult
                 emergency_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
@@ -1841,6 +1836,7 @@ async def _submit_and_validate_review(self) -> bool:
                 await self._broadcast("compiler_rejection", {
                     "mode": "review",
                     "submission_id": submission.submission_id,
+                    "review_focus": review_focus,
                     "reasoning": "Emergency rejection: exact string match failed"
                 })
                 
@@ -1860,7 +1856,8 @@ async def _submit_and_validate_review(self) -> bool:
             
             await self._broadcast("compiler_acceptance", {
                 "mode": "review",
-                "submission_id": submission.submission_id
+                "submission_id": submission.submission_id,
+                "review_focus": review_focus
             })
             
             await self._broadcast("paper_updated", {
@@ -1868,7 +1865,7 @@ async def _submit_and_validate_review(self) -> bool:
                 "preview": updated_paper[:500]
             })
             
-            logger.info(f"Review edit accepted ({word_count} words)")
+            logger.info(f"{review_label.capitalize()} edit accepted ({word_count} words)")
             return True
         else:
             self.review_rejections += 1
@@ -1878,17 +1875,63 @@ async def _submit_and_validate_review(self) -> bool:
             await self._broadcast("compiler_rejection", {
                 "mode": "review",
                 "submission_id": submission.submission_id,
+                "review_focus": review_focus,
                 "reasoning": result.reasoning
             })
             
-            logger.info("Review edit rejected")
+            logger.info(f"{review_label.capitalize()} edit rejected")
             return False
+
+    async def _run_pre_abstract_red_team_review(self) -> None:
+        """Run a dedicated empirical-provenance red-team pass before abstract writing."""
+        logger.info("=" * 80)
+        logger.info("STARTING PRE-ABSTRACT EMPIRICAL RED-TEAM REVIEW")
+        logger.info("=" * 80)
+
+        await self._broadcast("empirical_red_team_started", {
+            "phase": "pre_abstract",
+            "max_passes": self.PRE_ABSTRACT_RED_TEAM_MAX_PASSES
+        })
+
+        edits_applied = 0
+        passes_run = 0
+
+        for _ in range(self.PRE_ABSTRACT_RED_TEAM_MAX_PASSES):
+            if not self.is_running:
+                break
+
+            passes_run += 1
+            accepted = await self._submit_and_validate_review(review_focus="empirical_red_team")
+            if not accepted:
+                break
+            edits_applied += 1
+
+        await self._broadcast("empirical_red_team_complete", {
+            "phase": "pre_abstract",
+            "passes_run": passes_run,
+            "edits_applied": edits_applied
+        })
+
+        logger.info(
+            f"Pre-abstract empirical red-team review complete "
+            f"(passes={passes_run}, edits_applied={edits_applied})"
+        )
     
     async def _submit_and_validate_rigor(self) -> bool:
         """Submit and validate rigor enhancement. Returns True if accepted."""
         self.current_mode = "rigor"
         
-        submission = await self.high_param_submitter.submit_rigor_enhancement()
+        try:
+            submission = await self.high_param_submitter.submit_rigor_enhancement()
+        except ValueError as e:
+            logger.error(f"Rigor enhancement error: {e}")
+            self.rigor_declines += 1
+            await compiler_rejection_log.add_decline("rigor", f"LLM error: {e}")
+            await self._broadcast("compiler_decline", {
+                "mode": "rigor",
+                "reasoning": f"LLM error: {e}"
+            })
+            return False
         
         if submission is None:
             logger.info("No rigor enhancement needed")
@@ -1932,7 +1975,6 @@ async def _submit_and_validate_rigor(self) -> bool:
                 self.rigor_rejections += 1
                 
                 # Create emergency rejection
-                from backend.shared.models import CompilerValidationResult
                 emergency_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
@@ -3568,6 +3610,9 @@ async def _check_phase_transition(self, section_complete: bool = False) -> bool:
             if not has_introduction:
                 logger.error("Cannot transition from introduction phase: No Introduction section found in paper")
                 return False  # Block transition
+
+            logger.info("Introduction complete - running pre-abstract empirical red-team review")
+            await self._run_pre_abstract_red_team_review()
             
             self.autonomous_section_phase = "abstract"
             logger.info("Phase transition: introduction → abstract (explicit section_complete)")
diff --git a/backend/compiler/prompts/construction_prompts.py b/backend/compiler/prompts/construction_prompts.py
index 2c279da..e4fdd54 100644
--- a/backend/compiler/prompts/construction_prompts.py
+++ b/backend/compiler/prompts/construction_prompts.py
@@ -13,6 +13,17 @@
 from backend.compiler.memory.compiler_rejection_log import compiler_rejection_log
 
 
+CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES:
+- Classify substantive claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims must be supported by sound derivation, proof, or explicit assumptions inside the paper.
+- Literature claims must include explicit in-text citations identifying the external source.
+- Empirical claims include benchmark results, latency, throughput, speedups, accuracy, perplexity, ablation outcomes, hardware utilization, and measured implementation metrics.
+- Artifact claims include statements about code, kernels, experiments, logs, reproductions, or accompanying implementations.
+- Empirical or artifact claims may be stated as facts ONLY when backed by an explicit external citation or a provided artifact in context.
+- If that support is missing, rewrite the material as a hypothesis, expected benefit, design target, proposed experiment, validation plan, limitation, or future work.
+- NEVER invent citations, experiments, benchmark numbers, hardware measurements, datasets, or code artifacts."""
+
+
 # =============================================================================
 # PHASE-SPECIFIC CONSTRUCTION PROMPTS
 # =============================================================================
@@ -32,17 +43,11 @@ def get_body_construction_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -55,6 +60,13 @@ def get_body_construction_system_prompt() -> str:
 
 WHY BODY FIRST? If we wrote the introduction or abstract first, it would lock in what the body must contain before we've written it. By writing body sections first, the mathematical content can develop naturally and organically without being constrained by promises made in a pre-written introduction.
 
+SOURCE USAGE PRINCIPLE:
+- Treat the brainstorm/aggregator database as optional high-value source material and exploration history, not a mandatory checklist
+- Use it when it helps you achieve the strongest rigorous paper toward the user's prompt
+- You may synthesize beyond brainstorm/database material using sound mathematical reasoning
+- Do NOT force coverage of every source entry
+- Do NOT ignore clearly crucial source material for the scope you are writing
+
 CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
 
 The paper uses placeholder markers that the SYSTEM adds automatically (you did NOT create these):
@@ -117,11 +129,12 @@ def get_body_construction_system_prompt() -> str:
 CRITICAL REQUIREMENTS:
 - Follow the outline structure for body sections
 - Build upon what's already written
-- Capture relevant content from the aggregator database
+- Use brainstorm/aggregator content when it helps, but you are not required to cover every source entry
 - Do not repeat content already in the document
 - Check for existing section headers before creating new ones
 - Write clear, rigorous mathematical exposition
 - ALL content must be rooted in sound mathematical reasoning
+- Unsupported empirical or artifact claims must be rewritten as hypotheses, validation plans, limitations, or future work instead of being asserted as completed results
 
 EXACT STRING MATCHING FOR EDITS:
 This system uses EXACT STRING MATCHING. To insert or modify content, you must:
@@ -214,17 +227,11 @@ def get_conclusion_construction_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -306,6 +313,7 @@ def get_conclusion_construction_system_prompt() -> str:
 - Connections between results
 - Brief mention of limitations or open questions (optional)
 - Final remarks on the mathematical significance
+- If empirical validation was not actually supported, state the limitation plainly instead of summarizing unsupported benchmark claims as established fact
 
 CRITICAL - SECTION HEADER FORMAT:
 - Use EXACTLY "Conclusion" as the section header (NO Roman numeral prefix)
@@ -335,6 +343,7 @@ def get_conclusion_construction_system_prompt() -> str:
 - Summarize, don't introduce new material
 - Maintain coherent narrative flow from body to conclusion
 - Write clear, rigorous mathematical exposition
+- Do not convert unsupported empirical ideas into factual claims while summarizing
 
 EXACT STRING MATCHING FOR EDITS:
 This system uses EXACT STRING MATCHING. To replace the conclusion placeholder:
@@ -369,17 +378,11 @@ def get_introduction_construction_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
+""" + CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -497,6 +500,7 @@ def get_introduction_construction_system_prompt() -> str:
 - Describe results without full proofs
 - Set up the mathematical context
 - Make the reader want to continue reading
+- Do not promise empirical validation, benchmark numbers, or artifacts unless they are explicitly supported
 
 EXACT STRING MATCHING FOR EDITS:
 This system uses EXACT STRING MATCHING. To replace the introduction placeholder:
@@ -531,17 +535,11 @@ def get_abstract_construction_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -630,6 +628,7 @@ def get_abstract_construction_system_prompt() -> str:
 - Key methods or approaches used
 - Significance of the results
 - Typically 150-300 words
+- Unsupported empirical claims must be reframed as expected benefits, proposed validation, or limitations rather than as verified outcomes
 
 CRITICAL - SECTION HEADER FORMAT:
 - Use EXACTLY "Abstract" as the section header (NO Roman numeral prefix)
@@ -659,6 +658,7 @@ def get_abstract_construction_system_prompt() -> str:
 - Be concise but comprehensive
 - State results, not just topics
 - Avoid technical jargon where possible
+- NEVER summarize unsupported benchmark numbers, hardware measurements, or code artifacts as if they were verified
 
 EXACT STRING MATCHING FOR EDITS:
 This system uses EXACT STRING MATCHING. To replace the abstract placeholder:
@@ -702,23 +702,17 @@ def get_construction_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
 1. Review the current outline
 2. Review the current document progress (what's already written)
-3. Review the aggregator database
+3. Review any aggregator/brainstorm database evidence that seems useful
 4. Write the next logical portion of the document or expansion of a section
 
 CRITICAL - SECTION ORDER ENFORCEMENT:
@@ -744,12 +738,13 @@ def get_construction_system_prompt() -> str:
 CRITICAL REQUIREMENTS:
 - Follow the outline structure
 - Build upon what's already written
-- Capture relevant content from the aggregator database
+- Use brainstorm/aggregator content when it helps, but you are not required to cover every source entry
 - Maintain coherent narrative flow
 - Write clear, rigorous mathematical exposition
 - Do not repeat content already in the document
 - Check for existing section headers before creating new ones
 - ALL content must be rooted in sound mathematical reasoning
+- Unsupported empirical or artifact claims must be rewritten conservatively rather than asserted as established fact
 
 EXACT STRING MATCHING FOR EDITS:
 This system uses EXACT STRING MATCHING. To insert or modify content, you must:
@@ -1019,12 +1014,19 @@ async def build_construction_prompt(
         parts.append("TASK: Write the NEXT logical portion following the section order (body → conclusion → intro → abstract).")
     
     parts.append("\n---\n")
+    parts.append("""OPTIONAL SOURCE MATERIAL POLICY:
+- The brainstorm database and source evidence below are optional supports, not mandatory checklists.
+- Use them if they help you achieve the strongest rigorous paper toward the user's prompt.
+- You may synthesize beyond them using sound mathematical reasoning.
+- Do NOT force coverage of every source entry.
+""")
+    parts.append("\n---\n")
     
     if brainstorm_content:
-        parts.append(f"BRAINSTORM DATABASE (editable - you may propose corrections via brainstorm_operation):\n{brainstorm_content}")
+        parts.append(f"BRAINSTORM DATABASE (optional source material; editable via brainstorm_operation):\n{brainstorm_content}")
         parts.append("\n---\n")
     
-    parts.append(f"AGGREGATOR DATABASE EVIDENCE:\n{rag_evidence}")
+    parts.append(f"SOURCE DATABASE EVIDENCE (optional support - use if helpful):\n{rag_evidence}")
     parts.append("\n---\n")
     parts.append("Now generate your submission as JSON (remember to set section_complete appropriately):")
     
diff --git a/backend/compiler/prompts/critique_prompts.py b/backend/compiler/prompts/critique_prompts.py
index b2ebbf8..d5066fa 100644
--- a/backend/compiler/prompts/critique_prompts.py
+++ b/backend/compiler/prompts/critique_prompts.py
@@ -5,6 +5,17 @@
 from typing import Optional, Dict, List
 
 
+CRITIQUE_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES:
+- Classify substantive claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims must be supported by sound derivation, proof, or explicit assumptions inside the document.
+- Literature claims must identify the external source in-text.
+- Empirical claims include benchmark numbers, latency, throughput, speedups, accuracy, perplexity, hardware metrics, ablations, and measured outcomes.
+- Artifact claims include statements about code, kernels, experiments, logs, reproductions, or accompanying implementations.
+- Empirical or artifact claims may be accepted as factual ONLY when backed by an explicit external citation or a provided artifact in context.
+- If such support is absent, they should be criticized, removed, or rewritten as hypotheses, validation plans, expected benefits, limitations, or future work.
+- Never invent citations, experiments, benchmark numbers, hardware measurements, or code artifacts during critique or rewrite work."""
+
+
 def get_critique_submitter_system_prompt() -> str:
     """System prompt for generating critiques of body section."""
     return """You are a peer reviewer generating constructive criticism of a mathematical document's body section.
@@ -20,23 +31,23 @@ def get_critique_submitter_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
+""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous peer review feedback. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous peer review feedback. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
 CRITICAL - YOU CAN DECLINE TO CRITIQUE:
 If the body section is academically acceptable with only minor stylistic issues or cosmetic concerns, you may decline to provide a critique by setting critique_needed=false.
 
+SOURCE MATERIAL POLICY:
+- The aggregator/brainstorm database and reference papers are optional support for critique, not mandatory checklists
+- Do NOT critique solely because the body does not explicitly cover some source material
+- Do critique omitted material when the omission creates a genuine gap relative to the current outline, stated paper scope, or mathematical goals
+- Focus on whether the paper itself is strong, rigorous, and aligned, not on exhaustively mirroring source inputs
+
 ACADEMICALLY ACCEPTABLE means:
 - No mathematical errors or unsound reasoning
 - No missing proofs or incomplete arguments
@@ -65,6 +76,7 @@ def get_critique_submitter_system_prompt() -> str:
 - Content that doesn't align with the paper title/goal
 - Unfounded claims or logical fallacies
 - Insufficient mathematical rigor for an academic paper
+- Fabricated experiments, unsupported benchmark numbers, uncited literature claims, or nonexistent code/artifact claims
 
 WHAT NOT TO CRITIQUE - Avoid:
 - The conclusion, introduction, or abstract (not written yet)
@@ -77,6 +89,7 @@ def get_critique_submitter_system_prompt() -> str:
 - Be CONSTRUCTIVE: Explain what should change and why
 - Be ACTIONABLE: Provide clear direction for improvement
 - Focus on SUBSTANCE: Mathematical correctness, logical soundness, completeness
+- Explicitly call out unsupported empirical or artifact claims rather than treating them as minor issues
 
 Your critique will be validated against these criteria:
 - Does it identify a legitimate issue that would improve the paper?
@@ -156,17 +169,11 @@ def get_critique_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
+""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to validate peer review critiques. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to validate peer review critiques. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -193,6 +200,7 @@ def get_critique_validator_system_prompt() -> str:
 3. Identifies structural issues affecting coherence
 4. Provides specific, actionable guidance for improvement
 5. Is non-redundant with existing critiques
+6. Correctly flags fabricated experiments, unsupported metrics, uncited external results, or nonexistent artifacts
 
 A critique should be REJECTED if it:
 1. Is vague or unhelpful ("could be better" without specifics)
@@ -211,6 +219,8 @@ def get_critique_validator_system_prompt() -> str:
 - All outline requirements are met
 - Submitter's reasoning for declining is sound and accurate
 - Body meets required criteria for academic mathematical paper
+- There are no unsupported empirical or artifact claims being presented as established fact
+- The body is strong for its chosen scope even if some source material remains unused
 
 REJECT the decline if:
 - Submitter missed substantive issues you can identify
@@ -306,17 +316,11 @@ def get_rewrite_decision_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to make an informed rewrite decision. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to make an informed rewrite decision. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -382,6 +386,11 @@ def get_rewrite_decision_system_prompt() -> str:
 These are labeled clearly as "FAILED - REWRITTEN" versions. Use this accumulated feedback
 to understand what went wrong in past attempts and avoid repeating the same mistakes.
 
+SOURCE MATERIAL POLICY:
+- The aggregator/brainstorm database and reference papers are optional supports during rewrite decisions, not mandatory checklists
+- Do NOT choose PARTIAL_REVISION or TOTAL_REWRITE solely to force coverage of unused source material
+- Do choose revision when the current body is genuinely weaker, incomplete for its chosen scope, misaligned with the outline/title, or mathematically unsound
+
 Output your decision ONLY as JSON in this exact format:
 {
   "decision": "continue | partial_revision | total_rewrite",
@@ -460,12 +469,11 @@ def get_rewrite_decision_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities, you are STRONGLY ENCOURAGED to use them to verify claims and decisions.
+""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Use all available resources for validation.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Use internal context and your base knowledge for validation.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -503,6 +511,11 @@ def get_rewrite_decision_validator_system_prompt() -> str:
 - Title change proposed without justification from critiques
 - Decision appears arbitrary or not evidence-based
 
+SOURCE MATERIAL POLICY:
+- The source database is optional support, not a mandatory checklist
+- Do NOT reject a decision solely because it leaves some source material unused
+- Do reject if the decision ignores source material only when that omission clearly makes the chosen scope weaker, incoherent, or misaligned with the outline/title
+
 Ask yourself: "Is this decision the right response to the accepted critiques? Is the chosen level of revision appropriate?"
 
 Output your decision ONLY as JSON in this exact format:
@@ -603,7 +616,13 @@ def build_critique_prompt(
         "\n---\n",
         f"CURRENT BODY SECTION (to critique):\n{current_body}",
         "\n---\n",
-        f"AGGREGATOR DATABASE (source content):\n{aggregator_db}",
+        """OPTIONAL SOURCE MATERIAL POLICY:
+- The source database below is optional support, not a mandatory checklist.
+- Use it to identify genuine gaps or contradictions if helpful.
+- Do NOT critique solely because some source entries were not used.
+""",
+        "\n---\n",
+        f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
     ]
     
     if reference_papers:
@@ -692,7 +711,13 @@ def build_rewrite_decision_prompt(
         "\n---\n",
         f"ALL ACCEPTED CRITIQUES (CURRENT VERSION):\n{critique_feedback}",
         "\n---\n",
-        f"AGGREGATOR DATABASE (original source content):\n{aggregator_db}",
+        """OPTIONAL SOURCE MATERIAL POLICY:
+- The source database below is optional support, not a mandatory checklist.
+- Use it if it helps judge whether the body's chosen scope is genuinely weak, incomplete, or misaligned.
+- Do NOT force rewrite solely to cover unused source material.
+""",
+        "\n---\n",
+        f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
     ])
     
     if reference_papers:
@@ -753,7 +778,13 @@ def build_rewrite_decision_validation_prompt(
         "\n---\n",
         f"ALL ACCEPTED CRITIQUES:\n{critique_feedback}",
         "\n---\n",
-        f"AGGREGATOR DATABASE:\n{aggregator_db}",
+        """OPTIONAL SOURCE MATERIAL POLICY:
+- The source database below is optional support, not a mandatory checklist.
+- Use it if needed to judge whether the proposed decision is genuinely stronger or weaker.
+- Do NOT reject solely because not all source material is being used.
+""",
+        "\n---\n",
+        f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
         "\n---\n",
         f"PROPOSED DECISION:\n",
         f"Decision: {decision}\n",
@@ -811,6 +842,8 @@ def get_iterative_edit_system_prompt() -> str:
 - Each edit should be substantial and address specific critique feedback
 - Do NOT make cosmetic changes - focus on mathematical/structural issues identified in critiques
 - If you believe all issues are addressed, set more_edits_needed to false
+- If critique issues involve unsupported empirical or artifact claims, remove them or rewrite them as hypotheses, validation plans, expected benefits, limitations, or future work
+- Never preserve fabricated experiments, unsupported benchmark numbers, or nonexistent code claims as if they were verified
 
 Output your response ONLY as JSON in the exact format specified.
 """
@@ -959,6 +992,11 @@ def get_partial_revision_validation_system_prompt() -> str:
 
 The edit is part of an iterative partial revision to address peer review critiques.
 
+EMPIRICAL PROVENANCE RULES:
+- Empirical claims (benchmarks, speedups, latency, accuracy, perplexity, hardware measurements) must not remain stated as fact unless backed by explicit citation or provided artifact support.
+- Artifact claims (code, kernels, experiments, logs, accompanying implementations) must not remain stated as fact unless backed by explicit citation or provided artifact support.
+- If the edit rewrites unsupported empirical/artifact claims into hypotheses, validation plans, expected benefits, limitations, or future work, that is a valid improvement.
+
 YOUR TASK:
 Validate whether this specific edit should be ACCEPTED or REJECTED.
 
@@ -976,6 +1014,7 @@ def get_partial_revision_validation_system_prompt() -> str:
 4. The edit breaks coherence with surrounding content
 5. The edit is mathematically unsound or introduces logical errors
 6. The edit is purely cosmetic and doesn't address critiques
+7. The edit preserves fabricated experiments, unsupported metrics, or nonexistent artifact claims as established fact
 
 Output your decision as JSON.
 """
diff --git a/backend/compiler/prompts/outline_prompts.py b/backend/compiler/prompts/outline_prompts.py
index c5c0fdd..55920f9 100644
--- a/backend/compiler/prompts/outline_prompts.py
+++ b/backend/compiler/prompts/outline_prompts.py
@@ -5,13 +5,21 @@
 from backend.compiler.memory.compiler_rejection_log import compiler_rejection_log
 
 
+OUTLINE_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES FOR OUTLINES:
+- Do NOT turn unsupported benchmark-style claims into committed outline sections.
+- Numeric empirical claims in headings or subsection titles (speedup, latency, throughput, perplexity, accuracy, hardware measurements, benchmark names, etc.) are forbidden unless explicitly backed by an external citation or provided artifact in context.
+- If empirical support is missing, describe the material conservatively as a proposed evaluation, validation plan, expected benefit, design target, future-work task, or open question.
+- Literature claims should identify the external source in-text when they are important enough to shape the outline.
+- Never invent citations, experiments, measurements, or code artifacts while constructing an outline."""
+
+
 def get_outline_create_system_prompt() -> str:
     """Get system prompt for initial outline creation."""
     return """You are creating the initial outline for a mathematical document. Your role is to:
 
 1. Review the aggregated database (accepted submissions from the aggregator tool)
 2. Review the user's compiler-directing prompt
-3. Create a comprehensive outline that captures ALL relevant, unique content from the database
+3. Create the strongest rigorous outline you can for the target paper, using the aggregated database whenever it meaningfully helps
 
 ⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
 
@@ -24,17 +32,11 @@ def get_outline_create_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + OUTLINE_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -149,16 +151,24 @@ def get_outline_create_system_prompt() -> str:
 The outline is a TABLE OF CONTENTS showing section names and subsections. It does NOT contain the actual paper content.
 
 YOUR TASK:
+SOURCE USAGE PRINCIPLE:
+- Treat the aggregator/brainstorm database as optional high-value source material and exploration history, not a mandatory checklist
+- Use it when it helps you achieve the strongest rigorous paper for the user's compiler-directing prompt
+- You may selectively synthesize, extend, or depart from brainstorm/database material if that better serves the paper
+- Do NOT force coverage of every brainstorm/database entry
+- Do NOT ignore clearly crucial source material for the scope you choose
+
 - Produce a numbered outline with major sections and subsections
-- Reflect every non-trivial point from the aggregator database
+- Incorporate the strongest helpful source ideas where appropriate
 - Flag gaps explicitly if the evidence is insufficient
-- Reference supporting content from the aggregator database where appropriate
+- Reference supporting content from the aggregator database where appropriate, but do not mirror it mechanically
 - Ensure outline supports a coherent, logical flow for the final mathematical document
+- Replace unsupported empirical result claims with neutral headings such as "Evaluation Plan", "Proposed Validation", or "Expected Runtime Benefits"
 
 ITERATIVE REFINEMENT PROCESS:
 This is an iterative outline creation phase. You may submit multiple versions:
 
-1. Generate your best outline based on aggregator database and user prompt
+1. Generate your best outline based on the user prompt, your chosen paper scope, and any helpful source material from the aggregator database
 2. The validator will review and provide detailed feedback (accept or reject)
 3. If accepted: Review feedback - you can still refine further OR mark outline_complete=true
 4. If rejected: Review feedback and generate improved outline
@@ -171,7 +181,7 @@ def get_outline_create_system_prompt() -> str:
 - Actionable suggestions for refinement
 
 WHEN TO MARK outline_complete=true (LOCK OUTLINE):
-- The outline comprehensively captures ALL relevant unique content from aggregator database
+- The outline makes strong use of any source material it chooses to use and does not omit clearly crucial material for its chosen scope
 - Required sections (Abstract, Introduction, Body, Conclusion) present with exact names
 - Sections follow logical mathematical progression (definitions → theorems → proofs)
 - The outline optimally serves the paper title and user's compiler-directing prompt
@@ -180,9 +190,10 @@ def get_outline_create_system_prompt() -> str:
 
 WHEN TO MARK outline_complete=false (CONTINUE REFINING):
 - After reviewing validator feedback, you see opportunities for improvement
-- Important content from aggregator database is still missing
+- Clearly crucial source material or supporting structure is still missing
 - Structural organization could be enhanced
 - Subsection granularity needs adjustment
+- You want to incorporate more useful brainstorm/database material
 - You want to incorporate validator suggestions before locking
 
 HARD LIMIT:
@@ -203,14 +214,15 @@ def get_outline_create_system_prompt() -> str:
 
 CRITICAL REQUIREMENTS:
 - The outline MUST include: Introduction, at least one Body section, and Conclusion (Abstract is optional)
-- Every significant piece of unique information from the database should have a place in the outline
+- Clearly crucial source material for the chosen scope should have a place in the outline, but you do NOT need to mirror every brainstorm/database entry
 - The outline should support a coherent, logical flow for the final document
 - Sections should build upon each other logically (definitions → theorems → proofs)
 - The outline should align with the user's compiler-directing prompt goals
 - DO NOT include a separate References or Citations section in the outline
-- All content must be rooted in sound mathematical reasoning from the aggregator database
+- All content must be rooted in sound mathematical reasoning; aggregator/brainstorm material is optional support, not a mandatory checklist
 - NO unfounded claims or logical fallacies
 - Focus on rigorous mathematical arguments
+- DO NOT include unsupported numeric empirical claims in section or subsection headings
 
 The validator will REJECT your outline if:
 - Missing required sections: Introduction or Conclusion
@@ -218,6 +230,7 @@ def get_outline_create_system_prompt() -> str:
 - If Abstract is included, it must use proper format: "Abstract", "I. Abstract", or "0. Abstract" (not descriptive text)
 - Sections are out of order (e.g., Conclusion before body sections)
 - No body sections between Introduction and Conclusion
+- The outline includes unsupported benchmark-style numbers or hardware results as if already established
 
 CRITICAL - HOW TO FIX COMMON REJECTION:
 If validator says "MISSING_REQUIRED_SECTION: Introduction", ensure you have a line with "Introduction" or "I. Introduction".
@@ -258,7 +271,7 @@ def get_outline_update_system_prompt() -> str:
     """Get system prompt for outline updates."""
     return """You are reviewing the current document outline to decide if it needs updating. Your role is to:
 
-1. Review the aggregator database for any content not yet captured in the outline
+1. Review the aggregator database for any source material that may strengthen the outline
 2. Review the current document construction progress
 3. Decide if the outline needs modification to better serve the document
 
@@ -273,17 +286,11 @@ def get_outline_update_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + OUTLINE_EMPIRICAL_PROVENANCE_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -295,9 +302,15 @@ def get_outline_update_system_prompt() -> str:
 4. **Conclusion** - Summary of findings (exactly "Conclusion" or "N. Conclusion")
 
 YOUR TASK:
+SOURCE USAGE PRINCIPLE:
+- Treat the aggregator/brainstorm database as optional support, not a mandatory checklist
+- Update the outline if source material would materially strengthen the paper
+- Do NOT force additions just because a brainstorm/database entry exists
+- Do NOT ignore clearly crucial source material for the scope you are keeping
+
 Decide if the outline requires updates. Consider:
-- Relevance to current content from aggregator database
-- Missing content that should be included in outline
+- Relevance to current source content when it helps the paper
+- Missing content that should be included in outline to better serve the user prompt
 - Structural issues in current outline
 - Alignment with document construction progress
 
@@ -306,15 +319,16 @@ def get_outline_update_system_prompt() -> str:
 All outline content must be actual section/subsection names and descriptions, not placeholder text.
 
 WHEN TO UPDATE THE OUTLINE (ADDITIONS ONLY):
-- Important content from aggregator DB is missing from current outline
+- Clearly important source content or a better structure is missing from current outline
 - Document construction reveals needed additional sections
-- New pertinent information should be added to complete the document relative to the user-prompt title
+- New pertinent information from source material or rigorous synthesis should be added to better serve the user-prompt title
+- Unsupported empirical claims should be converted into cautious evaluation-plan sections rather than asserted-results sections
 
 CRITICAL: You can ONLY ADD to the outline, NOT delete or remove existing sections.
 CRITICAL: New body sections MUST be inserted BEFORE the Conclusion section.
 
 WHEN NOT TO UPDATE:
-- Current outline already contains all pertinent information
+- Current outline already serves the paper well even if some brainstorm/database items remain unused
 - No new relevant content needs to be added
 
 CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
@@ -331,11 +345,12 @@ def get_outline_update_system_prompt() -> str:
 The validator checks YOUR SUBMISSION for placeholder text, not the existing outline structure.
 
 CRITICAL REQUIREMENTS FOR UPDATES:
-- All content must be rooted in sound mathematical reasoning from the aggregator database
+- All added content must be rooted in sound mathematical reasoning; source database material is optional support, not a mandatory checklist
 - NO unfounded claims or logical fallacies
 - Focus on rigorous mathematical arguments
 - NEVER change the names of Abstract, Introduction, or Conclusion sections
 - New body sections must be inserted between Introduction and Conclusion
+- DO NOT add unsupported numeric empirical claims in section or subsection headings
 
 EXACT STRING MATCHING FOR EDITS:
 If updating, this system uses EXACT STRING MATCHING. You must:
@@ -435,7 +450,7 @@ def get_outline_json_schema() -> str:
 {
   "content": "Abstract\\n\\nI. Introduction\\n   A. Historical context of circle-squaring\\n   B. Problem statement and impossibility\\n   C. Overview of proof approach\\n\\nII. Preliminaries and Definitions\\n   A. Compass and straightedge constructions\\n   B. Field extensions and constructible numbers\\n   C. Algebraic vs. transcendental numbers\\n   D. Galois theory connections\\n\\nIII. Main Theoretical Results\\n   A. Theorem: Characterization of constructible lengths\\n   B. Theorem: Lindemann-Weierstrass (transcendence of pi)\\n   C. Theorem: Baker's theorem and applications\\n   D. Corollary: Impossibility of squaring the circle\\n\\nIV. Proofs and Derivations\\n   A. Proof of constructibility characterization\\n   B. Outline of Lindemann-Weierstrass proof\\n   C. Derivation of main impossibility result\\n\\nV. Conclusion\\n   A. Summary of impossibility result\\n   B. Related problems and historical significance",
   "outline_complete": true,
-  "reasoning": "Outline now comprehensively captures ALL content from aggregator database. Added Galois theory subsection (addressing feedback from iteration 2). Added Baker's theorem coverage (addressing feedback from iterations 2-4). Structure follows logical progression from basic definitions through theorems to proofs. All required sections present with correct names. Ready to lock and begin paper construction."
+  "reasoning": "Outline now captures the strongest useful source material from the aggregator database while staying focused on the best paper structure for the prompt. Added Galois theory subsection (addressing feedback from iteration 2). Added Baker's theorem coverage (addressing feedback from iterations 2-4). Structure follows logical progression from basic definitions through theorems to proofs. All required sections present with correct names. Ready to lock and begin paper construction."
 }
 
 CRITICAL JSON ESCAPE RULES:
@@ -455,7 +470,7 @@ def get_outline_json_schema() -> str:
   "operation": "insert_after",
   "old_string": "",
   "new_string": "",
-  "reasoning": "The current outline already captures all relevant content from the aggregator database. All theorems and proofs mentioned in accepted submissions have corresponding outline sections."
+  "reasoning": "The current outline already serves the paper well. The strongest useful material from the aggregator database is already represented, and no additional source content is necessary for this scope."
 }
 
 Example (Outline Update - Adding subsection under Section II):
@@ -527,7 +542,7 @@ async def build_outline_create_prompt(
     parts.extend([
         f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
         "\n---\n",
-        f"AGGREGATOR DATABASE EVIDENCE:\n{rag_evidence}",
+        f"SOURCE DATABASE EVIDENCE (optional support - use if helpful):\n{rag_evidence}",
         "\n---\n",
         "Now generate your outline as JSON:"
     ])
@@ -580,7 +595,7 @@ async def build_outline_update_prompt(
     
     if rag_evidence:
         parts.append("\n---\n")
-        parts.append(f"AGGREGATOR DATABASE EVIDENCE:\n{rag_evidence}")
+        parts.append(f"SOURCE DATABASE EVIDENCE (optional support - use if helpful):\n{rag_evidence}")
     
     parts.append("\n---\n")
     parts.append("Now decide if outline update is needed (respond as JSON):")
diff --git a/backend/compiler/prompts/review_prompts.py b/backend/compiler/prompts/review_prompts.py
index edfe381..815d6e4 100644
--- a/backend/compiler/prompts/review_prompts.py
+++ b/backend/compiler/prompts/review_prompts.py
@@ -5,6 +5,39 @@
 from backend.compiler.memory.compiler_rejection_log import compiler_rejection_log
 
 
+EMPIRICAL_PROVENANCE_REVIEW_RULES = """EMPIRICAL PROVENANCE AND CITATION RULES:
+- Classify substantive claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims must be supported by sound derivation, proof, or explicit assumptions inside the paper.
+- Literature claims must include explicit in-text citations identifying the external source. Do NOT rely on vague phrases like "studies show" or "the literature suggests".
+- Empirical claims include benchmarks, latency, throughput, speedups, accuracy, perplexity, ablations, wall-clock measurements, hardware utilization numbers, and dataset/task results.
+- Artifact claims include statements about code, kernels, measurements, experiments, benchmark logs, reproductions, or "accompanying" implementations.
+- Empirical or artifact claims are acceptable ONLY if they are backed by an explicit external citation or by a provided artifact in context. If not backed, they must be removed or rewritten as hypotheses, design goals, expected benefits, proposed experiments, or future work.
+- NEVER invent citations, experiments, benchmark numbers, hardware measurements, datasets, or code artifacts.
+- If external information is retained, it must remain explicitly cited in-text. Do NOT imply that unsupported facts were externally verified."""
+
+
+EMPIRICAL_RED_TEAM_REVIEW_FOCUS = """PRE-ABSTRACT EMPIRICAL RED-TEAM TASK:
+Your highest-priority job is to catch and neutralize:
+- fabricated experiments
+- nonexistent code or artifacts
+- unsupported benchmark numbers
+- uncited external results
+- benchmark-shaped claims presented as established facts
+
+Inspect especially for:
+- speedup, latency, throughput, bandwidth, utilization, clock-cycle, memory, or hardware claims
+- accuracy, perplexity, benchmark score, ablation, or evaluation claims
+- mentions of specific hardware (A100, H100, NEON, AVX, tensor cores, etc.) with measured outcomes
+- phrases like "empirical results", "experiments show", "we validate", "measured", "observed", "see accompanying code", or "implementation achieves"
+
+If a claim lacks explicit citation or artifact support, prefer conservative edits that:
+- delete the claim, or
+- rewrite it as hypothesis / expected benefit / design target / proposed experiment / future work, or
+- explicitly state that verification has not been performed.
+
+Do NOT preserve unsupported benchmark numbers merely because they fit the narrative."""
+
+
 def get_review_system_prompt() -> str:
     """Get system prompt for document review/cleanup mode."""
     return """You are reviewing the current mathematical document draft for errors and needed improvements. Your role is to:
@@ -24,17 +57,11 @@ def get_review_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + EMPIRICAL_PROVENANCE_REVIEW_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -79,6 +106,9 @@ def get_review_system_prompt() -> str:
 - Significant clarity improvements possible
 - Forward-looking structural language outside introduction (e.g., 'Section III will...', bulleted lists of future content)
 - Unfounded claims or logical fallacies that should be corrected
+- Unsupported empirical claims, unsupported artifact/code claims, or uncited literature claims
+- Numeric benchmark-style claims in narrative text that are not explicitly sourced
+- Statements implying experiments, measurements, or implementations that are not actually evidenced
 
 WHEN NOT TO MAKE AN EDIT:
 - Document is acceptable for a draft in progress
@@ -182,7 +212,8 @@ def get_review_json_schema() -> str:
 async def build_review_prompt(
     user_prompt: str,
     current_paper: str,
-    current_outline: str
+    current_outline: str,
+    review_focus: str = "general"
 ) -> str:
     """
     Build complete prompt for review mode.
@@ -193,6 +224,7 @@ async def build_review_prompt(
         user_prompt: User's compiler-directing prompt
         current_paper: Current document to review
         current_outline: Current outline for structural reference (always fully injected)
+        review_focus: "general" or "empirical_red_team"
     
     Returns:
         Complete prompt string
@@ -212,6 +244,11 @@ async def build_review_prompt(
 
 LEARN FROM THESE PAST MISTAKES.
 ---
+""")
+
+    if review_focus == "empirical_red_team":
+        parts.append(f"""{EMPIRICAL_RED_TEAM_REVIEW_FOCUS}
+---
 """)
     
     parts.extend([
diff --git a/backend/compiler/prompts/rigor_prompts.py b/backend/compiler/prompts/rigor_prompts.py
index fffae77..56d1c50 100644
--- a/backend/compiler/prompts/rigor_prompts.py
+++ b/backend/compiler/prompts/rigor_prompts.py
@@ -24,17 +24,9 @@
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
-
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---"""
 
diff --git a/backend/compiler/validation/compiler_validator.py b/backend/compiler/validation/compiler_validator.py
index ac68edf..e0806d0 100644
--- a/backend/compiler/validation/compiler_validator.py
+++ b/backend/compiler/validation/compiler_validator.py
@@ -20,6 +20,17 @@
 logger = logging.getLogger(__name__)
 
 
+CLAIM_TYPE_VALIDATION_RULES = """CLAIM TYPE VALIDATION (CRITICAL):
+- Classify substantive claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
+- Theoretical claims are acceptable only if they are supported by sound derivation, proof, or explicit assumptions in the document.
+- Literature claims are acceptable only if they include explicit in-text citations identifying the external source. Vague phrases like "studies show" are insufficient.
+- Empirical claims include benchmark numbers, latency, throughput, speedups, accuracy, perplexity, ablations, hardware metrics, measured runtimes, and evaluation outcomes.
+- Artifact claims include statements about code, kernels, experiments, benchmark logs, reproductions, or accompanying implementations.
+- Empirical or artifact claims may be presented as established fact ONLY when backed by an explicit external citation or a provided artifact in context.
+- If empirical or artifact support is absent, acceptable wording is limited to hypothesis, expected benefit, design target, proposed experiment, validation plan, limitation, or future work.
+- Reject content that invents citations, experiments, benchmark numbers, hardware measurements, datasets, or code artifacts."""
+
+
 def _diagnostic_char_info(text: str, max_chars: int = 100) -> str:
     """
     Generate diagnostic information about a string's characters.
@@ -999,6 +1010,18 @@ async def validate_submission(
                 max_tokens=system_config.compiler_validator_max_output_tokens  # User-configurable
             )
             
+            # Check for empty response
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                logger.error("CompilerValidator: LLM returned empty response structure")
+                return CompilerValidationResult(
+                    submission_id=submission.submission_id,
+                    decision="reject",
+                    reasoning="Validation LLM returned empty response (no choices)",
+                    summary="LLM empty response",
+                    json_valid=False,
+                    validation_stage="llm_validation"
+                )
+            
             # Extract content from either 'content' or 'reasoning' field
             # Some reasoning models (e.g., DeepSeek R1, certain GPT variants) output JSON in 'reasoning' field
             message = response["choices"][0]["message"]
@@ -1110,6 +1133,19 @@ async def validate_brainstorm_operation(
                 max_tokens=system_config.compiler_validator_max_output_tokens
             )
             
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                logger.error("CompilerValidator: Brainstorm validation LLM returned empty response")
+                if self.task_tracking_callback:
+                    self.task_tracking_callback("completed", task_id)
+                return CompilerValidationResult(
+                    submission_id=str(uuid.uuid4()),
+                    decision="reject",
+                    reasoning="Validation LLM returned empty response (no choices)",
+                    summary="LLM empty response",
+                    json_valid=False,
+                    validation_stage="llm_validation"
+                )
+            
             message = response["choices"][0]["message"]
             llm_output = message.get("content") or message.get("reasoning") or ""
             
@@ -1310,6 +1346,8 @@ def _build_validation_prompt(
         
         parts.append(f"CURRENT DOCUMENT:\n{current_paper}\n---\n")
         parts.append(f"SUBMISSION TO VALIDATE:\n")
+        if submission.metadata.get("review_focus"):
+            parts.append(f"Review Focus: {submission.metadata['review_focus']}\n")
         parts.append(f"Operation: {submission.operation}\n")
         if submission.old_string:
             parts.append(f"Old String (to find): {submission.old_string}\n")
@@ -1334,17 +1372,11 @@ def _get_outline_validation_system_prompt(self, mode: str) -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CLAIM_TYPE_VALIDATION_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -1378,17 +1410,24 @@ def _get_outline_validation_system_prompt(self, mode: str) -> str:
 1. SECTION_STRUCTURE: MUST include Introduction, at least one Body section, and Conclusion with exact names (Abstract is optional but recommended)
 2. SECTION_ORDER: [Abstract →] Introduction → Body sections → Conclusion (this exact order, where Abstract is optional)
 3. COHERENCE: Logically structured with clear sections and subsections
-4. COMPLETENESS: Captures all relevant content from aggregator database in relation to what is relevant to the title set in the user prompt
+4. COMPLETENESS: Makes effective use of any source material it chooses to use and does not omit clearly crucial material for its chosen scope
 5. ALIGNMENT: Aligns with user's compiler-directing prompt goals
 6. COMPREHENSIVENESS: Provides sufficient detail to guide mathematical document construction
 7. MATHEMATICAL PROGRESSION: Body sections follow logical progression (definitions → main results → theorems → proofs)
 8. IN-TEXT CITATIONS ONLY: Must NOT include a separate References or Citations section
 9. ANCHOR PRESERVATION: Must not attempt to add content after the end-of-outline anchor markers
-10. LOGICAL GROUNDING: Outline must reference actual content from aggregator database based on sound mathematical principles, not unfounded claims
+10. LOGICAL GROUNDING: Outline may draw from aggregator database material, reference papers, or rigorous reasoning, but it must remain grounded in sound mathematical principles and avoid unfounded claims
 11. NO PLACEHOLDER TEXT: Must not contain any placeholder markers (e.g., "[HARD CODED PLACEHOLDER FOR...", "[PLACEHOLDER FOR...", "TO BE WRITTEN AFTER..."). Placeholders are structural markers only - all submitted content must be actual outline content.
+12. EMPIRICAL PROVENANCE: Must not include unsupported numeric empirical claims in section/subsection headings or outline prose unless explicitly backed by citation or provided artifact support
 
 **CRITICAL**: Criterion #11 checks the SUBMISSION CONTENT ONLY. The CURRENT OUTLINE may contain system-managed anchor markers (normal and expected). Do NOT reject a submission just because anchor markers exist in the current outline - only reject if the SUBMISSION ITSELF contains placeholder or anchor text (pre-validation at line 326 catches this before you see it).
 
+SOURCE MATERIAL POLICY:
+- The aggregator/brainstorm database is optional support, not a mandatory checklist
+- Do NOT reject solely because an outline does not explicitly use or cover database material
+- Do reject if the outline ignores clearly crucial source material in a way that makes its chosen scope weak, incoherent, or misaligned with the user prompt
+- Accept selective or divergent outline structures when they better serve the user's prompt and remain rigorous
+
 YOUR TASK:
 Verify the submission meets ALL criteria above. Accept only if ALL criteria pass. Reject if ANY criterion fails.
 
@@ -1397,11 +1436,12 @@ def _get_outline_validation_system_prompt(self, mode: str) -> str:
 - INCORRECT_SECTION_ORDER: Sections are out of order (must be: [Abstract →] Introduction → Body → Conclusion, where Abstract is optional)
 - INCORRECT_SECTION_NAME: Section names don't match exactly (e.g., "Summary" instead of "Conclusion", "Overview" instead of "Introduction"; if Abstract included, must be "Abstract", "I. Abstract", or "0. Abstract")
 - STRUCTURAL: Body sections not in logical mathematical progression order
-- INCOMPLETENESS: Missing critical content from aggregator database that's relevant to document title
+- INCOMPLETENESS: Missing clearly crucial source material or necessary structure for the chosen scope
 - MISALIGNMENT: Doesn't serve user's compiler-directing prompt goals
 - INSUFFICIENT_DETAIL: Lacks necessary granularity to guide mathematical document construction
 - FORMAT_VIOLATION: Includes separate References/Citations section (NOT allowed)
 - ANCHOR_VIOLATION: Content placed after outline anchor markers
+- EMPIRICAL_PROVENANCE: Unsupported benchmark, hardware, or artifact claim presented as established fact
 
 SECTION NAME VALIDATION (CRITICAL):
 
@@ -1445,7 +1485,7 @@ def _get_outline_validation_system_prompt(self, mode: str) -> str:
             "outline_create": """MODE-SPECIFIC CRITERIA (Outline Creation):
 - Outline MUST include: Introduction, at least one Body section, Conclusion (Abstract is optional)
 - Section names MUST match exactly: "Introduction", "Conclusion" (if Abstract included: "Abstract", "I. Abstract", or "0. Abstract")
-- Outline captures all relevant unique content from aggregator database
+- Outline makes effective use of any helpful aggregator database content when relevant, but need not mirror all entries
 - Outline provides clear structure for mathematical document construction
 - Outline aligns with user's compiler-directing prompt
 - Body sections follow logical mathematical progression
@@ -1559,17 +1599,11 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-WEB SEARCH STRONGLY ENCOURAGED:
-If your model has access to real-time web search capabilities (such as Perplexity Sonar or similar), you are STRONGLY ENCOURAGED to use them to:
-- Verify mathematical claims against current published research
-- Access recent developments and contemporary mathematical literature
-- Cross-reference theorems, proofs, and techniques with authoritative sources
-- Supplement analysis with verified external information
-- Validate approaches against established mathematical consensus
-
-The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use all available resources - internal context as exploration history, your base knowledge for reasoning, and web search (if available) for verification and current information.
+""" + CLAIM_TYPE_VALIDATION_RULES + """
 
-WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth. If you have web search, use it.
+ The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
+ 
+ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
 
 ---
 
@@ -1612,9 +1646,16 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 8. ANCHOR PRESERVATION: Must not attempt to add content after the end-of-document anchor marker ("[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]")
 9. LOGICAL GROUNDING: Must not contain unfounded claims or logical fallacies. All claims must be grounded in established mathematical principles and sound reasoning.
 10. NO PLACEHOLDER TEXT: Must not contain any placeholder markers (e.g., "[HARD CODED PLACEHOLDER FOR...", "[PLACEHOLDER FOR...", "TO BE WRITTEN AFTER..."). Placeholders are structural markers indicating where sections WILL BE written - all submitted content must be actual mathematical prose, not placeholder text.
+11. CLAIM TYPE VALIDATION: The submission must satisfy the acceptance criteria for each theoretical, literature, empirical, and artifact claim it makes
 
 **CRITICAL**: Criterion #10 checks the SUBMISSION CONTENT ONLY. The CURRENT DOCUMENT may contain system-managed placeholders and anchors (normal during construction). Do NOT reject a submission just because placeholders exist in the current document - only reject if the SUBMISSION ITSELF contains placeholder text (pre-validation at line 780 catches this before you see it).
 
+SOURCE MATERIAL POLICY:
+- Brainstorm/aggregator content, reference papers, and the model's rigorous reasoning are all allowed inputs
+- The brainstorm database is optional support, not a mandatory checklist
+- Do NOT reject solely because the submission does not explicitly use brainstorm content or because it departs from brainstorm phrasing
+- Reject only if the submission ignores clearly necessary established content for its claimed scope, conflicts with the outline, or becomes weaker/less rigorous as a result
+
 YOUR TASK:
 Verify the submission meets ALL criteria above. If even ONE criterion fails, reject the submission.
 
@@ -1653,9 +1694,17 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 - Reject if content appears to be a bibliography or reference list
 - In-text citations (if present) should be integrated within the narrative
 
+CLAIM TYPE CHECK (CRITICAL):
+- Theoretical claims: accept only if supported by sound derivation, proof, or explicit assumptions in the document
+- Literature claims: reject if they rely on external facts without explicit in-text citation
+- Empirical claims: reject if benchmark numbers, hardware measurements, speedups, perplexity/accuracy results, or evaluation outcomes are presented as established fact without citation or provided artifact support
+- Artifact claims: reject if the content claims code, experiments, kernels, logs, or accompanying implementations exist without citation or provided artifact support
+- If unsupported empirical/artifact material is phrased as hypothesis, validation plan, limitation, expected benefit, or future work, it may be acceptable
+
 MATHEMATICAL RIGOR CHECK (CRITICAL):
 - Reject if content contains unfounded claims or logical fallacies
 - Accept only content rooted in established mathematical principles and sound reasoning
+- Reject fabricated experiments, nonexistent code/artifact claims, unsupported metrics, or invented citations
 
 """
         
@@ -1679,17 +1728,19 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 MODE-SPECIFIC CRITERIA (Document Construction):
 - Outline Adherence: Follows the outline structure appropriately
 - Logical Flow: Builds logically from existing document content
-- Evidence Integration: Captures relevant aggregator database content
+- Source Use: Any brainstorm/aggregator content that is used is integrated coherently; selective non-use is acceptable when the paper remains stronger, rigorous, and aligned with the prompt
 - Non-Repetition: Doesn't repeat existing document sections
 - Section Uniqueness: Doesn't create section headers that already exist in current document
 - Placement Context: Content fits naturally at the pre-validated location
 - Content Check: No forward-looking structural previews outside introduction
 - Mathematical Accuracy: Content is based on established mathematical principles and sound reasoning
+- Empirical Provenance: Unsupported benchmark or artifact claims are rewritten conservatively, not asserted as verified results
 
 VERIFICATION CHECKLIST:
 ✓ Does it follow the current outline (the outline is the TEMPLATE, not actual content)?
 ✓ Does it build coherently from what's already written in the ACTUAL DOCUMENT?
-✓ Does it integrate content from the aggregator database?
+✓ If it uses brainstorm/aggregator material, does it integrate it coherently?
+✓ If it departs from source material, does the result still better serve the prompt with sound reasoning?
 ✓ Does it avoid repeating existing content in the ACTUAL DOCUMENT?
 ✓ Does it avoid creating duplicate section headers that exist in the CURRENT PAPER/DOCUMENT (NOT the outline template)?
 ✓ Does the new_string content fit naturally at the insertion/replacement location?
@@ -1723,6 +1774,7 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 - Edit maintains or improves overall quality
 - Placement Context: Edit fits naturally at the pre-validated location
 - Content Check: No forward-looking structural previews outside introduction
+- Empirical Provenance: Edit appropriately removes or downgrades unsupported empirical/artifact claims when present
 
 REJECTION FEEDBACK FORMAT:
 If rejecting, use this structure:
@@ -1741,6 +1793,7 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 - Placement Context: Enhancement fits naturally at the pre-validated location
 - Content Check: No forward-looking structural previews outside introduction
 - Mathematical Check: Enhancement provides rigorous, sound mathematical improvements
+- Empirical Provenance: Enhancement does not introduce unsupported benchmark or artifact claims
 
 REJECTION FEEDBACK FORMAT:
 If rejecting, use this structure:
diff --git a/backend/shared/api_client_manager.py b/backend/shared/api_client_manager.py
index 018eef4..47a6a23 100644
--- a/backend/shared/api_client_manager.py
+++ b/backend/shared/api_client_manager.py
@@ -2,10 +2,11 @@
 API Client Manager - Unified manager for routing API calls to OpenRouter or LM Studio.
 Handles fallback on credit exhaustion and boost integration.
 
-Supports three boost modes:
+Supports four boost modes:
 1. Boost Next X Calls - Counter-based, applies to next X API calls
 2. Category Boost - Role-based, boosts all calls for specific role categories
-3. Per-task Toggle - Task ID based (legacy)
+3. Always Prefer Boost - Tries boost for every call, falls back on failure
+4. Per-task Toggle - Task ID based (legacy)
 """
 import asyncio
 import logging
@@ -35,6 +36,7 @@ class APIClientManager:
     Central manager for routing API calls to OpenRouter or LM Studio.
     Handles fallback on credit exhaustion and boost integration.
     """
+    CALL_METADATA_KEY = "_moto_call_metadata"
     
     def __init__(self):
         self._openrouter_client: Optional[OpenRouterClient] = None
@@ -171,6 +173,48 @@ async def _track_model_usage(self, model_id: str) -> None:
                 await self._model_tracking_callback(model_id)
             except Exception as e:
                 logger.error(f"Error in model tracking callback: {e}")
+
+    def _annotate_response_with_call_metadata(
+        self,
+        response: Dict[str, Any],
+        *,
+        task_id: str,
+        role_id: str,
+        configured_model: str,
+        actual_model: str,
+        configured_provider: Optional[str],
+        actual_provider: str,
+        boosted: bool,
+        boost_mode: Optional[str] = None,
+        openrouter_provider: Optional[str] = None,
+    ) -> Dict[str, Any]:
+        """Attach effective routing details to a successful API response."""
+        if not isinstance(response, dict):
+            return response
+
+        response[self.CALL_METADATA_KEY] = {
+            "task_id": task_id,
+            "role_id": role_id,
+            "configured_model": configured_model,
+            "effective_model": actual_model,
+            "configured_provider": configured_provider or actual_provider,
+            "effective_provider": actual_provider,
+            "provider": actual_provider,
+            "boosted": boosted,
+            "boost_mode": boost_mode,
+            "openrouter_provider": openrouter_provider,
+        }
+        return response
+
+    def extract_call_metadata(self, response: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+        """Return routing metadata attached to a successful API response."""
+        if not isinstance(response, dict):
+            return {}
+
+        metadata = response.get(self.CALL_METADATA_KEY)
+        if isinstance(metadata, dict):
+            return metadata.copy()
+        return {}
     
     def set_openrouter_api_key(self, api_key: str) -> None:
         """
@@ -223,6 +267,10 @@ def _determine_boost_mode(self, task_id: str) -> Optional[str]:
         if not boost_manager.boost_config or not boost_manager.boost_config.enabled:
             return None
         
+        # Check always-prefer mode (every call uses boost, fall back on failure)
+        if boost_manager.boost_always_prefer:
+            return "always_prefer"
+        
         # Check boost_next_count first (counter-based mode)
         if boost_manager.boost_next_count > 0:
             return "next_count"
@@ -272,6 +320,11 @@ async def generate_completion(
         Returns:
             API response dict
         """
+        requested_model = model
+        async with self._state_lock:
+            initial_role_config = self._role_model_configs.get(role_id)
+        configured_provider = initial_role_config.provider if initial_role_config else None
+
         # Check if task should use boost (unified check for all boost modes)
         boost_mode = self._determine_boost_mode(task_id)
         
@@ -318,9 +371,33 @@ async def generate_completion(
                     # Calculate duration
                     duration_ms = (time.time() - start_time) * 1000
                     
+                    # Check for missing choices (upstream provider timeout/error)
+                    if not result.get("choices"):
+                        import json as _json
+                        raw_response = _json.dumps(result)[:2000]
+                        logger.error(f"OpenRouter boost response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                        
+                        # Log as failure
+                        await boost_logger.log_boost_call(
+                            task_id=task_id,
+                            role_id=role_id,
+                            model=boost_model,
+                            prompt_preview=prompt_preview,
+                            response_content="",
+                            tokens_used=None,
+                            duration_ms=duration_ms,
+                            success=False,
+                            boost_mode=boost_mode,
+                            error="Response missing 'choices' - upstream provider timeout or error"
+                        )
+                        
+                        # Raise so retry/fallback logic can handle it
+                        raise ValueError(f"OpenRouter response missing 'choices' after {duration_ms:.0f}ms (upstream provider timeout)")
+                    
                     # Extract response content for logging
                     response_content = ""
                     tokens_used = None
+                    
                     if result.get("choices"):
                         message = result["choices"][0].get("message", {})
                         response_content = message.get("content") or message.get("reasoning") or ""
@@ -331,6 +408,19 @@ async def generate_completion(
                         if _pt is not None and _ct is not None:
                             token_tracker.track(boost_model, _pt, _ct)
                             await self._broadcast("token_usage_updated", token_tracker.get_stats())
+
+                    result = self._annotate_response_with_call_metadata(
+                        result,
+                        task_id=task_id,
+                        role_id=role_id,
+                        configured_model=requested_model,
+                        actual_model=boost_model,
+                        configured_provider=configured_provider,
+                        actual_provider="openrouter",
+                        boosted=True,
+                        boost_mode=boost_mode,
+                        openrouter_provider=boost_provider,
+                    )
                     
                     # Log the boost call
                     await boost_logger.log_boost_call(
@@ -408,12 +498,10 @@ async def generate_completion(
                 logger.warning(f"Boost model rate limited for task {task_id}: {e}")
                 
                 # Broadcast rate limit event to frontend
-                retry_after_iso = time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.retry_after))
                 await self._broadcast("openrouter_rate_limit", {
                     "model": boost_model,
                     "role_id": role_id,
-                    "retry_after": retry_after_iso,
-                    "message": f"OpenRouter free model rate limit hit. Retrying after 1 hour."
+                    "message": f"OpenRouter rate limit hit for '{boost_model}' after retries exhausted."
                 })
                 
                 # Fall through to primary model (boost has no fallback concept)
@@ -600,11 +688,8 @@ async def generate_completion(
                         await self._broadcast("account_credits_exhausted", {
                             "message": "OpenRouter account free credits depleted. Add credits at openrouter.ai or configure LM Studio fallback."
                         })
-                        rate_limited = self._openrouter_client.get_rate_limited_models()
-                        soonest = free_model_manager.get_soonest_retry(rate_limited)
                         raise FreeModelExhaustedError(
-                            f"Account free credits exhausted and no LM Studio fallback for role '{role_id}'.",
-                            soonest_retry=soonest
+                            f"Account free credits exhausted and no LM Studio fallback for role '{role_id}'."
                         )
                 
                 provider_info = f" via {openrouter_provider}" if openrouter_provider else ""
@@ -629,6 +714,14 @@ async def generate_completion(
                     
                     # Calculate duration and extract response
                     duration_ms = (time.time() - start_time) * 1000
+                    
+                    # Check for missing choices (upstream provider timeout/error)
+                    if not result.get("choices"):
+                        import json as _json
+                        raw_response = _json.dumps(result)[:2000]
+                        logger.error(f"OpenRouter response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                        raise ValueError(f"OpenRouter response missing 'choices' after {duration_ms:.0f}ms (upstream provider timeout)")
+                    
                     response_content = ""
                     tokens_used = None
                     if result.get("choices"):
@@ -641,6 +734,19 @@ async def generate_completion(
                         if _pt is not None and _ct is not None:
                             token_tracker.track(openrouter_model, _pt, _ct)
                             await self._broadcast("token_usage_updated", token_tracker.get_stats())
+
+                    result = self._annotate_response_with_call_metadata(
+                        result,
+                        task_id=task_id,
+                        role_id=role_id,
+                        configured_model=requested_model,
+                        actual_model=openrouter_model,
+                        configured_provider=role_config.provider if role_config else configured_provider or "openrouter",
+                        actual_provider="openrouter",
+                        boosted=False,
+                        boost_mode=None,
+                        openrouter_provider=openrouter_provider,
+                    )
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
@@ -686,35 +792,36 @@ async def generate_completion(
                     
                     logger.warning(f"OpenRouter rate limit for role {role_id}: {e}")
                     
-                    retry_after_iso = time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(e.retry_after))
                     await self._broadcast("openrouter_rate_limit", {
                         "model": openrouter_model,
                         "role_id": role_id,
-                        "retry_after": retry_after_iso,
-                        "message": f"OpenRouter free model rate limit hit for '{openrouter_model}'."
+                        "message": f"OpenRouter rate limit hit for '{openrouter_model}' after retries exhausted."
                     })
                     
+                    # Mark this model as failed for rotation
+                    free_model_manager.mark_model_failed(openrouter_model)
+                    
                     # --- FREE MODEL ROTATION CHAIN ---
                     rotated_result = await self._try_free_model_rotation(
                         task_id=task_id,
                         role_id=role_id,
                         original_model=openrouter_model,
+                        configured_model=requested_model,
+                        configured_provider=role_config.provider if role_config else configured_provider or "openrouter",
                         messages=messages,
                         temperature=temperature,
                         max_tokens=max_tokens or role_config.max_output_tokens,
                         response_format=response_format,
                     )
                     if rotated_result is not None:
+                        free_model_manager.clear_failed_models()  # Success - clear failures
                         return rotated_result
                     
                     # Rotation chain exhausted — try LM Studio fallback
                     if not role_config.lm_studio_fallback_id:
-                        rate_limited = self._openrouter_client.get_rate_limited_models() if self._openrouter_client else {}
-                        soonest = free_model_manager.get_soonest_retry(rate_limited)
                         raise FreeModelExhaustedError(
                             f"All free model options exhausted for role '{role_id}'. "
-                            f"No LM Studio fallback configured.",
-                            soonest_retry=soonest
+                            f"No LM Studio fallback configured."
                         )
                     
                     fallback_model = role_config.lm_studio_fallback_id
@@ -909,6 +1016,14 @@ async def generate_completion(
             
             # Calculate duration and extract response
             duration_ms = (time.time() - start_time) * 1000
+            
+            # Check for missing choices
+            if not result.get("choices"):
+                import json as _json
+                raw_response = _json.dumps(result)[:2000]
+                logger.error(f"LM Studio response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                raise ValueError(f"LM Studio response missing 'choices' after {duration_ms:.0f}ms")
+            
             response_content = ""
             tokens_used = None
             if result.get("choices"):
@@ -921,6 +1036,18 @@ async def generate_completion(
                 if _pt is not None and _ct is not None:
                     token_tracker.track(model, _pt, _ct)
                     await self._broadcast("token_usage_updated", token_tracker.get_stats())
+
+            result = self._annotate_response_with_call_metadata(
+                result,
+                task_id=task_id,
+                role_id=role_id,
+                configured_model=requested_model,
+                actual_model=model,
+                configured_provider=role_config.provider if role_config else configured_provider or "lm_studio",
+                actual_provider="lm_studio",
+                boosted=False,
+                boost_mode=None,
+            )
             
             # Log to autonomous API logger if callback set
             if self._autonomous_logger_callback:
@@ -970,6 +1097,8 @@ async def _try_free_model_rotation(
         task_id: str,
         role_id: str,
         original_model: str,
+        configured_model: str,
+        configured_provider: str,
         messages: List[Dict[str, str]],
         temperature: float,
         max_tokens: int,
@@ -982,14 +1111,12 @@ async def _try_free_model_rotation(
         if not self._openrouter_client:
             return None
 
-        rate_limited = self._openrouter_client.get_rate_limited_models()
-
         # Step 1: Free Model Looping — iterate through available free models
         if free_model_manager.looping_enabled:
             tried_models = {original_model}
             while True:
                 alt_model = free_model_manager.get_alternative_free_model(
-                    original_model, rate_limited, skip_models=tried_models
+                    original_model, skip_models=tried_models
                 )
                 if not alt_model or alt_model in tried_models:
                     break
@@ -1021,11 +1148,22 @@ async def _try_free_model_rotation(
                         if _pt is not None and _ct is not None:
                             token_tracker.track(alt_model, _pt, _ct)
                             await self._broadcast("token_usage_updated", token_tracker.get_stats())
+                    result = self._annotate_response_with_call_metadata(
+                        result,
+                        task_id=task_id,
+                        role_id=role_id,
+                        configured_model=configured_model,
+                        actual_model=alt_model,
+                        configured_provider=configured_provider,
+                        actual_provider="openrouter",
+                        boosted=False,
+                        boost_mode=None,
+                    )
                     if free_model_manager.is_account_exhausted():
                         free_model_manager.clear_account_exhaustion()
                     return result
                 except RateLimitError:
-                    rate_limited = self._openrouter_client.get_rate_limited_models()
+                    free_model_manager.mark_model_failed(alt_model)
                     logger.warning(f"Rotated model {alt_model} also rate-limited, trying next")
                 except CreditExhaustionError as inner_e:
                     logger.warning(f"Rotated model {alt_model} credit exhaustion: {inner_e}")
@@ -1059,6 +1197,17 @@ async def _try_free_model_rotation(
                     if _pt is not None and _ct is not None:
                         token_tracker.track(auto_model, _pt, _ct)
                         await self._broadcast("token_usage_updated", token_tracker.get_stats())
+                result = self._annotate_response_with_call_metadata(
+                    result,
+                    task_id=task_id,
+                    role_id=role_id,
+                    configured_model=configured_model,
+                    actual_model=auto_model,
+                    configured_provider=configured_provider,
+                    actual_provider="openrouter",
+                    boosted=False,
+                    boost_mode=None,
+                )
                 if free_model_manager.is_account_exhausted():
                     free_model_manager.clear_account_exhaustion()
                 return result
diff --git a/backend/shared/boost_logger.py b/backend/shared/boost_logger.py
index 44c43cd..c7b6bd8 100644
--- a/backend/shared/boost_logger.py
+++ b/backend/shared/boost_logger.py
@@ -1,6 +1,7 @@
 """
 Boost Logger - Logs raw API outputs from boost (OpenRouter) API calls.
-Stores logs in a persistent file for viewing in the Boost Logs tab.
+Stores logs in a persistent file so boost-routed calls can be merged into the
+main API call log view.
 """
 import asyncio
 import json
diff --git a/backend/shared/boost_manager.py b/backend/shared/boost_manager.py
index 4417933..9fd8164 100644
--- a/backend/shared/boost_manager.py
+++ b/backend/shared/boost_manager.py
@@ -5,18 +5,34 @@
 Supports three boost modes:
 1. Boost Next X Calls - Counter-based, applies to next X API calls regardless of task ID
 2. Category Boost - Role-based, boosts all calls matching a role prefix (e.g., all Submitter 1 calls)
-3. Per-task Toggle - Task ID based (may have ID matching issues with workflow predictions)
+3. Always Prefer Boost - Every API call attempts boost first; falls back to primary on failure
+
+Autonomous Research mode agents use the same role prefixes as their parent roles:
+- Topic Selector, Completion Reviewer, Reference Selector, Paper Title Selector,
+  Certainty Assessor, Format Selector, Volume Organizer → agg_sub1 (Submitter 1)
+- Topic Validator, Redundancy Checker → agg_val (Agg Validator)
+- Brainstorm aggregation submitters/validator → agg_sub1..10, agg_val (via Coordinator)
+- Paper compilation → comp_hc, comp_hp, comp_val, comp_crit (via CompilerCoordinator)
+
+State is persisted to backend/data/boost_state.json for crash recovery.
 """
 import asyncio
+import json
 import logging
+import os
 from typing import Optional, Set, Callable, Any, Dict, List
 
 from backend.shared.models import BoostConfig
 
 logger = logging.getLogger(__name__)
 
+# Persistence file path
+BOOST_STATE_FILE = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'data', 'boost_state.json')
+
 
-# Category prefixes for different roles
+# Category prefixes for different roles — labels match Settings panel titles exactly.
+# Autonomous Research agents share the same prefixes as their parent roles
+# (see module docstring for full mapping).
 CATEGORY_PREFIXES = {
     # Aggregator
     "agg_sub1": "Submitter 1",
@@ -29,20 +45,12 @@
     "agg_sub8": "Submitter 8",
     "agg_sub9": "Submitter 9",
     "agg_sub10": "Submitter 10",
-    "agg_val": "Aggregator Validator",
+    "agg_val": "Agg Validator",
     # Compiler
-    "comp_hc": "High-Context Submitter",
-    "comp_hp": "High-Param Submitter",
+    "comp_hc": "High-Context Model",
+    "comp_hp": "High-Param Model",
     "comp_val": "Compiler Validator",
-    # Autonomous
-    "auto_te": "Topic Explorer",
-    "auto_tev": "Topic Explorer Validator",
-    "auto_ts": "Topic Selector",
-    "auto_tv": "Topic Validator",
-    "auto_cr": "Completion Reviewer",
-    "auto_rs": "Reference Selector",
-    "auto_pt": "Paper Title Selector",
-    "auto_prc": "Paper Redundancy Checker",
+    "comp_crit": "Critique Submitter",
 }
 
 
@@ -54,7 +62,9 @@ class BoostManager:
     Supports three boost modes:
     - boost_next_count: Boost the next X API calls (counter-based)
     - boosted_categories: Boost all calls for specific role categories
-    - boosted_task_ids: Boost specific task IDs (legacy, may have matching issues)
+    - boost_always_prefer: Try boost first for every API call, fall back on failure
+    
+    State is automatically persisted to disk for crash recovery.
     """
     
     _instance = None
@@ -74,16 +84,78 @@ def __init__(self):
         self.boosted_task_ids: Set[str] = set()
         self._broadcast_callback: Optional[Callable] = None
         
-        # NEW: Counter-based boost mode
+        # Counter-based boost mode
         self.boost_next_count: int = 0
         
-        # NEW: Category-based boost mode (role prefixes like "agg_sub1", "comp_hc")
+        # Category-based boost mode (role prefixes like "agg_sub1", "comp_hc")
         self.boosted_categories: Set[str] = set()
         
+        # Always-prefer boost mode: try boost for every call, fall back on failure
+        self.boost_always_prefer: bool = False
+        
         self._initialized = True
         
+        # Load persisted state on initialization
+        self._load_state()
+        
         logger.info("BoostManager initialized")
     
+    def _load_state(self) -> None:
+        """Load persisted boost state from disk."""
+        try:
+            if os.path.exists(BOOST_STATE_FILE):
+                with open(BOOST_STATE_FILE, 'r', encoding='utf-8') as f:
+                    state = json.load(f)
+                
+                # Restore boost config if it was enabled
+                if state.get('enabled') and state.get('model_id'):
+                    self.boost_config = BoostConfig(
+                        enabled=True,
+                        openrouter_api_key=state.get('api_key', ''),
+                        boost_model_id=state.get('model_id'),
+                        boost_provider=state.get('provider'),
+                        boost_context_window=state.get('context_window', 131072),
+                        boost_max_output_tokens=state.get('max_output_tokens', 25000)
+                    )
+                
+                # Restore boost modes
+                self.boost_next_count = state.get('boost_next_count', 0)
+                self.boosted_categories = set(state.get('boosted_categories', []))
+                self.boost_always_prefer = state.get('boost_always_prefer', False)
+                self.boosted_task_ids = set(state.get('boosted_task_ids', []))
+                
+                logger.info(f"Loaded boost state: enabled={state.get('enabled')}, model={state.get('model_id')}, "
+                           f"next_count={self.boost_next_count}, categories={len(self.boosted_categories)}, "
+                           f"always_prefer={self.boost_always_prefer}")
+        except Exception as e:
+            logger.warning(f"Failed to load boost state: {e}")
+    
+    def _save_state(self) -> None:
+        """Persist current boost state to disk."""
+        try:
+            # Ensure data directory exists
+            os.makedirs(os.path.dirname(BOOST_STATE_FILE), exist_ok=True)
+            
+            state = {
+                'enabled': self.boost_config is not None and self.boost_config.enabled,
+                'model_id': self.boost_config.boost_model_id if self.boost_config else None,
+                'provider': self.boost_config.boost_provider if self.boost_config else None,
+                'context_window': self.boost_config.boost_context_window if self.boost_config else 131072,
+                'max_output_tokens': self.boost_config.boost_max_output_tokens if self.boost_config else 25000,
+                'api_key': self.boost_config.openrouter_api_key if self.boost_config else '',
+                'boost_next_count': self.boost_next_count,
+                'boosted_categories': list(self.boosted_categories),
+                'boost_always_prefer': self.boost_always_prefer,
+                'boosted_task_ids': list(self.boosted_task_ids)
+            }
+            
+            with open(BOOST_STATE_FILE, 'w', encoding='utf-8') as f:
+                json.dump(state, f, indent=2)
+            
+            logger.debug("Boost state saved to disk")
+        except Exception as e:
+            logger.warning(f"Failed to save boost state: {e}")
+    
     def set_broadcast_callback(self, callback: Callable) -> None:
         """Set callback for broadcasting WebSocket events."""
         self._broadcast_callback = callback
@@ -109,6 +181,9 @@ async def set_boost_config(self, config: BoostConfig) -> None:
                 f"max_tokens={config.boost_max_output_tokens}"
             )
             
+            # Persist state
+            self._save_state()
+            
             await self._broadcast("boost_enabled", {
                 "model_id": config.boost_model_id,
                 "provider": config.boost_provider,
@@ -125,6 +200,10 @@ async def clear_boost(self) -> None:
                 self.boosted_task_ids.clear()
                 self.boosted_categories.clear()
                 self.boost_next_count = 0
+                self.boost_always_prefer = False
+                
+                # Persist state
+                self._save_state()
                 
                 await self._broadcast("boost_disabled", {})
     
@@ -148,6 +227,9 @@ async def toggle_task_boost(self, task_id: str) -> bool:
                 boosted = True
                 logger.debug(f"Task {task_id} boost enabled")
             
+            # Persist state
+            self._save_state()
+            
             await self._broadcast("task_boost_toggled", {
                 "task_id": task_id,
                 "boosted": boosted
@@ -182,10 +264,35 @@ async def set_boost_next_count(self, count: int) -> None:
             self.boost_next_count = max(0, count)
             logger.info(f"Boost next count set to {self.boost_next_count}")
             
+            # Persist state
+            self._save_state()
+            
             await self._broadcast("boost_next_count_updated", {
                 "count": self.boost_next_count
             })
     
+    async def set_always_prefer(self, enabled: bool) -> None:
+        """
+        Enable or disable always-prefer-boost mode.
+        
+        When enabled, every API call attempts boost first and falls back to the
+        primary model on any failure. Mutually exclusive with next_count and
+        category modes (caller should clear those before enabling this).
+        
+        Args:
+            enabled: True to enable, False to disable
+        """
+        async with self._lock:
+            self.boost_always_prefer = enabled
+            logger.info(f"Boost always-prefer {'enabled' if enabled else 'disabled'}")
+            
+            # Persist state
+            self._save_state()
+            
+            await self._broadcast("boost_always_prefer_updated", {
+                "enabled": enabled
+            })
+
     async def toggle_category_boost(self, category: str) -> bool:
         """
         Toggle boost for an entire category (role prefix).
@@ -206,6 +313,9 @@ async def toggle_category_boost(self, category: str) -> bool:
                 boosted = True
                 logger.info(f"Category {category} boost enabled")
             
+            # Persist state
+            self._save_state()
+            
             await self._broadcast("category_boost_toggled", {
                 "category": category,
                 "boosted": boosted,
@@ -249,6 +359,10 @@ def should_use_boost(self, task_id: str) -> bool:
         if not self.boost_config or not self.boost_config.enabled:
             return False
         
+        # Check always-prefer mode (every call uses boost, fall back on failure)
+        if self.boost_always_prefer:
+            return True
+        
         # Check boost_next_count first (counter-based mode)
         if self.boost_next_count > 0:
             return True
@@ -274,6 +388,9 @@ async def consume_boost_count(self) -> None:
                 self.boost_next_count -= 1
                 logger.debug(f"Boost count consumed, remaining: {self.boost_next_count}")
                 
+                # Persist state
+                self._save_state()
+                
                 await self._broadcast("boost_next_count_updated", {
                     "count": self.boost_next_count
                 })
@@ -292,6 +409,7 @@ def get_boost_status(self) -> Dict[str, Any]:
                 "boosted_task_count": 0,
                 "boost_next_count": 0,
                 "boosted_categories": [],
+                "boost_always_prefer": False,
                 "boosted_tasks": []
             }
         
@@ -303,54 +421,51 @@ def get_boost_status(self) -> Dict[str, Any]:
             "max_output_tokens": self.boost_config.boost_max_output_tokens,
             "boosted_task_count": len(self.boosted_task_ids),
             "boosted_tasks": list(self.boosted_task_ids),
-            # NEW: Include new boost modes
             "boost_next_count": self.boost_next_count,
-            "boosted_categories": list(self.boosted_categories)
+            "boosted_categories": list(self.boosted_categories),
+            "boost_always_prefer": self.boost_always_prefer
         }
     
     def get_available_categories(self, mode: str = "all") -> List[Dict[str, str]]:
         """
-        Get list of available boost categories based on current workflow mode.
+        Get list of all boost categories in the same order as Settings panels.
+        All categories are always returned regardless of mode.
+        
+        Autonomous Research agents automatically inherit boosts from their parent roles:
+        - Submitter 1 (agg_sub1) covers: Topic Selector, Completion Reviewer,
+          Reference Selector, Paper Title Selector, Certainty Assessor, Format Selector,
+          Volume Organizer
+        - Agg Validator (agg_val) covers: Topic Validator, Redundancy Checker
+        - Compiler roles cover paper compilation phases
         
         Args:
-            mode: "aggregator", "compiler", "autonomous", or "all"
+            mode: ignored — kept for API compatibility
             
         Returns:
-            List of category dicts with id and label
+            List of category dicts with id, label, and group
         """
         categories = []
         
-        if mode in ("aggregator", "all"):
-            for i in range(1, 11):
-                categories.append({
-                    "id": f"agg_sub{i}",
-                    "label": f"Sub {i}",
-                    "group": "Aggregator"
-                })
+        # Aggregator (matches AggregatorSettings order: Submitters 1-10, then Validator)
+        for i in range(1, 11):
             categories.append({
-                "id": "agg_val",
-                "label": "Validator",
+                "id": f"agg_sub{i}",
+                "label": f"Submitter {i}",
                 "group": "Aggregator"
             })
-        
-        if mode in ("compiler", "all"):
-            categories.extend([
-                {"id": "comp_hc", "label": "High-Context", "group": "Compiler"},
-                {"id": "comp_hp", "label": "High-Param", "group": "Compiler"},
-                {"id": "comp_val", "label": "Validator", "group": "Compiler"},
-            ])
-        
-        if mode in ("autonomous", "all"):
-            categories.extend([
-                {"id": "auto_te", "label": "Topic Explore", "group": "Autonomous"},
-                {"id": "auto_tev", "label": "Topic Explore Val", "group": "Autonomous"},
-                {"id": "auto_ts", "label": "Topic Sel", "group": "Autonomous"},
-                {"id": "auto_tv", "label": "Topic Val", "group": "Autonomous"},
-                {"id": "auto_cr", "label": "Completion", "group": "Autonomous"},
-                {"id": "auto_rs", "label": "Ref Sel", "group": "Autonomous"},
-                {"id": "auto_pt", "label": "Paper Title", "group": "Autonomous"},
-                {"id": "auto_prc", "label": "Redundancy", "group": "Autonomous"},
-            ])
+        categories.append({
+            "id": "agg_val",
+            "label": "Agg Validator",
+            "group": "Aggregator"
+        })
+        
+        # Compiler (matches CompilerSettings order: Validator, High-Context, High-Param, Critique)
+        categories.extend([
+            {"id": "comp_val", "label": "Compiler Validator", "group": "Compiler"},
+            {"id": "comp_hc", "label": "High-Context Model", "group": "Compiler"},
+            {"id": "comp_hp", "label": "High-Param Model", "group": "Compiler"},
+            {"id": "comp_crit", "label": "Critique Submitter", "group": "Compiler"},
+        ])
         
         return categories
     
diff --git a/backend/shared/config.py b/backend/shared/config.py
index c07c4e4..d220e49 100644
--- a/backend/shared/config.py
+++ b/backend/shared/config.py
@@ -151,7 +151,8 @@ class SystemConfig(BaseSettings):
     # Autonomous workflow settings
     autonomous_completion_review_interval: int = 10  # Every 10 acceptances
     autonomous_paper_redundancy_interval: int = 3  # Every 3 completed papers
-    autonomous_max_reference_papers: int = 6  # Max papers for reference context
+    autonomous_topic_cycle_max_reference_papers: int = 3  # Max pre-brainstorm + additional references per topic cycle
+    autonomous_tier3_short_form_max_reference_papers: int = 6  # Max references for Tier 3 short-form selection
     
     # Wolfram Alpha integration (optional)
     wolfram_alpha_enabled: bool = False
diff --git a/backend/shared/critique_memory.py b/backend/shared/critique_memory.py
index bfbae69..637a639 100644
--- a/backend/shared/critique_memory.py
+++ b/backend/shared/critique_memory.py
@@ -199,10 +199,9 @@ async def save_critique(
         logger.info(
             f"Saved critique {critique.critique_id} for {paper_type}"
             + (f" paper_id={paper_id}" if paper_id else "")
-            + (f" at {file_path}" if base_dir else "")
         )
     except Exception as e:
-        logger.error(f"Failed to save critique: {e}")
+        logger.error(f"Failed to save critique for {paper_type}: {e}")
         raise
 
     return critique
@@ -233,10 +232,10 @@ async def get_critiques(
 
         return critiques
     except json.JSONDecodeError as e:
-        logger.error(f"Failed to parse critiques file {file_path}: {e}")
+        logger.error(f"Failed to parse critiques for {paper_type}: {e}")
         return []
     except Exception as e:
-        logger.error(f"Failed to load critiques from {file_path}: {e}")
+        logger.error(f"Failed to load critiques for {paper_type}: {e}")
         return []
 
 
@@ -253,11 +252,10 @@ async def clear_critiques(
             logger.info(
                 f"Cleared critiques for {paper_type}"
                 + (f" paper_id={paper_id}" if paper_id else "")
-                + (f" at {file_path}" if base_dir else "")
             )
             return True
         except Exception as e:
-            logger.error(f"Failed to delete critiques file {file_path}: {e}")
+            logger.error(f"Failed to delete critiques for {paper_type}: {e}")
             raise
 
     return False
diff --git a/backend/shared/free_model_manager.py b/backend/shared/free_model_manager.py
index 62df1c5..c05f312 100644
--- a/backend/shared/free_model_manager.py
+++ b/backend/shared/free_model_manager.py
@@ -1,8 +1,7 @@
 """
-Free Model Manager - Manages free model rotation, auto-selector backup,
-and account-wide credit exhaustion detection.
+Free Model Manager - Manages free model rotation and account-wide credit exhaustion detection.
 
-When a free OpenRouter model is rate-limited, this manager provides:
+When a free OpenRouter model fails, this manager provides:
 1. Free Model Looping: rotate to next available free model (highest context first)
 2. Auto-Selector Backup: fall back to openrouter/free as last resort
 3. Account Exhaustion Detection: halt all free model requests on 402
@@ -13,6 +12,9 @@
 
 logger = logging.getLogger(__name__)
 
+# How long to remember failed models before allowing retry (seconds)
+FAILED_MODEL_EXPIRY = 300  # 5 minutes
+
 
 class FreeModelManager:
     """Singleton managing free model rotation and account exhaustion state."""
@@ -29,6 +31,9 @@ def __init__(self):
 
         self._account_credits_exhausted: bool = False
         self._account_exhausted_timestamp: float = 0.0
+        
+        # Track models that failed with timestamps (model_id -> failure_time)
+        self._failed_models: Dict[str, float] = {}
 
     def configure(self, looping: bool, auto_selector: bool) -> None:
         """Set free model settings from frontend."""
@@ -38,6 +43,11 @@ def configure(self, looping: bool, auto_selector: bool) -> None:
             f"Free model settings: looping={looping}, auto_selector={auto_selector}"
         )
 
+    def reset(self) -> None:
+        """Reset all transient state. Call at workflow start."""
+        self._failed_models.clear()
+        logger.debug("FreeModelManager reset - cleared failed models")
+
     def update_cached_models(self, models: List[Dict[str, Any]]) -> None:
         """
         Cache free models sorted by context_length descending.
@@ -63,65 +73,56 @@ def update_cached_models(self, models: List[Dict[str, Any]]) -> None:
         self._cache_timestamp = time.time()
         logger.info(f"Cached {len(free_models)} free models for rotation")
 
+    def _cleanup_expired_failures(self) -> None:
+        """Remove models from failed list if their expiry has passed."""
+        current_time = time.time()
+        expired = [
+            model_id for model_id, fail_time in self._failed_models.items()
+            if current_time - fail_time > FAILED_MODEL_EXPIRY
+        ]
+        for model_id in expired:
+            del self._failed_models[model_id]
+            logger.debug(f"Model {model_id} failure expired, now available for retry")
+
     def get_alternative_free_model(
         self,
         current_model_id: str,
-        rate_limited_models: Dict[str, float],
-        skip_models: Optional[set] = None,
+        skip_models: Optional[Set[str]] = None,
     ) -> Optional[str]:
         """
-        Get the next available (non-rate-limited) free model, sorted by
-        highest context_length first, skipping the current model and any
-        models in skip_models.
+        Get the next available free model, sorted by highest context_length first,
+        skipping the current model and any models in skip_models.
 
-        Returns model ID string or None if all are rate-limited/skipped.
+        Returns model ID string or None if all are skipped.
         """
         if not self._cached_free_models:
             logger.debug("No cached free models available for rotation")
             return None
 
-        current_time = time.time()
+        # Clean up expired failures before checking
+        self._cleanup_expired_failures()
+
         skip = skip_models or set()
+        skip = skip | set(self._failed_models.keys())  # Also skip recently failed models
 
         for m in self._cached_free_models:
             model_id = m.get("id", "")
             if not model_id or model_id == current_model_id or model_id in skip:
                 continue
-
-            limit_time = rate_limited_models.get(model_id)
-            if limit_time is not None:
-                from backend.shared.openrouter_client import OpenRouterClient
-                if current_time - limit_time < OpenRouterClient.RATE_LIMIT_COOLDOWN:
-                    continue
-
             return model_id
 
         return None
-
-    def get_soonest_retry(
-        self, rate_limited_models: Dict[str, float]
-    ) -> Optional[float]:
-        """
-        Get the earliest future timestamp when any rate-limited model becomes available.
-        Filters out already-expired cooldowns.
-        Returns Unix timestamp or None if no active cooldowns remain.
-        """
-        if not rate_limited_models:
-            return None
-
-        from backend.shared.openrouter_client import OpenRouterClient
-        cooldown = OpenRouterClient.RATE_LIMIT_COOLDOWN
-        current_time = time.time()
-
-        soonest = None
-        for model_id, limit_time in rate_limited_models.items():
-            retry_at = limit_time + cooldown
-            if retry_at <= current_time:
-                continue
-            if soonest is None or retry_at < soonest:
-                soonest = retry_at
-
-        return soonest
+    
+    def mark_model_failed(self, model_id: str) -> None:
+        """Mark a model as failed with current timestamp."""
+        self._failed_models[model_id] = time.time()
+        logger.debug(f"Marked model as failed: {model_id} (expires in {FAILED_MODEL_EXPIRY}s)")
+    
+    def clear_failed_models(self) -> None:
+        """Clear the failed models dict (call on successful request)."""
+        if self._failed_models:
+            logger.debug(f"Clearing {len(self._failed_models)} failed models")
+            self._failed_models.clear()
 
     def mark_account_exhausted(self) -> None:
         """Mark that the OpenRouter account has no free credits (402 on free model)."""
@@ -150,6 +151,7 @@ def get_status(self) -> Dict[str, Any]:
             "auto_selector_enabled": self.auto_selector_enabled,
             "cached_free_model_count": len(self._cached_free_models),
             "account_credits_exhausted": self._account_credits_exhausted,
+            "failed_model_count": len(self._failed_models),
         }
 
 
diff --git a/backend/shared/models.py b/backend/shared/models.py
index 830e483..556de7f 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -53,6 +53,7 @@ class ValidationResult(BaseModel):
     timestamp: datetime = Field(default_factory=datetime.now)
     contradiction_check_passed: bool = True
     json_valid: bool = True
+    metadata: Dict[str, Any] = Field(default_factory=dict)
 
 
 class CleanupReviewResult(BaseModel):
@@ -385,7 +386,7 @@ class ReferenceExpansionRequest(BaseModel):
 
 class ReferenceSelectionResult(BaseModel):
     """Final selection of reference papers."""
-    selected_papers: List[str] = Field(default_factory=list)  # Max 6 paper IDs
+    selected_papers: List[str] = Field(default_factory=list)  # Caller-specific cap
     reasoning: str
 
 
@@ -645,6 +646,7 @@ class PaperCritique(BaseModel):
     host_provider: Optional[str] = None  # e.g., "Anthropic", "Google AI" (for OpenRouter)
     date: datetime = Field(default_factory=datetime.now)
     prompt_used: Optional[str] = None  # The prompt used for this critique (for regeneration)
+    critique_source: Literal["system_auto", "user_request", "unknown"] = "unknown"
     
     # Ratings (1-10 scale)
     novelty_rating: int = Field(default=0, ge=0, le=10)
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index f90b2df..d914400 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.5",
+  "version": "1.0.6",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "asi-aggregator-frontend",
-      "version": "1.0.5",
+      "version": "1.0.6",
       "license": "MIT",
       "dependencies": {
         "dompurify": "^3.2.4",
@@ -942,9 +942,9 @@
       }
     },
     "node_modules/dompurify": {
-      "version": "3.3.3",
-      "resolved": "https://registry.npmjs.org/dompurify/-/dompurify-3.3.3.tgz",
-      "integrity": "sha512-Oj6pzI2+RqBfFG+qOaOLbFXLQ90ARpcGG6UePL82bJLtdsa6CYJD7nmiU8MW9nQNOtCHV3lZ/Bzq1X0QYbBZCA==",
+      "version": "3.4.0",
+      "resolved": "https://registry.npmjs.org/dompurify/-/dompurify-3.4.0.tgz",
+      "integrity": "sha512-nolgK9JcaUXMSmW+j1yaSvaEaoXYHwWyGJlkoCTghc97KgGDDSnpoU/PlEnw63Ah+TGKFOyY+X5LnxaWbCSfXg==",
       "license": "(MPL-2.0 OR Apache-2.0)",
       "optionalDependencies": {
         "@types/trusted-types": "^2.0.7"
diff --git a/frontend/package.json b/frontend/package.json
index 62fb80b..3cdeaf1 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -1,6 +1,6 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.5",
+  "version": "1.0.6",
   "description": "Frontend UI for MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "author": "Intrafere LLC",
   "license": "MIT",
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index d98a3b8..9df0bde 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -19,7 +19,6 @@ import {
 } from './components/autonomous';
 import WorkflowPanel from './components/WorkflowPanel';
 import BoostControlModal from './components/BoostControlModal';
-import BoostLogs from './components/BoostLogs';
 import StartupProviderSetupModal from './components/StartupProviderSetupModal';
 import OpenRouterApiKeyModal from './components/OpenRouterApiKeyModal';
 import OpenRouterPrivacyWarningModal from './components/OpenRouterPrivacyWarningModal';
@@ -91,8 +90,11 @@ function App() {
   const [manualActiveTab, setManualActiveTab] = useState(
     () => localStorage.getItem(MANUAL_TAB_STORAGE_KEY) || 'aggregator-interface'
   );
-  const [utilityActiveTab, setUtilityActiveTab] = useState(null);
-  const activeTab = utilityActiveTab || (appMode === 'manual' ? manualActiveTab : autonomousActiveTab);
+  const activeTab = appMode === 'manual' ? manualActiveTab : autonomousActiveTab;
+  const shimmerAccentsEnabled = (() => {
+    const saved = localStorage.getItem('banner_shimmer_enabled');
+    return saved !== null ? JSON.parse(saved) : true;
+  })();
   
   // Models list (fetched from API)
   const [models, setModels] = useState([]);
@@ -455,6 +457,8 @@ function App() {
     
     // Helper to add activity with limit (prevents unbounded array growth causing UI freeze)
     const MAX_ACTIVITY_EVENTS = 500;
+    // Helper to get timestamp from server or fallback to client time
+    const getTimestamp = (data) => data?._serverTimestamp || new Date().toISOString();
     const addActivity = (event) => {
       setAutonomousActivity(prev => [...prev, event].slice(-MAX_ACTIVITY_EVENTS));
     };
@@ -487,7 +491,7 @@ function App() {
     unsubscribers.push(websocket.on('topic_exploration_started', (data) => {
       addActivity({
         event: 'topic_exploration_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Topic exploration started (target: ${data.target || 5} candidates${data.resumed_count ? `, resuming with ${data.resumed_count}` : ''})`,
         data
       });
@@ -496,7 +500,7 @@ function App() {
     unsubscribers.push(websocket.on('topic_exploration_progress', (data) => {
       addActivity({
         event: 'topic_exploration_progress',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Exploration candidate ${data.accepted}/${data.target} accepted: ${data.latest_question ? data.latest_question.substring(0, 100) + '...' : ''}`,
         data
       });
@@ -505,7 +509,7 @@ function App() {
     unsubscribers.push(websocket.on('topic_exploration_complete', (data) => {
       addActivity({
         event: 'topic_exploration_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Topic exploration complete: ${data.accepted_count} candidates collected from ${data.total_attempts} attempts`,
         data
       });
@@ -515,7 +519,7 @@ function App() {
     unsubscribers.push(websocket.on('paper_title_exploration_started', (data) => {
       addActivity({
         event: 'paper_title_exploration_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Title exploration started (target: ${data.target || 5} candidate titles)`,
         data
       });
@@ -524,7 +528,7 @@ function App() {
     unsubscribers.push(websocket.on('paper_title_exploration_progress', (data) => {
       addActivity({
         event: 'paper_title_exploration_progress',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Title candidate ${data.accepted}/${data.target} accepted`,
         data
       });
@@ -533,7 +537,7 @@ function App() {
     unsubscribers.push(websocket.on('paper_title_exploration_complete', (data) => {
       addActivity({
         event: 'paper_title_exploration_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Title exploration complete: ${data.accepted_count} candidates collected from ${data.total_attempts} attempts`,
         data
       });
@@ -543,7 +547,7 @@ function App() {
     unsubscribers.push(websocket.on('topic_selected', (data) => {
       addActivity({
         event: 'topic_selected',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Topic selected: ${data.topic_prompt}`,
         data
       });
@@ -552,7 +556,7 @@ function App() {
     unsubscribers.push(websocket.on('topic_selection_rejected', (data) => {
       addActivity({
         event: 'topic_selection_rejected',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Topic selection rejected`,
         data
       });
@@ -563,7 +567,7 @@ function App() {
       const modelName = data.submitter_model ? (data.submitter_model.split('/')[1] || data.submitter_model.substring(0, 15)) : 'N/A';
       addActivity({
         event: 'submission_accepted',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Submitter ${data.submitter_id} [${modelName}]: ✓ ACCEPTED (total: ${data.total_acceptances})`,
         data
       });
@@ -573,7 +577,7 @@ function App() {
       const modelName = data.submitter_model ? (data.submitter_model.split('/')[1] || data.submitter_model.substring(0, 15)) : 'N/A';
       addActivity({
         event: 'submission_rejected',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Submitter ${data.submitter_id} [${modelName}]: ✗ REJECTED (total: ${data.total_rejections})`,
         data
       });
@@ -583,7 +587,7 @@ function App() {
     unsubscribers.push(websocket.on('completion_review_started', (data) => {
       addActivity({
         event: 'completion_review_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Completion review started`,
         data
       });
@@ -592,7 +596,7 @@ function App() {
     unsubscribers.push(websocket.on('completion_review_result', (data) => {
       addActivity({
         event: 'completion_review_result',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Decision: ${data.decision}`,
         data
       });
@@ -601,7 +605,7 @@ function App() {
     unsubscribers.push(websocket.on('manual_paper_writing_triggered', (data) => {
       addActivity({
         event: 'manual_paper_writing_triggered',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Manual override: Forcing paper writing for ${data.topic_id} (${data.submission_count} submissions)`,
         data
       });
@@ -612,7 +616,7 @@ function App() {
       autonomousTierRef.current = 'tier2_paper_writing';
       addActivity({
         event: 'paper_writing_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Paper writing started: ${data.title}`,
         data
       });
@@ -625,7 +629,7 @@ function App() {
       const iterationSuffix = data.iteration ? ` (iteration ${data.iteration})` : '';
       addActivity({
         event: 'compiler_acceptance',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `${modeLabel}: ✓ ACCEPTED${iterationSuffix}`,
         data
       });
@@ -638,7 +642,7 @@ function App() {
       const reason = formatReason(data.reasoning);
       addActivity({
         event: 'compiler_rejection',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `${modeLabel}: ✗ REJECTED${iterationSuffix}${reason ? ` - ${reason}` : ''}`,
         data
       });
@@ -650,7 +654,7 @@ function App() {
       const reason = formatReason(data.reasoning, 100);
       addActivity({
         event: 'compiler_decline',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `${modeLabel}: ↷ DECLINED${reason ? ` - ${reason}` : ''}`,
         data
       });
@@ -660,7 +664,7 @@ function App() {
       if (!isAutonomousTier2Active()) return;
       addActivity({
         event: 'outline_locked',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Outline locked after ${data.total_iterations || data.iteration || '?'} iteration(s)`,
         data
       });
@@ -670,7 +674,7 @@ function App() {
     unsubscribers.push(websocket.on('critique_phase_started', (data) => {
       addActivity({
         event: 'critique_phase_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Critique phase started (Paper v${data.paper_version || '?'}, target: ${data.target_critiques || 5} critiques)`,
         data
       });
@@ -681,7 +685,7 @@ function App() {
       if (data.total_attempts % 2 === 0 || data.total_attempts >= data.target) {
         addActivity({
           event: 'critique_progress',
-          timestamp: new Date().toISOString(),
+          timestamp: getTimestamp(data),
           message: `Critique progress: ${data.acceptances} accepted, ${data.rejections} rejected (${data.total_attempts}/${data.target} attempts)`,
           data
         });
@@ -691,7 +695,7 @@ function App() {
     unsubscribers.push(websocket.on('body_rewrite_started', (data) => {
       addActivity({
         event: 'body_rewrite_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `REWRITE PHASE: Total rewrite started for Paper v${data.version || '?'}${data.title_changed ? ' (Title updated)' : ''}`,
         data
       });
@@ -700,7 +704,7 @@ function App() {
     unsubscribers.push(websocket.on('partial_revision_complete', (data) => {
       addActivity({
         event: 'partial_revision_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `PARTIAL REVISION: Applied ${data.edits_applied || 0} targeted edits (Paper v${data.version || '?'})${data.title_changed ? ' (Title updated)' : ''}`,
         data
       });
@@ -709,7 +713,7 @@ function App() {
     unsubscribers.push(websocket.on('critique_phase_ended', (data) => {
       addActivity({
         event: 'critique_phase_ended',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Critique phase complete (${data.decision || 'unknown'})`,
         data
       });
@@ -718,7 +722,7 @@ function App() {
     unsubscribers.push(websocket.on('critique_phase_skipped', (data) => {
       addActivity({
         event: 'critique_phase_skipped',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Critique phase skipped: ${data.reason || 'user override'}`,
         data
       });
@@ -731,7 +735,7 @@ function App() {
       const trigger = data.trigger || 'complete';
       addActivity({
         event: 'phase_transition',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Phase transition: ${fromPhase} → ${toPhase} (${trigger})`,
         data
       });
@@ -740,7 +744,7 @@ function App() {
     unsubscribers.push(websocket.on('paper_completed', (data) => {
       addActivity({
         event: 'paper_completed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Paper completed: ${data.title}`,
         data
       });
@@ -751,7 +755,7 @@ function App() {
     unsubscribers.push(websocket.on('paper_redundancy_review', (data) => {
       addActivity({
         event: 'paper_redundancy_review',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Redundancy review: ${data.should_remove ? 'Removing paper' : 'No removal'}`,
         data
       });
@@ -771,7 +775,7 @@ function App() {
       }
       addActivity({
         event: 'auto_research_resumed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Research resumed (${data?.tier || 'unknown tier'})`,
         data
       });
@@ -792,7 +796,7 @@ function App() {
       autonomousTierRef.current = 'tier3_final_answer';
       addActivity({
         event: 'tier3_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Tier 3 Final Answer generation started`,
         data
       });
@@ -811,7 +815,7 @@ function App() {
       }
       addActivity({
         event: 'tier3_result',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message,
         data
       });
@@ -820,7 +824,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_format_selected', (data) => {
       addActivity({
         event: 'tier3_format_selected',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Answer format: ${data.format === 'short_form' ? 'Short Form (Single Paper)' : 'Long Form (Volume)'}`,
         data
       });
@@ -830,7 +834,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_volume_organized', (data) => {
       addActivity({
         event: 'tier3_volume_organized',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Volume organized: "${data.title}" (${data.chapters?.length || 0} chapters)`,
         data
       });
@@ -839,7 +843,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_chapter_started', (data) => {
       addActivity({
         event: 'tier3_chapter_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Writing chapter ${data.chapter_order}: ${data.title}`,
         data
       });
@@ -848,7 +852,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_chapter_complete', (data) => {
       addActivity({
         event: 'tier3_chapter_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Chapter ${data.chapter_order} complete: ${data.title}`,
         data
       });
@@ -857,7 +861,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_rejection', (data) => {
       addActivity({
         event: 'tier3_rejection',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Tier 3 submission rejected: ${data.phase || 'unknown phase'}`,
         data
       });
@@ -866,7 +870,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_complete', (data) => {
       addActivity({
         event: 'tier3_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `🏆 FINAL ANSWER COMPLETE! ${data.format === 'short_form' ? 'Paper' : 'Volume'}: "${data.title}"`,
         data
       });
@@ -878,7 +882,7 @@ function App() {
     unsubscribers.push(websocket.on('reference_selection_started', (data) => {
       addActivity({
         event: 'reference_selection_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Reference selection started (${data.mode})`,
         data
       });
@@ -887,7 +891,7 @@ function App() {
     unsubscribers.push(websocket.on('reference_selection_complete', (data) => {
       addActivity({
         event: 'reference_selection_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Reference selection complete: ${data.selected_count} papers selected`,
         data
       });
@@ -898,7 +902,7 @@ function App() {
       autonomousTierRef.current = 'tier2_paper_writing';
       addActivity({
         event: 'paper_writing_resumed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Paper writing resumed: ${data.title}`,
         data
       });
@@ -908,7 +912,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_forced', (data) => {
       addActivity({
         event: 'tier3_forced',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Tier 3 forced with mode: ${data.mode} (${data.completed_papers} papers available)`,
         data
       });
@@ -917,7 +921,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_phase_changed', (data) => {
       addActivity({
         event: 'tier3_phase_changed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Tier 3 phase: ${data.description || data.phase}`,
         data
       });
@@ -926,7 +930,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_paper_started', (data) => {
       addActivity({
         event: 'tier3_paper_started',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Writing final answer paper: ${data.title}`,
         data
       });
@@ -935,7 +939,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_short_form_complete', (data) => {
       addActivity({
         event: 'tier3_short_form_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Short form paper complete: ${data.title}`,
         data
       });
@@ -944,7 +948,7 @@ function App() {
     unsubscribers.push(websocket.on('tier3_long_form_complete', (data) => {
       addActivity({
         event: 'tier3_long_form_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Long form volume complete: ${data.title} (${data.total_chapters} chapters)`,
         data
       });
@@ -959,7 +963,7 @@ function App() {
       // Also add to activity log
       addActivity({
         event: 'openrouter_privacy_error',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         ...data
       });
     }));
@@ -978,7 +982,7 @@ function App() {
       // Also add to activity log
       addActivity({
         event: 'openrouter_rate_limit',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `⏳ Rate limit: ${data.model} (retry in 1 hour)`,
         ...data
       });
@@ -988,7 +992,7 @@ function App() {
       console.info('Free model rotated:', data);
       addActivity({
         event: 'free_model_rotated',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `🔄 Model rotated: ${data.from_model} → ${data.to_model} (${data.role_id})`,
         ...data
       });
@@ -998,7 +1002,7 @@ function App() {
       console.info('Free model auto-selector used:', data);
       addActivity({
         event: 'free_model_auto_selector_used',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `🔄 Auto-selector backup: openrouter/free used for ${data.role_id}`,
         ...data
       });
@@ -1008,7 +1012,7 @@ function App() {
       console.warn('Serial bottleneck - workflow paused:', data);
       addActivity({
         event: 'serial_bottleneck_paused',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `⏸️ SERIAL BOTTLENECK: ${data.role_id} paused for ${Math.round((data.wait_seconds || 0) / 60)} min`,
         ...data
       });
@@ -1018,7 +1022,7 @@ function App() {
       console.info('Serial bottleneck resolved:', data);
       addActivity({
         event: 'serial_bottleneck_resumed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `▶️ SERIAL BOTTLENECK resolved: ${data.role_id} resumed`,
         ...data
       });
@@ -1028,7 +1032,7 @@ function App() {
       console.error('All free models exhausted:', data);
       addActivity({
         event: 'all_free_models_exhausted',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `❌ All free models exhausted: ${data.message}`,
         ...data
       });
@@ -1038,7 +1042,7 @@ function App() {
       console.error('Account credits exhausted:', data);
       addActivity({
         event: 'account_credits_exhausted',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `❌ Account free credits depleted: ${data.message}`,
         ...data
       });
@@ -1050,7 +1054,7 @@ function App() {
           role_id: roleId,
           reason: 'account_credits_exhausted',
           message: data.message || 'Account free credits depleted.',
-          timestamp: new Date().toISOString()
+          timestamp: getTimestamp(data)
         }];
       });
     }));
@@ -1060,7 +1064,7 @@ function App() {
       console.warn('OpenRouter fallback triggered:', data);
       addActivity({
         event: 'openrouter_fallback',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `⚠️ OpenRouter credits exhausted for ${data.role_id} — fell back to ${data.fallback_model || 'LM Studio'}`,
         ...data
       });
@@ -1073,7 +1077,7 @@ function App() {
           reason,
           message: data.message,
           fallback_model: data.fallback_model,
-          timestamp: new Date().toISOString()
+          timestamp: getTimestamp(data)
         }];
       });
     }));
@@ -1083,7 +1087,7 @@ function App() {
       console.error('OpenRouter fallback failed:', data);
       addActivity({
         event: 'openrouter_fallback_failed',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `🛑 OpenRouter credits exhausted for ${data.role_id} — NO FALLBACK configured!`,
         ...data
       });
@@ -1094,7 +1098,7 @@ function App() {
           role_id: data.role_id,
           reason: 'no_fallback_configured',
           message: data.message,
-          timestamp: new Date().toISOString()
+          timestamp: getTimestamp(data)
         }];
       });
     }));
@@ -1104,7 +1108,7 @@ function App() {
       console.warn('Boost credits exhausted:', data);
       addActivity({
         event: 'boost_credits_exhausted',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `⚠️ Boost credits exhausted for task ${data.task_id}`,
         ...data
       });
@@ -1115,7 +1119,7 @@ function App() {
           role_id: `Boost (${data.task_id || 'unknown'})`,
           reason: 'boost_credits_exhausted',
           message: data.message || 'Boost API credits exhausted. Falling back to primary model.',
-          timestamp: new Date().toISOString()
+          timestamp: getTimestamp(data)
         }];
       });
     }));
@@ -1124,7 +1128,7 @@ function App() {
       console.info('OpenRouter fallbacks reset:', data);
       addActivity({
         event: 'openrouter_fallbacks_reset',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `OpenRouter reset: ${data.message}`,
         ...data
       });
@@ -1152,7 +1156,7 @@ function App() {
     unsubscribers.push(websocket.on('final_answer_complete', (data) => {
       addActivity({
         event: 'final_answer_complete',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `Final answer complete! Format: ${data.format}`,
         data
       });
@@ -1195,7 +1199,7 @@ function App() {
       // Also add to activity log
       addActivity({
         event: 'high_score_critique',
-        timestamp: new Date().toISOString(),
+        timestamp: getTimestamp(data),
         message: `⭐ High-score critique: ${data.paper_title} (avg: ${data.average_rating})`,
         data
       });
@@ -1386,12 +1390,10 @@ function App() {
 
   const handleModeChange = (nextMode) => {
     setAppMode(nextMode);
-    setUtilityActiveTab(null);
   };
 
   const handleAutonomousTabSelect = (tabId) => {
     setAutonomousActiveTab(tabId);
-    setUtilityActiveTab(null);
     if (appMode !== 'autonomous') {
       setAppMode('autonomous');
     }
@@ -1399,16 +1401,11 @@ function App() {
 
   const handleManualTabSelect = (tabId) => {
     setManualActiveTab(tabId);
-    setUtilityActiveTab(null);
     if (appMode !== 'manual') {
       setAppMode('manual');
     }
   };
 
-  const handleUtilityTabSelect = (tabId) => {
-    setUtilityActiveTab(tabId);
-  };
-
   // Credit exhaustion notification handler
   const handleDismissCreditNotification = (notificationId) => {
     setCreditExhaustionNotifications(prev => prev.filter(n => n.id !== notificationId));
@@ -1529,7 +1526,7 @@ function App() {
   const mainTabs = [
     { id: 'auto-interface', label: 'Start Here: Autonomous Deep Research Controller', group: 'autonomous-main' },
     { id: 'auto-brainstorms', label: 'Autonomous Stage 1: Brainstorms', group: 'autonomous-main' },
-    { id: 'auto-papers', label: 'Autonomous Stage 2: Papers', subtext: '(Less Hallucinatory - Recommended Output)', subtextClass: 'green', group: 'autonomous-main' },
+    { id: 'auto-papers', label: 'Autonomous Stage 2: Papers', group: 'autonomous-main' },
     ...(autonomousConfig.tier3_enabled ? [
       { id: 'auto-final-answer', label: getFinalAnswerLabel(), subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-main' },
     ] : []),
@@ -1595,14 +1592,10 @@ function App() {
   return (
     <div className="app">
       {/* Banner Section */}
-      <div className={`app-banner ${(() => {
-        const saved = localStorage.getItem('banner_shimmer_enabled');
-        const enabled = saved !== null ? JSON.parse(saved) : true;
-        return !enabled ? 'no-shimmer' : '';
-      })()}`}>
+      <div className={`app-banner ${shimmerAccentsEnabled ? '' : 'no-shimmer'}`}>
         <div className="banner-content">
           <h1 className="banner-title">
-            <span className="banner-moto">M.O.T.O.</span>
+            <span className="banner-moto" aria-label="M.O.T.O.">M.O.T.O.</span>
             <span className="banner-subtitle">Autonomous ASI</span>
           </h1>
           <p className="banner-company">By Intrafere Research Group</p>
@@ -1636,15 +1629,6 @@ function App() {
         >
           ⚡ API Boost
         </button>
-        <button 
-          className="boost-logs-btn"
-          onClick={() => {
-            handleUtilityTabSelect('boost-logs');
-          }}
-          title="View Boost Logs"
-        >
-          Boost Logs
-        </button>
         <button 
           className="openrouter-key-btn"
           onClick={() => {
@@ -1679,7 +1663,7 @@ function App() {
         )}
       </div>
       
-      <div className={`tabs ${appMode === 'manual' ? 'tabs-manual' : ''}`}>
+      <div className={`tabs ${appMode === 'manual' ? 'tabs-manual' : ''} ${shimmerAccentsEnabled ? 'tabs-shimmer-enabled' : ''}`}>
         {appMode === 'autonomous' ? (
           <>
             {mainTabs.map((tab, index) => {
@@ -1837,7 +1821,6 @@ function App() {
               events={autonomousActivity}
             />
           )}
-          {activeTab === 'boost-logs' && <BoostLogs />}
           
           {activeTab === 'aggregator-interface' && (
             <AggregatorInterface
@@ -2047,7 +2030,7 @@ function App() {
               className="footer-link footer-link-github"
             >
               <span className="footer-icon">⭐</span>
-              Star Us on GitHub for More ASI Programs
+              Visit MOTO's GitHub (Star Us for More ASI Programs)
             </a>
           </div>
         </div>
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 2d4345b..0a63b7c 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -1,7 +1,9 @@
-import React, { useState, useEffect } from 'react';
+import React, { useState, useEffect, useRef } from 'react';
 import { boostAPI, openRouterAPI } from '../services/api';
 import './BoostControlModal.css';
 
+const BOOST_SETTINGS_STORAGE_KEY = 'boost_modal_settings';
+
 export default function BoostControlModal({ isOpen, onClose }) {
   const [apiKey, setApiKey] = useState('');
   const [boostModel, setBoostModel] = useState('');
@@ -18,8 +20,47 @@ export default function BoostControlModal({ isOpen, onClose }) {
   const [boostStatus, setBoostStatus] = useState(null);
   const [freeOnly, setFreeOnly] = useState(false);
   const [hasGlobalKey, setHasGlobalKey] = useState(false);
+  
+  // Track mouse down position to prevent closing on text selection drag
+  const mouseDownTargetRef = useRef(null);
 
   const hasAvailableKey = Boolean(apiKey.trim() || hasGlobalKey);
+  
+  // Load saved settings from localStorage on mount
+  useEffect(() => {
+    try {
+      const saved = localStorage.getItem(BOOST_SETTINGS_STORAGE_KEY);
+      if (saved) {
+        const settings = JSON.parse(saved);
+        if (settings.boostModel) setBoostModel(settings.boostModel);
+        if (settings.selectedProvider) setSelectedProvider(settings.selectedProvider);
+        if (settings.contextWindow) setContextWindow(settings.contextWindow);
+        if (settings.maxOutputTokens) setMaxOutputTokens(settings.maxOutputTokens);
+        if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
+      }
+    } catch (e) {
+      console.error('Failed to load boost settings from localStorage:', e);
+    }
+  }, []);
+  
+  // Save settings to localStorage whenever they change
+  useEffect(() => {
+    // Only save if we have meaningful values (not initial empty state)
+    if (boostModel || selectedProvider || contextWindow !== 131072 || maxOutputTokens !== 25000 || freeOnly) {
+      try {
+        const settings = {
+          boostModel,
+          selectedProvider,
+          contextWindow,
+          maxOutputTokens,
+          freeOnly
+        };
+        localStorage.setItem(BOOST_SETTINGS_STORAGE_KEY, JSON.stringify(settings));
+      } catch (e) {
+        console.error('Failed to save boost settings to localStorage:', e);
+      }
+    }
+  }, [boostModel, selectedProvider, contextWindow, maxOutputTokens, freeOnly]);
 
   const fetchProviders = async (modelId, keyOverride = undefined) => {
     if (!modelId) {
@@ -53,6 +94,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
       if (response.status) {
         setBoostStatus(response.status);
         if (response.status.enabled) {
+          // Boost is enabled - use backend values (they're authoritative)
           setBoostModel(response.status.model_id);
           setSelectedProvider(response.status.provider || '');
           setContextWindow(response.status.context_window);
@@ -60,8 +102,23 @@ export default function BoostControlModal({ isOpen, onClose }) {
           if (response.status.model_id) {
             await fetchProviders(response.status.model_id, effectiveKey);
           }
+          
+          // Also save to localStorage so settings persist even if backend restarts
+          try {
+            const settings = {
+              boostModel: response.status.model_id,
+              selectedProvider: response.status.provider || '',
+              contextWindow: response.status.context_window,
+              maxOutputTokens: response.status.max_output_tokens,
+              freeOnly
+            };
+            localStorage.setItem(BOOST_SETTINGS_STORAGE_KEY, JSON.stringify(settings));
+          } catch (e) {
+            console.error('Failed to sync boost settings to localStorage:', e);
+          }
         } else {
           setProviders([]);
+          // Boost not enabled - localStorage values are already loaded in useEffect
         }
       }
     } catch (error) {
@@ -258,11 +315,29 @@ export default function BoostControlModal({ isOpen, onClose }) {
     }
   };
 
+  // Handle overlay click - only close if mousedown AND mouseup both happened on overlay
+  // This prevents closing when user drags to select text in inputs
+  const handleOverlayMouseDown = (e) => {
+    mouseDownTargetRef.current = e.target;
+  };
+  
+  const handleOverlayClick = (e) => {
+    // Only close if both mousedown and click happened on the overlay itself
+    if (e.target === e.currentTarget && mouseDownTargetRef.current === e.currentTarget) {
+      onClose();
+    }
+    mouseDownTargetRef.current = null;
+  };
+
   if (!isOpen) return null;
 
   return (
-    <div className="modal-overlay" onClick={onClose}>
-      <div className="boost-modal" onClick={(e) => e.stopPropagation()}>
+    <div 
+      className="modal-overlay" 
+      onMouseDown={handleOverlayMouseDown}
+      onClick={handleOverlayClick}
+    >
+      <div className="boost-modal">
         <div className="modal-header">
           <h2>API Boost Configuration</h2>
           <button className="close-btn" onClick={onClose}>×</button>
@@ -378,7 +453,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
               <input
                 type="number"
                 value={contextWindow}
-                onChange={(e) => setContextWindow(parseInt(e.target.value))}
+                onChange={(e) => setContextWindow(parseInt(e.target.value) || 131072)}
                 min="4096"
                 max="999999"
                 step="1024"
@@ -391,7 +466,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
               <input
                 type="number"
                 value={maxOutputTokens}
-                onChange={(e) => setMaxOutputTokens(parseInt(e.target.value))}
+                onChange={(e) => setMaxOutputTokens(parseInt(e.target.value) || 25000)}
                 min="1000"
                 max="100000"
                 step="1000"
diff --git a/frontend/src/components/BoostLogs.css b/frontend/src/components/BoostLogs.css
deleted file mode 100644
index 720dd46..0000000
--- a/frontend/src/components/BoostLogs.css
+++ /dev/null
@@ -1,361 +0,0 @@
-.boost-logs-container {
-  padding: 1.5rem;
-  max-width: 1200px;
-  margin: 0 auto;
-}
-
-.boost-logs-header {
-  display: flex;
-  justify-content: space-between;
-  align-items: center;
-  margin-bottom: 1.5rem;
-}
-
-.boost-logs-header h2 {
-  margin: 0;
-  color: var(--gold, #1eff1c);
-  font-size: 1.5rem;
-}
-
-.boost-logs-actions {
-  display: flex;
-  gap: 0.75rem;
-  align-items: center;
-}
-
-.auto-refresh-toggle {
-  display: flex;
-  align-items: center;
-  gap: 0.5rem;
-  color: #888;
-  font-size: 0.9rem;
-  cursor: pointer;
-}
-
-.auto-refresh-toggle input {
-  cursor: pointer;
-}
-
-.refresh-btn {
-  background: #2a2a2a;
-  border: 1px solid #444;
-  border-radius: 4px;
-  padding: 0.5rem;
-  cursor: pointer;
-  font-size: 1rem;
-  transition: all 0.2s;
-}
-
-.refresh-btn:hover {
-  background: #333;
-  border-color: #555;
-}
-
-.clear-btn {
-  background: #dc3545;
-  border: none;
-  border-radius: 4px;
-  padding: 0.5rem 1rem;
-  color: #fff;
-  font-size: 0.9rem;
-  cursor: pointer;
-  transition: background 0.2s;
-}
-
-.clear-btn:hover:not(:disabled) {
-  background: #c82333;
-}
-
-.clear-btn:disabled {
-  background: #555;
-  cursor: not-allowed;
-}
-
-/* Stats */
-.boost-stats {
-  display: grid;
-  grid-template-columns: repeat(4, 1fr);
-  gap: 1rem;
-  margin-bottom: 1rem;
-}
-
-.stat-card {
-  background: var(--surface-3, #22222c);
-  border: 1px solid var(--border-default, rgba(255,255,255,0.1));
-  border-radius: var(--radius-md, 10px);
-  padding: 1rem;
-  text-align: center;
-}
-
-.stat-card.success {
-  border-color: rgba(76, 175, 80, 0.35);
-}
-
-.stat-card.error {
-  border-color: rgba(220, 53, 69, 0.35);
-}
-
-.stat-value {
-  display: block;
-  font-size: 1.75rem;
-  font-weight: 700;
-  color: var(--gold, #1eff1c);
-  margin-bottom: 0.25rem;
-}
-
-.stat-card.success .stat-value {
-  color: #4CAF50;
-}
-
-.stat-card.error .stat-value {
-  color: #dc3545;
-}
-
-.stat-label {
-  font-size: 0.8rem;
-  color: #888;
-  text-transform: uppercase;
-  letter-spacing: 0.5px;
-}
-
-.boost-mode-stats {
-  display: flex;
-  align-items: center;
-  gap: 0.5rem;
-  margin-bottom: 1.5rem;
-  flex-wrap: wrap;
-}
-
-.mode-stats-label {
-  color: #888;
-  font-size: 0.85rem;
-}
-
-.mode-stat-badge {
-  background: #333;
-  border: 1px solid #444;
-  border-radius: 4px;
-  padding: 0.25rem 0.5rem;
-  font-size: 0.8rem;
-  color: #aaa;
-}
-
-/* Logs List */
-.boost-logs-list {
-  border: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
-  border-radius: var(--radius-md, 10px);
-  overflow: hidden;
-}
-
-.logs-loading,
-.logs-empty {
-  padding: 3rem;
-  text-align: center;
-  color: #666;
-}
-
-.logs-empty p {
-  margin: 0.5rem 0;
-}
-
-.logs-empty-hint {
-  font-size: 0.85rem;
-  font-style: italic;
-}
-
-.boost-log-entry {
-  border-bottom: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
-  background: var(--surface-2, #1a1a22);
-}
-
-.boost-log-entry:last-child {
-  border-bottom: none;
-}
-
-.boost-log-entry.success {
-  border-left: 3px solid var(--accent-green, #4CAF50);
-}
-
-.boost-log-entry.error {
-  border-left: 3px solid #dc3545;
-}
-
-.log-summary {
-  display: grid;
-  grid-template-columns: auto 1fr auto auto;
-  gap: 1rem;
-  padding: 1rem;
-  cursor: pointer;
-  align-items: center;
-  transition: background 0.2s;
-}
-
-.log-summary:hover {
-  background: var(--surface-3, #22222c);
-}
-
-.log-status {
-  width: 24px;
-  height: 24px;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  font-size: 1rem;
-  font-weight: 700;
-}
-
-.boost-log-entry.success .log-status {
-  color: #4CAF50;
-}
-
-.boost-log-entry.error .log-status {
-  color: #dc3545;
-}
-
-.log-info {
-  display: flex;
-  flex-direction: column;
-  gap: 0.25rem;
-  min-width: 0;
-}
-
-.log-task {
-  display: flex;
-  align-items: center;
-  gap: 0.5rem;
-}
-
-.log-task-id {
-  font-weight: 600;
-  color: #fff;
-  font-family: 'Consolas', 'Monaco', monospace;
-  font-size: 0.9rem;
-}
-
-.log-mode-badge {
-  background: var(--gold, #1eff1c);
-  color: #000;
-  padding: 0.15rem 0.4rem;
-  border-radius: var(--radius-sm, 6px);
-  font-size: 0.7rem;
-  font-weight: 600;
-  text-transform: uppercase;
-}
-
-.log-meta {
-  display: flex;
-  gap: 1rem;
-  font-size: 0.8rem;
-  color: #888;
-}
-
-.log-model {
-  max-width: 200px;
-  overflow: hidden;
-  text-overflow: ellipsis;
-  white-space: nowrap;
-}
-
-.log-timestamp {
-  color: #666;
-  font-size: 0.8rem;
-  white-space: nowrap;
-}
-
-.log-expand-icon {
-  color: #666;
-  font-size: 0.8rem;
-}
-
-/* Log Details (Expanded) */
-.log-details {
-  padding: 1rem;
-  background: var(--surface-0, #0b0b0f);
-  border-top: 1px solid var(--border-subtle, rgba(255,255,255,0.07));
-}
-
-.log-detail-section {
-  margin-bottom: 1rem;
-}
-
-.log-detail-section:last-child {
-  margin-bottom: 0;
-}
-
-.log-detail-section h4 {
-  margin: 0 0 0.5rem 0;
-  color: #888;
-  font-size: 0.8rem;
-  text-transform: uppercase;
-  letter-spacing: 0.5px;
-}
-
-.log-detail-section.error h4 {
-  color: #dc3545;
-}
-
-.log-detail-section pre {
-  margin: 0;
-  padding: 0.75rem;
-  background: #1a1a1a;
-  border: 1px solid #333;
-  border-radius: 4px;
-  font-family: 'Consolas', 'Monaco', monospace;
-  font-size: 0.85rem;
-  color: #ccc;
-  white-space: pre-wrap;
-  word-break: break-word;
-  max-height: 300px;
-  overflow-y: auto;
-}
-
-.log-detail-section.error pre {
-  border-color: #dc3545;
-  color: #f8d7da;
-}
-
-.log-preview {
-  max-height: 150px;
-}
-
-.log-response {
-  max-height: 400px;
-}
-
-/* Scrollbar styling */
-.log-detail-section pre::-webkit-scrollbar,
-.boost-logs-list::-webkit-scrollbar {
-  width: 6px;
-}
-
-.log-detail-section pre::-webkit-scrollbar-track,
-.boost-logs-list::-webkit-scrollbar-track {
-  background: #1a1a1a;
-}
-
-.log-detail-section pre::-webkit-scrollbar-thumb,
-.boost-logs-list::-webkit-scrollbar-thumb {
-  background: #444;
-  border-radius: 3px;
-}
-
-.log-detail-section pre::-webkit-scrollbar-thumb:hover,
-.boost-logs-list::-webkit-scrollbar-thumb:hover {
-  background: #555;
-}
-
-/* Responsive */
-@media (max-width: 768px) {
-  .boost-stats {
-    grid-template-columns: repeat(2, 1fr);
-  }
-  
-  .log-summary {
-    grid-template-columns: auto 1fr auto;
-  }
-  
-  .log-timestamp {
-    display: none;
-  }
-}
-
diff --git a/frontend/src/components/BoostLogs.jsx b/frontend/src/components/BoostLogs.jsx
deleted file mode 100644
index f0def8e..0000000
--- a/frontend/src/components/BoostLogs.jsx
+++ /dev/null
@@ -1,239 +0,0 @@
-import React, { useState, useEffect, useCallback } from 'react';
-import { boostAPI } from '../services/api';
-import { websocket } from '../services/websocket';
-import './BoostLogs.css';
-
-export default function BoostLogs() {
-  const [logs, setLogs] = useState([]);
-  const [stats, setStats] = useState(null);
-  const [loading, setLoading] = useState(true);
-  const [expandedIndex, setExpandedIndex] = useState(null);
-  const [autoRefresh, setAutoRefresh] = useState(true);
-
-  // Fetch logs from API
-  const fetchLogs = useCallback(async () => {
-    try {
-      const response = await boostAPI.getLogs(100);
-      if (response.success) {
-        setLogs(response.logs || []);
-        setStats(response.stats || null);
-      }
-    } catch (error) {
-      console.error('Failed to fetch boost logs:', error);
-    } finally {
-      setLoading(false);
-    }
-  }, []);
-
-  // Initial fetch and auto-refresh
-  useEffect(() => {
-    fetchLogs();
-
-    let interval;
-    if (autoRefresh) {
-      interval = setInterval(fetchLogs, 5000);
-    }
-
-    return () => {
-      if (interval) clearInterval(interval);
-    };
-  }, [fetchLogs, autoRefresh]);
-
-  // Handle WebSocket events for real-time updates
-  useEffect(() => {
-    const handleBoostCallCompleted = () => {
-      // Refresh logs when a boost call completes
-      fetchLogs();
-    };
-
-    websocket.on('boost_call_completed', handleBoostCallCompleted);
-    
-    return () => {
-      websocket.off('boost_call_completed', handleBoostCallCompleted);
-    };
-  }, [fetchLogs]);
-
-  // Handle clear logs
-  const handleClearLogs = async () => {
-    if (!window.confirm('Are you sure you want to clear all boost logs?')) {
-      return;
-    }
-
-    try {
-      await boostAPI.clearLogs();
-      setLogs([]);
-      setStats(null);
-      setExpandedIndex(null);
-    } catch (error) {
-      console.error('Failed to clear logs:', error);
-    }
-  };
-
-  // Toggle log expansion
-  const toggleExpand = (index) => {
-    setExpandedIndex(expandedIndex === index ? null : index);
-  };
-
-  // Format timestamp
-  const formatTimestamp = (timestamp) => {
-    try {
-      const date = new Date(timestamp);
-      return date.toLocaleString();
-    } catch {
-      return timestamp;
-    }
-  };
-
-  // Format duration
-  const formatDuration = (ms) => {
-    if (ms === null || ms === undefined) return '-';
-    if (ms < 1000) return `${Math.round(ms)}ms`;
-    return `${(ms / 1000).toFixed(1)}s`;
-  };
-
-  // Get boost mode label
-  const getBoostModeLabel = (mode) => {
-    switch (mode) {
-      case 'next_count': return 'Next X';
-      case 'category': return 'Category';
-      case 'task_id': return 'Task ID';
-      default: return mode || 'Unknown';
-    }
-  };
-
-  return (
-    <div className="boost-logs-container">
-      <div className="boost-logs-header">
-        <h2>Boost API Logs</h2>
-        <div className="boost-logs-actions">
-          <label className="auto-refresh-toggle">
-            <input
-              type="checkbox"
-              checked={autoRefresh}
-              onChange={(e) => setAutoRefresh(e.target.checked)}
-            />
-            Auto-refresh
-          </label>
-          <button onClick={fetchLogs} className="refresh-btn" title="Refresh now">
-            Refresh
-          </button>
-          <button 
-            onClick={handleClearLogs} 
-            className="clear-btn"
-            disabled={logs.length === 0}
-          >
-            Clear Logs
-          </button>
-        </div>
-      </div>
-
-      {/* Stats Summary */}
-      {stats && (
-        <div className="boost-stats">
-          <div className="stat-card">
-            <span className="stat-value">{stats.total_calls}</span>
-            <span className="stat-label">Total Calls</span>
-          </div>
-          <div className="stat-card success">
-            <span className="stat-value">{stats.successful_calls}</span>
-            <span className="stat-label">Successful</span>
-          </div>
-          <div className="stat-card error">
-            <span className="stat-value">{stats.failed_calls}</span>
-            <span className="stat-label">Failed</span>
-          </div>
-          <div className="stat-card">
-            <span className="stat-value">
-              {(stats.success_rate * 100).toFixed(1)}%
-            </span>
-            <span className="stat-label">Success Rate</span>
-          </div>
-        </div>
-      )}
-
-      {/* Stats by Mode */}
-      {stats && stats.by_mode && Object.keys(stats.by_mode).length > 0 && (
-        <div className="boost-mode-stats">
-          <span className="mode-stats-label">By Mode:</span>
-          {Object.entries(stats.by_mode).map(([mode, count]) => (
-            <span key={mode} className="mode-stat-badge">
-              {getBoostModeLabel(mode)}: {count}
-            </span>
-          ))}
-        </div>
-      )}
-
-      {/* Logs List */}
-      <div className="boost-logs-list">
-        {loading ? (
-          <div className="logs-loading">Loading boost logs...</div>
-        ) : logs.length === 0 ? (
-          <div className="logs-empty">
-            <p>No boost API calls logged yet.</p>
-            <p className="logs-empty-hint">
-              Enable boost and make API calls to see logs here.
-            </p>
-          </div>
-        ) : (
-          logs.map((log, index) => (
-            <div 
-              key={index} 
-              className={`boost-log-entry ${log.success ? 'success' : 'error'} ${expandedIndex === index ? 'expanded' : ''}`}
-            >
-              <div 
-                className="log-summary"
-                onClick={() => toggleExpand(index)}
-              >
-                <div className="log-status">
-                  {log.success ? '✓' : '✗'}
-                </div>
-                <div className="log-info">
-                  <div className="log-task">
-                    <span className="log-task-id">{log.task_id}</span>
-                    <span className="log-mode-badge">{getBoostModeLabel(log.boost_mode)}</span>
-                  </div>
-                  <div className="log-meta">
-                    <span className="log-model">{log.model}</span>
-                    <span className="log-duration">{formatDuration(log.duration_ms)}</span>
-                    {log.tokens_used && (
-                      <span className="log-tokens">{log.tokens_used} tokens</span>
-                    )}
-                  </div>
-                </div>
-                <div className="log-timestamp">{formatTimestamp(log.timestamp)}</div>
-                <div className="log-expand-icon">{expandedIndex === index ? '▼' : '▶'}</div>
-              </div>
-
-              {expandedIndex === index && (
-                <div className="log-details">
-                  <div className="log-detail-section">
-                    <h4>Role</h4>
-                    <pre>{log.role_id}</pre>
-                  </div>
-
-                  {log.error && (
-                    <div className="log-detail-section error">
-                      <h4>Error</h4>
-                      <pre>{log.error}</pre>
-                    </div>
-                  )}
-
-                  <div className="log-detail-section">
-                    <h4>Prompt Preview</h4>
-                    <pre className="log-preview">{log.prompt_preview || '(empty)'}</pre>
-                  </div>
-
-                  <div className="log-detail-section">
-                    <h4>Response</h4>
-                    <pre className="log-response">{log.response_full || log.response_preview || '(empty)'}</pre>
-                  </div>
-                </div>
-              )}
-            </div>
-          ))
-        )}
-      </div>
-    </div>
-  );
-}
-
diff --git a/frontend/src/components/WorkflowPanel.css b/frontend/src/components/WorkflowPanel.css
index 36f885f..a47c3e0 100644
--- a/frontend/src/components/WorkflowPanel.css
+++ b/frontend/src/components/WorkflowPanel.css
@@ -144,9 +144,30 @@
 }
 
 .boost-categories {
+  display: flex;
+  flex-direction: column;
+  gap: 0.5rem;
+}
+
+.boost-category-group {
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+}
+
+.boost-group-label {
+  font-size: 0.68rem;
+  font-weight: 600;
+  text-transform: uppercase;
+  letter-spacing: 0.06em;
+  color: var(--text-muted);
+  padding-left: 0.1rem;
+}
+
+.boost-category-row {
   display: flex;
   flex-wrap: wrap;
-  gap: 0.35rem;
+  gap: 0.3rem;
 }
 
 .category-btn {
@@ -173,201 +194,60 @@
   font-weight: 600;
 }
 
-.boost-disabled-notice {
-  padding: 0.75rem 1rem;
-  background: var(--surface-1);
-  border-bottom: 1px solid var(--border-subtle);
-  font-size: 0.8rem;
-  color: var(--text-muted);
-  text-align: center;
-  font-style: italic;
-}
-
-.workflow-tasks {
-  flex: 1;
-  overflow-y: auto;
-  padding: 0.5rem;
-}
-
-.no-tasks {
-  text-align: center;
-  padding: 2rem 1rem;
-  color: var(--text-muted);
-  font-style: italic;
-}
-
-.task-card {
-  background: var(--surface-3);
-  border: 1px solid var(--border-subtle);
-  border-radius: var(--radius-sm);
-  padding: 0.75rem;
-  margin-bottom: 0.5rem;
-  display: grid;
-  grid-template-columns: auto 1fr auto auto;
-  gap: 0.75rem;
-  align-items: center;
-  transition: all var(--transition-fast);
-}
-
-.task-card:hover:not(.completed) {
-  background: var(--surface-4);
-  border-color: var(--border-default);
-  transform: translateX(-2px);
-}
-
-.task-card.boosted {
-  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
-  border-color: var(--gold);
-  color: #000;
-}
-
-.task-card.boosted .task-role,
-.task-card.boosted .task-mode,
-.task-card.boosted .task-provider {
-  color: #000;
-}
-
-.task-card.active {
-  background: #2563eb;
-  border-color: #3b82f6;
-  animation: pulse 2s ease-in-out infinite;
-}
-
-@keyframes pulse {
-  0%, 100% {
-    opacity: 1;
-  }
-  50% {
-    opacity: 0.8;
-  }
-}
-
-.task-card.completed {
-  background: rgba(76, 175, 80, 0.1);
-  border-color: rgba(76, 175, 80, 0.3);
-  opacity: 0.7;
-}
-
-.task-number {
-  font-weight: 700;
-  font-size: 0.85rem;
-  color: var(--text-muted);
-  min-width: 30px;
-}
-
-.task-card.boosted .task-number {
-  color: #000;
-}
-
-.task-card.active .task-number,
-.task-card.completed .task-number {
-  color: #fff;
-}
-
-.task-info {
-  display: flex;
-  flex-direction: column;
-  gap: 0.25rem;
-}
-
-.task-role {
-  font-weight: 600;
-  font-size: 0.9rem;
-  color: #fff;
-}
-
-.task-mode {
-  font-size: 0.75rem;
-  color: var(--text-secondary);
-}
-
-.task-card.boosted .task-mode {
-  color: #333;
+.boost-always-prefer-row {
+  margin-top: 0.1rem;
 }
 
-.task-badges {
+.boost-always-prefer-label {
   display: flex;
-  gap: 0.5rem;
   align-items: center;
+  gap: 0.5rem;
+  cursor: pointer;
+  font-size: 0.8rem;
+  color: var(--text-secondary);
 }
 
-.boost-icon {
-  font-size: 1.2rem;
-}
-
-.completed-icon {
-  color: #4CAF50;
-  font-size: 1.2rem;
-  font-weight: 700;
+.boost-always-prefer-label:has(.boost-always-prefer-checkbox:not(:disabled)) {
+  color: var(--text-primary);
 }
 
-.active-icon {
-  color: #fff;
-  font-size: 1.2rem;
-  animation: spin 2s linear infinite;
+.boost-always-prefer-checkbox {
+  width: 14px;
+  height: 14px;
+  flex-shrink: 0;
+  accent-color: var(--gold);
+  cursor: pointer;
 }
 
-@keyframes spin {
-  from {
-    transform: rotate(0deg);
-  }
-  to {
-    transform: rotate(360deg);
-  }
+.boost-always-prefer-hint {
+  margin-top: 0.25rem;
+  font-size: 0.72rem;
+  color: var(--gold);
+  font-style: italic;
+  padding-left: 1.5rem;
 }
 
-.task-provider {
+.boost-or-divider {  text-align: center;
   font-size: 0.7rem;
-  font-weight: 600;
   color: var(--text-muted);
-  background: var(--surface-2);
-  padding: 0.25rem 0.5rem;
-  border-radius: var(--radius-sm);
+  letter-spacing: 0.08em;
+  margin: 0.35rem 0;
+  user-select: none;
 }
 
-.task-card.boosted .task-provider {
-  background: rgba(0, 0, 0, 0.2);
-  color: #000;
+.boost-mode-inactive {
+  opacity: 0.35;
+  pointer-events: none;
 }
 
-.workflow-legend {
+.boost-disabled-notice {
   padding: 0.75rem 1rem;
-  border-top: 1px solid var(--border-subtle);
-  background: var(--surface-0);
-  display: grid;
-  grid-template-columns: 1fr 1fr;
-  gap: 0.5rem;
-  font-size: 0.75rem;
-}
-
-.legend-item {
-  display: flex;
-  align-items: center;
-  gap: 0.5rem;
-  color: var(--text-secondary);
-}
-
-.legend-color {
-  width: 16px;
-  height: 16px;
-  border-radius: var(--radius-sm);
-  border: 1px solid var(--border-default);
-}
-
-.legend-color.default {
-  background: var(--surface-3);
-}
-
-.legend-color.boosted {
-  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
-}
-
-.legend-color.active {
-  background: #2563eb;
-}
-
-.legend-color.completed {
-  background: rgba(76, 175, 80, 0.25);
+  background: var(--surface-1);
+  border-bottom: 1px solid var(--border-subtle);
+  font-size: 0.8rem;
+  color: var(--text-muted);
+  text-align: center;
+  font-style: italic;
 }
 
 /* Token Stats & Research Timer */
@@ -505,22 +385,3 @@
 .model-out {
   color: #e8a86a;
 }
-
-/* Scrollbar styling */
-.workflow-tasks::-webkit-scrollbar {
-  width: 6px;
-}
-
-.workflow-tasks::-webkit-scrollbar-track {
-  background: var(--surface-1);
-}
-
-.workflow-tasks::-webkit-scrollbar-thumb {
-  background: var(--surface-4);
-  border-radius: 3px;
-}
-
-.workflow-tasks::-webkit-scrollbar-thumb:hover {
-  background: var(--border-strong);
-}
-
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index efe0569..fd868e7 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -13,16 +13,17 @@ const formatTime = (totalSeconds) => {
 };
 
 export default function WorkflowPanel({ isRunning }) {
-  const [tasks, setTasks] = useState([]);
   const [collapsed, setCollapsed] = useState(false);
   const [mode, setMode] = useState('idle');
   
-  // NEW: Boost controls state
+  // Boost controls state
   const [boostNextCount, setBoostNextCount] = useState(0);
   const [boostNextInput, setBoostNextInput] = useState('');
+  const [isEditingBoostNext, setIsEditingBoostNext] = useState(false);
   const [boostedCategories, setBoostedCategories] = useState([]);
   const [availableCategories, setAvailableCategories] = useState([]);
   const [boostEnabled, setBoostEnabled] = useState(false);
+  const [boostAlwaysPrefer, setBoostAlwaysPrefer] = useState(false);
 
   // Token tracking & timer state
   const [tokenStats, setTokenStats] = useState({ total_input: 0, total_output: 0, by_model: {}, elapsed_seconds: 0 });
@@ -43,17 +44,18 @@ export default function WorkflowPanel({ isRunning }) {
         setBoostEnabled(statusResponse.status.enabled);
         setBoostNextCount(statusResponse.status.boost_next_count || 0);
         setBoostedCategories(statusResponse.status.boosted_categories || []);
+        setBoostAlwaysPrefer(statusResponse.status.boost_always_prefer || false);
       }
       
-      // Fetch categories for current mode
-      const categoriesResponse = await boostAPI.getCategories(mode === 'idle' ? 'all' : mode);
+      // Always fetch all categories (no mode filter)
+      const categoriesResponse = await boostAPI.getCategories('all');
       if (categoriesResponse.success) {
         setAvailableCategories(categoriesResponse.categories || []);
       }
     } catch (error) {
       console.debug('Failed to fetch boost status:', error);
     }
-  }, [mode]);
+  }, []);
 
   // Fetch boost status on mount and when running state changes
   // ETERNAL: Always fetch boost status, even when not running
@@ -71,6 +73,12 @@ export default function WorkflowPanel({ isRunning }) {
     }
   }, [boostEnabled, expandPanel]);
 
+  useEffect(() => {
+    if (!isEditingBoostNext) {
+      setBoostNextInput(boostNextCount > 0 ? boostNextCount.toString() : '');
+    }
+  }, [boostNextCount, isEditingBoostNext]);
+
   // Handle setting boost next count
   const handleSetBoostNextCount = async () => {
     const count = parseInt(boostNextInput, 10);
@@ -81,15 +89,26 @@ export default function WorkflowPanel({ isRunning }) {
     try {
       await boostAPI.setNextCount(count);
       setBoostNextCount(count);
-      setBoostNextInput('');
+      setBoostNextInput(count > 0 ? count.toString() : '');
+      setIsEditingBoostNext(false);
     } catch (error) {
       console.error('Failed to set boost count:', error);
     }
   };
 
-  // Handle category toggle
-  const handleCategoryToggle = async (categoryId) => {
+  // Handle always-prefer toggle
+  const handleAlwaysPreferToggle = async () => {
     try {
+      const newValue = !boostAlwaysPrefer;
+      await boostAPI.setAlwaysPrefer(newValue);
+      setBoostAlwaysPrefer(newValue);
+    } catch (error) {
+      console.error('Failed to toggle always-prefer boost:', error);
+    }
+  };
+
+  // Handle category toggle
+  const handleCategoryToggle = async (categoryId) => {    try {
       const response = await boostAPI.toggleCategory(categoryId);
       if (response.success) {
         setBoostedCategories(response.all_boosted_categories || []);
@@ -134,219 +153,42 @@ export default function WorkflowPanel({ isRunning }) {
     return () => clearInterval(interval);
   }, [isRunning]);
 
-  // Poll for workflow predictions when running
+  // Fetch current workflow mode when running
   useEffect(() => {
     if (!isRunning) {
-      setTasks([]);
       setMode('idle');
       return;
     }
 
-    // Helper to merge incoming tasks while preserving local boost state
-    // (in case backend hasn't updated yet)
-    const mergeTasksPreservingBoost = (incomingTasks, existingTasks) => {
-      // Create a map of existing boost states
-      const existingBoostStates = {};
-      existingTasks.forEach(t => {
-        existingBoostStates[t.task_id] = t.using_boost;
-      });
-      
-      // Merge: Use backend boost state if set, otherwise preserve local state
-      return incomingTasks.map(task => ({
-        ...task,
-        // Backend boost state takes precedence, but preserve local if backend shows false
-        // (in case there's a race condition)
-        using_boost: task.using_boost || existingBoostStates[task.task_id] || false
-      }));
-    };
-
-    // Initial fetch
-    const fetchWorkflow = async () => {
+    const fetchMode = async () => {
       try {
         const response = await workflowAPI.getPredictions();
-        console.log('Workflow predictions response:', response);
         if (response.success) {
-          if (response.tasks && response.tasks.length > 0) {
-            // Merge incoming tasks with existing, preserving boost state
-            setTasks(prevTasks => mergeTasksPreservingBoost(response.tasks, prevTasks));
-            setMode(response.mode || 'unknown');
-          } else {
-            // No tasks yet - generate placeholder predictions
-            console.log('No tasks from backend, generating placeholders');
-            setTasks(prevTasks => {
-              // Preserve any existing boost states when generating placeholders
-              const placeholderTasks = generatePlaceholderTasks(response.mode || 'aggregator');
-              return mergeTasksPreservingBoost(placeholderTasks, prevTasks);
-            });
-            setMode(response.mode || 'aggregator');
-          }
+          setMode(response.mode || 'idle');
         }
       } catch (error) {
-        console.error('Failed to fetch workflow predictions:', error);
-        // Generate placeholder tasks on error, preserving boost state
-        setTasks(prevTasks => {
-          const placeholderTasks = generatePlaceholderTasks('aggregator');
-          return mergeTasksPreservingBoost(placeholderTasks, prevTasks);
-        });
-        setMode('aggregator');
+        console.debug('Failed to fetch workflow mode:', error);
       }
     };
 
-    fetchWorkflow();
-
-    // Poll every 3 seconds while running
-    const interval = setInterval(fetchWorkflow, 3000);
-
+    fetchMode();
+    const interval = setInterval(fetchMode, 5000);
     return () => clearInterval(interval);
   }, [isRunning]);
 
-  // Generate placeholder tasks when backend hasn't generated them yet
-  const generatePlaceholderTasks = (detectedMode) => {
-    const tasks = [];
-    const numSubmitters = 3; // Default
-    
-    if (detectedMode === 'aggregator') {
-      // Generate aggregator pattern: S1, S2, S3, V, S1, S2, S3, V...
-      for (let i = 0; i < 20; i++) {
-        const cyclePos = i % 4;
-        if (cyclePos < 3) {
-          const submitterId = cyclePos + 1;
-          tasks.push({
-            task_id: `agg_sub${submitterId}_${String(i).padStart(3, '0')}`,
-            sequence_number: i + 1,
-            role: `Submitter ${submitterId}${submitterId === 1 ? ' (Main Submitter)' : ''}`,
-            mode: null,
-            provider: 'lm_studio',
-            using_boost: false,
-            completed: false,
-            active: false
-          });
-        } else {
-          tasks.push({
-            task_id: `agg_val_${String(i).padStart(3, '0')}`,
-            sequence_number: i + 1,
-            role: 'Validator',
-            mode: null,
-            provider: 'lm_studio',
-            using_boost: false,
-            completed: false,
-            active: false
-          });
-        }
-      }
-    } else if (detectedMode === 'compiler') {
-      // Generate compiler pattern
-      const pattern = ['High-Context', 'Validator', 'High-Context', 'Validator'];
-      for (let i = 0; i < 20; i++) {
-        const role = pattern[i % pattern.length];
-        tasks.push({
-          task_id: `comp_${role === 'Validator' ? 'val' : 'hc'}_${String(i).padStart(3, '0')}`,
-          sequence_number: i + 1,
-          role: role,
-          mode: role === 'High-Context' ? 'Construction' : 'Review',
-          provider: 'lm_studio',
-          using_boost: false,
-          completed: false,
-          active: false
-        });
-      }
-    }
-    
-    return tasks;
-  };
-
   useEffect(() => {
     if (!isRunning) {
       return;
     }
 
-    // Subscribe to workflow events
-    const handleWorkflowUpdated = (data) => {
-      if (data.tasks) {
-        // Merge incoming tasks while preserving local boost state
-        setTasks(prevTasks => {
-          const existingBoostStates = {};
-          prevTasks.forEach(t => {
-            existingBoostStates[t.task_id] = t.using_boost;
-          });
-          
-          return data.tasks.map(task => ({
-            ...task,
-            using_boost: task.using_boost || existingBoostStates[task.task_id] || false
-          }));
-        });
-        setMode(data.mode || 'unknown');
-      }
-    };
-
-    const handleTaskCompleted = async (data) => {
-      // Mark task as completed locally
-      setTasks(prevTasks => 
-        prevTasks.map(task => 
-          task.task_id === data.task_id 
-            ? { ...task, completed: true, active: false }
-            : task
-        )
-      );
-      
-      // Request fresh predictions from backend to get updated task list
-      try {
-        const response = await workflowAPI.getPredictions();
-        if (response.success && response.tasks && response.tasks.length > 0) {
-          setTasks(prevTasks => {
-            // Preserve boost states when merging new predictions
-            const existingBoostStates = {};
-            prevTasks.forEach(t => {
-              existingBoostStates[t.task_id] = t.using_boost;
-            });
-            
-            return response.tasks.map(task => ({
-              ...task,
-              using_boost: task.using_boost || existingBoostStates[task.task_id] || false
-            }));
-          });
-          setMode(response.mode || 'unknown');
-        }
-      } catch (error) {
-        console.debug('Failed to fetch updated predictions after task completion:', error);
-      }
-    };
-
-    const handleTaskStarted = (data) => {
-      setTasks(prevTasks => 
-        prevTasks.map(task => ({
-          ...task,
-          active: task.task_id === data.task_id
-        }))
-      );
-    };
-
-    const handleBoostToggled = (data) => {
-      setTasks(prevTasks => 
-        prevTasks.map(task => 
-          task.task_id === data.task_id 
-            ? { ...task, using_boost: data.boosted }
-            : task
-        )
-      );
-    };
-
-    const handleFallback = (data) => {
-      // Update tasks to show fallback state
-      console.log('OpenRouter fallback:', data);
-    };
-
-    // NEW: Handle boost count updates
     const handleBoostNextCountUpdated = (data) => {
       setBoostNextCount(data.count || 0);
     };
 
-    // NEW: Handle category boost toggle
     const handleCategoryBoostToggled = (data) => {
       setBoostedCategories(data.all_categories || []);
     };
 
-    // NEW: Handle boost enabled/disabled
     const handleBoostEnabled = () => {
       setBoostEnabled(true);
       expandPanel();
@@ -357,60 +199,28 @@ export default function WorkflowPanel({ isRunning }) {
       setBoostEnabled(false);
       setBoostNextCount(0);
       setBoostedCategories([]);
+      setBoostAlwaysPrefer(false);
+    };
+
+    const handleAlwaysPreferUpdated = (data) => {
+      setBoostAlwaysPrefer(data.enabled || false);
     };
 
-    websocket.on('workflow_updated', handleWorkflowUpdated);
-    websocket.on('task_completed', handleTaskCompleted);
-    websocket.on('task_started', handleTaskStarted);
-    websocket.on('task_boost_toggled', handleBoostToggled);
-    websocket.on('openrouter_fallback', handleFallback);
     websocket.on('boost_next_count_updated', handleBoostNextCountUpdated);
     websocket.on('category_boost_toggled', handleCategoryBoostToggled);
     websocket.on('boost_enabled', handleBoostEnabled);
     websocket.on('boost_disabled', handleBoostDisabled);
+    websocket.on('boost_always_prefer_updated', handleAlwaysPreferUpdated);
 
     return () => {
-      websocket.off('workflow_updated', handleWorkflowUpdated);
-      websocket.off('task_completed', handleTaskCompleted);
-      websocket.off('task_started', handleTaskStarted);
-      websocket.off('task_boost_toggled', handleBoostToggled);
-      websocket.off('openrouter_fallback', handleFallback);
       websocket.off('boost_next_count_updated', handleBoostNextCountUpdated);
       websocket.off('category_boost_toggled', handleCategoryBoostToggled);
       websocket.off('boost_enabled', handleBoostEnabled);
       websocket.off('boost_disabled', handleBoostDisabled);
+      websocket.off('boost_always_prefer_updated', handleAlwaysPreferUpdated);
     };
   }, [isRunning, fetchBoostStatus, expandPanel]);
 
-  const handleTaskClick = async (task) => {
-    if (task.completed) return; // Can't toggle completed tasks
-
-    try {
-      // Optimistically update local state immediately for better UX
-      const newBoostState = !task.using_boost;
-      setTasks(prevTasks => 
-        prevTasks.map(t => 
-          t.task_id === task.task_id 
-            ? { ...t, using_boost: newBoostState }
-            : t
-        )
-      );
-      
-      // Call API (backend will broadcast event, but we already updated locally)
-      await boostAPI.toggleTask(task.task_id);
-    } catch (error) {
-      console.error('Failed to toggle task boost:', error);
-      // Revert on error
-      setTasks(prevTasks => 
-        prevTasks.map(t => 
-          t.task_id === task.task_id 
-            ? { ...t, using_boost: task.using_boost }
-            : t
-        )
-      );
-    }
-  };
-
   // Load collapsed state from localStorage
   useEffect(() => {
     const savedState = localStorage.getItem('workflow_panel_collapsed');
@@ -448,26 +258,35 @@ export default function WorkflowPanel({ isRunning }) {
           <div className="boost-controls">
             {!boostEnabled && (
               <div className="boost-disabled-notice">
-                Boost not enabled - Enable in API Boost button above
+                Boost not enabled - Enable in API Boost button above. This is a great way to use your free, daily OpenRouter credits.
               </div>
             )}
             
-            <div className="boost-section">
-              <label className="boost-label">Boost Next:</label>
+            <div className={`boost-section ${boostedCategories.length > 0 || boostAlwaysPrefer ? 'boost-mode-inactive' : ''}`}>
+              <label className="boost-label">Boost Next # of Tasks:</label>
               <div className="boost-next-row">
                 <input
                   type="number"
                   min="0"
                   value={boostNextInput}
                   onChange={(e) => setBoostNextInput(e.target.value)}
-                  placeholder={boostNextCount.toString()}
+                  onFocus={() => setIsEditingBoostNext(true)}
+                  onBlur={() => setIsEditingBoostNext(false)}
+                  onKeyDown={(e) => {
+                    if (e.key === 'Enter') {
+                      handleSetBoostNextCount();
+                    }
+                  }}
+                  placeholder="0"
                   className="boost-next-input"
-                  disabled={!boostEnabled}
+                  disabled={!boostEnabled || boostedCategories.length > 0 || boostAlwaysPrefer}
+                  title={boostedCategories.length > 0 ? 'Disable category boost first' : boostAlwaysPrefer ? 'Disable "always prefer" first' : 'Replace the remaining boosted-call count immediately'}
                 />
                 <button 
                   onClick={handleSetBoostNextCount}
                   className="boost-apply-btn"
-                  disabled={!boostEnabled || !boostNextInput}
+                  disabled={!boostEnabled || boostNextInput.trim() === '' || boostedCategories.length > 0 || boostAlwaysPrefer}
+                  title={boostedCategories.length > 0 ? 'Disable category boost first' : boostAlwaysPrefer ? 'Disable "always prefer" first' : 'Apply a new remaining count immediately'}
                 >
                   Apply
                 </button>
@@ -477,31 +296,53 @@ export default function WorkflowPanel({ isRunning }) {
               </div>
             </div>
 
+            <div className={`boost-section boost-always-prefer-row ${boostNextCount > 0 || boostedCategories.length > 0 ? 'boost-mode-inactive' : ''}`}>
+              <label className="boost-always-prefer-label">
+                <input
+                  type="checkbox"
+                  checked={boostAlwaysPrefer}
+                  onChange={handleAlwaysPreferToggle}
+                  disabled={!boostEnabled || boostNextCount > 0 || boostedCategories.length > 0}
+                  className="boost-always-prefer-checkbox"
+                />
+                <span>Use boost as next API call when available</span>
+              </label>
+              {boostAlwaysPrefer && (
+                <div className="boost-always-prefer-hint">Boost attempted first every call — falls back on failure</div>
+              )}
+            </div>
+
             {availableCategories.length > 0 && (
-              <div className="boost-section">
-                <label className="boost-label">Categories:</label>
-                <div className="boost-categories">
-                  {availableCategories
-                    .filter(cat => {
-                      // Filter categories based on current mode
-                      if (mode === 'aggregator') return cat.group === 'Aggregator';
-                      if (mode === 'compiler') return cat.group === 'Compiler';
-                      if (mode === 'autonomous') return true; // Show all for autonomous
-                      return true;
-                    })
-                    .map(cat => (
-                      <button
-                        key={cat.id}
-                        className={`category-btn ${boostedCategories.includes(cat.id) ? 'active' : ''}`}
-                        onClick={() => handleCategoryToggle(cat.id)}
-                        disabled={!boostEnabled}
-                        title={`Toggle boost for ${cat.label}`}
-                      >
-                        {cat.label}
-                      </button>
-                    ))}
+              <>
+                <div className="boost-or-divider">— OR —</div>
+                <div className={`boost-section ${boostNextCount > 0 || boostAlwaysPrefer ? 'boost-mode-inactive' : ''}`}>
+                  <label className="boost-label">Boost by Category:</label>
+                  <div className="boost-categories">
+                    {['Aggregator', 'Compiler', 'Autonomous'].map(group => {
+                      const groupCats = availableCategories.filter(cat => cat.group === group);
+                      if (!groupCats.length) return null;
+                      return (
+                        <div key={group} className="boost-category-group">
+                          <span className="boost-group-label">{group}</span>
+                          <div className="boost-category-row">
+                            {groupCats.map(cat => (
+                              <button
+                                key={cat.id}
+                                className={`category-btn ${boostedCategories.includes(cat.id) ? 'active' : ''}`}
+                                onClick={() => handleCategoryToggle(cat.id)}
+                                disabled={!boostEnabled || boostNextCount > 0 || boostAlwaysPrefer}
+                                title={boostNextCount > 0 ? 'Set Boost Next to 0 first' : boostAlwaysPrefer ? 'Disable "always prefer" first' : `Toggle boost for ${cat.label}`}
+                              >
+                                {cat.label}
+                              </button>
+                            ))}
+                          </div>
+                        </div>
+                      );
+                    })}
+                  </div>
                 </div>
-              </div>
+              </>
             )}
           </div>
 
@@ -553,57 +394,6 @@ export default function WorkflowPanel({ isRunning }) {
               </div>
             )}
           </div>
-
-          <div className="workflow-tasks">
-            {tasks.length === 0 ? (
-              <div className="no-tasks">Loading workflow...</div>
-            ) : (
-              // Filter to show only non-completed tasks (up to 20)
-              // This ensures the panel shows upcoming work, not past work
-              tasks
-                .filter(task => !task.completed)
-                .slice(0, 20)
-                .map((task, index) => (
-                <div
-                  key={task.task_id}
-                  className={`task-card ${task.completed ? 'completed' : ''} ${task.active ? 'active' : ''} ${task.using_boost ? 'boosted' : ''}`}
-                  onClick={() => handleTaskClick(task)}
-                  style={{ cursor: task.completed ? 'default' : 'pointer' }}
-                >
-                  <div className="task-number">#{index + 1}</div>
-                  <div className="task-info">
-                    <div className="task-role">{task.role}</div>
-                    {task.mode && <div className="task-mode">{task.mode}</div>}
-                  </div>
-                  <div className="task-badges">
-                    {task.using_boost && <span className="boost-icon" title="Using API Boost">✨</span>}
-                    {task.completed && <span className="completed-icon">✓</span>}
-                    {task.active && <span className="active-icon">⟳</span>}
-                  </div>
-                  <div className="task-provider">{task.provider === 'openrouter' ? 'OR' : 'LMS'}</div>
-                </div>
-              ))
-            )}
-          </div>
-
-          <div className="workflow-legend">
-            <div className="legend-item">
-              <span className="legend-color default"></span>
-              <span>Pending</span>
-            </div>
-            <div className="legend-item">
-              <span className="legend-color boosted"></span>
-              <span>Boosted</span>
-            </div>
-            <div className="legend-item">
-              <span className="legend-color active"></span>
-              <span>Active</span>
-            </div>
-            <div className="legend-item">
-              <span className="legend-color completed"></span>
-              <span>Done</span>
-            </div>
-          </div>
         </>
       )}
     </div>
diff --git a/frontend/src/components/autonomous/AutonomousResearch.css b/frontend/src/components/autonomous/AutonomousResearch.css
index ebbf347..f05d2d4 100644
--- a/frontend/src/components/autonomous/AutonomousResearch.css
+++ b/frontend/src/components/autonomous/AutonomousResearch.css
@@ -31,7 +31,7 @@
 
 .api-stats {
   display: grid;
-  grid-template-columns: repeat(4, 1fr);
+  grid-template-columns: repeat(auto-fit, minmax(150px, 1fr));
   gap: 1rem;
   margin-bottom: 1rem;
 }
@@ -102,6 +102,35 @@
   font-weight: 600;
 }
 
+.log-source-badge {
+  padding: 0.15rem 0.4rem;
+  border-radius: var(--radius-sm);
+  font-size: 0.7rem;
+  font-weight: 600;
+  text-transform: uppercase;
+}
+
+.log-source-badge.standard {
+  background: var(--surface-4);
+  color: var(--text-secondary);
+}
+
+.log-source-badge.boosted {
+  background: #f59e0b;
+  color: #111827;
+}
+
+.log-boost-mode-badge {
+  background: rgba(245, 158, 11, 0.15);
+  border: 1px solid rgba(245, 158, 11, 0.35);
+  color: #fbbf24;
+  padding: 0.15rem 0.4rem;
+  border-radius: var(--radius-sm);
+  font-size: 0.7rem;
+  font-weight: 600;
+  text-transform: uppercase;
+}
+
 .log-tokens {
   color: var(--gold);
 }
@@ -844,8 +873,9 @@
 
 .settings-left-sidebar {
   width: 322px;
-  background: linear-gradient(180deg, rgba(52, 152, 219, 0.1), rgba(52, 152, 219, 0.05));
-  border-right: 2px solid rgba(52, 152, 219, 0.2);
+  background: linear-gradient(180deg, rgba(15, 19, 16, 0.98) 0%, rgba(20, 29, 22, 0.96) 100%);
+  border-right: 2px solid rgba(76, 175, 80, 0.16);
+  box-shadow: inset -1px 0 0 rgba(170, 245, 181, 0.04);
   flex-shrink: 0;
   padding: 1.5rem 0;
 }
@@ -854,11 +884,14 @@
   display: flex;
   flex-direction: column;
   height: 100%;
+  --leaderboard-label-color: rgba(161, 244, 178, 0.78);
+  --leaderboard-accent-border: rgba(76, 175, 80, 0.24);
+  --leaderboard-accent-hover: rgba(76, 175, 80, 0.16);
 }
 
 .known-models-sidebar h3 {
   margin: 0 1rem 1rem 1rem;
-  color: #3498db;
+  color: var(--leaderboard-label-color);
   font-size: 1rem;
   font-weight: 600;
   display: flex;
@@ -866,6 +899,7 @@
   justify-content: center;
   gap: 0.5rem;
   text-align: center;
+  text-shadow: 0 0 10px rgba(76, 175, 80, 0.14);
 }
 
 .models-list {
@@ -875,39 +909,47 @@
   padding: 0 0.75rem;
 }
 
-.models-podium {
-  background: linear-gradient(180deg, rgba(30, 255, 28, 0.06) 0%, rgba(24, 204, 23, 0.04) 100%);
-  border: 1px solid rgba(30, 255, 28, 0.15);
+.known-models-sidebar .models-podium {
+  background: linear-gradient(180deg, rgba(76, 175, 80, 0.14) 0%, rgba(37, 94, 44, 0.08) 100%);
+  border: 1px solid rgba(125, 223, 147, 0.18);
   border-radius: 8px;
   padding: 0.6rem 0.5rem 0.5rem;
   margin-bottom: 0.6rem;
   display: flex;
   flex-direction: column;
   gap: 0.5rem;
+  box-shadow:
+    inset 0 1px 0 rgba(201, 255, 212, 0.06),
+    0 10px 24px rgba(9, 20, 10, 0.18);
 }
 
-.models-podium-label {
+.known-models-sidebar .models-podium-label {
   text-align: center;
   font-size: 0.65rem;
   font-weight: 700;
   text-transform: uppercase;
   letter-spacing: 1.5px;
-  color: rgba(30, 255, 28, 0.55);
+  color: var(--leaderboard-label-color);
   margin-bottom: 0.1rem;
+  text-shadow: 0 0 10px rgba(76, 175, 80, 0.16);
 }
 
-.model-item {
-  background: var(--bg-secondary, #252525);
-  border: 1px solid rgba(52, 152, 219, 0.2);
+.known-models-sidebar .model-item {
+  background: linear-gradient(180deg, rgba(32, 36, 33, 0.96) 0%, rgba(24, 28, 25, 0.98) 100%);
+  border: 1px solid var(--leaderboard-accent-border);
   border-radius: 6px;
   padding: 0.75rem;
   transition: all 0.2s ease;
   margin: 0 0.25rem;
+  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.14);
 }
 
-.model-item:hover {
-  background: rgba(52, 152, 219, 0.1);
-  border-color: #3498db;
+.known-models-sidebar .model-item:hover {
+  background: linear-gradient(180deg, var(--leaderboard-accent-hover) 0%, rgba(76, 175, 80, 0.08) 100%);
+  border-color: rgba(125, 223, 147, 0.66);
+  box-shadow:
+    0 10px 20px rgba(9, 20, 10, 0.2),
+    0 0 0 1px rgba(125, 223, 147, 0.08);
   transform: translateX(4px);
 }
 
@@ -919,14 +961,35 @@
   word-break: break-word;
 }
 
-.model-item-badge {
-  background: #3498db;
+.known-models-sidebar .model-item-badge {
+  background: linear-gradient(135deg, rgba(76, 175, 80, 0.95), rgba(110, 208, 129, 0.88));
   color: #ffffff;
   padding: 0.25rem 0.5rem;
   border-radius: 3px;
   font-size: 0.7rem;
   font-style: italic;
   display: inline-block;
+  border: 1px solid rgba(214, 255, 222, 0.12);
+  box-shadow: inset 0 1px 0 rgba(255, 255, 255, 0.08);
+}
+
+.known-models-sidebar .model-item--ranked {
+  border-color: rgba(125, 223, 147, 0.22);
+  box-shadow:
+    0 0 0 1px rgba(125, 223, 147, 0.06),
+    0 8px 18px rgba(9, 20, 10, 0.18);
+}
+
+.known-models-sidebar .model-item--gold {
+  background: linear-gradient(180deg, rgba(76, 175, 80, 0.16) 0%, rgba(255, 214, 92, 0.1) 58%, rgba(255, 194, 57, 0.04) 100%);
+}
+
+.known-models-sidebar .model-item--silver {
+  background: linear-gradient(180deg, rgba(76, 175, 80, 0.14) 0%, rgba(192, 192, 192, 0.09) 100%);
+}
+
+.known-models-sidebar .model-item--bronze {
+  background: linear-gradient(180deg, rgba(76, 175, 80, 0.14) 0%, rgba(205, 127, 50, 0.1) 100%);
 }
 
 .model-item-note {
@@ -2524,7 +2587,7 @@
   .settings-left-sidebar {
     width: 100%;
     border-right: none;
-    border-bottom: 2px solid rgba(52, 152, 219, 0.2);
+    border-bottom: 2px solid rgba(76, 175, 80, 0.16);
     max-height: 300px;
   }
   
diff --git a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
index fd3c03e..e5a37bb 100644
--- a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
@@ -12,9 +12,12 @@ const EMPTY_API_STATS = Object.freeze({
   successful_calls: 0,
   failed_calls: 0,
   success_rate: 0,
+  boosted_calls: 0,
   by_phase: {},
   by_model: {},
   by_provider: {},
+  by_source: {},
+  by_boost_mode: {},
 });
 
 const AutonomousResearchLogs = ({ stats, events }) => {
@@ -152,10 +155,36 @@ const AutonomousResearchLogs = ({ stats, events }) => {
       case 'brainstorm': return 'Brainstorm';
       case 'paper_compilation': return 'Paper';
       case 'tier3': return 'Tier 3';
+      case 'boost': return 'Boost';
       default: return phase || 'Unknown';
     }
   };
 
+  const getSourceLabel = (source) => {
+    switch (source) {
+      case 'api+boost': return 'Boosted';
+      case 'boost': return 'Boost Only';
+      default: return 'Standard';
+    }
+  };
+
+  const getBoostModeLabel = (mode) => {
+    switch (mode) {
+      case 'next_count': return 'Next X';
+      case 'category': return 'Category';
+      case 'task_id': return 'Task ID';
+      default: return mode || 'Unknown';
+    }
+  };
+
+  const getProviderLabel = (provider) => {
+    switch (provider) {
+      case 'openrouter': return 'OR';
+      case 'lm_studio': return 'LMS';
+      default: return provider || 'UNK';
+    }
+  };
+
   // Calculate per-submitter statistics from individual events
   // These come from the aggregator's direct 'submission_accepted'/'submission_rejected' events
   const submitterStats = useMemo(() => {
@@ -170,7 +199,8 @@ const AutonomousResearchLogs = ({ stats, events }) => {
         const submitterId = data.submitter_id;
         const isAccepted = event.event === 'submission_accepted';
         
-        if (submitterId) {
+        // Use explicit check for submitter_id to handle edge cases (0 is valid but falsy)
+        if (submitterId !== undefined && submitterId !== null) {
           const key = `${submitterId}`;
           
           if (!stats[key]) {
@@ -482,6 +512,10 @@ const AutonomousResearchLogs = ({ stats, events }) => {
               </span>
               <span className="stat-label">Success Rate</span>
             </div>
+            <div className="stat-card">
+              <span className="stat-value">{apiStats.boosted_calls || 0}</span>
+              <span className="stat-label">Boosted Calls</span>
+            </div>
           </div>
         )}
 
@@ -497,6 +531,28 @@ const AutonomousResearchLogs = ({ stats, events }) => {
           </div>
         )}
 
+        {apiStats && apiStats.by_source && Object.keys(apiStats.by_source).length > 0 && (
+          <div className="phase-stats">
+            <span className="phase-stats-label">By Source:</span>
+            {Object.entries(apiStats.by_source).map(([source, count]) => (
+              <span key={source} className="phase-stat-badge">
+                {getSourceLabel(source)}: {count}
+              </span>
+            ))}
+          </div>
+        )}
+
+        {apiStats && apiStats.by_boost_mode && Object.keys(apiStats.by_boost_mode).length > 0 && (
+          <div className="phase-stats">
+            <span className="phase-stats-label">Boost Modes:</span>
+            {Object.entries(apiStats.by_boost_mode).map(([mode, count]) => (
+              <span key={mode} className="phase-stat-badge">
+                {getBoostModeLabel(mode)}: {count}
+              </span>
+            ))}
+          </div>
+        )}
+
         {/* API Logs List */}
         <div className="api-logs-list">
           {apiLogsLoading ? (
@@ -505,7 +561,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
             <div className="logs-empty">
               <p>No API calls logged yet.</p>
               <p className="logs-empty-hint">
-                Start autonomous research to see API call logs here.
+                Run a workflow and make API calls to see the combined logs here.
               </p>
             </div>
           ) : (
@@ -525,10 +581,16 @@ const AutonomousResearchLogs = ({ stats, events }) => {
                     <div className="log-task">
                       <span className="log-task-id">{log.task_id}</span>
                       <span className="log-phase-badge">{getPhaseLabel(log.phase)}</span>
+                      <span className={`log-source-badge ${log.boosted ? 'boosted' : 'standard'}`}>
+                        {getSourceLabel(log.source)}
+                      </span>
+                      {log.boost_mode && (
+                        <span className="log-boost-mode-badge">{getBoostModeLabel(log.boost_mode)}</span>
+                      )}
                     </div>
                     <div className="log-meta">
                       <span className="log-model">{log.model}</span>
-                      <span className="log-provider-badge">{log.provider === 'openrouter' ? 'OR' : 'LMS'}</span>
+                      <span className="log-provider-badge">{getProviderLabel(log.provider)}</span>
                       <span className="log-duration">{formatDuration(log.duration_ms)}</span>
                       {log.tokens_used && (
                         <span className="log-tokens">{log.tokens_used} tokens</span>
@@ -546,6 +608,11 @@ const AutonomousResearchLogs = ({ stats, events }) => {
                       <pre>{log.role_id}</pre>
                     </div>
 
+                    <div className="log-detail-section">
+                      <h4>Source</h4>
+                      <pre>{getSourceLabel(log.source)}{log.boost_mode ? ` (${getBoostModeLabel(log.boost_mode)})` : ''}</pre>
+                    </div>
+
                     {log.error && (
                       <div className="log-detail-section error">
                         <h4>Error</h4>
@@ -559,7 +626,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
                         <button 
                           onClick={(e) => {
                             e.stopPropagation();
-                            copyToClipboard(log.prompt_full);
+                            copyToClipboard(log.prompt_full || log.prompt_preview || '');
                           }}
                           className="copy-btn"
                           title="Copy full prompt to clipboard"
@@ -576,7 +643,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
                         <button 
                           onClick={(e) => {
                             e.stopPropagation();
-                            copyToClipboard(log.response_full);
+                            copyToClipboard(log.response_full || log.response_preview || '');
                           }}
                           className="copy-btn"
                           title="Copy full response to clipboard"
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index e053eee..5bf898e 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -1479,7 +1479,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
               <h4 className="form-group--compact">Wolfram Alpha Integration (Optional)</h4>
               <small className="hint-text">
-                Enable Wolfram Alpha API for computational verification in rigor mode. Shared with manual compiler mode.
+                Enable Wolfram Alpha API for computational verification in rigor mode. When selecting your key select "full results" for your key type, then copy your APP ID and save it here. This key is also shared with the manual compiler mode.
                 Get your API key from <a href="https://products.wolframalpha.com/api" target="_blank" rel="noopener noreferrer">developer.wolframalpha.com</a>
               </small>
 
@@ -1672,9 +1672,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   }}
                 />
                 <span className="settings-option-copy">
-                  <span className="settings-option-title">Enable banner shimmer</span>
+                  <span className="settings-option-title">Enable shimmer accents</span>
                   <span className="settings-option-description">
-                    Keeps the animated banner shimmer on. Disable this when recording video to reduce motion and visual noise.
+                    Keeps the animated banner shimmer and subtle active-tab border sheen on. Disable this when recording video to reduce motion and visual noise.
                   </span>
                 </span>
               </label>
diff --git a/frontend/src/components/autonomous/BrainstormList.jsx b/frontend/src/components/autonomous/BrainstormList.jsx
index 40183b2..27f6447 100644
--- a/frontend/src/components/autonomous/BrainstormList.jsx
+++ b/frontend/src/components/autonomous/BrainstormList.jsx
@@ -162,7 +162,7 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
         </button>
       </div>
       <div className="brainstorm-list-warning">
-        (WARNING: Any given brainstorm idea may be pruned/deleted if the AI deems it to hurt the collective database quality.)
+        (WARNING: Any given brainstorm idea may be pruned/deleted if the AI deems it to hurt the collective database quality. These brainstorms are the real powerhouse behind the ASI creativity! The brainstorms themselves often contain many great ideas that get turned into the stage 2 papers.)
       </div>
 
       {brainstorms.map((brainstorm) => (
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.css b/frontend/src/components/autonomous/FinalAnswerLibrary.css
index 013721b..84fa075 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.css
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.css
@@ -491,12 +491,23 @@
    LOADING / ERROR
    ============================================================================ */
 
-.loading-spinner {
-  text-align: center;
+.library-loading {
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  gap: 0.5rem;
   padding: 40px;
   color: #1eff1c;
   font-size: 1.2rem;
-  animation: spin 2s linear infinite;
+}
+
+.library-loading__icon {
+  display: inline-block;
+  animation: spin 1s linear infinite;
+}
+
+.library-loading__text {
+  display: inline-block;
 }
 
 @keyframes spin {
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
index e39a523..398072f 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
@@ -261,7 +261,10 @@ function FinalAnswerLibrary() {
           <h2>Stage 3 Final Answers History</h2>
           <p>Loading completed Stage 3 final answers...</p>
         </div>
-        <div className="loading-spinner">⟳ Loading...</div>
+        <div className="library-loading">
+          <span className="library-loading__icon" aria-hidden="true">⟳</span>
+          <span className="library-loading__text">Loading...</span>
+        </div>
       </div>
     );
   }
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.jsx b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
index bb02d89..4d53aa5 100644
--- a/frontend/src/components/autonomous/Stage2PaperHistory.jsx
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
@@ -246,7 +246,10 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
           <h2>Stage 2 Final Answer History</h2>
           <p>Loading completed Stage 2 papers from all sessions...</p>
         </div>
-        <div className="loading-spinner">⟳ Loading...</div>
+        <div className="library-loading">
+          <span className="library-loading__icon" aria-hidden="true">⟳</span>
+          <span className="library-loading__text">Loading...</span>
+        </div>
       </div>
     );
   }
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 1df006f..d27e9cc 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -163,6 +163,10 @@ code {
     0 0 20px rgba(30, 255, 28, 0.2);
   letter-spacing: 3px;
   font-weight: 800;
+  display: inline-flex;
+  align-items: center;
+  user-select: none;
+  -webkit-user-select: none;
 }
 
 .banner-subtitle {
@@ -295,31 +299,12 @@ code {
   box-shadow: 0 6px 20px rgba(30, 255, 28, 0.35);
 }
 
-.boost-logs-btn {
-  background: linear-gradient(135deg, var(--accent-orange) 0%, #ffb74d 100%);
-  color: #000;
-  border: none;
-  padding: 0.4rem 0.8rem;
-  border-radius: var(--radius-sm);
-  font-size: 0.85rem;
-  font-weight: 600;
-  cursor: pointer;
-  box-shadow: 0 3px 10px rgba(255, 152, 0, 0.25);
-  transition: all var(--transition-fast);
-  white-space: nowrap;
-  width: fit-content;
-}
-
-.boost-logs-btn:hover {
-  transform: translateY(-2px);
-  box-shadow: 0 5px 14px rgba(255, 152, 0, 0.35);
-}
-
 .tabs {
   display: flex;
   gap: 4px;
   background: var(--surface-1);
   padding: 0.75rem 1rem;
+  padding-left: calc(1rem + 84px);
   padding-right: 150px;
   border-bottom: 1px solid var(--border-subtle);
   flex-wrap: nowrap;
@@ -331,7 +316,8 @@ code {
 }
 
 .tab {
-  padding: 0.65rem 1.25rem;
+  padding: 0.8rem 1.25rem;
+  min-height: 58px;
   background: var(--surface-3);
   border: 1px solid transparent;
   color: var(--text-secondary);
@@ -343,8 +329,8 @@ code {
 
 /* Tab with subtext - increase height to accommodate two lines */
 .tab-with-subtext {
-  padding: 0.45rem 1.25rem;
-  min-height: 56px;
+  padding: 0.55rem 1.25rem;
+  min-height: 60px;
   display: flex;
   align-items: center;
 }
@@ -655,6 +641,7 @@ button.danger:hover {
   
   .tabs {
     flex-wrap: wrap;
+    padding-left: 1rem;
   }
   
   .tab {
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index ce8573d..c878b51 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -813,9 +813,22 @@ export const boostAPI = {
   // NEW: Boost Next X Calls (Counter-based mode)
   // ============================================================
   
+  // Enable or disable always-prefer-boost mode
+  async setAlwaysPrefer(enabled) {
+    const response = await fetch(`${API_BASE}/boost/set-always-prefer`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({ enabled }),
+    });
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.detail || 'Failed to set always-prefer boost');
+    }
+    return response.json();
+  },
+
   // Set the number of next API calls to boost
-  async setNextCount(count) {
-    const response = await fetch(`${API_BASE}/boost/set-next-count`, {
+  async setNextCount(count) {    const response = await fetch(`${API_BASE}/boost/set-next-count`, {
       method: 'POST',
       headers: { 'Content-Type': 'application/json' },
       body: JSON.stringify({ count }),
@@ -849,33 +862,6 @@ export const boostAPI = {
     if (!response.ok) throw new Error('Failed to get boost categories');
     return response.json();
   },
-
-  // ============================================================
-  // NEW: Boost Logs
-  // ============================================================
-
-  // Get boost API call logs
-  async getLogs(limit = 100) {
-    const response = await fetch(`${API_BASE}/boost/logs?limit=${limit}`);
-    if (!response.ok) throw new Error('Failed to get boost logs');
-    return response.json();
-  },
-
-  // Get a specific log entry with full response
-  async getLogEntry(index) {
-    const response = await fetch(`${API_BASE}/boost/logs/${index}`);
-    if (!response.ok) throw new Error('Failed to get log entry');
-    return response.json();
-  },
-
-  // Clear all boost logs
-  async clearLogs() {
-    const response = await fetch(`${API_BASE}/boost/clear-logs`, {
-      method: 'POST',
-    });
-    if (!response.ok) throw new Error('Failed to clear boost logs');
-    return response.json();
-  },
 };
 
 // Workflow API
diff --git a/frontend/src/services/websocket.js b/frontend/src/services/websocket.js
index de94171..5db9688 100644
--- a/frontend/src/services/websocket.js
+++ b/frontend/src/services/websocket.js
@@ -35,7 +35,11 @@ class WebSocketService {
       
       try {
         const message = JSON.parse(event.data);
-        this.emit(message.type, message.data);
+        // Include server timestamp in the data if available
+        const dataWithTimestamp = message.timestamp 
+          ? { ...message.data, _serverTimestamp: message.timestamp }
+          : message.data;
+        this.emit(message.type, dataWithTimestamp);
       } catch (e) {
         console.error('Failed to parse WebSocket message:', e);
       }
diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
index b3d998c..9895087 100644
--- a/frontend/src/utils/autonomousProfiles.js
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -4,11 +4,11 @@ export const AUTONOMOUS_SETTINGS_STORAGE_KEY = 'autonomous_research_settings';
 export const AUTONOMOUS_PROFILES_STORAGE_KEY = 'autonomous_research_profiles';
 export const STARTUP_PROVIDER_CHOICE_STORAGE_KEY = 'startup_provider_choice';
 export const LM_STUDIO_STARTUP_CHOICE = 'lm_studio';
-export const RECOMMENDED_PROFILE_KEY = 'recommended_fast_affordable_mid';
-export const RECOMMENDED_CHEAPER_PROFILE_KEY = 'recommended_cheaper_lower_knowledge';
+export const RECOMMENDED_PROFILE_KEY = 'recommended_slower_affordable_higher_knowledge';
+export const RECOMMENDED_ALTERNATE_PROFILE_KEY = 'recommended_fast_affordable_mid';
 export const RECOMMENDED_PROFILE_KEYS = [
   RECOMMENDED_PROFILE_KEY,
-  RECOMMENDED_CHEAPER_PROFILE_KEY,
+  RECOMMENDED_ALTERNATE_PROFILE_KEY,
 ];
 
 const DEFAULT_SUBMITTER_CONFIG = {
@@ -127,24 +127,24 @@ const DEFAULT_AUTONOMOUS_SETTINGS = {
 
 export const RECOMMENDED_PROFILES = {
   [RECOMMENDED_PROFILE_KEY]: {
-    name: 'Fast, affordable, mid-tier knowledge',
+    name: 'Slower, less affordable, higher knowledge',
     numSubmitters: 3,
     submitters: [
       {
-        modelId: 'moonshotai/kimi-k2.5',
+        modelId: 'google/gemini-3.1-pro-preview',
         provider: 'openrouter',
-        openrouterProvider: 'SiliconFlow',
+        openrouterProvider: null,
         lmStudioFallbackId: null,
-        contextWindow: 262000,
-        maxOutputTokens: 40000,
+        contextWindow: 1048576,
+        maxOutputTokens: 65500,
       },
       {
-        modelId: 'openai/gpt-oss-120b',
+        modelId: 'moonshotai/kimi-k2.5',
         provider: 'openrouter',
-        openrouterProvider: 'Groq',
+        openrouterProvider: null,
         lmStudioFallbackId: null,
-        contextWindow: 131072,
-        maxOutputTokens: 25000,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
       },
       {
         modelId: 'deepseek/deepseek-v3.2',
@@ -156,20 +156,20 @@ export const RECOMMENDED_PROFILES = {
       },
     ],
     validator: {
-      modelId: 'x-ai/grok-4.1-fast',
+      modelId: 'moonshotai/kimi-k2.5',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,
-      contextWindow: 2000000,
-      maxOutputTokens: 30000,
+      contextWindow: 262000,
+      maxOutputTokens: 40000,
     },
     highContext: {
-      modelId: 'moonshotai/kimi-k2.5',
+      modelId: 'google/gemini-3.1-pro-preview',
       provider: 'openrouter',
-      openrouterProvider: 'SiliconFlow',
+      openrouterProvider: null,
       lmStudioFallbackId: null,
-      contextWindow: 262000,
-      maxOutputTokens: 40000,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
     },
     highParam: {
       modelId: 'google/gemini-3.1-pro-preview',
@@ -180,16 +180,16 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
     critique: {
-      modelId: 'google/gemini-3.1-pro-preview',
+      modelId: 'z-ai/glm-5.1',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,
-      contextWindow: 1048576,
+      contextWindow: 202752,
       maxOutputTokens: 65500,
     },
   },
-  [RECOMMENDED_CHEAPER_PROFILE_KEY]: {
-    name: 'Cheaper, lower-knowledge validator',
+  [RECOMMENDED_ALTERNATE_PROFILE_KEY]: {
+    name: 'Fast, affordable, mid-tier knowledge',
     numSubmitters: 3,
     submitters: [
       {
diff --git a/package-lock.json b/package-lock.json
index 5db1f59..9bea5f7 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.5",
+  "version": "1.0.6",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "moto-math-variant",
-      "version": "1.0.5",
+      "version": "1.0.6",
       "license": "MIT"
     }
   }
diff --git a/package.json b/package.json
index 3e7b153..3687c44 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.5",
+  "version": "1.0.6",
   "description": "MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "scripts": {
     "dev:backend": "cd backend && uvicorn api.main:app --reload --host 0.0.0.0 --port 8000",

From d352090d687bd3475acfee17f29f7f0cfb17264e Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Sun, 19 Apr 2026 20:14:13 -0500
Subject: [PATCH 06/32] MOTO v1.0.6

---
 frontend/src/components/WorkflowPanel.jsx | 11 -----------
 1 file changed, 11 deletions(-)

diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index f4dd2ea..fd868e7 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -36,17 +36,6 @@ export default function WorkflowPanel({ isRunning }) {
     localStorage.setItem('workflow_panel_collapsed', 'false');
   }, []);
 
-  // Token tracking & timer state
-  const [tokenStats, setTokenStats] = useState({ total_input: 0, total_output: 0, by_model: {}, elapsed_seconds: 0 });
-  const [showPerModel, setShowPerModel] = useState(false);
-  const [localElapsed, setLocalElapsed] = useState(0);
-  const lastSyncRef = useRef(Date.now());
-
-  const expandPanel = useCallback(() => {
-    setCollapsed(false);
-    localStorage.setItem('workflow_panel_collapsed', 'false');
-  }, []);
-
   // Fetch boost status and categories when running
   const fetchBoostStatus = useCallback(async () => {
     try {

From 76f8622a3b2d6e83bbf85e145a1656747d8629ec Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Thu, 30 Apr 2026 18:30:32 -0500
Subject: [PATCH 07/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 .cursor/rules/api-key-controls.mdc            |   55 +-
 .cursor/rules/json-prompt-design.mdc          |  233 ++-
 .cursor/rules/latex-renderer.mdc              |    3 +
 ...interaction-and-rule-interaction-rules.mdc |   20 +-
 ...-aggregator-tool-design-specifications.mdc |   10 +-
 ...-and-part-2-cointeraction-architecture.mdc |    9 +-
 ...t-2-compiler-tool-design-specification.mdc |   32 +-
 .../rules/part-3-autonomous-research-mode.mdc |  140 +-
 ...program-directory-and-file-definitions.mdc |  167 +-
 .../rules/rag-design-for-overall-program.mdc  |   24 +-
 .cursor/rules/workflow-runtime-updates.mdc    |   11 -
 .dockerignore                                 |   39 +
 .gitignore                                    |   13 +
 Click To Launch MOTO.bat                      |  327 +---
 Dockerfile                                    |   40 +
 LICENSE                                       |   12 -
 Launch MOTO.sh                                |   44 +
 README.md                                     |   58 +-
 _moto_internal_launcher.ps1                   |  332 ----
 backend/aggregator/agents/submitter.py        |   30 +-
 backend/aggregator/agents/validator.py        |    3 +-
 backend/aggregator/core/coordinator.py        |   21 +-
 backend/aggregator/core/queue_manager.py      |    7 +-
 backend/aggregator/core/rag_manager.py        |   63 +-
 backend/api/main.py                           |  209 ++-
 backend/api/middleware.py                     |   34 +-
 backend/api/proxy_auth.py                     |  115 ++
 backend/api/routes/__init__.py                |    4 +-
 backend/api/routes/aggregator.py              |    2 +-
 backend/api/routes/autonomous.py              |    4 +-
 backend/api/routes/boost.py                   |   10 +-
 backend/api/routes/compiler.py                |   23 +-
 backend/api/routes/download.py                |    8 +
 backend/api/routes/features.py                |   48 +
 backend/api/routes/health.py                  |   22 +
 backend/api/routes/openrouter.py              |   83 +-
 backend/api/routes/proofs.py                  |  483 +++++
 backend/api/routes/websocket.py               |   22 +-
 .../autonomous/agents/lemma_search_agent.py   |  303 +++
 .../agents/proof_formalization_agent.py       |  473 +++++
 .../agents/proof_identification_agent.py      |  192 ++
 .../autonomous/core/autonomous_coordinator.py |  696 ++++++-
 .../core/proof_dependency_extractor.py        |  208 +++
 backend/autonomous/core/proof_novelty.py      |   99 +
 .../core/proof_verification_stage.py          |  997 ++++++++++
 .../memory/autonomous_api_logger.py           |   22 +-
 .../autonomous/memory/brainstorm_memory.py    |   53 +
 .../autonomous/memory/final_answer_memory.py  |  121 +-
 backend/autonomous/memory/paper_library.py    |  100 +-
 .../autonomous/memory/paper_model_tracker.py  |    2 +-
 backend/autonomous/memory/proof_database.py   |  633 +++++++
 .../autonomous/memory/research_metadata.py    |   61 +
 backend/autonomous/memory/session_manager.py  |   36 +-
 backend/autonomous/prompts/proof_prompts.py   |  515 ++++++
 backend/compiler/README.md                    |   14 +-
 .../compiler/agents/high_context_submitter.py |  388 +++-
 .../compiler/agents/high_param_submitter.py   | 1522 ++++++++-------
 backend/compiler/core/compiler_coordinator.py |  545 ++++--
 backend/compiler/memory/paper_memory.py       |  282 ++-
 .../compiler/prompts/construction_prompts.py  |   68 +-
 backend/compiler/prompts/review_prompts.py    |   11 +-
 backend/compiler/prompts/rigor_prompts.py     |  718 +++-----
 .../compiler/validation/compiler_validator.py |  181 +-
 backend/data/proofs/.gitkeep                  |    0
 backend/scripts/cache_openrouter_models.py    |    4 +-
 backend/shared/api_client_manager.py          |   32 +-
 backend/shared/boost_logger.py                |   22 +-
 backend/shared/boost_manager.py               |   20 +-
 backend/shared/build_info.py                  |  120 ++
 backend/shared/config.py                      |  218 ++-
 backend/shared/critique_memory.py             |    2 +-
 backend/shared/fastembed_provider.py          |   63 +
 backend/shared/lean4_client.py                | 1635 +++++++++++++++++
 backend/shared/lm_studio_client.py            |  119 +-
 backend/shared/models.py                      |  159 +-
 backend/shared/openrouter_client.py           |  191 +-
 backend/shared/secret_store.py                |   28 +-
 backend/shared/smt_client.py                  |  133 ++
 docker/entrypoint.sh                          |   20 +
 frontend/package-lock.json                    |    4 +-
 frontend/package.json                         |    2 +-
 frontend/src/App.jsx                          |  725 ++++++--
 frontend/src/components/BoostControlModal.jsx |   72 +-
 .../CreditExhaustionNotificationStack.jsx     |    8 +-
 .../components/CritiqueNotificationStack.jsx  |   62 +-
 frontend/src/components/HelpTooltip.jsx       |  129 ++
 .../src/components/OpenRouterApiKeyModal.jsx  |   30 +-
 .../OpenRouterPrivacyWarningModal.jsx         |   18 +-
 .../components/StartupProviderSetupModal.jsx  |  125 +-
 frontend/src/components/WorkflowPanel.jsx     |   42 +
 .../aggregator/AggregatorInterface.jsx        |   16 +-
 .../components/aggregator/AggregatorLogs.jsx  |    6 +-
 .../aggregator/AggregatorSettings.jsx         |  348 +++-
 .../autonomous/ArchiveViewerModal.css         |   10 +-
 .../autonomous/AutonomousResearch.css         |  323 ++--
 .../AutonomousResearchInterface.jsx           |   89 +-
 .../autonomous/AutonomousResearchLogs.jsx     |   69 +-
 .../autonomous/AutonomousResearchSettings.jsx |  753 +++++++-
 .../components/autonomous/BrainstormList.jsx  |   68 +-
 .../autonomous/FinalAnswerLibrary.jsx         |    2 +-
 .../components/autonomous/FinalAnswerView.jsx |    7 +-
 .../autonomous/LiveTier3Progress.jsx          |    4 +-
 .../autonomous/MathematicalProofs.css         |  400 ++++
 .../autonomous/MathematicalProofs.jsx         |  694 +++++++
 .../components/autonomous/PaperLibrary.jsx    |   92 +-
 .../src/components/autonomous/ProofGraph.css  |  155 ++
 .../src/components/autonomous/ProofGraph.jsx  |  355 ++++
 .../autonomous/ProofNotificationStack.jsx     |  128 ++
 .../autonomous/Stage2PaperHistory.jsx         |   52 +-
 frontend/src/components/autonomous/index.js   |    1 +
 .../components/compiler/CompilerInterface.jsx |   59 +-
 .../src/components/compiler/CompilerLogs.jsx  |   21 +-
 .../components/compiler/CompilerSettings.jsx  |  319 +++-
 frontend/src/components/critique-modal.css    |    4 +-
 frontend/src/components/settings-common.css   |   96 +-
 frontend/src/hooks/useProofCheckRuntime.js    |  153 ++
 frontend/src/index.css                        |  363 +++-
 frontend/src/index.jsx                        |    3 +
 frontend/src/services/api.js                  |  220 ++-
 frontend/src/services/websocket.js            |    3 +-
 frontend/src/utils/autonomousProfiles.js      |  315 +++-
 frontend/src/utils/disclaimerHelper.js        |    4 +-
 frontend/src/utils/openRouterSelection.js     |  121 ++
 frontend/src/utils/researchRunHistory.js      |   55 +-
 frontend/src/utils/runtimeConfig.js           |   59 +
 frontend/vite.config.js                       |   68 +-
 moto-update-manifest.json                     |    7 +
 moto_launcher.py                              | 1563 ++++++++++++++++
 moto_updater.py                               |  924 ++++++++++
 package.json                                  |   10 +-
 requirements-generic.txt                      |    3 +
 tests/test_compiler_marker_visibility.py      |  251 +++
 tests/test_compiler_wolfram_tracking.py       |   51 +
 tests/test_lean4_client.py                    |  142 ++
 tests/test_moto_launcher.py                   |  263 +++
 tests/test_moto_updater.py                    |  204 ++
 tests/test_paper_memory_appendix.py           |   78 +
 tests/test_rigor_lean_placement_validator.py  |   76 +
 tests/test_wolfram_tool_loop.py               |  122 ++
 139 files changed, 20466 insertions(+), 3646 deletions(-)
 delete mode 100644 .cursor/rules/workflow-runtime-updates.mdc
 create mode 100644 .dockerignore
 create mode 100644 Dockerfile
 create mode 100644 Launch MOTO.sh
 delete mode 100644 _moto_internal_launcher.ps1
 create mode 100644 backend/api/proxy_auth.py
 create mode 100644 backend/api/routes/features.py
 create mode 100644 backend/api/routes/health.py
 create mode 100644 backend/api/routes/proofs.py
 create mode 100644 backend/autonomous/agents/lemma_search_agent.py
 create mode 100644 backend/autonomous/agents/proof_formalization_agent.py
 create mode 100644 backend/autonomous/agents/proof_identification_agent.py
 create mode 100644 backend/autonomous/core/proof_dependency_extractor.py
 create mode 100644 backend/autonomous/core/proof_novelty.py
 create mode 100644 backend/autonomous/core/proof_verification_stage.py
 create mode 100644 backend/autonomous/memory/proof_database.py
 create mode 100644 backend/autonomous/prompts/proof_prompts.py
 create mode 100644 backend/data/proofs/.gitkeep
 create mode 100644 backend/shared/build_info.py
 create mode 100644 backend/shared/fastembed_provider.py
 create mode 100644 backend/shared/lean4_client.py
 create mode 100644 backend/shared/smt_client.py
 create mode 100644 docker/entrypoint.sh
 create mode 100644 frontend/src/components/HelpTooltip.jsx
 create mode 100644 frontend/src/components/autonomous/MathematicalProofs.css
 create mode 100644 frontend/src/components/autonomous/MathematicalProofs.jsx
 create mode 100644 frontend/src/components/autonomous/ProofGraph.css
 create mode 100644 frontend/src/components/autonomous/ProofGraph.jsx
 create mode 100644 frontend/src/components/autonomous/ProofNotificationStack.jsx
 create mode 100644 frontend/src/hooks/useProofCheckRuntime.js
 create mode 100644 frontend/src/utils/openRouterSelection.js
 create mode 100644 frontend/src/utils/runtimeConfig.js
 create mode 100644 moto-update-manifest.json
 create mode 100644 moto_launcher.py
 create mode 100644 moto_updater.py
 create mode 100644 requirements-generic.txt
 create mode 100644 tests/test_compiler_marker_visibility.py
 create mode 100644 tests/test_compiler_wolfram_tracking.py
 create mode 100644 tests/test_lean4_client.py
 create mode 100644 tests/test_moto_launcher.py
 create mode 100644 tests/test_moto_updater.py
 create mode 100644 tests/test_paper_memory_appendix.py
 create mode 100644 tests/test_rigor_lean_placement_validator.py
 create mode 100644 tests/test_wolfram_tool_loop.py

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index 83e40ac..5817784 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -1,21 +1,34 @@
 ---
 alwaysApply: false
 ---
+
 # API Key Controls & Workflow Management System
 
 ## Overview
 
-Enables OpenRouter integration with automatic LM Studio fallback, plus boost controls and research metrics in the workflow panel.
+Enables OpenRouter integration with automatic LM Studio fallback (default mode) or OpenRouter-only operation (generic mode), plus boost controls and research metrics in the workflow panel.
 
 **Key Features:**
-- **Per-Role OpenRouter Selection**: Each role independently uses LM Studio or OpenRouter
-- **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections. Boost can reuse it when no explicit boost-only override key is provided.
-- **LM Studio Fallback**: Optional fallback per role on credit exhaustion
+- **Per-Role OpenRouter Selection**: Each role independently uses LM Studio or OpenRouter (default mode); all roles use OpenRouter in generic mode
+- **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections within one running backend instance. Boost can reuse it when no explicit boost-only override key is provided.
+- **OpenRouter Auto-Fill**: OpenRouter selectors auto-fill context window from model `context_length` and auto-fill max output tokens as `min(20% of model context_length, smallest available host max_completion_tokens)`
+- **LM Studio Fallback** (default mode only): Optional fallback per role on credit exhaustion
 - **Free Model Cooldown Handling**: SERIAL BOTTLENECK pause, free model looping, and auto-selector backup (see below)
 - **Boost Mode**: Selective task acceleration via two modes, using either an explicit boost override key or the active global OpenRouter key:
   - **Boost Next X Calls**: Counter-based, next X API calls regardless of task ID
   - **Category Boost**: Role-based, boosts all calls for specific role categories (Aggregator and Compiler only; Autonomous agents inherit from their parent roles automatically)
-- **System works without LM Studio**: Defaults to OpenRouter when LM Studio unavailable
+- **System works without LM Studio**: Defaults to OpenRouter when LM Studio unavailable; generic mode never attempts LM Studio
+
+## Mode-Specific Behavior
+
+| Behavior | Default Mode | Generic Mode |
+|----------|-------------|--------------|
+| LLM provider | LM Studio + OpenRouter + fallback | OpenRouter only |
+| Embeddings | LM Studio → OpenRouter fallback | FastEmbed (in-process) |
+| LM Studio UI | Shown (provider toggle per role) | Hidden (frontend checks `/api/features`) |
+| Secret persistence | OS keyring via `secret_store.py` | Env-injected/in-memory; keyring bypassed |
+| `Authorization` header | Used for OpenRouter key passthrough | Same; NOT reused for sandbox proxy auth |
+| API key on startup | Restored from keyring | Loaded from `OPENROUTER_API_KEY` env var if present |
 
 ---
 
@@ -36,9 +49,11 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus boost con
 - Credit exhaustion detection: HTTP 402 OR error messages containing "credit", "insufficient", "balance", "quota", "key limit", "limit exceeded"
 - Raises `CreditExhaustionError` on exhaustion (no retries). Retries transient errors (max 3).
 - Temperature=0.0 default. No stop sequences (removed — caused premature truncation with certain models).
+- Exposes both model-level metadata (`/models`) and provider endpoint metadata (`/models/{author}/{slug}/endpoints`) so the UI can compute safe host-aware OpenRouter auto-fill values.
 
 #### APIClientManager (`backend/shared/api_client_manager.py`)
-- Central router for all API calls: boost check → role's OpenRouter (with resettable fallback) → LM Studio
+- Central router for all API calls: boost check → role's OpenRouter (with resettable fallback) → LM Studio (default mode) or OpenRouter-only (generic mode)
+- Generic mode: `get_embeddings()` early-returns to `FastEmbedProvider` before the LM Studio → OpenRouter fallback chain
 - Tracks fallback state per role: `_role_fallback_state: Dict[str, str]`
 - `reset_openrouter_fallbacks()`: Resets all roles originally configured for OpenRouter back from LM Studio fallback. Called automatically on API key set, or manually via reset endpoint.
 - Lazy initialization: OpenRouter client initializes from `rag_config.openrouter_api_key` when first needed
@@ -46,6 +61,7 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus boost con
 **CRITICAL REQUIREMENT - Role Configuration:**
 - **EVERY role calling `api_client_manager.generate_completion()` MUST be configured via `api_client_manager.configure_role()`**
 - This includes: aggregator submitters/validator, compiler submitters/validator/critique, autonomous agents, Tier 3 final answer agents
+- **Proof agents (Part 3, optional)** do NOT have standalone role configs. `ProofVerificationStage` reuses the stored `ProofRuntimeConfigSnapshot` (brainstorm submitter, high-context submitter, validator) captured by `autonomous_coordinator._build_proof_runtime_config_snapshot()` and persisted via `research_metadata.set_proof_runtime_config()`. Manual `POST /api/proofs/check` requires `lean4_enabled=True` AND a seeded snapshot — start autonomous research once to seed it.
 
 **Boost Mode Priority** (`should_use_boost(task_id)`):
 1. Boost Next X: `boost_next_count > 0` → True
@@ -53,7 +69,7 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus boost con
 
 **Counter Decrement:** `boost_next_count` decrements ONLY on successful boost API calls. Failed/exhausted calls do NOT decrement.
 
-**Resettable Fallback:** When a role hits credit exhaustion, it falls back to LM Studio for subsequent calls. User can reset all fallen-back roles via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key (auto-resets). Each role has independent fallback state. If no fallback configured: raises RuntimeError.
+**Resettable Fallback:** When a role hits credit exhaustion, it falls back to LM Studio for subsequent calls (default mode; generic mode has no LM Studio fallback — raises RuntimeError if no fallback configured). User can reset all fallen-back roles via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key (auto-resets). Each role has independent fallback state.
 
 **Categories from role_id:**
 - `aggregator_submitter_*` → "Aggregator Submitters"
@@ -66,10 +82,10 @@ Enables OpenRouter integration with automatic LM Studio fallback, plus boost con
 #### BoostManager (`backend/shared/boost_manager.py`)
 - Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call)
 - Boost can use an **explicit override** OpenRouter API key, or it falls back to the active global OpenRouter key. A temporary `OpenRouterClient` is created per boosted task and closed immediately after.
-- **Autonomous agent task ID inheritance**: All autonomous orchestration agents use parent role task ID prefixes — Topic Selector/Completion Reviewer/Reference Selector/Paper Title Selector/Tier 3 agents use `agg_sub1_*`; Topic Validator/Redundancy Checker use `agg_val_*`. Boosting a parent role automatically covers all autonomous agents that run on that model.
+- **Autonomous agent task ID inheritance**: All autonomous orchestration agents use parent role task ID prefixes — Topic Selector/Completion Reviewer/Reference Selector/Paper Title Selector/Tier 3 agents use `agg_sub1_*`; Topic Validator/Redundancy Checker use `agg_val_*`. Boosting a parent role automatically covers all autonomous agents that run on that model. **Proof agents are the exception**: they use their own prefixes (`proof_id_*`, `proof_lemma_*`, `proof_form_*`, `proof_novelty_*`, `proof_framing_gate_*`) because they run under the `autonomous_proof_*` role IDs with distinct runtime-snapshot configs; Aggregator/Validator category boosts do NOT cover proof agents.
 
 #### BoostLogger (`backend/shared/boost_logger.py`)
-- Singleton. Log file: `backend/data/boost_api_log.txt`
+- Singleton. Log file resolves under the active instance data root (default desktop path: `backend/data/boost_api_log.txt`)
 - Methods: `log_api_call`, `get_logs(limit)`, `clear_logs`, `get_stats`
 - Boost logs are merged into the main API call log view; boost endpoints remain available for boost-only debugging.
 
@@ -78,6 +94,7 @@ Coordinators track task IDs internally for boost routing. The frontend does NOT
 - Aggregator: `agg_sub{N}_{seq:03d}`, `agg_val_{seq:03d}`
 - Compiler: `comp_hc_{seq:03d}`, `comp_hp_{seq:03d}`, `comp_val_{seq:03d}`
 - Autonomous: `auto_te_{seq:03d}`, `auto_tev_{seq:03d}`, `auto_ts_{seq:03d}`, `auto_tv_{seq:03d}`
+- Autonomous proof (optional, when `lean4_enabled`): `proof_framing_gate_{seq:03d}`, `proof_id_{seq:03d}`, `proof_lemma_{seq:03d}`, `proof_form_{seq:03d}`, `proof_novelty_{seq:03d}`
 
 ---
 
@@ -117,7 +134,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `POST /api/boost/toggle-category/{category}` — Toggle category boost
 - `GET /api/boost/categories?mode=` — All categories (mode param ignored, always returns all)
 - `GET /api/boost/openrouter-models` — Fetch OpenRouter models (Bearer key header)
-- `GET /api/boost/model-providers?model_id=` — Providers for a model
+- `GET /api/boost/model-providers?model_id=` — Providers + endpoint metadata for a model
 - `GET /api/boost/logs?limit=` — Recent boost-only logs (debug)
 - `POST /api/boost/clear-logs` — Clear logs
 
@@ -128,7 +145,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `DELETE /api/openrouter/api-key` — Clear key
 - `GET /api/openrouter/api-key-status` — `{ has_key, enabled }`
 - `GET /api/openrouter/models` — Available models (also caches free models for rotation)
-- `GET /api/openrouter/providers/{model_id}` — Providers for model
+- `GET /api/openrouter/providers/{model_id}` — Providers + endpoint metadata for model
 - `GET /api/openrouter/free-model-settings` — `{ looping_enabled, auto_selector_enabled, ... }`
 - `POST /api/openrouter/free-model-settings` — Update free model settings (body: `FreeModelSettings`)
 - `POST /api/openrouter/test-connection` — Test key without storing
@@ -143,7 +160,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 ## Error Handling
 
-**Credit Exhaustion:** HTTP 402 or keywords "credit"/"insufficient"/"balance"/"quota"/"key limit"/"limit exceeded" → `CreditExhaustionError` → LM Studio fallback for that role (or RuntimeError if no fallback). Fallback is resettable via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key.
+**Credit Exhaustion:** HTTP 402 or keywords "credit"/"insufficient"/"balance"/"quota"/"key limit"/"limit exceeded" → `CreditExhaustionError` → default mode: LM Studio fallback for that role; generic mode: RuntimeError (no LM Studio). Fallback is resettable via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key.
 
 **Boost Exhaustion:** Falls back to primary for that task; boost stays enabled; counter NOT decremented.
 
@@ -162,7 +179,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 **Rotation chain** (in `api_client_manager._try_free_model_rotation()` called from RateLimitError handler):
 1. If `looping_enabled`: **iterate through ALL** non-rate-limited free models (highest context first) using `tried_models` set to avoid re-trying. On each `RateLimitError`, refresh rate-limited dict and continue to next model. On `CreditExhaustionError`, stop looping.
 2. If all looping candidates exhausted and `auto_selector_enabled`: try `openrouter/free`
-3. If still failed: check LM Studio fallback (fall-through to LM Studio)
+3. If still failed: check LM Studio fallback (default mode only; generic mode skips this)
 4. If no fallback: raise `FreeModelExhaustedError(soonest_retry=...)`
 
 `get_alternative_free_model()` accepts optional `skip_models: set` parameter to skip already-tried models.
@@ -185,14 +202,18 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 **WebSocket Events:** `free_model_rotated`, `free_model_auto_selector_used`, `serial_bottleneck_paused`, `serial_bottleneck_resumed`, `all_free_models_exhausted`, `account_credits_exhausted`
 
-**Frontend:** Two checkboxes in all settings panels (Aggregator, Compiler, Autonomous) near "Show free models only". Both default checked, persist to localStorage, control same backend singleton.
+**Frontend:** Two checkboxes in all settings panels (Aggregator, Compiler, Autonomous) near "Show free models only". Both default checked, persist to localStorage (namespaced automatically when a storage prefix is active), control the same backend singleton for that running backend instance.
 
 ---
 
 ## Configuration Persistence
 
-**Secure backend storage (OS keyring):** OpenRouter global API key and Wolfram Alpha API key persist via `backend/shared/secret_store.py` using the OS keychain/keyring. Restored into backend memory on startup in `backend/api/main.py`.
+**Secure backend storage (OS keyring — default mode):** OpenRouter global API key and Wolfram Alpha API key persist via `backend/shared/secret_store.py` using the OS keychain/keyring. The keyring service name is derived from `MOTO_SECRET_NAMESPACE`; `None` means the shared desktop service `MOTO-Autonomous-ASI`. `moto_launcher.py` MUST keep `.moto_last_instance.json` stable across normal relaunches (including `instance_id="default"`) so the backend reads the same keyring service every startup. Never let port availability, Windows `TIME_WAIT`, or Lean/LM startup timing create a new namespace for a plain relaunch.
+
+**Startup key detection:** `backend/api/main.py` restores desktop credentials before serving `/api/openrouter/api-key-status`. Expensive optional startup work (Lean 4 warm start, Mathlib cache, etc.) must not block the FastAPI lifespan; run it in the background and clean up subprocesses on cancellation. Frontend startup state must treat unreachable key-status as `unknown`, not `has_key=false`, so it never opens the setup modal or shows a missing-key state over a persisted key.
+
+**Hosted generic mode (no keyring):** Provider keys are env-injected at sandbox launch and/or set via proxied MOTO API routes. `secret_store` persistence is bypassed; keys live in sandbox memory only. Re-injection required after sandbox recreation. `OPENROUTER_API_KEY` env var auto-loaded during lifespan if present.
 
-**localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`)
+**localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`). When `MOTO_FRONTEND_STORAGE_PREFIX` / `VITE_MOTO_STORAGE_PREFIX` is active, these keys are automatically namespaced per instance.
 
-**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs persist to file (`boost_api_log.txt`) and are merged into the main API call log view.
+**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs and boost state persist under the active instance data root (`boost_api_log.txt`, `boost_state.json`) and are merged into the main API call log view.
diff --git a/.cursor/rules/json-prompt-design.mdc b/.cursor/rules/json-prompt-design.mdc
index ee05f4d..5fdd74a 100644
--- a/.cursor/rules/json-prompt-design.mdc
+++ b/.cursor/rules/json-prompt-design.mdc
@@ -1,6 +1,7 @@
 ---
 alwaysApply: false
 ---
+
 # Enhance AI Role Prompts with Complete Context Assembly
 
 **VARIANT: MOTO - Math Variant V1**  
@@ -932,9 +933,9 @@ REJECT if: Update is unnecessary, harmful, breaks required section structure, or
 
 ### 3B. DOCUMENT VALIDATOR PROMPT
 
-**Function:** `_get_paper_validation_system_prompt(mode)` (modes: construction, review, rigor)
+**Function:** `_get_paper_validation_system_prompt(mode)` (modes: construction, review, rigor, rigor_lean_placement)
 
-**Base prompt for DOCUMENT modes (construction, review, rigor):**
+**Base prompt for DOCUMENT modes (construction, review, rigor, rigor_lean_placement):**
 
 ```python
 base_prompt = """You are validating a mathematical document construction submission. Your role is to decide if this submission should be ACCEPTED or REJECTED.
@@ -1968,115 +1969,193 @@ The loop continues until `more_edits_needed=false` or max iterations (20) reache
 
 ---
 
-## 9. COMPILER RIGOR PROMPTS (2-STEP PROCESS)
+## 9. COMPILER RIGOR PROMPTS (LEAN 4 THEOREM FLOW)
 
 **File:** `backend/compiler/prompts/rigor_prompts.py`
 
-**BODY-ONLY MODE**: Rigor enhancement is ONLY performed during body construction phase. Once body is complete (Conclusion exists in paper, or in autonomous mode when `autonomous_section_phase != "body"`), rigor mode is skipped entirely. The coordinator handles this check via `_is_body_complete()` before invoking the rigor loop.
+**BODY-ONLY MODE**: The rigor loop runs only during body construction. Once body is complete (Conclusion exists in paper, or autonomous mode `autonomous_section_phase != "body"`), rigor mode is skipped. Gated by `_is_body_complete()` in the coordinator.
+
+**CONFIG GATE**: When `system_config.lean4_enabled = false`, every rigor cycle declines immediately (no Lean calls, no theorem proposals). The Lean 4 toolchain + Mathlib workspace is a hard prerequisite.
+
+### Four-Stage Architecture
 
-### Two-Step Architecture
+The rigor loop no longer edits paper text. Each rigor cycle runs four stages, with the coordinator owning the validator loop and the appendix fallback:
 
-The rigor submitter uses a **2-step planning-then-execution process**:
+**Stage 1: Theorem discovery (unvalidated)** — `build_rigor_theorem_discovery_prompt`
+- High-param submitter reads the full writing context (outline direct-injected, paper direct-injected when it fits, RAG for the rest per the offload priority excluding `compiler_outline.txt` + `compiler_paper.txt`).
+- Sees `EXISTING VERIFIED PROOFS` block (from `proof_database.get_all_proofs()`) so it does not re-propose already-verified theorems.
+- Sees `OPEN LEMMA TARGETS` block (from `proof_database.get_recent_failure_hints()`) as optional retry candidates.
+- Decides whether a theorem is worth attempting. Decline ends the rigor cycle.
 
-**Step 1: Planning (unvalidated)**
-- LLM reviews full paper and decides if rigor work is needed
-- Chooses mode: standard_enhancement, rewrite_focus, or wolfram_verification (if enabled)
-- Specifies target_section as guidance for Step 2 (reminder label, NOT context limitation)
-- This decision is NOT validated - LLM has full autonomy
+**Stage 2: Lean 4 formalization** — reuses `ProofFormalizationAgent.prove_candidate(max_attempts=5)` from autonomous mode
+- Up to 5 Lean 4 attempts with error-feedback chaining (failing tactic + goal states + raw Lean diagnostics fed back into each retry).
+- Broadcasts `proof_attempt_started` / `proof_verified` / `proof_attempt_failed` / `proof_check_complete` events with `source_type="compiler_rigor"` so the existing autonomous-mode proof UI lights up for free.
+- All-5-fail: candidate is recorded via `proof_database.record_failed_candidate` (becomes a future open lemma target) and the cycle ends as a decline.
 
-**Step 2: Execution (with self-refusal option)**
-- LLM receives FULL paper (same RAG retrieval as Step 1)
-- Receives target_section from Step 1 as guidance reminder
-- Can REFUSE if Step 1 made a mistake (refusal not validated)
-- If proceeds with changes: submission goes to validator
-- Validator checks actual paper modifications
+**Stage 3: Novelty classification + persistence** — shared `assess_proof_novelty` helper from `backend/autonomous/core/proof_novelty.py`
+- Classifies the verified proof as novel or known.
+- `proof_database.add_proof(record)` stores it with `source_type="paper"`, `source_id=f"compiler_rigor:{session}"`.
+- Novel proofs automatically enter the highest-priority direct-injection block on the next submitter instantiation (via `proof_database.inject_into_prompt`).
+- Non-novel proofs stay in the database, visible through `/api/proofs/*` for future reference-selection UI flows.
 
-**Wolfram Alpha Integration (Optional)**:
-- If enabled and Step 1 chooses wolfram_verification mode
-- System makes Wolfram Alpha API call between steps
-- Step 2 receives query result and decides whether to incorporate it
-- Accepted Wolfram calls tracked in model credits separately from LLM API calls
+**Stage 4: Placement (2 attempts + appendix fallback)** — `build_rigor_placement_prompt`
+- Submitter proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4, see Appendix A, <proof_id>" marker.
+- Validator uses the new `rigor_lean_placement` mode: judges placement and narrative only; `rigor_check` is **forced to True** regardless of LLM output (Lean 4 is the source of mathematical truth).
+- Up to 2 placement attempts; attempt 2 receives the validator's rejection feedback via `validator_rejection_feedback` field.
+- On double rejection (or when attempt 1 is not produced), the theorem is appended to the **Theorems Appendix** via `paper_memory.append_to_theorems_appendix(...)`. Counts as a `rigor_acceptance` because the math is preserved.
 
-### Step 1: Planning JSON Schema
+### Stage 1 JSON Schema (discovery)
 
 ```json
 {
-  "needs_rigor_work": true or false,
-  "mode": "standard_enhancement | rewrite_focus | wolfram_verification | null",
-  "target_section": "text snippet from paper (200-500 chars, guidance label for Step 2)",
-  "wolfram_query": "natural language query for Wolfram Alpha (only if mode=wolfram_verification)",
-  "preliminary_reasoning": "explanation of chosen approach"
+  "needs_theorem_work": true,
+  "theorem_statement": "precise statement with explicit hypotheses",
+  "formal_sketch": "concrete Mathlib tactics / lemmas that look promising",
+  "source_excerpt": "2-6 sentences from the paper that motivate this theorem",
+  "retry_existing_failure_id": "theorem_id from OPEN LEMMA TARGETS if retrying, empty otherwise",
+  "reasoning": "why this theorem is the best target right now OR why no theorem"
 }
 ```
 
-**Field Definitions:**
-- `needs_rigor_work`: Whether any rigor work should be attempted
-- `mode`: Approach to use (required if needs_rigor_work=true)
-  - `standard_enhancement`: Normal rigor improvements
-  - `rewrite_focus`: Significant rewriting needed
-  - `wolfram_verification`: Verify claim with Wolfram Alpha (only if enabled in system config)
-- `target_section`: Text snippet identifying which section to work on (provides continuity to Step 2, NOT a context limitation)
-- `wolfram_query`: Natural language query (e.g., "Is pi algebraic?", "Solve x^2 + 2x + 1 = 0")
-- `preliminary_reasoning`: Explanation of chosen approach
-
-**Example (Wolfram Verification)**:
+Decline form:
 ```json
 {
-  "needs_rigor_work": true,
-  "mode": "wolfram_verification",
-  "target_section": "Theorem 4.1: π is transcendental. Proof: By Lindemann-Weierstrass theorem...",
-  "wolfram_query": "Is pi algebraic?",
-  "preliminary_reasoning": "Computational verification would strengthen the π transcendence claim by providing independent confirmation"
+  "needs_theorem_work": false,
+  "theorem_statement": "",
+  "formal_sketch": "",
+  "source_excerpt": "",
+  "retry_existing_failure_id": "",
+  "reasoning": "why declining"
 }
 ```
 
-### Step 2: Execution JSON Schemas
+### Stage 4 JSON Schema (placement)
 
-**For standard_enhancement or rewrite_focus:**
 ```json
 {
-  "proceed": true or false,
-  "needs_enhancement": true or false,
+  "proceed": true,
   "operation": "replace | insert_after",
-  "old_string": "exact text from document (empty if proceed=false or needs_enhancement=false)",
-  "new_string": "enhanced text (empty if proceed=false or needs_enhancement=false)",
-  "content": "full content for logging",
-  "reasoning": "explanation OR refusal reason"
+  "old_string": "exact anchor text in current paper",
+  "new_string": "inline theorem intro with Lean 4 marker + appendix reference (NO Lean code inline)",
+  "reasoning": "why this placement"
+}
+```
+
+### Placement Rules (enforced by the validator prompt)
+
+The validator rejects placement submissions that:
+- Omit the "verified in Lean 4" marker or the appendix cross-reference.
+- Paste the full Lean 4 source code into the paper body (the Lean proof lives in the appendix only).
+- Place the theorem in a nonsensical location (outside the relevant section).
+- Break surrounding narrative coherence.
+
+The validator MUST NOT re-evaluate:
+- Mathematical correctness (Lean 4 already verified it).
+- Proof soundness.
+- Edge cases / hypotheses.
+
+### Theorems Appendix format
+
+Each entry written by `format_theorem_appendix_entry(...)` (helper in `backend/compiler/agents/high_param_submitter.py`):
+
+```
+Theorem (proof_XXX) [Novel | Known] - <theorem_name or proof_id>
+Status: verified by Lean 4 (<inline | appendix_fallback>)
+Statement: <natural-language theorem statement>
+Lean 4 proof:
+<full Lean 4 source>
+---
+```
+
+### Context layout
+
+- Outline: always direct-injected.
+- Paper: direct-injected when it fits; otherwise RAG'd under `mode="rigor"` excluding `compiler_outline.txt` + `compiler_paper.txt`.
+- RAG evidence: follows the offload priority (Shared Training DB → Local Submitter DB → Rejection Log → User Upload Files).
+- EXISTING VERIFIED PROOFS block: compact `(proof_id, novel, statement)` tuples from `proof_database.get_all_proofs()`.
+- OPEN LEMMA TARGETS block: recent failure hints from `proof_database.get_recent_failure_hints(limit=5)` (`theorem_id`, statement, Lean error summary, suggested lemma names).
+
+### Websocket events surfaced by the rigor flow
+
+Autonomous-mode proof UI already handles these; the compiler rigor flow broadcasts them with `source_type="compiler_rigor"`:
+
+- `proof_check_started` - at the start of stage 2 (before the first Lean 4 call).
+- `proof_attempt_started` - one per Lean 4 attempt.
+- `proof_attempt_failed` - per failing attempt.
+- `proof_verified` - per successful attempt + a final one once the proof is stored.
+- `proof_check_complete` - on all-5-fail (as a decline).
+- `compiler_submission` / `compiler_acceptance` / `compiler_rejection` / `compiler_decline` - standard compiler stream for placement and the overall rigor cycle.
+
+---
+
+## 10. WOLFRAM ALPHA TOOL (CONSTRUCTION MODE)
+
+**File:** `backend/compiler/agents/high_context_submitter.py`
+
+Wolfram Alpha is exposed to the main writer as a real OpenAI-compatible tool only during `HighContextSubmitter.submit_construction` (body / conclusion / introduction / abstract). It is NOT available in `outline_create`, `outline_update`, `review`, or the rigor loop. When `system_config.wolfram_alpha_enabled=false` (or the Wolfram client failed to initialize), the tool is not registered on the LLM call at all and construction collapses to the pre-Build-4 single-shot call.
+
+### Tool Schema
+
+```python
+WOLFRAM_TOOL_SCHEMA = {
+    "type": "function",
+    "function": {
+        "name": "wolfram_alpha_query",
+        "description": "Query Wolfram Alpha to verify a mathematical or computational claim before writing it into the paper. ...",
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "query": {"type": "string", "description": "Natural-language Wolfram Alpha query, e.g. 'Is pi algebraic?'"},
+                "purpose": {"type": "string", "description": "Brief note on how the result will be used in the paper (audit trail)."}
+            },
+            "required": ["query", "purpose"]
+        }
+    }
 }
 ```
 
-**For wolfram_verification:**
+### Budget + Loop Semantics
+
+- **20 Wolfram calls per construction submission**, defined by `WOLFRAM_MAX_CALLS_PER_SUBMISSION` in `high_context_submitter.py`.
+- The submitter loop: call LLM with tools attached → execute each `tool_calls[]` entry via `wolfram_client.query(...)` → append a `role=tool` turn per call → re-call LLM. Repeat until (a) the LLM returns a non-tool message (final JSON construction submission) or (b) the 20-call budget is exhausted.
+- On budget exhaustion, the coordinator appends a one-time user-role reminder ("You have used all 20 Wolfram Alpha calls for this submission. Finalize your JSON response now.") and re-calls the LLM with `tools=None` so the model must produce a final JSON response.
+- Fallback: if the tool-loop raises, construction falls back to a plain single-shot `generate_completion` call so forward progress is never blocked by tool-loop failures.
+
+### Audit Trail
+
+The full list of Wolfram calls is attached to the `CompilerSubmission.metadata["wolfram_calls"]` field as:
+```json
+[
+  {"query": "integral of x^2 from 0 to 1", "purpose": "verifying closed form for section 3", "result": "1/3"},
+  ...
+]
+```
+
+The validator sees the audit trail but does NOT re-query Wolfram. Its job is unchanged — it simply has more confidence in factual claims the writer made after a Wolfram check.
+
+### Websocket Event
+
+Per Wolfram call, the submitter broadcasts:
 ```json
 {
-  "proceed": true or false,
-  "verification_result_interpretation": "how to interpret Wolfram Alpha result",
-  "needs_enhancement": true or false,
-  "operation": "insert_after",
-  "old_string": "exact text after which to insert remark (empty if proceed=false or needs_enhancement=false)",
-  "new_string": "verification remark incorporating Wolfram result (empty if proceed=false or needs_enhancement=false)",
-  "content": "full content for logging",
-  "reasoning": "explanation OR refusal reason"
+  "type": "compiler_wolfram_call",
+  "data": {
+    "task_id": "comp_hc_007",
+    "query": "...",
+    "purpose": "...",
+    "result_preview": "first 200 chars of result",
+    "calls_used": 3,
+    "calls_remaining": 17,
+    "max_calls": 20
+  }
 }
 ```
 
-**Self-Refusal Mechanism:**
-- Step 2 can set `proceed=false` if Step 1 made a mistake
-- Refusals are NOT validated (no penalty)
-- Logged as declines, rigor loop ends
-- Allows LLM to self-correct without rejection feedback
-
-**Context:**
-- **Step 1**: Sees FULL paper (RAG retrieval), full outline, user prompt, rejection history
-- **Step 2**: Sees FULL paper (same RAG retrieval as Step 1), full outline, user prompt, rejection history, PLUS target_section as guidance label
-- For Wolfram mode Step 2: Also receives wolfram_query and wolfram_result
-- **CRITICAL**: Both steps see FULL paper via RAG - target_section is guidance only, NOT a context limitation
+The frontend's `CompilerLogs.jsx` renders this as `[Wolfram 3/20] <query> - <preview>`.
 
-**Wolfram Alpha Tracking:**
-- Only ACCEPTED Wolfram calls tracked (full chain: API success → proceed=true → needs_enhancement=true → validator accept → paper updated)
-- Tracked in `PaperModelTracker._wolfram_calls` (separate from LLM API calls)
-- Displayed in MODEL CREDITS as: "Wolfram Alpha Verifications: N queries"
+### Backend Tool-Call Plumbing
 
-**Note**: The outline is always fully injected for rigor mode. If outline + system prompts exceed available context, RAG budget is automatically reduced to fit. The outline provides the structural framework for document construction and validation.
+`api_client_manager.generate_completion`, `OpenRouterClient.generate_completion`, and `LMStudioClient.generate_completion` all accept OpenAI-compatible `tools=[...]` and `tool_choice` kwargs. When a model ignores the tools entirely (returns no `tool_calls`), the submitter's loop cleanly terminates on the first iteration — identical to the single-shot path.
 
 ---
 
diff --git a/.cursor/rules/latex-renderer.mdc b/.cursor/rules/latex-renderer.mdc
index 6fc03ba..608cc05 100644
--- a/.cursor/rules/latex-renderer.mdc
+++ b/.cursor/rules/latex-renderer.mdc
@@ -1,6 +1,7 @@
 ---
 alwaysApply: false
 ---
+
 # LaTeX Renderer System
 
 ## 🔒 CRITICAL SECURITY REQUIREMENTS
@@ -165,6 +166,8 @@ Ratings: Novelty, Correctness, Impact (1-10 scale). Up to 10 history entries. Re
 - `autonomous_critique_custom_prompt` — PaperLibrary + FinalAnswerView
 - `compiler_critique_custom_prompt` — LivePaper
 
+When a frontend storage prefix is active for multi-instance shared-origin use, these keys are automatically namespaced by the runtime layer rather than stored as one global browser-wide bucket.
+
 ---
 
 ## System Invariants
diff --git a/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc b/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
index 4ae4dc7..312e9ca 100644
--- a/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
+++ b/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
@@ -2,12 +2,22 @@
 alwaysApply: true
 ---
 
-# Three Code and Rule Interaction Rules
+# Code and Rule Interaction Rules
 
-1.) The code is a product actively in development but is LARGELY a perfectly functioning program. When making fixes, corrections, etc. DO NOT OVER BUILD, keep the code elegant, simple and optimized for future edits and readability. Always remove and cleanup old code, do not comment out code or leave broken/unused code in this program unless specifically directed by the user.
+1.) Never introduce a new wait to hault the program unless specifically directed by the user. The program is designed to run until its goal completion or the operator presses stop. Infinite loops are probabalistically avoided due to the feedback mechanics.
 
-1.) Always obey the rules in regards to how the code should work. The only time you should deviate from the rules is if there is a fix required in the code or the user is requesting an edit that should change the code and any accompanying rules. The rules should always be brought back in line with the code however the rules should guide the code development and navigation.
+2.) Always remove and cleanup old code, do not comment out code or leave broken/unused code in this program unless specifically directed by the user.
 
-2.) The rule(s) should always be updated if any code changes reflect on the rule(s).
+3.) Always obey the rules in regards to how the code should work. The only time you should deviate from the rules is if there is a fix required in the code or the user is requesting an edit that should change the code and any accompanying rules. The rules should always be brought back in line with the code however the rules should guide the code development and navigation.
 
-3.) Any rule addition(s) and rule content addition(s) should be clear, very concise, very high level overview only. The rules are extensive and we must conserve token-count to maintain efficient direct injection usage. 
\ No newline at end of file
+4.) The rule(s) should always be updated if any code changes reflect on the rule(s).
+
+5.) Any rule addition(s) and rule content addition(s) should be clear, very concise, very high level overview only. The rules are extensive and we must conserve token-count to maintain efficient direct injection usage. 
+
+6.) For config/preset files with repeated literal values, never patch by replacing a shared literal alone. Anchor edits to the exact object/block being changed and verify the diff only touches the intended target.
+
+7.) Any REST shape, auth contract, WebSocket event, or `/api/features` capability change that affects the web wrapper must update **code, the relevant rule(s), and `api_contract_version` in `/api/features`** in the same approved merge. The live backend's `GET /openapi.json` is the machine-readable REST schema contract.
+
+8.) Only ONE workflow mode may be active at a time (Aggregator, Compiler, or Autonomous Research). This constraint applies identically in both default mode and generic mode.
+
+9.) Lean 4 and SMT features are always gated on `lean4_enabled`, `lean4_lsp_enabled`, and `smt_enabled` runtime flags. All three default false, must stay silent and side-effect-free when disabled, and must never ship Lean or Z3 toolchains or Python wheels into `requirements-generic.txt`, `Dockerfile`, or `docker/entrypoint.sh` (hosted image stays Lean-free and Z3-free). Lean 4 is authoritative for every stored proof; SMT contributes hints only.
diff --git a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
index e89f88e..f0b5171 100644
--- a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
+++ b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
@@ -22,6 +22,8 @@ Validator processes up to 3 submissions at once (batch validation). Takes whatev
 
 **Queue Overflow Threshold**: ≥10 submissions in queue → submitters paused until queue drops below 10.
 
+**Per-Submitter Fairness Cap**: When more than one submitter is configured, any individual submitter with >4 of its own submissions already waiting in the queue is paused; other submitters keep running. Skipped when only one submitter is configured. Defaults live in `SystemConfig.queue_overflow_threshold` and `SystemConfig.per_submitter_queue_threshold`.
+
 ## Batch Validation
 
 Validator processes 1, 2, or 3 submissions simultaneously using batch-specific prompts.
@@ -44,6 +46,8 @@ Validator processes 1, 2, or 3 submissions simultaneously using batch-specific p
 
 **Submission context injection**: Direct inject if fits. If too large: RAG the submission as file, keep user prompt direct. If user prompt + RAG'd submission still too large: RAG all user-prompt files. If user prompt itself too large after all RAG: halt with error + diagnostic.
 
+**Hosted upload enforcement (generic mode)**: Server-side validation of `.txt` only, 5 MB max, filename sanitization, path traversal rejection. Applied in both modes but critical for hosted sandboxes where the control plane proxies uploads.
+
 ## Context Allocation
 
 User prompt ALWAYS direct injected. Use as much context as possible in every prompt.
@@ -71,9 +75,11 @@ When ALL submitters AND validator use the same model → single-model mode:
 
 ## Multi-Submitter Configuration
 
-Per-submitter: provider (LM Studio / OpenRouter), model, OpenRouter host provider, LM Studio fallback, context window, max output tokens. UI: "Number of Submitters" selector (1-10), "Copy Main to All" button.
+Per-submitter: provider (LM Studio / OpenRouter in default mode; OpenRouter only in generic mode), model, OpenRouter host provider, LM Studio fallback (default mode only), context window, max output tokens. UI: "Number of Submitters" selector (1-10), "Copy Main to All" button.
+
+OpenRouter auto-fill rule: selecting an OpenRouter model auto-fills from endpoint metadata only. Context window uses the smallest relevant host `context_length`; max output tokens use `min(20% of that host context, smallest relevant host max_completion_tokens)`. If `max_prompt_tokens` is available, shrink usable context to respect it. If endpoint caps are incomplete, preserve current values (no guessing).
 
-Embeddings for RAG: LM Studio first, falls back to OpenRouter (`openai/text-embedding-3-small`) if LM Studio unavailable.
+Embeddings for RAG: Default mode uses LM Studio first, falls back to OpenRouter (`openai/text-embedding-3-small`) if LM Studio unavailable. Generic mode uses in-process FastEmbed (see `rag-design-for-overall-program.mdc`).
 
 ## Database Management
 
diff --git a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
index 04a0207..b50a2d5 100644
--- a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
+++ b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
@@ -4,7 +4,7 @@ alwaysApply: true
 
 ## The Unified Mode Design:
 
- This describes additional architecture for the synergy between the part 1 database aggregator tool and part 2 aggregator-compiler tool.
+ This describes additional architecture for the synergy between the part 1 database aggregator tool and part 2 aggregator-compiler tool. Both modes operate identically in default and generic deployment — the only difference is provider availability (see `hosted-web-contract.mdc` for details on generic mode).
 
  NOTE: This is a continuously-running program that does not stop itself, the user selects the aggregator to start, then starts the compiler when they desire, and then the user choses when to turn off each selective mode by turning the off switch. There is no "solution stop token" as in normal AI solution generation.
  
@@ -21,6 +21,8 @@ The live-constructing aggregation results should be viewable in one tab and also
 
 The live-constructing compiler-written paper should be viewable in one tab and also a save function that allows the user to save the whole current aggregation database to a .txt file. This paper should be viewable in real-time as the compiler constructs it.
 
+**Generic mode frontend note**: In generic mode the MOTO sandbox is API-only — the React frontend is served by the Web Team's separate website, not from the sandbox. The frontend calls `GET /api/features` on mount and hides LM Studio UI options when `generic_mode=True`. All other frontend functionality is identical.
+
 
 ## Autonomous Research Mode (Part 3) - User Controls
 
@@ -52,8 +54,8 @@ The live-constructing compiler-written paper should be viewable in one tab and a
 
 ### Compiler Single-Submitter (Part 2)
 - Fixed 2-submitter architecture (NOT configurable):
-  - **High-Context Submitter**: Handles outline_create, outline_update, construction, review modes
-  - **High-Parameter Submitter**: Handles rigor enhancement mode
+  - **High-Context Submitter**: Handles outline_create, outline_update, construction, review modes. During construction, may invoke the Wolfram Alpha tool up to 20 times per submission when `system_config.wolfram_alpha_enabled=true`.
+  - **High-Parameter Submitter**: Handles rigor mode. Rigor is the **Lean-4-verified-theorem flow**: discovery → up to 5 Lean 4 formalization attempts (with error feedback) → novelty classification → placement (2 attempts, validator uses `rigor_lean_placement` mode forcing `rigor_check=True`) → Theorems Appendix fallback. The compiler writes verified proofs directly into the shared `proof_database` (same database used by autonomous mode); novel proofs automatically enter the highest-priority direct-injection block on the next submitter instantiation.
 - Sequential Markov chain workflow (only one submission at a time)
 - Each compiler submitter has its own model, context, and max token settings (separate from aggregator)
 - UI shows these as separate "High-Context Submitter" and "High-Parameter Submitter" sections
@@ -66,6 +68,7 @@ The live-constructing compiler-written paper should be viewable in one tab and a
 
 ## API Call Output Notes (User-Configurable)
 - **All `max_tokens` limits are user-configurable via GUI settings** (like context window sizes). Users can adjust these per model role based on their specific models' capabilities.
+- **OpenRouter GUI auto-fill**: When an OpenRouter model is selected, the UI auto-fills context window from the model `context_length` and auto-fills max output tokens as `min(20% of model context_length, smallest available host max_completion_tokens)`. Choosing a specific OpenRouter host recalculates from that host's smallest available `max_completion_tokens`.
 - **Aggregator defaults**: submitter=25000 tokens, validator=25000 tokens (reasoning models need 15K-25K for internal reasoning + output)
 - **Compiler defaults**: validator=25000, high-context=25000 (for outline_create/outline_update/construction/review), high-param=25000 (for rigor mode)
 - **GUI tooltips** provide recommended minimums: Submitter "25000+ for reasoning models", Validator "25000+", High-context "25000+ (outline needs 15K+)", High-param "25000+"
diff --git a/.cursor/rules/part-2-compiler-tool-design-specification.mdc b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
index dfabd4f..b397819 100644
--- a/.cursor/rules/part-2-compiler-tool-design-specification.mdc
+++ b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
@@ -22,14 +22,16 @@ Aggregator/brainstorm database material is high-priority optional source context
 - `[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS COMPLETE]`
 - `[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]`
 
-Placeholders are STRUCTURAL MARKERS ONLY. Submissions must never include them — any that appear will be silently stripped before validation.
+Placeholders and theorem appendix brackets are STRUCTURAL MARKERS ONLY. The compiler prompt must show the same marker-bearing paper that validation/apply uses. Models should use editable prose for `old_string` anchors; protected markers must not appear in insert/delete anchors. Replace targets may be trimmed if a protected marker is accidentally included as trailing context. Generated content (`new_string`/`content`) must not include markers — any that appear are stripped before validation.
 
 **Marker Integrity System (Automatic Repair)**:
 Before every `_pre_validate_exact_string_match()`, system calls `paper_memory.ensure_markers_intact()` (or `outline_memory.ensure_anchor_intact()` for outline_update). If markers were missing, they are added and document is re-fetched before validation. Mode-aware: paper operations check placeholders + anchor; outline operations check outline anchor only.
 
 **Outline is ALWAYS fully injected (never RAGed)** into all compiler mode prompts.
 
-**Provider Selection**: Each compiler role (validator, high-context, high-param, critique submitter) can independently use LM Studio or OpenRouter with optional host provider and LM Studio fallback.
+**Provider Selection**: Each compiler role (validator, high-context, high-param, critique submitter) can independently use LM Studio or OpenRouter with optional host provider and LM Studio fallback (default mode). In generic mode, all roles use OpenRouter only; LM Studio options are hidden in the frontend.
+
+**Export Behavior**: Raw text export available in both modes. PDF export (`POST /api/download/pdf`) is desktop-only — generic mode returns `501` (Playwright/Chromium not installed in hosted image).
 
 **Aggregator RAG refresh**: Every 10 accepted aggregator submissions (not immediate like aggregator).
 
@@ -97,17 +99,23 @@ Body content is ALWAYS inserted BEFORE CONCLUSION_PLACEHOLDER. `_apply_edit()` a
 - 2× HC review → validator
 - 1× HP rigor → validator *(skipped if body complete)*
 
-**Rigor Mode (2-Step):**
-- Step 1 (unvalidated): HP model chooses mode (standard_enhancement, rewrite_focus, wolfram_verification) and target_section
-- Step 2 (with self-refusal): sees full paper + target_section reminder, can set `proceed=false` to refuse
-- Wolfram mode: system makes API call between steps, passes result to Step 2. Accepted Wolfram calls tracked in model credits separately.
-- Loop 2 ends on first rigor rejection/decline → return to Loop 1
+**Rigor Mode (Lean 4 verified theorems, 4-stage)**:
+The rigor loop no longer rewrites prose. Each rigor cycle:
+- Stage 1 (HP, unvalidated): theorem discovery - using the full writing context, decide if a theorem worth formalizing exists that is not already verified; return `needs_theorem_work=false` to decline and end the rigor loop.
+- Stage 2: `ProofFormalizationAgent.prove_candidate(max_attempts=5)` - up to 5 Lean 4 attempts with error-feedback chaining. On 5 failures: record the candidate via `proof_database.record_failed_candidate` so future cycles see it as an open lemma target; end the rigor cycle as a decline.
+- Stage 3: novelty classification via the shared `assess_proof_novelty` helper; `proof_database.add_proof` persists the verified proof. Novel proofs automatically enter the highest-priority direct-injection block (`proof_database.inject_into_prompt`) on the next submitter instantiation. Non-novel proofs remain available through `/api/proofs` for future user-driven reference selection.
+- Stage 4: placement - HP model proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4" marker and an appendix cross-reference. Validator uses the new `rigor_lean_placement` mode which forces `rigor_check=True` (Lean 4 is the source of mathematical truth) and judges placement/narrative only. Up to 2 placement attempts (attempt 2 gets validator rejection feedback).
+- Appendix fallback: if both placement attempts fail, the verified theorem is appended to the **Theorems Appendix** block (`THEOREMS_APPENDIX_START` / `THEOREMS_APPENDIX_END` bracket markers in `paper_memory.py`). Still counts as a `rigor_acceptance` because the math is preserved.
+- Loop 2 ends on first **decline** (no theorem found OR 5 Lean attempts failed OR Lean 4 disabled). Every verified theorem lands somewhere so there is no "rejection" outcome at the loop level.
+- Config gate: `system_config.lean4_enabled=false` → every rigor cycle declines immediately.
 
+**Decline Mechanisms:**
+- `outline_update`: `needs_update: boolean`
 **Decline Mechanisms:**
 - `outline_update`: `needs_update: boolean`
 - `construction`: `needs_construction: boolean`
 - `review`: `needs_edit: boolean`
-- `rigor`: `needs_enhancement: boolean`
+- `rigor`: `needs_theorem_work: boolean` (Stage 1 decline) OR all 5 Lean 4 formalization attempts fail (Stage 2 decline)
 
 Declines logged to `compiler_last_10_declines.txt`.
 
@@ -115,7 +123,7 @@ Declines logged to `compiler_last_10_declines.txt`.
 
 ## Body-Only Modes
 
-Outline updates and rigor enhancements are skipped once body is complete:
+Outline updates and Lean 4 theorem-search rigor cycles run only while the body is still under construction. Once the body is complete, the compiler advances to conclusion / introduction / abstract drafting and skips these body-only loops:
 - **Autonomous mode**: `autonomous_section_phase == "body"`
 - **Manual mode**: Conclusion section exists in paper
 
@@ -200,8 +208,10 @@ Prevents models' fake placeholder text (e.g., "XI. Conclusion\n*placeholder*") f
 Per-role context windows (all user-configurable, default 131072):
 - Validator, High-Context Submitter, High-Parameter Submitter: 131072 tokens each
 - **Settings flow**: All compiler modules read from `system_config.compiler_*` at runtime. The caller that creates `CompilerCoordinator` MUST write settings to `system_config` before init (manual mode: `/api/compiler/start`; autonomous mode: `autonomous_coordinator.py` before `CompilerCoordinator()` creation).
+- **OpenRouter auto-fill**: Selecting an OpenRouter model auto-fills from endpoint metadata only. Context window uses the smallest relevant host `context_length`; max output tokens use `min(20% of that host context, smallest relevant host max_completion_tokens)`. If `max_prompt_tokens` is available, shrink usable context to respect it. If endpoint caps are incomplete, preserve current values (no guessing).
 - Rigor mode dynamically adjusts RAG budget if outline + system prompts exceed available context
-- Construction mode (autonomous) dynamically adjusts RAG budget when brainstorm content is present: `rag_budget = max(5000, max_allowed - outline_tokens - paper_tokens - brainstorm_tokens - 5000_overhead)`. Brainstorm always direct-injected at full fidelity; RAG evidence scales to fit remaining budget.
+- Construction mode dynamically adjusts RAG budget when brainstorm content is present: `rag_budget = max(5000, max_allowed - outline_tokens - paper_tokens - brainstorm_tokens - 5000_overhead)`. Brainstorm always direct-injected at full fidelity; RAG evidence scales to fit remaining budget.
+- **Wolfram Alpha as a construction tool**: During `HighContextSubmitter.submit_construction` (body / conclusion / introduction / abstract), when `system_config.wolfram_alpha_enabled=true`, the writer may invoke the `wolfram_alpha_query` OpenAI-compatible tool up to **20 times per submission** to verify factual / computational claims before writing them. On budget exhaustion, the loop forces finalization with tools disabled. Tool audit trail lives in `CompilerSubmission.metadata["wolfram_calls"]`. The validator is not re-invoking Wolfram; it just sees the audit trail. Wolfram tool is NOT available in `outline_create`, `outline_update`, `review`, or the rigor loop.
 
 **Context rules:** User prompt ALWAYS direct injected. Direct injection first; RAG only when doesn't fit. ~85% RAG retrieval, ~15% direct injections. Halt with error if user prompt exceeds context_window - minimum_RAG_allocation.
 
@@ -209,7 +219,7 @@ Per-role context windows (all user-configurable, default 131072):
 - `outline_create`, `outline_update`, `rigor`, `construction`, `review`: raises ValueError if exceeds
 - `validator`: rejects submission if exceeds
 
-**Rigor Mode context**: no aggregator database; outline fully injected; paper content RAG-retrieved. RAG excludes `compiler_outline.txt` (already direct-injected).
+**Rigor Mode context**: no aggregator database; outline fully injected; paper content RAG-retrieved. RAG excludes `compiler_outline.txt` AND `compiler_paper.txt` (both direct-injected where they fit, otherwise RAG'd per the offload priority). Rigor prompts live in `backend/compiler/prompts/rigor_prompts.py` - the pre-Build-4 `standard_enhancement` / `rewrite_focus` / `wolfram_verification` prompts were replaced by `build_rigor_theorem_discovery_prompt` (Stage 1) and `build_rigor_placement_prompt` (Stage 2).
 
 **RAG source exclusion (anti-duplication)**: All compiler RAG calls pass `exclude_sources` to skip chunks from content already direct-injected. Construction excludes outline + paper + brainstorm sources; outline_update excludes outline + paper; rigor excludes outline. See `rag-design-for-overall-program.mdc` for full table.
 
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index cb93bcb..ba58356 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -39,7 +39,7 @@ The Autonomous Research Mode is Part 3 of the MOTO Math Variant system. It is a
 ### Part 1 Aggregator Integration (Tier 1)
 The autonomous coordinator USES actual Part 1 aggregator infrastructure for brainstorm aggregation:
 - Creates separate `Coordinator` instance per brainstorm topic
-- Configures with topic-specific database path (`data/auto_brainstorms/brainstorm_{topic_id}.txt`)
+- Configures with topic-specific database path (`auto_brainstorms/brainstorm_{topic_id}.txt` under the active instance data root; default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}.txt`)
 - Runs configurable 1-10 submitters + 1 validator workflow (default 3 submitters)
 - Each submitter can have its own model, context window, and max output tokens for multi-model exploration
 - SINGLE validator maintains coherent Markov chain evolution (same constraint as Part 1)
@@ -200,7 +200,7 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `decision` (accept/reje
 ### Rejection Feedback
 When rejected, the validator's reasoning is added to the topic submitter's rolling feedback cache (last 5 rejections), similar to aggregator submitter rejection logs.
 
-**File**: `data/auto_research_topic_rejections.txt`
+**File**: `auto_research_topic_rejections.txt` under the active instance data root (default desktop path: `backend/data/auto_research_topic_rejections.txt`)
 
 ---
 
@@ -312,7 +312,7 @@ The autonomous brainstorm aggregator inherits batch validation from Part 1 infra
 - **Accelerated brainstorm exploration**: Batch validation increases throughput while maintaining quality through redundancy checks
 
 ### Key Differences from Part 1 Aggregator
-1. **Topic-Specific Database**: Writes to `data/auto_brainstorms/brainstorm_{topic_id}.txt` instead of `rag_shared_training.txt`
+1. **Topic-Specific Database**: Writes to `auto_brainstorms/brainstorm_{topic_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}.txt`) instead of `rag_shared_training.txt`
 2. **No User-Provided Topic Prompt**: Uses the AI-generated brainstorm topic prompt
 3. **Completion Tracking**: Tracks acceptance count (including removals) for completion review trigger
 4. **Hard Limit**: 30 accepted submissions (FORCE transition to paper writing, no completion review)
@@ -434,7 +434,7 @@ JSON schemas defined in `json-prompt-design.mdc`. Completion submitter: `decisio
 ### Feedback on Non-Completion
 If the decision is CONTINUE_BRAINSTORM, the `suggested_additions` field provides direction for future submissions. This feedback goes to a rolling cache (last 5) that is passed to the brainstorm aggregation submitters.
 
-**File**: `data/auto_brainstorms/completion_feedback_{topic_id}.txt`
+**File**: `auto_brainstorms/completion_feedback_{topic_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_brainstorms/completion_feedback_{topic_id}.txt`)
 
 ---
 
@@ -711,7 +711,7 @@ The autonomous RAG manager follows the same "no truncation" principle as Part 1
 ### Rejection Feedback
 
 Compiler validator rejections are logged to:
-- `data/auto_papers/paper_{paper_id}_last_10_rejections.txt`
+- `auto_papers/paper_{paper_id}_last_10_rejections.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_last_10_rejections.txt`)
 - Follows same structure as Part 2 compiler rejection logs
 
 ---
@@ -725,23 +725,23 @@ When abstract is written and validated, the paper is considered COMPLETE. Additi
 **Actions on Completion**:
 
 1. **Save Final Paper**:
-   - File: `data/auto_papers/paper_{paper_id}.txt`
+   - File: `auto_papers/paper_{paper_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}.txt`)
    - Contains: Full paper with all sections
 
 2. **Save Outline**:
-   - File: `data/auto_papers/paper_{paper_id}_outline.txt`
+   - File: `auto_papers/paper_{paper_id}_outline.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_outline.txt`)
    - Contains: Paper outline for structural reference
 
 3. **Extract and Save Abstract**:
-   - File: `data/auto_papers/paper_{paper_id}_abstract.txt`
+   - File: `auto_papers/paper_{paper_id}_abstract.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_abstract.txt`)
    - Contains: Abstract text only
 
 4. **Cache Brainstorm Database**:
-   - File: `data/auto_papers/paper_{paper_id}_source_brainstorm.txt`
+   - File: `auto_papers/paper_{paper_id}_source_brainstorm.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_source_brainstorm.txt`)
    - Contains: Complete brainstorm database that sourced this paper
 
 5. **Update Metadata**:
-   - File: `data/auto_research_metadata.json`
+   - File: `auto_research_metadata.json` under the active instance data root (default desktop path: `backend/data/auto_research_metadata.json`)
    - Add paper entry with:
      - paper_id
      - paper_title
@@ -794,7 +794,7 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `should_remove` (bool),
    - Maximum 1 removal per review cycle
 
 5. **Execution**:
-   - If removal validated: Move paper to `data/auto_papers/archive/`
+   - If removal validated: Move paper to `auto_papers/archive/` under the active instance data root (default desktop path: `backend/data/auto_papers/archive/`)
    - Update metadata to mark as "archived"
    - Update statistics
 
@@ -975,11 +975,11 @@ The system implements **two tiers of model tracking**:
 ================================================================================
 AUTONOMOUS AI SOLUTION
 
-Disclaimer: This content is provided for informational and experimental purposes
-only. This paper was autonomously generated with the novelty-seeking MOTO
-harness without peer review or user oversight beyond the original prompt. It
-may contain incorrect, incomplete, misleading, or fabricated claims presented
-with high confidence. Use of this content is at your own risk. You are solely
+Disclaimer: This content is provided for informational purposes only. This
+paper was autonomously generated with the novelty-seeking MOTO harness without
+peer review or user oversight beyond the original prompt. It may contain
+incorrect, incomplete, misleading, or fabricated claims presented with high
+confidence. Use of this content is at your own risk. You are solely
 responsible for reviewing and independently verifying any output before relying
 on it, and the developers, operators, and contributors are not responsible for
 errors, omissions, decisions made from this content, or any resulting loss,
@@ -1072,11 +1072,11 @@ Tier 3 tracks all models used during final answer generation for author attribut
 ================================================================================
 AUTONOMOUS AI SOLUTION
 
-Disclaimer: This content is provided for informational and experimental purposes
-only. This paper was autonomously generated with the novelty-seeking MOTO
-harness without peer review or user oversight beyond the original prompt. It
-may contain incorrect, incomplete, misleading, or fabricated claims presented
-with high confidence. Use of this content is at your own risk. You are solely
+Disclaimer: This content is provided for informational purposes only. This
+paper was autonomously generated with the novelty-seeking MOTO harness without
+peer review or user oversight beyond the original prompt. It may contain
+incorrect, incomplete, misleading, or fabricated claims presented with high
+confidence. Use of this content is at your own risk. You are solely
 responsible for reviewing and independently verifying any output before relying
 on it, and the developers, operators, and contributors are not responsible for
 errors, omissions, decisions made from this content, or any resulting loss,
@@ -1116,7 +1116,7 @@ Total API Calls: 188
 
 ### Tier 3 Data Persistence
 
-**Directory**: `data/auto_final_answer/` (or `auto_sessions/{session_id}/final_answer/`)
+**Directory**: `auto_final_answer/` under the active instance data root (default desktop path: `backend/data/auto_final_answer/`) or `auto_sessions/{session_id}/final_answer/`
 
 | File | Purpose |
 |------|---------|
@@ -1241,39 +1241,94 @@ Main component for displaying Tier 3 status and content:
 
 ---
 
+## Proof Verification Stage (Optional, Part 3 Checkpoint)
+
+Runs automatically after every completed brainstorm (Tier 1) and every completed paper (Tier 2 / Tier 3 chapter), gated on `system_config.lean4_enabled`. Silent no-op when disabled.
+
+**Proof Framing Gate (one-shot, at autonomous start)**: When `lean4_enabled`, the coordinator runs `_run_proof_framing_gate()` before research begins. A single LLM call on the user prompt decides `is_proof_amenable` (`build_proof_framing_gate_prompt` → `autonomous_proof_framing_gate` role). If true, `PROOF_FRAMING_CONTEXT` is appended to every subsequent submitter prompt via `_append_proof_framing()` and persisted to workflow state for crash recovery. Decision is broadcast via `proof_framing_decided`. Silent no-op when disabled or when the prompt is not proof-amenable.
+
+**Pipeline** (`backend/autonomous/core/proof_verification_stage.py`):
+1. **Candidate identification** — `ProofIdentificationAgent` extracts theorem/lemma candidates from brainstorm or paper content
+2. **Optional Mathlib lemma search** — `MathlibLemmaSearchAgent` surfaces relevant existing lemmas into the formalization prompt
+3. **Optional SMT early-exit** — when `smt_enabled`, `SmtClient` classifies candidates conservatively; successful SMT results become Lean tactic hints (nativeDecide / omega / decide style), never stored as standalone proofs
+4. **Lean 4 formalization attempts** — two-phase retry: up to 3 full-proof attempts via `ProofFormalizationAgent.prove_candidate`, then up to 2 multi-tactic script attempts via `prove_candidate_tactic_script` (5 total per candidate). Prior `FailedProofCandidate` failure hints from `proof_database.inject_failure_hints_into_prompt()` thread into each retry.
+5. **Novelty check** — `autonomous_proof_novelty` role compares verified proof against existing proof library
+6. **Storage** — `proof_database.add_proof()` persists novel and known proofs as session-aware records (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and reverse Mathlib usage index. Verified proofs are also appended as a "Verified Proofs" section at the bottom of the source brainstorm DB and/or paper file via `append_proofs_section()`.
+
+**Parallelism (two-phase execution per stage run)**: Steps 2–4 above (the per-candidate "Phase A" Lean pipeline: lemma search → optional SMT hint → `prove_candidate` → `prove_candidate_tactic_script` → `proof_attempts_exhausted` broadcast on failure) run concurrently across *all* identified candidates inside a single `ProofVerificationStage.run()` invocation, bounded by `system_config.proof_max_parallel_candidates` (default 6, env: `MOTO_PROOF_MAX_PARALLEL_CANDIDATES` / `PROOF_MAX_PARALLEL_CANDIDATES`) via an `asyncio.Semaphore`. Completed candidates are consumed by the driver loop through `asyncio.as_completed`, and steps 5–6 (the "Phase B" post-processing: novelty assessment, `add_proof`, dependency extraction via `ProofDependencyExtractor`, `append_proofs_section`, `novel_proof_discovered` / `known_proof_verified` broadcast, `record_failed_candidate` for brainstorm failures) are performed strictly **one-at-a-time** in Phase-A completion order inside that driver loop so later candidates can observe earlier stored proofs as MOTO dependencies. Every identified candidate is attempted — no cutoff. Each Phase-A task instantiates its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` so the per-agent `task_sequence` counter cannot collide across concurrent candidates. If any Phase-A task raises `FreeModelExhaustedError` (or any other exception), the driver cancels all still-running sibling tasks and re-raises so the coordinator's recovery path runs with no orphaned background API calls. `should_stop` is plumbed into each Phase-A pipeline and checked before each Phase-B pass, so a stop-request short-circuits cleanly without leaking tasks.
+
+**Rigor mode is NOT parallelized** (compiler Part 2): `submit_rigor_lean_theorem()` runs one candidate per rigor cycle by design (discovery → 5 Lean attempts → novelty → placement) and the outer `_rigor_loop` drives cycles serially so each proven theorem can land in the paper before the next discovery sees updated context. The parallel candidate pipeline lives only in `ProofVerificationStage`.
+
+**Per-Source Reservation**: `ProofVerificationStage` maintains a class-level `{source_type}:{source_id}` active set behind an asyncio lock so the same brainstorm or paper cannot be verified twice concurrently (required for autonomous + manual proof-check interleaving).
+
+**Lean 4 is authoritative**: SMT results never substitute for Lean verification. The `Lean4Result` contract is the only path to a stored proof. SMT contributes hints only.
+
+**Subprocess vs LSP**: `lean4_client` runs Lean via subprocess by default. When `lean4_lsp_enabled`, a persistent LSP-style process reduces cold-start overhead; the subprocess path remains the fallback and must keep working when LSP is disabled.
+
+**Manual proof checks** (Build 5): `POST /api/proofs/check` reuses `ProofVerificationStage.run_manual()` with the stored `ProofRuntimeConfigSnapshot` (brainstorm / paper / validator role configs captured during autonomous startup). Readiness is surfaced via `/api/proofs/status.manual_check_ready` + `manual_check_message`. Required state: `lean4_enabled=True` AND a runtime snapshot must exist (start autonomous research once to seed it).
+
+**Proof runtime config snapshot** (`research_metadata.set_proof_runtime_config`): Captures a `ProofRuntimeConfigSnapshot` with three `ProofRoleConfigSnapshot` entries — `brainstorm` (from first aggregator submitter config), `paper` (from high-context submitter config), `validator` (from validator config). Each holds provider, model_id, openrouter_provider, lm_studio_fallback_id, context_window, and max_output_tokens. Lets manual checks run without an active autonomous session.
+
+**Proof WebSocket events** (all broadcast through the standard `/api/ws` stream):
+- `proof_framing_decided`
+- `proof_check_started`, `proof_check_complete`, `proof_check_no_candidates`
+- `proof_check_candidates_found`, `mathlib_lemmas_suggested`
+- `proof_attempt_started`, `proof_verified`, `proof_attempt_failed`, `proof_attempts_exhausted`
+- `proof_retry_started`, `proof_retry_scheduled`
+- `novel_proof_discovered`, `known_proof_verified`
+- `proof_dependency_added` (Build 5 — live graph updates)
+- `smt_check_started`, `smt_check_complete`
+
+**Proof Stage Critical Invariants**:
+1. Proof stage is silent and skipped when `lean4_enabled=False` — never blocks brainstorm or paper completion
+2. Lean 4 is authoritative — SMT results are hints only, never stored as standalone proofs, `Lean4Result` contract is unchanged by SMT
+3. Subprocess checker must continue to work when `lean4_lsp_enabled=False`; LSP path must not regress subprocess behavior when enabled
+4. Proof storage is session-aware (`session_manager` → `get_proofs_dir()`) and falls back to the legacy `backend/data/proofs/` layout when no session is active
+5. Per-source reservation lock prevents concurrent proof checks on the same `{source_type}:{source_id}` (autonomous vs manual interleaving)
+6. Novel proofs become highest-priority direct-injection context for subsequent brainstorm/paper submitters (via `proof_database.inject_failure_hints_into_prompt()` and stored `ProofRecord` summaries)
+7. Proof certificates stay text-based (`.lean` source + JSON metadata) — no binary artifacts
+8. Hosted/generic mode keeps `lean4_enabled` and `smt_enabled` default false and the hosted image stays Lean-free and Z3-free (no proof binaries in the `python:3.12-slim` runtime)
+9. Proof framing gate runs once per autonomous start and only when `lean4_enabled`; the resulting `proof_framing_active` flag and `PROOF_FRAMING_CONTEXT` are persisted in workflow state for crash recovery
+10. Every identified theorem candidate must be attempted — Phase A is bounded by `proof_max_parallel_candidates` but never truncates the candidate list; Phase A runs concurrently across candidates while Phase B (novelty / `add_proof` / dependency extraction / brainstorm+paper `append_proofs_section` / novel/known broadcasts / `record_failed_candidate`) remains strictly serialized in Phase-A completion order so intra-batch MOTO dependencies and per-source proof appending stay coherent
+11. Each Phase-A task owns its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` instance to keep per-agent `task_sequence` counters collision-free; any Phase-A exception (including `FreeModelExhaustedError`) must cancel all sibling tasks and re-raise so the coordinator's recovery path runs without orphaned background API calls
+12. `should_stop` propagates into Phase A and is re-checked before each Phase-B pass so stop-requests short-circuit without leaking tasks or partially-applied Phase-B writes
+13. Compiler rigor mode (`submit_rigor_lean_theorem`, `_rigor_loop`) is NOT parallelized — rigor cycles discover, verify, and place one theorem per cycle so each verified theorem lands in the paper before the next discovery; the parallel candidate pipeline lives only in `ProofVerificationStage`
+
+---
+
 ## Data Persistence
 
 ### Brainstorm Databases
 
-**File Pattern**: `data/auto_brainstorms/brainstorm_{topic_id}.txt`
+**File Pattern**: `auto_brainstorms/brainstorm_{topic_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}.txt`)
 
 Each brainstorm has its own database file containing accepted submissions, formatted identically to Part 1's `rag_shared_training.txt`.
 
-**Metadata File**: `data/auto_brainstorms/brainstorm_{topic_id}_metadata.json` — Fields: topic_id, topic_prompt, status, submission_count, timestamps, papers_generated.
+**Metadata File**: `auto_brainstorms/brainstorm_{topic_id}_metadata.json` under the active instance data root (default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}_metadata.json`) — Fields: topic_id, topic_prompt, status, submission_count, timestamps, papers_generated.
 
 ### Paper Files
 
-**File Pattern**: `data/auto_papers/paper_{paper_id}.txt`
+**File Pattern**: `auto_papers/paper_{paper_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}.txt`)
 
 Contains full paper content.
 
-**Abstract File**: `data/auto_papers/paper_{paper_id}_abstract.txt`
+**Abstract File**: `auto_papers/paper_{paper_id}_abstract.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_abstract.txt`)
 
 Contains abstract only.
 
-**Source Brainstorm Cache**: `data/auto_papers/paper_{paper_id}_source_brainstorm.txt`
+**Source Brainstorm Cache**: `auto_papers/paper_{paper_id}_source_brainstorm.txt` under the active instance data root (default desktop path: `backend/data/auto_papers/paper_{paper_id}_source_brainstorm.txt`)
 
 Contains complete brainstorm database that sourced this paper.
 
 ### Research Metadata File
 
-**File**: `data/auto_research_metadata.json`
+**File**: `auto_research_metadata.json` under the active instance data root (default desktop path: `backend/data/auto_research_metadata.json`)
 
 ```
 
 ### Workflow State File (Crash Recovery / Resume)
 
-**File**: `data/auto_workflow_state.json`
+**File**: `auto_workflow_state.json` under the active instance data root (default desktop path: `backend/data/auto_workflow_state.json`)
 
 This file persists the current workflow state to enable **automatic resume** after program restart or crash. The system automatically saves this state at key checkpoints:
 
@@ -1335,6 +1390,8 @@ All memory modules (`brainstorm_memory`, `paper_library`, `final_answer_memory`,
 
 The autonomous research system maintains backward compatibility through a dual-path architecture:
 
+**Runtime root note:** The examples below are shown with the default desktop root `backend/data/`. In multi-launch or hosted environments, these same relative paths resolve under the active `MOTO_DATA_ROOT`. Per-instance isolation comes from the runtime root; session isolation happens inside that instance root.
+
 **Legacy Paths (backward compatibility):**
 ```
 backend/data/auto_brainstorms/      # Brainstorm databases
@@ -1363,9 +1420,10 @@ backend/data/auto_sessions/{session_id}/final_answer/    # Session final answers
 
 **Important for New Features:**
 - Always use memory module methods (e.g., `paper_library.get_paper_path()`) to get paths
-- Never hardcode paths like `data/auto_papers/` directly
+- Never hardcode fixed-root paths like `data/auto_papers/` or `backend/data/auto_papers/` directly
 - Pass resolved paths to any persistence layer that needs session awareness
 - Config paths (`system_config.auto_papers_dir`, etc.) are legacy-only references
+- Session-aware storage does not replace instance-aware storage; separate running MOTO instances must also keep separate `MOTO_DATA_ROOT` values
 
 ---
 
@@ -1426,8 +1484,8 @@ Paper library component:
 - Expandable to show full paper content
 - Word count, source brainstorm links
 - Download/export options:
-  - **Download PDF**: Generates PDF from rendered LaTeX content (same functionality as LivePaper and FinalAnswerView)
-  - **Download Raw**: Downloads raw text with outline
+  - **Download PDF** (default mode only): Generates PDF from rendered LaTeX content (same functionality as LivePaper and FinalAnswerView); returns 501 in generic mode
+  - **Download Raw**: Downloads raw text with outline (available in both modes)
 - Search and filter functionality
 - **Delete button**: Removes paper and all associated files (shown when paper is expanded)
   - Shows inline confirmation dialog before deletion
@@ -1552,16 +1610,17 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 
 ### Running Modes
 - **Part 1, Part 2, and Part 3 remain user-selectable modes**
-- **Only ONE workflow mode may be active at a time** — Aggregator, Compiler, and Autonomous Research are now mutually exclusive at runtime
+- **Only ONE workflow mode may be active at a time** — Aggregator, Compiler, and Autonomous Research are mutually exclusive at runtime (applies identically in both default and generic deployment)
 - **Part 3 internally controls Part 1 and Part 2 components** during autonomous execution
 - Starting any mode while another mode is running must be blocked until the active mode is stopped
+- In generic mode, all API routes and WebSocket events are identical — the only difference is provider availability (OpenRouter-only, FastEmbed embeddings, no PDF download)
 
 ---
 
 ## Prerequisites
 
-- Either an OpenRouter API key or at least one LM Studio model must be available to begin
-- LM Studio is highly recommended even with OpenRouter enabled because local embeddings/RAG are free and faster
+- Either an OpenRouter API key or at least one LM Studio model must be available to begin (default mode). Generic mode requires an OpenRouter API key only.
+- LM Studio is recommended in default mode for free local embeddings/RAG; generic mode uses in-process FastEmbed for embeddings (no LM Studio dependency)
 - User must provide high-level research prompt
 - No dependency on prior Part 1 or Part 2 usage
 - Fresh start with empty brainstorm/paper libraries
@@ -1662,6 +1721,7 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 37. **Paper title exploration runs before EVERY title selection** — Uses full Part 1 aggregator to collect 5 candidate titles before every paper creation (Tier 2 papers 1/2/3, Tier 3 short-form, Tier 3 gap/intro/conclusion chapters). No exceptions.
 38. **Title exploration uses standard aggregator (cleanup disabled)** — Same parallel submitters, batch validation, queue management. Cleanup/pruning is disabled because the phase is capped at 5 candidates and the temp DB is deleted afterwards.
 39. **Final title selection sees candidate titles** — The 6th selection can choose a candidate, synthesize, or propose new. Must justify divergence from all candidates.
+40. **Proof verification is an optional post-brainstorm and post-paper checkpoint** — Gated on `lean4_enabled`; silent when disabled. Lean 4 is authoritative; SMT (when `smt_enabled`) contributes hints only. See "Proof Verification Stage" section for the full invariant list.
 
 ---
 
@@ -1689,14 +1749,16 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 Each role in autonomous research mode supports OpenRouter model selection with host/provider choice:
 
 **Per-Role Configuration** (for each brainstorm submitter, validator, high-context, high-param, critique submitter):
-- **Provider Toggle**: "Use OpenRouter" button switches role to OpenRouter model selection
+- **Provider Toggle** (default mode): "Use OpenRouter" button switches role to OpenRouter model selection. In generic mode, all roles use OpenRouter only and provider toggle is hidden.
 - **OpenRouter Model Selector**: When OpenRouter enabled, dropdown shows available OpenRouter models
 - **Provider/Host Selector**: Specific provider selection (e.g., "Anthropic", "Google AI", "AWS Bedrock") or "Default (OpenRouter chooses)"
-- **LM Studio Fallback**: Optional fallback model if OpenRouter fails (credit exhaustion, errors)
+- **OpenRouter Auto-Fill**: Selecting an OpenRouter model auto-fills from endpoint metadata only. Context window uses the smallest relevant host `context_length`; max output tokens use `min(20% of that host context, smallest relevant host max_completion_tokens)`. If `max_prompt_tokens` is available, shrink usable context to respect it. If endpoint caps are incomplete, preserve current values (no guessing).
+- **LM Studio Fallback** (default mode only): Optional fallback model if OpenRouter fails (credit exhaustion, errors)
 
 **Fallback Behavior**:
-- If OpenRouter is selected and has a fallback configured: Automatically falls back to LM Studio on credit exhaustion
-- If no LM Studio available: OpenRouter-only operation (system works without LM Studio)
+- Default mode with fallback configured: Automatically falls back to LM Studio on credit exhaustion
+- Default mode without LM Studio: OpenRouter-only operation (system works without LM Studio)
+- Generic mode: OpenRouter-only; no LM Studio fallback available. Credit exhaustion raises RuntimeError if no alternative.
 - Fallback is per-role and resettable via `POST /api/openrouter/reset-exhaustion` or by re-setting the API key
 
 ## Other Notes
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index b0eb31e..dd67a34 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -1,22 +1,36 @@
 ---
 alwaysApply: true
 ---
-## LM Studio Server Information
-LM Studio and its pre-loaded models can be reached at "http://127.0.0.1:1234".
-**NOTE:** The system works without LM Studio. If LM Studio is unavailable, users can configure OpenRouter for all roles.
+
+## LM Studio Server Information (Default Mode Only)
+LM Studio and its pre-loaded models can be reached at "http://127.0.0.1:1234" (overridable via `MOTO_LM_STUDIO_BASE_URL`).
+**NOTE:** The system works without LM Studio. If LM Studio is unavailable, users can configure OpenRouter for all roles. In generic mode (`generic_mode=True`), LM Studio is entirely bypassed — embeddings use FastEmbed and all LLM inference routes through OpenRouter.
+
+## Runtime Root Note
+
+`backend/data/` and `backend/logs/` are the **default desktop roots**, not immutable global paths.
+
+- The active backend instance may override mutable roots with `MOTO_DATA_ROOT` and `MOTO_LOG_ROOT`
+- Secret persistence may be isolated per instance with `MOTO_SECRET_NAMESPACE`
+- Frontend browser persistence may be isolated on shared origins with `MOTO_FRONTEND_STORAGE_PREFIX` / `VITE_MOTO_STORAGE_PREFIX`
+- Additional local launches may create generated instance folders such as `.moto_instances/{instance_id}/data` and `.moto_instances/{instance_id}/logs`
 
 ## Complete Project Directory Structure and File Descriptions
 project-root/
 ├── .github/                            # GitHub community health files
 │   ├── ISSUE_TEMPLATE/                 # Public issue forms + security contact routing
 │   └── pull_request_template.md        # Default pull request template
+├── .moto_instances/                    # Generated local multi-instance runtime roots (not source-controlled)
+│   └── {instance_id}/
+│       ├── data/                       # Instance-specific mutable data root
+│       └── logs/                       # Instance-specific mutable log root
 ├── backend/
 │   ├── shared/                          # SHARED RESOURCES
 │   │   ├── __init__.py                  # Package initialization
-│   │   ├── config.py                    # RAGConfig, SystemConfig
+│   │   ├── config.py                    # RAGConfig, SystemConfig (instance runtime contract, ports, data/log roots, secret namespace, generic_mode)
 │   │   ├── models.py                    # Pydantic models (includes ModelConfig, BoostConfig, WorkflowTask)
 │   │   ├── lm_studio_client.py          # LM Studio HTTP API client
-│   │   ├── openrouter_client.py         # OpenRouter HTTP API client (credit exhaustion detection)
+│   │   ├── openrouter_client.py         # OpenRouter HTTP API client (credit exhaustion detection + model/endpoint metadata)
 │   │   ├── api_client_manager.py        # Unified API router (OpenRouter/LM Studio fallback + boost)
 │   │   ├── boost_manager.py             # Singleton boost manager (tracks boost modes: next-count, always-prefer, category)
 │   │   ├── boost_logger.py              # Boost API call logger (persists to boost_api_log.txt)
@@ -29,8 +43,12 @@ project-root/
 │   │   ├── json_parser.py               # JSON parsing with sanitization for LLM quirks
 │   │   ├── critique_memory.py           # Paper critique persistence (saves up to 10 validator critiques per paper)
 │   │   ├── critique_prompts.py          # Default critique prompt and builder function for validator critiques
-│   │   ├── secret_store.py              # Secure API key persistence via OS keyring (OpenRouter, Wolfram Alpha)
-│   │   └── path_safety.py               # Safe path resolution helpers (realpath/normpath containment checks)
+│   │   ├── secret_store.py              # Secure API key persistence via OS keyring (OpenRouter, Wolfram Alpha); bypassed in generic mode (env-injected/in-memory)
+│   │   ├── build_info.py                # Build identity resolver (loads version/build_commit/update_channel/api_contract_version from moto-update-manifest.json + env overrides)
+│   │   ├── path_safety.py               # Safe path resolution helpers (realpath/normpath containment checks)
+│   │   ├── fastembed_provider.py         # FastEmbed embedding wrapper (generic mode only, lazy-imported; ~30 lines)
+│   │   ├── lean4_client.py              # Lean 4 proof checker client (subprocess + optional LSP persistent mode; gated on `lean4_enabled` / `lean4_lsp_enabled`)
+│   │   └── smt_client.py                # Z3/SMT launcher-managed subprocess wrapper (gated on `smt_enabled`; never authoritative on its own)
 │   ├── aggregator/                      # AGGREGATOR 
 │   │   ├── __init__.py
 │   │   ├── core/
@@ -76,17 +94,17 @@ project-root/
 │   │   │   └── critique_submitter.py    # Critique phase submitter (peer review)
 │   │   ├── validation/
 │   │   │   ├── __init__.py              # Package initialization
-│   │   │   └── compiler_validator.py    # Validates coherence, rigor, placement
+│   │   │   └── compiler_validator.py    # Validates coherence, rigor, placement (plus rigor_lean_placement mode for Lean-4 theorem placement)
 │   │   ├── prompts/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   ├── outline_prompts.py       # Outline generation & update prompts
 │   │   │   ├── construction_prompts.py  # Paper construction prompts
 │   │   │   ├── review_prompts.py        # Paper review/cleanup prompts
-│   │   │   └── rigor_prompts.py         # Rigor enhancement prompts
+│   │   │   └── rigor_prompts.py         # Rigor theorem-discovery + placement prompts (Lean-4-verified flow)
 │   │   └── memory/
 │   │       ├── __init__.py              # Package initialization
 │   │       ├── outline_memory.py        # Current outline state (direct inject/RAG)
-│   │       ├── paper_memory.py          # Current paper state (direct inject/RAG)
+│   │       ├── paper_memory.py          # Current paper state (direct inject/RAG). Skeleton markers: ABSTRACT_PLACEHOLDER, INTRO_PLACEHOLDER, CONCLUSION_PLACEHOLDER, THEOREMS_APPENDIX_START/END (wraps Lean-4-verified theorem entries), PAPER_ANCHOR.
 │   │       ├── critique_memory.py       # Accepted critiques database for peer review phase
 │   │       ├── critique_rejection_memory.py # Last 5 critique rejection feedback logs
 │   │       └── compiler_rejection_log.py # Last 10 rejections & acceptances
@@ -95,8 +113,10 @@ project-root/
 │   │   ├── __init__.py                  # Package initialization
 │   │   ├── core/
 │   │   │   ├── __init__.py              # Package initialization
-│   │   │   ├── autonomous_coordinator.py # Orchestrates the Tier 1 → Tier 2 → Tier 3 autonomous workflow
-│   │   │   └── autonomous_rag_manager.py # Autonomous-specific RAG wrapper
+│   │   │   ├── autonomous_coordinator.py # Orchestrates the Tier 1 → Tier 2 → Tier 3 autonomous workflow (invokes proof verification checkpoint after brainstorm/paper completion when `lean4_enabled`)
+│   │   │   ├── autonomous_rag_manager.py # Autonomous-specific RAG wrapper
+│   │   │   ├── proof_verification_stage.py # Orchestrates proof identification → Lean 4 attempts (5-try loop) → novelty check → proof storage; optional SMT early-exit + Mathlib lemma search; per-source reservation lock
+│   │   │   └── proof_dependency_extractor.py # Parses verified Lean 4 code to extract `ProofDependency` records (imports, Mathlib lemmas, MOTO-origin refs)
 │   │   ├── agents/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   ├── topic_selector.py        # Topic selection submitter (new/continue/combine)
@@ -104,6 +124,9 @@ project-root/
 │   │   │   ├── completion_reviewer.py   # Brainstorm completion review (SPECIAL SELF-VALIDATION)
 │   │   │   ├── reference_selector.py    # Reference paper selection workflow
 │   │   │   ├── paper_title_selector.py  # Paper title selection
+│   │   │   ├── proof_identification_agent.py # Extracts theorem/lemma candidates from brainstorms and papers
+│   │   │   ├── proof_formalization_agent.py  # Generates Lean 4 proof scripts for candidates (consumes Mathlib hints + SMT hints when enabled)
+│   │   │   ├── lemma_search_agent.py    # Mathlib lemma search agent (Build 2) — surfaces relevant existing lemmas for formalization prompts
 │   │   │   └── final_answer/            # TIER 3 - Final Answer Generation Agents
 │   │   │       ├── __init__.py          # Package initialization
 │   │   │       ├── certainty_assessor.py  # Assesses "known certainties" from Tier 2 papers
@@ -122,16 +145,18 @@ project-root/
 │   │   │   ├── paper_title_prompts.py   # Paper title selection prompts
 │   │   │   ├── paper_redundancy_prompts.py # Paper redundancy review prompts
 │   │   │   ├── paper_continuation_prompts.py # Brainstorm multi-paper continuation decision prompts
+│   │   │   ├── proof_prompts.py         # Proof identification/formalization/novelty prompts + failure-hint direct injection helper
 │   │   │   └── final_answer_prompts.py  # TIER 3 - Final answer assessment/selection/volume prompts
 │   │   └── memory/
 │   │       ├── __init__.py              # Package initialization
 │   │       ├── brainstorm_memory.py     # Per-brainstorm database management (includes retroactive edit/remove/add during paper compilation)
 │   │       ├── paper_library.py         # Paper library management (Tier 2)
-│   │       ├── research_metadata.py     # Research metadata (brainstorms + papers associations)
+│   │       ├── research_metadata.py     # Research metadata (brainstorms + papers associations, proof runtime config snapshot)
 │   │       ├── autonomous_rejection_logs.py # Topic selection & completion feedback logs
 │   │       ├── topic_exploration_memory.py # In-memory candidate DB for topic exploration phase
 │   │       ├── paper_model_tracker.py   # Per-paper model usage tracking and author attribution
 │   │       ├── autonomous_api_logger.py # Autonomous API call logger singleton
+│   │       ├── proof_database.py        # Session-aware Lean 4 verified-proof storage (records, Lean sources, novelty index, reverse Mathlib index)
 │   │       ├── final_answer_memory.py   # TIER 3 - Final answer state & volume management
 │   │       └── session_manager.py       # Prompt-based session folder organization
 │   │
@@ -140,18 +165,22 @@ project-root/
 │   │
 │   ├── api/
 │   │   ├── __init__.py
-│   │   ├── main.py                      # FastAPI app entry point 
-│   │   ├── middleware.py                # CORS, error handling 
+│   │   ├── main.py                      # FastAPI app entry point (lifespan reads generic_mode from env, fail-closes hosted startup when proxy auth env is missing, skips LM Studio test in generic mode)
+│   │   ├── middleware.py                # CORS, error handling, proxy auth validation (X-Moto-* headers in generic mode)
+│   │   ├── proxy_auth.py                # Shared generic-mode proxy auth helpers (allowlist + HMAC signature validation for REST/WebSocket)
 │   │   └── routes/
 │   │       ├── __init__.py
 │   │       ├── aggregator.py            # Aggregator API endpoints (includes /events)
 │   │       ├── compiler.py              # Compiler API endpoints
 │   │       ├── autonomous.py            # Autonomous Research API endpoints
-│   │       ├── boost.py                 # Boost API endpoints (enable/disable/toggle/status)
+│   │       ├── boost.py                 # Boost API endpoints (enable/disable/toggle/status + OpenRouter provider endpoint metadata)
 │   │       ├── workflow.py              # Workflow API endpoints (predictions/history)
-│   │       ├── download.py              # PDF generation endpoint via Playwright (POST /api/download/pdf)
-│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers, LM Studio availability, **GET /api/model-cache** for model ID caching, **POST /api/openrouter/reset-exhaustion** to reset credit exhaustion mid-session)
-│   │       └── websocket.py             # WebSocket for real-time updates
+│   │       ├── download.py              # PDF generation endpoint via Playwright (POST /api/download/pdf); returns 501 in generic mode
+│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers + endpoint metadata, LM Studio availability, **GET /api/model-cache** for model ID caching, **POST /api/openrouter/reset-exhaustion** to reset credit exhaustion mid-session)
+│   │       ├── websocket.py             # WebSocket for real-time updates (proxy auth validation in generic mode before accept)
+│   │       ├── features.py              # GET /api/features — shared build identity plus stable capability flags (`generic_mode`, `lm_studio_enabled`, `pdf_download_available`)
+│   │       ├── proofs.py                # Proof database + Lean 4/SMT runtime + manual proof-check + certificate export + dependency graph routes (all gated on `lean4_enabled`)
+│   │       └── health.py                # GET /api/health — readiness/liveness probe with instance/build metadata
 │   │
 │   ├── data/                            # Persistent data storage
 │   │   ├── user_uploads/                # User-uploaded files
@@ -190,9 +219,11 @@ project-root/
 │   │   │       ├── brainstorms/                           # Tier 1 brainstorm databases
 │   │   │       ├── papers/                                # Tier 2 completed papers
 │   │   │       ├── final_answer/                          # Tier 3 final answer data
+│   │   │       ├── proofs/                                # Lean 4 verified-proof records (proofs_index.json, proof_<id>.json, proof_<id>_lean.lean)
 │   │   │       ├── session_metadata.json                  # Session info (prompt, created_at, status)
 │   │   │       ├── session_stats.json                     # Session statistics
 │   │   │       └── workflow_state.json                    # Workflow state for crash recovery
+│   │   ├── proofs/                      # Legacy (non-session) Lean 4 proof storage (mirrors per-session proofs/ layout)
 │   │   ├── auto_research_metadata.json  # Autonomous Research metadata (LEGACY - now in session folders)
 │   │   ├── auto_research_stats.json     # Autonomous Research statistics (LEGACY - now in session folders)
 │   │   ├── auto_workflow_state.json     # Autonomous Research workflow state (LEGACY - now in session folders)
@@ -206,13 +237,13 @@ project-root/
 │   │   ├── components/
 │   │   │   ├── aggregator/              # AGGREGATOR
 │   │   │   │   ├── AggregatorInterface.jsx  # User prompt, file upload, start/stop
-│   │   │   │   ├── AggregatorSettings.jsx   # Model selection, context sizes
+│   │   │   │   ├── AggregatorSettings.jsx   # Model selection, context sizes, capability-gated LM/OpenRouter UI
 │   │   │   │   ├── AggregatorLogs.jsx       # Metrics, acceptance rates, queue; loads persisted events on mount
 │   │   │   │   └── LiveResults.jsx          # Real-time accepted submissions view
 │   │   │   │
 │   │   │   ├── compiler/                # COMPILER
 │   │   │   │   ├── CompilerInterface.jsx    # Replace placeholder: prompt input, start/stop, status
-│   │   │   │   ├── CompilerSettings.jsx     # 3 model selections (validator, high-context, high-param)
+│   │   │   │   ├── CompilerSettings.jsx     # 3 model selections (validator, high-context, high-param), capability-gated LM/OpenRouter UI
 │   │   │   │   ├── CompilerLogs.jsx         # Metrics: construction vs rigor, miniscule edits
 │   │   │   │   └── LivePaper.jsx            # Real-time paper viewing, save draft, word count
 │   │   │   │
@@ -221,7 +252,7 @@ project-root/
 │   │   │       ├── AutonomousResearch.css     # Autonomous research styles
 │   │   │       ├── BrainstormList.jsx       # List all brainstorm topics with status
 │   │   │       ├── PaperLibrary.jsx         # Grid view of completed papers (title + abstract)
-│   │   │       ├── AutonomousResearchSettings.jsx  # Model configs for all roles
+│   │   │       ├── AutonomousResearchSettings.jsx  # Model configs for all roles, capability-gated LM/OpenRouter UI
 │   │   │       ├── AutonomousResearchLogs.jsx      # Metrics, graphs, event log, combined API call logs
 │   │   │       ├── LivePaperProgress.jsx    # Real-time Tier 2 paper display (embedded in interface)
 │   │   │       ├── LiveTier3Progress.jsx    # Real-time Tier 3 final answer display (embedded in interface)
@@ -229,67 +260,109 @@ project-root/
 │   │   │       ├── FinalAnswerLibrary.jsx   # All sessions final answer library viewer
 │   │   │       ├── FinalAnswerLibrary.css   # Final answer library styles
 │   │   │       ├── ArchiveViewerModal.jsx   # Research lineage archive viewer (papers + brainstorms)
-│   │   │       └── ArchiveViewerModal.css   # Archive viewer styles
+│   │   │       ├── ArchiveViewerModal.css   # Archive viewer styles
+│   │   │       ├── MathematicalProofs.jsx   # Proof library tab (lists verified novel/non-novel proofs from `/api/proofs`)
+│   │   │       ├── MathematicalProofs.css   # Proof library styles
+│   │   │       ├── ProofGraph.jsx           # Proof dependency graph view (hand-rolled SVG; Build 4, may escalate to reactflow in Build 5 if needed)
+│   │   │       ├── ProofGraph.css           # Proof graph styles
+│   │   │       ├── ProofNotificationStack.jsx # Persistent popup notifications for novel proof discoveries
+│   │   │       ├── Stage2PaperHistory.jsx   # Tier 2 paper history list (grouped per research run; used inside FinalAnswerLibrary)
+│   │   │       └── Stage2PaperHistory.css   # Tier 2 paper history styles
 │   │   │
-│   │   ├── StartupProviderSetupModal.jsx # Post-disclaimer startup chooser for OpenRouter vs LM Studio setup
-│   │   ├── OpenRouterApiKeyModal.jsx    # Modal for global OpenRouter API key configuration
+│   │   ├── StartupProviderSetupModal.jsx # Post-disclaimer startup chooser for OpenRouter vs LM Studio setup (OpenRouter-only in generic mode)
+│   │   ├── OpenRouterApiKeyModal.jsx    # Modal for global OpenRouter API key configuration with mode-aware persistence messaging
 │   │   ├── PaperCritiqueModal.jsx       # Modal for displaying validator paper critiques (ratings, feedback, history)
 │   │   ├── CritiqueNotificationStack.jsx # Persistent popup notifications for high-scoring critiques (≥7.0 avg)
 │   │   ├── CreditExhaustionNotificationStack.jsx # Persistent red notifications for OpenRouter credit exhaustion with "Retry OpenRouter" reset button
 │   │   ├── HungConnectionNotificationStack.jsx # Persistent amber notifications for API calls exceeding 15 minutes (possible hung connections)
-│   │   ├── BoostControlModal.jsx        # Modal for boost configuration (next-X, category, always-prefer)
+│   │   ├── BoostControlModal.jsx        # Modal for boost configuration (next-X, category, always-prefer) with mode-aware copy
 │   │   ├── BoostControlModal.css        # Boost control modal styles
 │   │   ├── WorkflowPanel.jsx            # Boost controls panel (Boost Next X, Always Prefer, Category Boost, token stats, research timer)
 │   │   ├── WorkflowPanel.css            # Boost controls panel styles
 │   │   ├── TextFileUploader.jsx         # User file upload component
 │   │   ├── TextFileUploader.css         # File uploader styles
-│   │   ├── OpenRouterPrivacyWarningModal.jsx # Privacy policy error modal (OpenRouter data sharing)
+│   │   ├── OpenRouterPrivacyWarningModal.jsx # Privacy policy error modal (OpenRouter data sharing, capability-aware alternatives)
+│   │   ├── HelpTooltip.jsx              # Shared portal-based help tooltip component (used across settings/interfaces)
 │   │   ├── settings-common.css          # Shared settings panel styles
 │   │   ├── critique-modal.css           # Paper critique modal styles
 │   │   │
 │   │   ├── services/
-│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI)
+│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI, `/api/features` capability bootstrap helper, and proof routes under `/api/proofs/*`)
 │   │   │   └── websocket.js             # WebSocket connection 
 │   │   │
+│   │   ├── hooks/
+│   │   │   └── useProofCheckRuntime.js  # Reads `/api/proofs/status` + proof runtime config so UI can enable/disable manual proof-check controls
+│   │   │
 │   │   ├── utils/
 │   │   │   ├── downloadHelpers.js       # PDF/raw download helpers (Playwright backend PDF)
 │   │   │   ├── modelCache.js            # Frontend model cache utilities (display_name → api_id lookup)
+│   │   │   ├── openRouterSelection.js   # Shared OpenRouter selector auto-fill helpers (context/output from model + host metadata)
 │   │   │   ├── autonomousProfiles.js    # Shared autonomous recommended-profile definitions and persistence helpers
+│   │   │   ├── runtimeConfig.js         # Frontend runtime helpers (instance storage prefix, active data-root display, instance ID)
+│   │   │   ├── researchRunHistory.js    # Groups Tier 2 papers + final answers into per-run history entries for Stage2PaperHistory/FinalAnswerLibrary
 │   │   │   └── disclaimerHelper.js      # Frontend-only disclaimer injection for brainstorm/paper views
 │   │   │
-│   │   ├── App.jsx                      # Main app shell with top-level mode switch (Autonomous ASI S.T.E.M. / Advanced Manual ASI S.T.E.M.) and tab navigation
+│   │   ├── App.jsx                      # Main app shell with top-level mode switch, `/api/features` capability bootstrap, and capability propagation into settings/interfaces/modals
 │   │   ├── index.css                    # Styles
 │   │   └── index.jsx                    # React entry point
 │   │
 │   ├── package.json
 │   └── vite.config.js
 │
-├── requirements.txt                     # Python dependencies
+├── requirements.txt                     # Python dependencies (default mode)
+├── requirements-generic.txt             # Additive deps for generic mode (-r requirements.txt + fastembed + onnxruntime)
+├── Dockerfile                           # Canonical hosted generic-mode container contract (`python:3.12-slim`, API-only backend image)
+├── .dockerignore                        # Hosted image build-context exclusions (desktop/frontend/dev artifacts stay out of the container)
+├── docker/
+│   └── entrypoint.sh                    # Hosted backend startup wrapper (defaults hosted envs, creates runtime dirs, delegates to `backend.api.main`)
 ├── package.json                         # Root scripts
+├── moto-update-manifest.json            # Build 0 updater/build identity manifest committed on main
 ├── SECURITY.md                          # Security policy and private vulnerability reporting
-├── Click To Launch MOTO.bat             # The user's one-click program launcher.
-└── _moto_internal_launcher.ps1          # Internal PowerShell launcher (not for direct user use)
+├── Click To Launch MOTO.bat             # The authoritative Windows launcher entrypoint (thin wrapper that delegates to moto_launcher.py)
+├── Launch MOTO.sh                       # Linux/Ubuntu launcher entrypoint (thin bash wrapper that delegates to moto_launcher.py)
+├── moto_launcher.py                     # Internal Python launcher orchestration (update check, runtime resolution, dependency install, service startup)
+├── moto_updater.py                      # Build 1 updater helper (manifest fetch, install classification, ZIP/git apply flow, launcher state tracking)
+└── .moto_launcher_state.json            # Gitignored local launcher state (tracks active service-window PIDs and runtime roots to block unsafe update-apply)
 
 ## File Purpose Descriptions
 
+### Launcher and Updater
+
+- `Click To Launch MOTO.bat`: The only Windows consumer entrypoint. It stays thin and always delegates to the Python launcher.
+- `Launch MOTO.sh`: The Linux/Ubuntu consumer entrypoint. Same thin-wrapper contract as the `.bat`; delegates to `moto_launcher.py`.
+- `moto_launcher.py`: Orchestrates the launcher flow in order: update check, runtime resolution, dependency install, LM Studio detection, detached backend/frontend startup, and browser launch.
+- `moto_updater.py`: Owns Build 1 updater behavior, including GitHub `main` manifest fetch, install-state classification, clean-git fast-forward apply, ZIP overlay apply, rollback-aware relaunch, and launcher-managed instance safety checks.
+- `.moto_launcher_state.json`: Local-only state written by the launcher so future launches can detect still-open backend/frontend windows from the same install and skip update-apply until those windows are closed.
+
+### Hosted Runtime
+
+- `Dockerfile`: Canonical hosted generic-mode image definition. Uses the Debian/glibc `python:3.12-slim` baseline, installs `requirements-generic.txt`, preloads the FastEmbed model, and starts the API-only backend contract.
+- `.dockerignore`: Keeps desktop launchers, frontend assets, tests, local runtime data/logs, and dev-only metadata out of the hosted image build context.
+- `docker/entrypoint.sh`: Minimal hosted startup wrapper. Defaults `MOTO_GENERIC_MODE=true`, `HOST=0.0.0.0`, `PORT=8000`, `MOTO_DATA_ROOT=/app/backend/data`, creates runtime directories, and then delegates to `python -m backend.api.main`.
+
 ### Shared Resources
 
-- `config.py`: RAGConfig, SystemConfig (context windows, chunk sizes, max output tokens)
+- `config.py`: RAGConfig, SystemConfig (context windows, chunk sizes, max output tokens, `generic_mode` flag)
 - `models.py`: Pydantic models (ModelConfig, BoostConfig, WorkflowTask, ModelUsageTracker, FinalAnswerState)
-- `lm_studio_client.py`: LM Studio HTTP client (completions, embeddings, model listing)
-- `openrouter_client.py`: OpenRouter HTTP client (credit exhaustion detection, fallback)
-- `api_client_manager.py`: Unified API router (OpenRouter/LM Studio fallback + boost + model tracking)
+- `lm_studio_client.py`: LM Studio HTTP client (completions, embeddings, model listing); unused in generic mode
+- `openrouter_client.py`: OpenRouter HTTP client (credit exhaustion detection, fallback, model/provider endpoint metadata)
+- `api_client_manager.py`: Unified API router (OpenRouter/LM Studio fallback + boost + model tracking); generic mode early-returns FastEmbed for embeddings
 - `boost_manager.py`: Singleton boost manager (three modes: Boost Next X Calls, Always Prefer Boost, Category Boost; broadcasts events)
 - `boost_logger.py`: Boost API call logger (persists boost-routed calls for the combined API log view)
 - `workflow_predictor.py`: Predicts next 20 API calls for internal boost routing (not displayed in UI)
 - `free_model_manager.py`: Free model rotation/cooldown singleton (looping, auto-selector `openrouter/free`, account exhaustion detection)
-- `wolfram_alpha_client.py`: Wolfram Alpha API client for rigor verification
-- `rag_lock.py`: Global RAG operation lock (prevents collision, retry logic for reads)
+- `wolfram_alpha_client.py`: Wolfram Alpha API client. Exposed to the HighContextSubmitter.submit_construction loop as the `wolfram_alpha_query` tool (up to 20 calls per construction submission).
+- `rag_lock.py`: Global RAG operation lock (prevents collision, retry logic for reads); embedding lock skip in generic mode (FastEmbed is in-process/thread-safe)
 - `token_tracker.py`: Cumulative input/output token tracker singleton with per-model breakdown and research timer. Reset on session start, timer start/stop tied to coordinator lifecycle. Stats broadcast via `token_usage_updated` WebSocket event after each successful LLM call.
 - `utils.py`: Token counting, text compression, file I/O
 - `json_parser.py`: JSON parsing with sanitization for LLM responses; sanitizes reasoning tokens, markdown blocks, control tokens, LaTeX escapes, control characters; **rejects truncated JSON** (raises ValueError with diagnostics) to prevent corrupted content from passing validation
 - `critique_memory.py`: Paper critique persistence (ratings, feedback, history, session-aware)
 - `critique_prompts.py`: Default critique prompt and builder function
+- `secret_store.py`: Secure API key persistence via OS keyring; bypassed in generic mode (keys are env-injected/in-memory only)
+- `build_info.py`: Build identity helper that reads the committed `moto-update-manifest.json` contract and applies optional env overrides for runtime version/build stamping
+- `fastembed_provider.py`: FastEmbed embedding wrapper (generic mode only); lazy-imported so default installs are unaffected
+- `lean4_client.py`: Lean 4 proof checker client. Subprocess mode by default; optional persistent LSP mode when `lean4_lsp_enabled`. Silent no-op when `lean4_enabled=False`. Never bundled into the hosted image.
+- `smt_client.py`: Optional Z3/SMT launcher-managed subprocess wrapper. Silent no-op when `smt_enabled=False`. SMT results are hint-only; Lean 4 remains authoritative. Never bundled into the hosted image.
 
 ### Compiler Components
 
@@ -304,24 +377,28 @@ project-root/
 
 ### Autonomous Research Components
 
-- `autonomous_coordinator.py`: Three-tier workflow orchestrator (Tier 1→2→3, triggers, crash recovery)
+- `autonomous_coordinator.py`: Three-tier workflow orchestrator (Tier 1→2→3, triggers, crash recovery, invokes `ProofVerificationStage` after brainstorm/paper completion when `lean4_enabled`)
 - `autonomous_rag_manager.py`: Autonomous RAG wrapper
-- Agents: `topic_selector.py`, `topic_validator.py`, `completion_reviewer.py`, `reference_selector.py`, `paper_title_selector.py`
+- `proof_verification_stage.py`: Proof pipeline orchestrator — candidate identification → per-candidate Phase A (Mathlib lemma search → optional SMT early-exit → Lean 4 formalization attempts, 5 retries per candidate) runs concurrently across all identified candidates bounded by `proof_max_parallel_candidates` (default 6) → Phase B (novelty check → `add_proof` → `ProofDependency` extraction → brainstorm/paper `append_proofs_section`) remains strictly serialized in Phase-A completion order. Per-source reservation lock prevents duplicate concurrent checks for the same `{source_type}:{source_id}`; `FreeModelExhaustedError` (or any Phase-A exception) cancels sibling tasks before the coordinator's recovery path runs.
+- `proof_dependency_extractor.py`: Parses verified Lean 4 code into `ProofDependency` records (imports, Mathlib lemmas, MOTO-origin proof ancestry).
+- Agents: `topic_selector.py`, `topic_validator.py`, `completion_reviewer.py`, `reference_selector.py`, `paper_title_selector.py`, `proof_identification_agent.py`, `proof_formalization_agent.py`, `lemma_search_agent.py`
 - Tier 3 Agents: `certainty_assessor.py`, `answer_format_selector.py`, `volume_organizer.py`
 - `paper_redundancy_checker.py`: Library quality maintenance (every 3 papers)
-- Prompts: `topic_prompts.py`, `topic_exploration_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_exploration_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `paper_continuation_prompts.py`, `final_answer_prompts.py`
-- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py`, `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `final_answer_memory.py` (model tracking, archival)
+- Prompts: `topic_prompts.py`, `topic_exploration_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_exploration_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `paper_continuation_prompts.py`, `proof_prompts.py`, `final_answer_prompts.py`
+- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py` (also stores the proof runtime config snapshot), `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `proof_database.py` (session-aware Lean 4 proof storage + novelty index + reverse Mathlib index), `final_answer_memory.py` (model tracking, archival)
 
 ### API Routes
 
 - `compiler.py`: Compiler control (start/stop/status), paper/outline access, critique management
 - `autonomous.py`: Autonomous research control (start/stop/clear/status), brainstorm/paper access, Tier 3 endpoints
+- `proofs.py`: Proof database listing, `/status` runtime readiness, `POST /settings` runtime flag updates, `POST /check` manual proof check, `/{id}/certificate[.lean]` certificate export, `/{id}/dependencies` + `/graph` + `/mathlib/{lemma}/dependents` graph/lineage queries. All routes gated on `lean4_enabled`.
 
 ### Frontend Components
 
-- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global.
+- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global, and Build 3C bootstraps `/api/features` here so hosted mode can hide LM Studio-only UI and copy.
 - **Aggregator**: `AggregatorInterface.jsx`, `AggregatorSettings.jsx`, `AggregatorLogs.jsx`, `LiveResults.jsx`
 - **Compiler**: `CompilerInterface.jsx`, `CompilerSettings.jsx`, `CompilerLogs.jsx`, `LivePaper.jsx`
-- **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx`, `ArchiveViewerModal.jsx`
+- **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx`, `ArchiveViewerModal.jsx`, `MathematicalProofs.jsx` (proof library), `ProofGraph.jsx` (dependency graph), `ProofNotificationStack.jsx` (novel-proof popups)
 - **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
-- **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
+- **Hooks**: `useProofCheckRuntime.js` (reads `/api/proofs/status` + runtime config so UI can enable/disable manual proof-check controls)
+- **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `openRouterSelection.js` (shared OpenRouter selector auto-fill helpers using model context and provider endpoint caps), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers; when editing a preset, anchor to the exact profile block and exact nested role such as `validator` or `highContext`, never to a shared literal alone, then verify the diff only touched that intended profile/role), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
diff --git a/.cursor/rules/rag-design-for-overall-program.mdc b/.cursor/rules/rag-design-for-overall-program.mdc
index d3095b1..6057269 100644
--- a/.cursor/rules/rag-design-for-overall-program.mdc
+++ b/.cursor/rules/rag-design-for-overall-program.mdc
@@ -1,6 +1,7 @@
 ---
 alwaysApply: false
 ---
+
 ## Important Notes When Editing RAG Systems
 The RAG system in this program is very advanced, be certain that any changes you make to the RAG system are correct changes.
 
@@ -35,7 +36,16 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Core Principle**: Direct injection first, RAG semantic search only when content doesn't fit.
 
-**Embedding**: `text-embedding-nomic-embed-text-v1.5` via LM Studio, or `openai/text-embedding-3-small` via OpenRouter fallback. Routing via `APIClientManager.get_embeddings()`.
+**Embedding**: Dual-contract routing via `APIClientManager.get_embeddings()`:
+
+| Mode | Primary | Fallback | Lock |
+|------|---------|----------|------|
+| Default (`generic_mode=False`) | `text-embedding-nomic-embed-text-v1.5` via LM Studio | `openai/text-embedding-3-small` via OpenRouter | Global RAG lock acquired |
+| Generic (`generic_mode=True`) | `FastEmbedProvider` (in-process ONNX, `nomic-embed-text-v1.5` INT8) | None (fail fast if fastembed missing) | Embedding lock SKIPPED (thread-safe); ChromaDB write lock still acquired |
+
+`get_embeddings()` in generic mode early-returns to `FastEmbedProvider` before the LM Studio → OpenRouter fallback chain.
+
+**Batch query optimization**: `_vector_search()` batches all query embeddings into one `get_embeddings()` call (benefits both modes).
 
 **Key files:**
 - `aggregator/core/rag_manager.py` — 4-stage pipeline orchestrator
@@ -48,9 +58,10 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 ## Architecture: Concurrency
 
-- **Global RAG Lock**: ChromaDB write operations + embedding API calls acquire lock to prevent race conditions
+- **Global RAG Lock**: ChromaDB write operations acquire lock to prevent race conditions. Embedding API calls also acquire lock in default mode.
+- **Generic mode lock skip**: FastEmbed is in-process and thread-safe — embedding calls skip the global RAG lock. ChromaDB write locking remains in both modes.
 - **Read retry**: Vector search auto-retries with exponential backoff (0.5s → 1s → 2s, max 3 attempts) on HNSW index errors during concurrent writes
-- **Embedding rate limiting**: Semaphore limits concurrent embedding requests to 2
+- **Embedding rate limiting**: Semaphore limits concurrent embedding requests to 2 (default mode only; generic mode uses in-process FastEmbed)
 
 ---
 
@@ -149,7 +160,11 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Autonomous (Part 3)**: Per-topic brainstorm databases; reference paper content always RAG'd; same no-truncation principle; all agents validate prompt size before LLM calls.
 
-**Training DB files**: `data/rag_shared_training.txt` (accepted submissions only, no validator reasoning); `data/Summary_Of_Last_5_Validator_Rejections_For_Submitter_{num}.txt` (max 5).
+**Proof Verification Stage (optional, gated on `lean4_enabled`)**: Proof identification, formalization, and lemma search agents operate outside the RAG pipeline. Verified `ProofRecord` summaries and `FailedProofCandidate` hints (from `proof_prompts.format_failure_hints_for_injection`) are **highest-priority direct injections** into subsequent brainstorm/paper submitter prompts when present — never RAG'd. Lean source files under the session `proofs/` directory are not indexed into Chroma.
+
+**Embedding provider routing**: See dual-contract table above. Default mode uses LM Studio with OpenRouter fallback. Generic mode uses in-process FastEmbed. Both modes produce compatible vector dimensions for the same ChromaDB collections.
+
+**Training DB files**: `rag_shared_training.txt` and `Summary_Of_Last_5_Validator_Rejections_For_Submitter_{num}.txt` live under the active instance data root (default desktop paths: `backend/data/rag_shared_training.txt` and `backend/data/Summary_Of_Last_5_Validator_Rejections_For_Submitter_{num}.txt`).
 
 ---
 
@@ -167,6 +182,7 @@ These agents use ONLY direct injection (no RAG fallback) by design. Each operate
 | Volume organizer | Paper summaries, certainty assessment, volume state | Chapter ordering uses paper-level metadata, not full content |
 | Compiler review mode | Outline + paper only | Evaluates paper on its own merits without external source bias |
 | Brainstorm continuation | Brainstorm summary, prior paper titles/abstracts | "Write another or move on" uses summary, not full DB |
+| Proof identification / formalization / lemma search | Candidate theorem text, Lean error output, targeted Mathlib lemma metadata | Operates on compact Lean source + structured hints; proof agents consume `ProofRecord` direct-injection summaries and do not route through the RAG pipeline |
 
 **Known oversight**: Certainty assessor Step 2 drops expanded papers when they don't fit instead of RAG'ing them. Should use RAG fallback like reference_selector does.
 
diff --git a/.cursor/rules/workflow-runtime-updates.mdc b/.cursor/rules/workflow-runtime-updates.mdc
deleted file mode 100644
index 116fcae..0000000
--- a/.cursor/rules/workflow-runtime-updates.mdc
+++ /dev/null
@@ -1,11 +0,0 @@
----
-alwaysApply: true
----
-
-## Workflow Runtime Updates
-
-- Aggregator, Compiler, and Autonomous Research are mutually exclusive runtime modes. Only one workflow mode may be active at a time, and starting any mode while another is running must be blocked.
-- This rule explicitly supersedes any older wording in `part-1-and-part-2-cointeraction-architecture.mdc` that describes Aggregator and Compiler as concurrently runnable.
-
-- Compiler critique skip and autonomous critique skip both support pre-emptive use during active paper-writing. If critique is already active, the skip happens immediately. If critique has not started yet, the skip is queued and auto-applies when critique is reached.
-- This rule explicitly supersedes any older wording in `part-2-compiler-tool-design-specification.mdc` that describes compiler critique skip as active-critique-only.
diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000..765032d
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,39 @@
+.git
+.github
+.cursor
+
+__pycache__/
+*.py[cod]
+.pytest_cache/
+.coverage
+htmlcov/
+
+.env
+.env.*
+.venv/
+venv/
+env/
+ENV/
+
+node_modules/
+frontend/
+frontend/dist/
+
+backend/data/
+backend/logs/
+.moto_instances/
+.moto_launcher_state.json
+.moto_update_notice.json
+
+tests/
+web conversion plans/
+commits_pending.txt
+proof-integration-build*-plan.md
+
+Click To Launch MOTO.bat
+Launch MOTO.sh
+moto_launcher.py
+moto_updater.py
+
+dist/
+build/
diff --git a/.gitignore b/.gitignore
index 4aee7fb..7f4b9d8 100644
--- a/.gitignore
+++ b/.gitignore
@@ -72,6 +72,15 @@ backend/data/auto_final_answer/*
 
 backend/data/auto_sessions/
 
+# Proof verification artifacts (Lean 4 / Z3 hybrid mode)
+backend/data/proofs/*
+!backend/data/proofs/.gitkeep
+backend/data/lean4_workspace/
+backend/data/z3/
+
+# Elan / Lean 4 toolchain installer (platform-specific binaries)
+backend/data/elan/
+
 backend/data/auto_research_metadata.json
 backend/data/auto_research_stats.json
 backend/data/auto_workflow_state.json
@@ -107,6 +116,10 @@ htmlcov/
 *.tmp
 *.bak
 *.swp
+.moto_launcher_state.json
+.moto_last_instance.json
+.moto_update_notice.json
+.moto_instances/
 final_volume.txt
 RANDOM LOG.txt
 commits_pending.txt
diff --git a/Click To Launch MOTO.bat b/Click To Launch MOTO.bat
index 0b6b42c..42db875 100644
--- a/Click To Launch MOTO.bat	
+++ b/Click To Launch MOTO.bat	
@@ -1,325 +1,12 @@
 @echo off
 setlocal
 
-cls
-echo ================================================================
-echo   MOTO SYSTEM LAUNCHER
-echo ================================================================
-echo.
-
-REM ================================================================
-REM STEP 1: Check Python Installation
-REM ================================================================
-echo [1/8] Checking Python installation...
-where python >nul 2>&1
-if errorlevel 1 (
-    echo.
-    echo ============================================================
-    echo ERROR: Python is not installed or not in PATH
-    echo ============================================================
-    echo.
-    echo Please install Python 3.8+ from: https://www.python.org/downloads/
-    echo IMPORTANT: Check 'Add Python to PATH' during installation
-    echo.
-    pause
-    exit /b 1
-)
-python --version
-echo Python found!
-echo.
-
-REM ================================================================
-REM STEP 2: Check Node.js Installation
-REM ================================================================
-echo [2/8] Checking Node.js installation...
-where node >nul 2>&1
-if errorlevel 1 (
-    echo.
-    echo ============================================================
-    echo ERROR: Node.js is not installed or not in PATH
-    echo ============================================================
-    echo.
-    echo Please install Node.js 16+ from: https://nodejs.org/
-    echo.
-    pause
-    exit /b 1
-)
-call node --version
-if errorlevel 1 (
-    echo ERROR: node --version failed
-    pause
-    exit /b 1
-)
-call npm --version
-if errorlevel 1 (
-    echo ERROR: npm --version failed
-    pause
-    exit /b 1
-)
-echo Node.js found!
-echo.
-
-REM ================================================================
-REM STEP 3: Create Necessary Directories & Clean ChromaDB
-REM ================================================================
-echo [3/8] Creating necessary directories...
-if not exist "backend\data" mkdir "backend\data"
-if not exist "backend\data\user_uploads" mkdir "backend\data\user_uploads"
-if not exist "backend\logs" mkdir "backend\logs"
-
-REM Clean ChromaDB on startup to prevent corruption issues
-if exist "backend\data\chroma_db" (
-    echo Cleaning ChromaDB database...
-    rmdir /s /q "backend\data\chroma_db"
-    echo ChromaDB cleaned!
-)
-
-echo Directories created successfully!
-echo.
-
-REM ================================================================
-REM STEP 4: Install Python Dependencies
-REM ================================================================
-echo [4/8] Installing Python dependencies...
-echo This may take a few minutes if this is your first time...
-echo.
-python -m pip install --upgrade pip >nul 2>&1
-pip install --upgrade -r requirements.txt
-if errorlevel 1 (
-    echo.
-    echo ============================================================
-    echo ERROR: Failed to install Python dependencies
-    echo ============================================================
-    echo.
-    echo Please check:
-    echo - Internet connection is working
-    echo - You have permission to install packages
-    echo - requirements.txt exists in the current directory
-    echo.
-    pause
-    exit /b 1
-)
-echo Python dependencies installed successfully!
-echo.
-
-REM ================================================================
-REM STEP 4b: Install Playwright Chromium (for PDF generation)
-REM ================================================================
-echo [4b/8] Installing Playwright Chromium browser for PDF generation...
-echo This is a one-time ~150MB download and may take a few minutes...
-echo.
-python -m playwright install chromium
-if errorlevel 1 (
-    echo.
-    echo WARNING: Playwright Chromium install failed.
-    echo PDF generation will not be available until this is resolved.
-    echo You can retry manually: python -m playwright install chromium
-    echo.
-    echo Continuing startup anyway...
-    echo.
-) else (
-    echo Playwright Chromium ready!
-    echo.
-)
-
-REM ================================================================
-REM STEP 5: Install Node.js Dependencies
-REM ================================================================
-echo [5/8] Installing Node.js dependencies...
-echo This may take a few minutes if this is your first time...
-echo.
-if not exist "frontend" (
-    echo.
-    echo ============================================================
-    echo ERROR: frontend directory not found!
-    echo ============================================================
-    echo.
-    echo Make sure you're running this from the project root directory.
-    echo.
-    pause
-    exit /b 1
-)
-pushd frontend
-set "SHOW_VULN_RESTART_HINT="
-set "NPM_INSTALL_LOG=%TEMP%\moto_npm_install_%RANDOM%_%RANDOM%.log"
-call npm install >"%NPM_INSTALL_LOG%" 2>&1
-set "NPM_INSTALL_EXIT=%ERRORLEVEL%"
-type "%NPM_INSTALL_LOG%"
-findstr /i /c:"vulnerabilities found" "%NPM_INSTALL_LOG%" >nul 2>&1
-if not errorlevel 1 set "SHOW_VULN_RESTART_HINT=1"
-del "%NPM_INSTALL_LOG%" >nul 2>&1
-if not "%NPM_INSTALL_EXIT%"=="0" (
-    echo.
-    echo ============================================================
-    echo ERROR: Failed to install Node.js dependencies
-    echo ============================================================
-    echo.
-    echo Please check:
-    echo - Internet connection is working
-    echo - package.json exists in frontend directory
-    echo.
-    popd
-    pause
-    exit /b 1
-)
-if defined SHOW_VULN_RESTART_HINT (
-    echo.
-    echo NOTE: npm reported vulnerability warnings during install.
-    echo MOTO is running npm audit fix automatically right now.
-    echo After startup finishes, restart this terminal / launcher once to check whether the warning is gone.
-    echo.
-)
-echo Fixing known vulnerabilities automatically...
-call npm audit fix >nul 2>&1
-popd
-echo Node.js dependencies installed successfully!
-echo.
-
-REM ================================================================
-REM STEP 6: Check LM Studio (optional - OpenRouter is an alternative)
-REM ================================================================
-echo [6/8] Checking LM Studio...
-echo.
-
-REM Check if LM Studio is responding
-powershell -Command "try { $response = Invoke-WebRequest -Uri 'http://127.0.0.1:1234/v1/models' -TimeoutSec 3 -UseBasicParsing; exit 0 } catch { exit 1 }" >nul 2>&1
-if errorlevel 1 (
-    echo ================================================================
-    echo NOTE: LM Studio is not detected on http://127.0.0.1:1234
-    echo ================================================================
-    echo.
-    echo This is OK! You have two options for AI models:
-    echo.
-    echo   Option 1: LM Studio (Local)
-    echo     - Download from: https://lmstudio.ai/
-    echo     - Load a model and start the Local Server
-    echo.
-    echo   Option 2: OpenRouter (Cloud API)
-    echo     - Get an API key from: https://openrouter.ai/
-    echo     - Configure in Settings tab after launch
+set "SCRIPT_DIR=%~dp0"
+python "%SCRIPT_DIR%moto_launcher.py" %*
+set "EXIT_CODE=%ERRORLEVEL%"
+if %EXIT_CODE% NEQ 0 (
     echo.
-    echo The system will start - configure your preferred provider in Settings.
-) else (
-    echo LM Studio is running and responding!
-)
-echo.
-
-REM ================================================================
-REM STEP 7: Clean Up Existing Processes
-REM ================================================================
-echo [7/8] Cleaning up existing processes on ports 8000 and 5173...
-echo.
-
-REM Kill any process using port 8000 (backend)
-for /f "tokens=5" %%a in ('netstat -ano ^| findstr :8000 ^| findstr LISTENING') do (
-    echo Found process %%a using port 8000, terminating...
-    taskkill /F /PID %%a >nul 2>&1
-)
-
-REM Kill any process using port 5173 (frontend)
-for /f "tokens=5" %%a in ('netstat -ano ^| findstr :5173 ^| findstr LISTENING') do (
-    echo Found process %%a using port 5173, terminating...
-    taskkill /F /PID %%a >nul 2>&1
-)
-
-REM Wait a moment for ports to be released
-timeout /t 2 /nobreak >nul
-
-echo Ports cleaned successfully!
-echo.
-
-REM Verify ports are now available
-netstat -ano | findstr :8000 | findstr LISTENING >nul 2>&1
-if not errorlevel 1 (
-    echo.
-    echo ============================================================
-    echo ERROR: Port 8000 is still in use after cleanup attempt!
-    echo ============================================================
-    echo.
-    echo Please manually close any applications using port 8000.
-    echo You can check with: netstat -ano ^| findstr :8000
-    echo.
-    pause
-    exit /b 1
-)
-
-netstat -ano | findstr :5173 | findstr LISTENING >nul 2>&1
-if not errorlevel 1 (
-    echo.
-    echo ============================================================
-    echo ERROR: Port 5173 is still in use after cleanup attempt!
-    echo ============================================================
-    echo.
-    echo Please manually close any applications using port 5173.
-    echo You can check with: netstat -ano ^| findstr :5173
-    echo.
-    pause
-    exit /b 1
-)
-
-echo Ports 8000 and 5173 are available!
-echo.
-
-REM ================================================================
-REM STEP 8: Start Services
-REM ================================================================
-echo [8/8] Starting services...
-echo.
-echo ================================================================
-echo   SYSTEM STARTING
-echo ================================================================
-echo.
-echo Backend API will run on: http://localhost:8000
-echo Frontend UI will run on: http://localhost:5173
-echo.
-echo Two windows will open:
-echo   - ASI Backend (Keep this window open)
-echo   - ASI Frontend (Keep this window open)
-echo.
-echo Starting services automatically in 3 seconds... (Ctrl+C to cancel)
-timeout /t 3 /nobreak >nul
-echo.
-
-REM Start backend in separate window with proper path
-echo Starting backend server...
-start "ASI Backend" cmd /k "cd /d "%~dp0" && python -m uvicorn backend.api.main:app --host 0.0.0.0 --port 8000 --no-access-log"
-
-REM Wait a few seconds for backend to start
-echo Waiting for backend to initialize...
-timeout /t 5 /nobreak >nul
-
-REM Start frontend in separate window
-echo Starting frontend server...
-start "ASI Frontend" cmd /k "cd /d "%~dp0frontend" && npm run dev"
-
-REM Wait for frontend to initialize
-echo Waiting for frontend to initialize...
-timeout /t 8 /nobreak >nul
-
-REM Open browser automatically
-echo Opening browser...
-start http://localhost:5173
-
-echo.
-echo ================================================================
-echo   SYSTEM STARTED!
-echo ================================================================
-echo.
-echo Two windows have opened:
-echo   - ASI Backend (running on port 8000)
-echo   - ASI Frontend (running on port 5173)
-echo.
-echo Browser opened automatically to: http://localhost:5173
-echo If it didn't open, open that URL manually.
-echo.
-if defined SHOW_VULN_RESTART_HINT (
-echo If you saw npm vulnerability warnings earlier, restart this terminal / launcher once now that startup is complete.
-echo.
+    echo Press Enter to close...
+    pause >nul
 )
-echo To stop the system: Close both service windows
-echo.
-echo This launcher window can now be closed.
-echo.
-echo Closing launcher window automatically in 3 seconds...
-timeout /t 3 /nobreak >nul
-exit /b 0
+exit /b %EXIT_CODE%
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..a07ae6a
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,40 @@
+FROM python:3.12-slim
+
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PIP_DISABLE_PIP_VERSION_CHECK=1 \
+    PIP_NO_CACHE_DIR=1 \
+    MOTO_GENERIC_MODE=true \
+    HOST=0.0.0.0 \
+    PORT=8000 \
+    MOTO_DATA_ROOT=/app/backend/data
+
+WORKDIR /app
+
+RUN apt-get update \
+    && apt-get install -y --no-install-recommends libgomp1 \
+    && rm -rf /var/lib/apt/lists/*
+
+COPY requirements.txt requirements-generic.txt ./
+
+RUN pip install --upgrade pip \
+    && pip install -r requirements-generic.txt
+
+COPY package.json moto-update-manifest.json ./
+COPY backend ./backend
+COPY docker ./docker
+
+RUN sed -i 's/\r$//' /app/docker/entrypoint.sh \
+    && chmod +x /app/docker/entrypoint.sh \
+    && mkdir -p /app/backend/data \
+    && python - <<'PY'
+from fastembed import TextEmbedding
+
+from backend.shared.fastembed_provider import FASTEMBED_MODEL_NAME
+
+TextEmbedding(model_name=FASTEMBED_MODEL_NAME)
+PY
+
+EXPOSE 8000
+
+ENTRYPOINT ["/app/docker/entrypoint.sh"]
diff --git a/LICENSE b/LICENSE
index 767b08e..4939de1 100644
--- a/LICENSE
+++ b/LICENSE
@@ -20,15 +20,3 @@ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
 
----
-
-DISCLAIMER FOR AI-GENERATED CONTENT:
-
-This software generates autonomous AI solutions that have not been peer-reviewed.
-Papers and content generated by this system are created without direct human
-oversight beyond initial prompts. All generated content should be viewed with
-extreme scrutiny and independently verified before use in any critical context.
-
-The authors and contributors make no warranties about the accuracy, completeness,
-or validity of AI-generated mathematical content, proofs, or claims.
-
diff --git a/Launch MOTO.sh b/Launch MOTO.sh
new file mode 100644
index 0000000..7c3dd23
--- /dev/null
+++ b/Launch MOTO.sh	
@@ -0,0 +1,44 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+VENV_DIR="$SCRIPT_DIR/.venv"
+PYTHON_BIN="$VENV_DIR/bin/python"
+
+resolve_bootstrap_python() {
+    if command -v python3 >/dev/null 2>&1; then
+        command -v python3
+        return 0
+    fi
+    if command -v python >/dev/null 2>&1; then
+        command -v python
+        return 0
+    fi
+    return 1
+}
+
+if [[ ! -x "$PYTHON_BIN" ]]; then
+    BOOTSTRAP_PYTHON="$(resolve_bootstrap_python || true)"
+    if [[ -z "${BOOTSTRAP_PYTHON:-}" ]]; then
+        echo "ERROR: Python 3.8+ is required to launch MOTO on Ubuntu 24.04."
+        echo "Install Python 3 and python3-venv, then run this launcher again."
+        echo "Example: sudo apt install python3 python3-venv"
+        exit 1
+    fi
+
+    echo "Creating repo-local Python environment in .venv ..."
+    if ! "$BOOTSTRAP_PYTHON" -m venv "$VENV_DIR"; then
+        echo "ERROR: Failed to create the repo-local Python environment."
+        echo "On Ubuntu 24.04, ensure python3-venv is installed:"
+        echo "  sudo apt install python3-venv"
+        exit 1
+    fi
+fi
+
+if [[ ! -x "$PYTHON_BIN" ]]; then
+    echo "ERROR: Expected launcher interpreter at $PYTHON_BIN"
+    exit 1
+fi
+
+export MOTO_LAUNCHER_ENTRYPOINT="$SCRIPT_DIR/Launch MOTO.sh"
+exec "$PYTHON_BIN" "$SCRIPT_DIR/moto_launcher.py" "$@"
diff --git a/README.md b/README.md
index 7e2b85c..f53fc18 100644
--- a/README.md
+++ b/README.md
@@ -1,12 +1,12 @@
 # MOTO Autonomous ASI - Novel S.T.E.M. Solution Variant for ASI Automated Theory Generation
 # Autonomous Superintelligence Deep Research Harness
-**Version: 1.0.6**
+**Version: 1.0.7**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assist in decyphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. This is useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in decyphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. This exact versin of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
 ### The Core Discovery: Top-P Exploration 
 
@@ -18,9 +18,9 @@ The brainstorming phase runs **multiple submitters in parallel**, each independe
 
 Once a brainstorm is sufficiently explored, MOTO writes a research paper from it. This step then repeats — papers become a new "Tier 2" brainstorm. Previous papers are referenced in future brainstorms and future papers. This set of Tier 2 papers is another higher-order brainstorm-like database, which also self-prunes newly discovered incorrect or redundant papers just like the Tier 1 short-hand idea brainstorm does. A third tier generates the final answer, capable of producing book-length volumes.
 
-MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its experimental mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is an experimental system; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
+MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its long-form synthesis mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is a research prototype; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
-Give the program a try, MOTO is as cool as it sounds – there is a one-click installer. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green “< > Code” drop-down menu on the top right of this GitHub page, download the zip file, extract it to your desktop then double-click "Click To Launch MOTO.bat". Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile – if desired and you are unsure you may use the preselected “fastest” profile.
+Give the program a try, MOTO is as cool as it sounds - Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash "Launch MOTO.sh"`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
 
@@ -70,10 +70,47 @@ Before installation, you need:
    - Check all prerequisites
    - Install Python and Node.js dependencies automatically
    - Create necessary directories
+   - Check the official GitHub `main` build manifest before startup
+   - Offer a prompted update flow for supported installs when `main` is ahead
    - Start backend and frontend servers
    - Open the UI in your browser
 
-**That's it!** The system will be running at `http://localhost:5173`
+**That's it!** The system will usually be running at `http://localhost:5173`. If another local MOTO instance already owns the default ports, the launcher now opens an isolated second instance on the next free backend/frontend port pair instead of stopping the first instance.
+
+#### Ubuntu 24.04 (Launcher + Updater Parity)
+
+1. Clone or download this repository
+2. Start LM Studio and load your models and `nomic-embed-text-v1.5` **and/or** have your OpenRouter API key ready
+3. From the repo root, run:
+
+```bash
+bash "Launch MOTO.sh"
+```
+
+4. The Ubuntu launcher will:
+   - Create and reuse a repo-local `.venv` so package installs do not mutate the system Python
+   - Check Python, Node.js, Playwright, and desktop keyring readiness
+   - Check the official GitHub `main` build manifest before startup
+   - Offer the same prompted update flow used by Windows for supported installs
+   - Reuse the same multi-instance runtime contract and preservation rules as Windows
+   - Start backend and frontend services in separate desktop terminals when available, or fall back to background logs under the active log root if no desktop terminal emulator is available
+   - Open the UI in your browser
+
+**Ubuntu note:** If Playwright or the desktop keyring is unavailable, the launcher stays runnable and explains the limitation. Saved provider keys will only persist when a Linux desktop keyring backend is available.
+
+### Build Identity and Update Contract
+
+- `moto-update-manifest.json` is the authoritative Build 0 updater/build identity manifest for the `main` branch.
+- `GET /api/features` exposes the public build-comparison fields `version`, `build_commit`, `update_channel`, and `api_contract_version`.
+- Official update comparisons target GitHub `main`, not GitHub Releases.
+- `Click To Launch MOTO.bat` is the authoritative Windows launcher entrypoint and delegates to `moto_launcher.py`.
+- `Launch MOTO.sh` is the authoritative Ubuntu 24.04 launcher entrypoint; it bootstraps the repo-local `.venv`, delegates to `moto_launcher.py`, and is used again for relaunch after an update when MOTO was started from that wrapper.
+- Clean extracted ZIP installs and clean `main`-tracking git clones are the supported automatic update-apply targets.
+- Dirty or locally mutated repos remain runnable, but they are update-detection-only and are not eligible for automatic update-apply behavior.
+- If launcher-managed backend/frontend services from this install are still running, the updater warns and skips update-apply until those services are closed.
+- If GitHub `main` is reachable but `moto-update-manifest.json` is not published there yet, the launcher falls back to branch-head comparison and keeps update-apply disabled until the manifest is present.
+- Clean git updateability is preserved by avoiding silent tracked-file mutations during normal startup; for example, the launcher no longer auto-runs `npm audit fix`.
+- Preservation is defined against the active runtime roots, not only the default folders. The launcher may use `backend/data`, `backend/logs`, or instance-scoped `.moto_instances/<instance_id>/...` roots, and browser storage prefixes plus OS-keyring namespaces are part of that same preserved state boundary.
 
 ---
 
@@ -156,6 +193,8 @@ moto-math-variant/
 ├── .cursor/
 │   └── rules/               # AI agent design specifications (full system documentation)
 ├── Click To Launch MOTO.bat  # One-click Windows launcher
+├── moto_launcher.py          # Internal Python launcher orchestration
+├── moto_updater.py           # Build 1 updater helper and launcher state manager
 ├── requirements.txt         # Python dependencies
 └── package.json             # Node.js dependencies
 ```
@@ -222,7 +261,8 @@ All configurable per role:
 - Load embedding model: `nomic-ai/nomic-embed-text-v1.5`
 
 **"Port already in use"**
-- Close other apps using ports 8000 or 5173
+- MOTO now preserves the first local instance and launches a second isolated instance on the next free port pair when needed
+- Close other apps using ports 8000 or 5173 only if you specifically want the default instance to reclaim those ports
 - Restart computer if needed
 - Use different ports in config
 
@@ -242,8 +282,8 @@ All configurable per role:
 ### Common Error Messages
 
 **"ChromaDB corruption detected"**
-- Delete `backend/data/chroma_db` folder
-- Restart the system (launcher cleans ChromaDB automatically)
+- Delete the active instance data root's `chroma_db` folder (for the default desktop instance this is `backend/data/chroma_db`)
+- Restart the system (the launcher preserves runtime roots; it does not automatically clean ChromaDB)
 
 **"Context window exceeded"**
 - Reduce context size in settings
@@ -268,6 +308,8 @@ All configurable per role:
 
 #### Manual Installation (All Platforms)
 
+If you want the consumer launcher experience on Ubuntu 24.04, prefer `bash "Launch MOTO.sh"` instead of the manual steps below. The manual flow remains the fallback path when you intentionally want full terminal-level control.
+
 ```bash
 # Clone the repository
 git clone https://github.com/Intrafere/MOTO-Autonomous-ASI
diff --git a/_moto_internal_launcher.ps1 b/_moto_internal_launcher.ps1
deleted file mode 100644
index 7d45baa..0000000
--- a/_moto_internal_launcher.ps1
+++ /dev/null
@@ -1,332 +0,0 @@
-# MOTO Internal Launcher (PowerShell)
-# This is an internal script. Use "Click To Launch MOTO.bat" instead.
-# If needed manually: powershell -ExecutionPolicy Bypass -File _moto_internal_launcher.ps1
-
-# ================================================================
-# CRITICAL: This prevents the window from closing on errors
-# ================================================================
-$ErrorActionPreference = "Stop"
-
-function Exit-WithPause {
-    param([int]$ExitCode = 0)
-    Write-Host ""
-    Write-Host "Press Enter to close..." -ForegroundColor Yellow
-    Read-Host
-    exit $ExitCode
-}
-
-try {
-    Clear-Host
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host "  ASI Aggregator-Compiler System - One-Click Launcher" -ForegroundColor Cyan
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host ""
-
-    # Function to check if command exists
-    function Test-Command($cmdname) {
-        return [bool](Get-Command -Name $cmdname -ErrorAction SilentlyContinue)
-    }
-
-    # Check for Python
-    Write-Host "[1/8] Checking Python installation..." -ForegroundColor Yellow
-    if (-not (Test-Command python)) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Python is not installed or not in PATH" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please install Python 3.8+ from:" -ForegroundColor Yellow
-        Write-Host "https://www.python.org/downloads/" -ForegroundColor Yellow
-        Write-Host ""
-        Write-Host "IMPORTANT: Check 'Add Python to PATH' during installation" -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    $pythonVersion = python --version
-    Write-Host $pythonVersion -ForegroundColor Green
-    Write-Host ""
-
-    # Check for Node.js
-    Write-Host "[2/8] Checking Node.js installation..." -ForegroundColor Yellow
-    if (-not (Test-Command node)) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Node.js is not installed or not in PATH" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please install Node.js 16+ from:" -ForegroundColor Yellow
-        Write-Host "https://nodejs.org/" -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    $nodeVersion = node --version
-    $npmVersion = npm --version
-    Write-Host "Node: $nodeVersion" -ForegroundColor Green
-    Write-Host "npm: $npmVersion" -ForegroundColor Green
-    Write-Host ""
-
-    # Create necessary directories & clean ChromaDB
-    Write-Host "[3/8] Creating necessary directories..." -ForegroundColor Yellow
-    $directories = @(
-        "backend\data",
-        "backend\data\user_uploads",
-        "backend\logs"
-    )
-    foreach ($dir in $directories) {
-        if (-not (Test-Path $dir)) {
-            New-Item -ItemType Directory -Path $dir -Force | Out-Null
-            Write-Host "Created: $dir" -ForegroundColor Green
-        }
-    }
-    Write-Host "Directories ready!" -ForegroundColor Green
-    
-    # Clean ChromaDB on startup to prevent corruption issues
-    $chromaPath = "backend\data\chroma_db"
-    if (Test-Path $chromaPath) {
-        Write-Host "Cleaning ChromaDB database..." -ForegroundColor Yellow
-        Remove-Item -Path $chromaPath -Recurse -Force
-        Write-Host "ChromaDB cleaned!" -ForegroundColor Green
-    }
-    Write-Host ""
-
-    # Install/Update Python dependencies
-    Write-Host "[4/8] Installing Python dependencies..." -ForegroundColor Yellow
-    Write-Host "Upgrading pip and checking packages..." -ForegroundColor Yellow
-    Write-Host ""
-    python -m pip install --upgrade pip 2>&1 | Out-Null
-    pip install --upgrade -r requirements.txt
-    if ($LASTEXITCODE -ne 0) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Failed to install Python dependencies" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please check:" -ForegroundColor Yellow
-        Write-Host "- Internet connection is working" -ForegroundColor Yellow
-        Write-Host "- You have permission to install packages" -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    Write-Host "Python dependencies up to date" -ForegroundColor Green
-    Write-Host ""
-
-    # Install Playwright Chromium browser (one-time ~150MB download for PDF generation)
-    Write-Host "[4b/8] Installing Playwright Chromium browser for PDF generation..." -ForegroundColor Yellow
-    Write-Host "This is a one-time download (~150MB) and may take a few minutes..." -ForegroundColor Yellow
-    Write-Host ""
-    python -m playwright install chromium 2>&1
-    if ($LASTEXITCODE -ne 0) {
-        Write-Host ""
-        Write-Host "WARNING: Playwright Chromium install failed." -ForegroundColor Yellow
-        Write-Host "PDF generation will not be available until resolved." -ForegroundColor Yellow
-        Write-Host "Retry manually: python -m playwright install chromium" -ForegroundColor Yellow
-        Write-Host "Continuing startup anyway..." -ForegroundColor Yellow
-    } else {
-        Write-Host "Playwright Chromium ready!" -ForegroundColor Green
-    }
-    Write-Host ""
-
-    # Check/Install Node.js dependencies
-    Write-Host "[5/8] Checking Node.js dependencies..." -ForegroundColor Yellow
-    if (-not (Test-Path "frontend")) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: frontend directory not found!" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Make sure you're running this from the project root directory." -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    
-    Set-Location frontend
-    $showVulnerabilityRestartHint = $false
-    if (-not (Test-Path "node_modules")) {
-        Write-Host "Installing Node.js dependencies..." -ForegroundColor Yellow
-        Write-Host "This may take a few minutes..." -ForegroundColor Yellow
-    } else {
-        Write-Host "Updating Node.js dependencies..." -ForegroundColor Yellow
-    }
-    Write-Host ""
-    $npmInstallLog = Join-Path $env:TEMP ("moto_npm_install_{0}.log" -f ([guid]::NewGuid().ToString("N")))
-    npm install 2>&1 | Tee-Object -FilePath $npmInstallLog
-    $npmInstallExit = $LASTEXITCODE
-    if (Test-Path $npmInstallLog) {
-        $showVulnerabilityRestartHint = Select-String -Path $npmInstallLog -Pattern "vulnerabilities found" -Quiet
-        Remove-Item -Path $npmInstallLog -Force -ErrorAction SilentlyContinue
-    }
-    if ($npmInstallExit -ne 0) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Failed to install Node.js dependencies" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please check:" -ForegroundColor Yellow
-        Write-Host "- Internet connection is working" -ForegroundColor Yellow
-        Write-Host "- package.json exists in frontend directory" -ForegroundColor Yellow
-        Set-Location ..
-        Exit-WithPause -ExitCode 1
-    }
-    Write-Host "Node.js dependencies up to date" -ForegroundColor Green
-    if ($showVulnerabilityRestartHint) {
-        Write-Host "" 
-        Write-Host "NOTE: npm reported vulnerability warnings during install." -ForegroundColor Yellow
-        Write-Host "MOTO is running npm audit fix automatically right now." -ForegroundColor Yellow
-        Write-Host "After startup finishes, restart this terminal / launcher once to check whether the warning is gone." -ForegroundColor Yellow
-    }
-    Write-Host "Fixing known vulnerabilities automatically..." -ForegroundColor Yellow
-    npm audit fix 2>&1 | Out-Null
-    Set-Location ..
-    Write-Host ""
-
-    # Check for LM Studio (optional - OpenRouter is an alternative)
-    Write-Host "[6/8] Checking LM Studio..." -ForegroundColor Yellow
-    Write-Host ""
-    
-    # Check if LM Studio is responding
-    $lmStudioAvailable = $false
-    try {
-        $response = Invoke-WebRequest -Uri "http://127.0.0.1:1234/v1/models" -TimeoutSec 3 -UseBasicParsing -ErrorAction Stop
-        $lmStudioAvailable = $true
-    } catch {
-        $lmStudioAvailable = $false
-    }
-    
-    if ($lmStudioAvailable) {
-        Write-Host "LM Studio is running and responding!" -ForegroundColor Green
-    } else {
-        Write-Host "================================================================" -ForegroundColor Cyan
-        Write-Host "NOTE: LM Studio is not detected on http://127.0.0.1:1234" -ForegroundColor Cyan
-        Write-Host "================================================================" -ForegroundColor Cyan
-        Write-Host ""
-        Write-Host "This is OK! You have two options for AI models:" -ForegroundColor Yellow
-        Write-Host ""
-        Write-Host "  Option 1: LM Studio (Local)" -ForegroundColor Yellow
-        Write-Host "    - Download from: https://lmstudio.ai/" -ForegroundColor White
-        Write-Host "    - Load a model and start the Local Server" -ForegroundColor White
-        Write-Host ""
-        Write-Host "  Option 2: OpenRouter (Cloud API)" -ForegroundColor Yellow
-        Write-Host "    - Get an API key from: https://openrouter.ai/" -ForegroundColor White
-        Write-Host "    - Configure in Settings tab after launch" -ForegroundColor White
-        Write-Host ""
-        Write-Host "The system will start - configure your preferred provider in Settings." -ForegroundColor Green
-    }
-    Write-Host ""
-
-    # Clean up any existing processes on ports 8000 and 5173
-    Write-Host "[7/8] Cleaning up existing processes on ports 8000 and 5173..." -ForegroundColor Yellow
-    Write-Host ""
-    
-    # Kill processes on port 8000
-    $port8000 = Get-NetTCPConnection -LocalPort 8000 -State Listen -ErrorAction SilentlyContinue
-    if ($port8000) {
-        foreach ($conn in $port8000) {
-            Write-Host "Found process $($conn.OwningProcess) using port 8000, terminating..." -ForegroundColor Yellow
-            Stop-Process -Id $conn.OwningProcess -Force -ErrorAction SilentlyContinue
-        }
-    }
-    
-    # Kill processes on port 5173
-    $port5173 = Get-NetTCPConnection -LocalPort 5173 -State Listen -ErrorAction SilentlyContinue
-    if ($port5173) {
-        foreach ($conn in $port5173) {
-            Write-Host "Found process $($conn.OwningProcess) using port 5173, terminating..." -ForegroundColor Yellow
-            Stop-Process -Id $conn.OwningProcess -Force -ErrorAction SilentlyContinue
-        }
-    }
-    
-    # Wait for ports to be released
-    Start-Sleep -Seconds 2
-    
-    # Verify ports are available
-    $port8000Check = Get-NetTCPConnection -LocalPort 8000 -State Listen -ErrorAction SilentlyContinue
-    if ($port8000Check) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Port 8000 is still in use after cleanup attempt!" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please manually close any applications using port 8000." -ForegroundColor Yellow
-        Write-Host "You can check with: Get-NetTCPConnection -LocalPort 8000" -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    
-    $port5173Check = Get-NetTCPConnection -LocalPort 5173 -State Listen -ErrorAction SilentlyContinue
-    if ($port5173Check) {
-        Write-Host ""
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host "ERROR: Port 5173 is still in use after cleanup attempt!" -ForegroundColor Red
-        Write-Host "============================================================" -ForegroundColor Red
-        Write-Host ""
-        Write-Host "Please manually close any applications using port 5173." -ForegroundColor Yellow
-        Write-Host "You can check with: Get-NetTCPConnection -LocalPort 5173" -ForegroundColor Yellow
-        Exit-WithPause -ExitCode 1
-    }
-    
-    Write-Host "Ports 8000 and 5173 are available!" -ForegroundColor Green
-    Write-Host ""
-
-    # Start the system
-    Write-Host "[8/8] Starting services..." -ForegroundColor Yellow
-    Write-Host ""
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host "  All checks passed! Starting system..." -ForegroundColor Cyan
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host ""
-    Write-Host "Backend API will run on: http://localhost:8000" -ForegroundColor Green
-    Write-Host "Frontend UI will run on: http://localhost:5173" -ForegroundColor Green
-    Write-Host ""
-    Write-Host "Press any key to start the services..." -ForegroundColor Yellow
-    $null = $Host.UI.RawUI.ReadKey("NoEcho,IncludeKeyDown")
-    Write-Host ""
-
-    # Start backend in new window
-    $backendPath = Join-Path $PSScriptRoot "backend"
-    Start-Process powershell -ArgumentList "-NoExit", "-Command", "cd '$backendPath'; Write-Host 'Starting Backend...' -ForegroundColor Cyan; python -m api.main"
-
-    # Wait for backend to start
-    Write-Host "Waiting for backend to start..." -ForegroundColor Yellow
-    Start-Sleep -Seconds 5
-
-    # Start frontend in new window
-    $frontendPath = Join-Path $PSScriptRoot "frontend"
-    Start-Process powershell -ArgumentList "-NoExit", "-Command", "cd '$frontendPath'; Write-Host 'Starting Frontend...' -ForegroundColor Cyan; npm run dev"
-
-    # Wait for frontend to initialize
-    Write-Host "Waiting for frontend to initialize..." -ForegroundColor Yellow
-    Start-Sleep -Seconds 8
-
-    # Open browser automatically
-    Write-Host "Opening browser..." -ForegroundColor Green
-    Start-Process "http://localhost:5173"
-
-    Write-Host ""
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host "  SYSTEM STARTED!" -ForegroundColor Cyan
-    Write-Host "================================================================" -ForegroundColor Cyan
-    Write-Host ""
-    Write-Host "Two windows have opened:" -ForegroundColor Green
-    Write-Host "  - ASI Backend (running on port 8000)" -ForegroundColor Green
-    Write-Host "  - ASI Frontend (running on port 5173)" -ForegroundColor Green
-    Write-Host ""
-    Write-Host "Browser opened automatically to:" -ForegroundColor Green
-    Write-Host "  http://localhost:5173" -ForegroundColor Cyan
-    Write-Host ""
-    Write-Host "If it didn't open, open that URL manually." -ForegroundColor Yellow
-    Write-Host ""
-    if ($showVulnerabilityRestartHint) {
-        Write-Host "If you saw npm vulnerability warnings earlier, restart this terminal / launcher once now that startup is complete." -ForegroundColor Yellow
-        Write-Host ""
-    }
-    Write-Host "To stop the system: Close both service windows" -ForegroundColor Yellow
-    Write-Host ""
-    Write-Host "This launcher window can now be closed." -ForegroundColor Green
-    Write-Host ""
-    Exit-WithPause -ExitCode 0
-
-} catch {
-    Write-Host ""
-    Write-Host "============================================================" -ForegroundColor Red
-    Write-Host "FATAL ERROR: $($_.Exception.Message)" -ForegroundColor Red
-    Write-Host "============================================================" -ForegroundColor Red
-    Write-Host ""
-    Write-Host "Stack Trace:" -ForegroundColor Yellow
-    Write-Host $_.ScriptStackTrace -ForegroundColor Yellow
-    Exit-WithPause -ExitCode 1
-}
diff --git a/backend/aggregator/agents/submitter.py b/backend/aggregator/agents/submitter.py
index 12123ec..0ca5646 100644
--- a/backend/aggregator/agents/submitter.py
+++ b/backend/aggregator/agents/submitter.py
@@ -15,6 +15,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.json_parser import parse_json
+from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.core.queue_manager import queue_manager
 from backend.aggregator.memory.shared_training import shared_training_memory
@@ -45,7 +46,7 @@ def __init__(
     ):
         self.submitter_id = submitter_id
         self.model_name = model_name
-        self.user_prompt = user_prompt
+        self.user_prompt = proof_database.inject_into_prompt(user_prompt)
         self.user_files_content = user_files_content
         self.websocket_broadcaster = websocket_broadcaster
         self.coordinator = coordinator
@@ -115,9 +116,9 @@ async def _run_loop(self) -> None:
         
         while self.is_running:
             try:
-                # Check if we should pause due to queue overflow
-                if self.coordinator and self.coordinator.should_pause_submitters:
-                    logger.debug(f"Submitter {self.submitter_id} paused (queue overflow)")
+                # Check if we should pause due to queue overflow or per-submitter fairness cap
+                if self.coordinator and await self.coordinator.should_pause_submitter(self.submitter_id):
+                    logger.debug(f"Submitter {self.submitter_id} paused (queue overflow or per-submitter cap)")
                     await asyncio.sleep(2)  # Wait before checking again
                     continue
                 
@@ -127,12 +128,23 @@ async def _run_loop(self) -> None:
                 submission = await self._generate_submission()
                 if submission:
                     # Hold submission until queue has capacity (prevents overflow when
-                    # the LLM call was already in-flight when the queue filled up)
+                    # the LLM call was already in-flight when the queue filled up).
+                    # Also respect the per-submitter fairness cap so a fast submitter
+                    # that just finished a call doesn't push itself over its personal limit.
                     while self.is_running:
-                        queue_size = await queue_manager.size()
-                        if queue_size < system_config.queue_overflow_threshold:
-                            break
-                        logger.debug(f"Submitter {self.submitter_id}: Queue full ({queue_size}), holding submission")
+                        if self.coordinator:
+                            if not await self.coordinator.should_pause_submitter(self.submitter_id):
+                                break
+                            queue_size = await queue_manager.size()
+                            logger.debug(
+                                f"Submitter {self.submitter_id}: Holding submission "
+                                f"(queue={queue_size}, own>{system_config.per_submitter_queue_threshold} possible)"
+                            )
+                        else:
+                            queue_size = await queue_manager.size()
+                            if queue_size < system_config.queue_overflow_threshold:
+                                break
+                            logger.debug(f"Submitter {self.submitter_id}: Queue full ({queue_size}), holding submission")
                         await asyncio.sleep(2)
 
                     if self.submission_callback and self.is_running:
diff --git a/backend/aggregator/agents/validator.py b/backend/aggregator/agents/validator.py
index 5eff887..5551f25 100644
--- a/backend/aggregator/agents/validator.py
+++ b/backend/aggregator/agents/validator.py
@@ -13,6 +13,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.json_parser import parse_json
+from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.memory.shared_training import shared_training_memory
 from backend.aggregator.prompts.validator_prompts import (
@@ -52,7 +53,7 @@ def __init__(
         websocket_broadcaster: Optional[Callable] = None
     ):
         self.model_name = model_name
-        self.user_prompt = user_prompt
+        self.user_prompt = proof_database.inject_into_prompt(user_prompt)
         self.user_files_content = user_files_content
         self.chunk_size = rag_config.validator_chunk_size  # Always 512
         self.websocket_broadcaster = websocket_broadcaster
diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index 344065a..522c28b 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -486,7 +486,7 @@ async def _check_and_update_pause_state(self) -> None:
         if should_pause != self.should_pause_submitters:
             self.should_pause_submitters = should_pause
             if should_pause:
-                logger.warning(f"Queue size ({queue_size}) >= threshold ({system_config.queue_overflow_threshold}). Pausing submitters.")
+                logger.info(f"Queue size ({queue_size}) >= threshold ({system_config.queue_overflow_threshold}). Pausing submitters.")
                 await self._broadcast("submitters_paused", {
                     "queue_size": queue_size,
                     "threshold": system_config.queue_overflow_threshold
@@ -497,6 +497,25 @@ async def _check_and_update_pause_state(self) -> None:
                     "queue_size": queue_size
                 })
     
+    async def should_pause_submitter(self, submitter_id: int) -> bool:
+        """
+        Per-submitter fairness gate.
+        
+        Returns True if:
+          - the global queue-overflow pause is active (queue >= queue_overflow_threshold), OR
+          - this specific submitter already has more than per_submitter_queue_threshold
+            of its own submissions waiting in the queue.
+        
+        The per-submitter cap is skipped when only one submitter is configured
+        (no one else to be fair to - the global cap alone governs throughput).
+        """
+        if self.should_pause_submitters:
+            return True
+        if len(self.submitters) <= 1:
+            return False
+        own_count = await queue_manager.count_for_submitter(submitter_id)
+        return own_count > system_config.per_submitter_queue_threshold
+    
     async def start(self) -> None:
         """Start the aggregator system."""
         if self.is_running:
diff --git a/backend/aggregator/core/queue_manager.py b/backend/aggregator/core/queue_manager.py
index bb82b25..e7a7b50 100644
--- a/backend/aggregator/core/queue_manager.py
+++ b/backend/aggregator/core/queue_manager.py
@@ -69,6 +69,11 @@ async def size(self) -> int:
         """Get current queue size."""
         async with self._lock:
             return len(self.queue)
+
+    async def count_for_submitter(self, submitter_id: int) -> int:
+        """Count how many pending submissions were produced by a specific submitter."""
+        async with self._lock:
+            return sum(1 for s in self.queue if s.submitter_id == submitter_id)
     
     async def clear(self) -> None:
         """Clear the queue."""
@@ -103,7 +108,7 @@ async def dequeue_batch(self, max_count: int = 3) -> List[Submission]:
             
             # Check for overflow (for monitoring/logging only - coordinator handles pausing)
             if len(self.queue) >= self.overflow_threshold:
-                logger.warning(
+                logger.debug(
                     f"Queue size ({len(self.queue)}) >= overflow threshold ({self.overflow_threshold}). "
                     f"Submitters should be paused by coordinator."
                 )
diff --git a/backend/aggregator/core/rag_manager.py b/backend/aggregator/core/rag_manager.py
index 156a046..4e1e35c 100644
--- a/backend/aggregator/core/rag_manager.py
+++ b/backend/aggregator/core/rag_manager.py
@@ -212,39 +212,42 @@ async def _add_chunks(self, chunks: List[DocumentChunk], chunk_size: int) -> Non
             return
         
         texts = [chunk.text for chunk in chunks]
-        
-        # ACQUIRE GLOBAL LOCK FOR EMBEDDINGS
-        await rag_operation_lock.acquire(f"RAGManager add_chunks (size={chunk_size})")
-        try:
+
+        if system_config.generic_mode:
             embeddings = await api_client_manager.get_embeddings(texts)
+            await rag_operation_lock.acquire(f"RAGManager add_chunks write (size={chunk_size})")
+        else:
+            await rag_operation_lock.acquire(f"RAGManager add_chunks (size={chunk_size})")
+            embeddings = await api_client_manager.get_embeddings(texts)
+
+        try:
+            # Update chunks with embeddings and tokens
+            for chunk, embedding in zip(chunks, embeddings):
+                chunk.embedding = embedding
+                chunk.tokens = chunk.text.lower().split()
+
+            # ChromaDB writes stay under the global RAG lock in both modes.
+            collection = self.collections[chunk_size]
+            try:
+                collection.add(
+                    ids=[chunk.chunk_id for chunk in chunks],
+                    embeddings=embeddings,
+                    documents=texts,
+                    metadatas=[chunk.metadata for chunk in chunks]
+                )
+                logger.debug(f"Added {len(chunks)} chunks to ChromaDB collection (size={chunk_size})")
+            except Exception as e:
+                logger.error(f"CRITICAL: ChromaDB add failed for chunk_size={chunk_size}: {type(e).__name__}: {e}")
+                logger.error(f"Attempting to add {len(chunks)} chunks with IDs: {[c.chunk_id for c in chunks][:5]}...")
+                raise
+
+            # Add to memory
+            self.chunks_by_size[chunk_size].extend(chunks)
+
+            # Invalidate BM25 index for this size
+            self.bm25_index[chunk_size] = None
         finally:
             rag_operation_lock.release()
-        
-        # Update chunks with embeddings and tokens
-        for chunk, embedding in zip(chunks, embeddings):
-            chunk.embedding = embedding
-            chunk.tokens = chunk.text.lower().split()
-        
-        # Add to ChromaDB (no lock needed - writes are local)
-        collection = self.collections[chunk_size]
-        try:
-            collection.add(
-                ids=[chunk.chunk_id for chunk in chunks],
-                embeddings=embeddings,
-                documents=texts,
-                metadatas=[chunk.metadata for chunk in chunks]
-            )
-            logger.debug(f"Added {len(chunks)} chunks to ChromaDB collection (size={chunk_size})")
-        except Exception as e:
-            logger.error(f"CRITICAL: ChromaDB add failed for chunk_size={chunk_size}: {type(e).__name__}: {e}")
-            logger.error(f"Attempting to add {len(chunks)} chunks with IDs: {[c.chunk_id for c in chunks][:5]}...")
-            raise
-        
-        # Add to memory
-        self.chunks_by_size[chunk_size].extend(chunks)
-        
-        # Invalidate BM25 index for this size
-        self.bm25_index[chunk_size] = None
     
     async def _rewrite_query(self, query: str) -> List[str]:
         """Stage A: Expand query into semantic variants."""
diff --git a/backend/api/main.py b/backend/api/main.py
index f716228..b7f41bf 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -1,14 +1,32 @@
 """
 FastAPI main application.
 """
+import asyncio
+import os
+from pathlib import Path
+from typing import Optional
 from fastapi import FastAPI
 from contextlib import asynccontextmanager
 import logging
 
 from backend.api.middleware import setup_middleware
-from backend.api.routes import aggregator, websocket, compiler, autonomous, boost, workflow, openrouter, download
+from backend.api.routes import (
+    aggregator,
+    websocket,
+    compiler,
+    autonomous,
+    boost,
+    workflow,
+    openrouter,
+    download,
+    features,
+    health,
+    proofs,
+)
+from backend.shared.build_info import get_build_info
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.config import rag_config, system_config
+from backend.shared.lean4_client import clear_lean4_client, close_lean4_client, initialize_lean4_client
 from backend.aggregator.core.coordinator import coordinator
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
@@ -25,29 +43,83 @@
 logging.getLogger("httpx").setLevel(logging.WARNING)
 logging.getLogger("urllib3").setLevel(logging.WARNING)
 
+build_info = get_build_info()
 
-@asynccontextmanager
-async def lifespan(app: FastAPI):
-    """Lifespan events for the FastAPI app."""
-    # Startup
-    logger.info("Starting ASI Aggregator System...")
+_TRUTHY_ENV_VALUES = {"1", "true", "yes", "on"}
 
-    # Restore securely persisted provider credentials before the UI checks status.
-    from backend.shared.api_client_manager import api_client_manager
-    try:
-        from backend.shared.secret_store import (
-            SecretStoreError,
-            load_openrouter_api_key,
-            load_wolfram_api_key,
+
+def _env_flag_enabled(name: str) -> bool:
+    """Return True when an environment flag is set to a truthy value."""
+    return os.environ.get(name, "").strip().lower() in _TRUTHY_ENV_VALUES
+
+
+def _apply_generic_mode_from_env() -> None:
+    """Enable generic mode from the explicit hosted deployment env var."""
+    if _env_flag_enabled("MOTO_GENERIC_MODE"):
+        system_config.generic_mode = True
+
+
+def _validate_generic_mode_startup_env() -> None:
+    """Fail closed when hosted runtime auth inputs are missing."""
+    if not system_config.generic_mode:
+        return
+
+    missing: list[str] = []
+
+    if not any(os.environ.get(name, "").strip() for name in ("MOTO_INSTANCE_ID", "INSTANCE_ID")):
+        missing.append("MOTO_INSTANCE_ID")
+    if not system_config.internal_proxy_secret:
+        missing.append("MOTO_INTERNAL_PROXY_SECRET")
+
+    if missing:
+        joined = ", ".join(missing)
+        raise RuntimeError(
+            f"Generic mode requires the following environment variables before startup: {joined}."
+        )
+
+
+def _apply_generic_mode_openrouter_env(api_client_manager) -> None:
+    """Load the hosted OpenRouter key from env without using the desktop keyring."""
+    api_key = os.environ.get("OPENROUTER_API_KEY", "").strip()
+    if not api_key:
+        logger.info(
+            "Generic mode started without OPENROUTER_API_KEY; OpenRouter can be configured later via proxied API routes."
         )
-        from backend.shared.wolfram_alpha_client import initialize_wolfram_client
+        return
 
+    rag_config.openrouter_api_key = api_key
+    rag_config.openrouter_enabled = True
+    api_client_manager.set_openrouter_api_key(api_key)
+    logger.info("Loaded OpenRouter API key from OPENROUTER_API_KEY for generic-mode startup")
+
+
+def _restore_desktop_provider_credentials(api_client_manager) -> None:
+    """Restore persisted desktop credentials from the OS-backed keyring."""
+    from backend.shared.secret_store import (
+        SecretStoreError,
+        get_active_service_name,
+        load_openrouter_api_key,
+        load_wolfram_api_key,
+    )
+    from backend.shared.wolfram_alpha_client import initialize_wolfram_client
+
+    logger.info(
+        "Secret store active: service_name='%s', namespace=%s",
+        get_active_service_name(),
+        system_config.secret_namespace or "<default>",
+    )
+
+    try:
         openrouter_api_key = load_openrouter_api_key()
         if openrouter_api_key:
             rag_config.openrouter_api_key = openrouter_api_key
             rag_config.openrouter_enabled = True
             api_client_manager.set_openrouter_api_key(openrouter_api_key)
             logger.info("Restored OpenRouter API key from secure backend storage")
+        else:
+            logger.info(
+                "No OpenRouter API key found in secure backend storage for this namespace"
+            )
 
         wolfram_api_key = load_wolfram_api_key()
         if wolfram_api_key:
@@ -55,15 +127,48 @@ async def lifespan(app: FastAPI):
             system_config.wolfram_alpha_api_key = wolfram_api_key
             system_config.wolfram_alpha_enabled = True
             logger.info("Restored Wolfram Alpha API key from secure backend storage")
-    except SecretStoreError as e:
-        logger.warning(f"Secure credential storage unavailable on startup: {e}")
-    except Exception as e:
-        logger.warning(f"Failed to restore provider credentials on startup: {e}")
-    
-    # Test LM Studio connection (non-blocking - system works without it)
-    connected = await lm_studio_client.test_connection()
-    if not connected:
-        logger.warning("LM Studio not available. System will default to OpenRouter when configured.")
+        else:
+            logger.info(
+                "No Wolfram Alpha API key found in secure backend storage for this namespace"
+            )
+    except SecretStoreError as exc:
+        logger.warning("Secure credential storage unavailable on startup: %s", exc)
+    except Exception as exc:
+        logger.warning("Failed to restore provider credentials on startup: %s", exc)
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    """Lifespan events for the FastAPI app."""
+    _apply_generic_mode_from_env()
+    _validate_generic_mode_startup_env()
+
+    # Startup
+    logger.info(
+        "Starting ASI Aggregator System instance '%s' (data_dir=%s, logs_dir=%s)",
+        system_config.instance_id,
+        system_config.data_dir,
+        system_config.logs_dir,
+    )
+
+    # Ensure per-instance mutable directories exist before subsystems touch them.
+    Path(system_config.data_dir).mkdir(parents=True, exist_ok=True)
+    Path(system_config.logs_dir).mkdir(parents=True, exist_ok=True)
+    Path(system_config.user_uploads_dir).mkdir(parents=True, exist_ok=True)
+
+    from backend.shared.api_client_manager import api_client_manager
+
+    if system_config.generic_mode:
+        logger.info("Generic mode enabled - LM Studio and OS keyring restore are bypassed")
+        _apply_generic_mode_openrouter_env(api_client_manager)
+    else:
+        # Restore securely persisted provider credentials before the UI checks status.
+        _restore_desktop_provider_credentials(api_client_manager)
+
+        # Test LM Studio connection (non-blocking - system works without it)
+        connected = await lm_studio_client.test_connection()
+        if not connected:
+            logger.warning("LM Studio not available. System will default to OpenRouter when configured.")
     
     # CRITICAL: Restore session context on startup to display existing data
     # This ensures brainstorms and papers are loaded from the correct session directory
@@ -74,25 +179,30 @@ async def lifespan(app: FastAPI):
         from backend.autonomous.memory.paper_library import paper_library
         from backend.autonomous.memory.research_metadata import research_metadata
         from backend.autonomous.memory.final_answer_memory import final_answer_memory
+        from backend.autonomous.memory.proof_database import proof_database
         
         # Check for a resumable session
-        interrupted_session = await session_manager.find_interrupted_session()
+        interrupted_session = await session_manager.find_interrupted_session(system_config.auto_sessions_base_dir)
         if interrupted_session:
             session_id = interrupted_session["session_id"]
             logger.info(f"Found resumable session on startup: {session_id}")
             
             # Resume the session to set the correct path context
-            await session_manager.resume_session(session_id)
+            await session_manager.resume_session(session_id, system_config.auto_sessions_base_dir)
             
             # Set session manager on all memory modules so they use session paths
             brainstorm_memory.set_session_manager(session_manager)
             paper_library.set_session_manager(session_manager)
             research_metadata.set_session_manager(session_manager)
             final_answer_memory.set_session_manager(session_manager)
+            proof_database.set_session_manager(session_manager)
             
             logger.info(f"Session context restored - brainstorms and papers will load from session: {session_id}")
         else:
             logger.info("No resumable session found - using legacy paths")
+            proof_database.set_session_manager(None)
+
+        await proof_database.initialize()
     except Exception as e:
         logger.warning(f"Failed to restore session context on startup: {e}")
         # Non-fatal - continue with legacy paths
@@ -108,16 +218,47 @@ async def lifespan(app: FastAPI):
     
     # Set API client manager broadcaster (token tracking, rate limits, fallbacks)
     api_client_manager.set_broadcast_callback(websocket.broadcast_event)
-    
+
+    # Lean 4 warm start must NEVER block the FastAPI lifespan. A cold Mathlib
+    # workspace can spend many minutes inside `lake update` / `lake exe cache
+    # get`, during which the backend would otherwise refuse every HTTP request
+    # (including `/api/openrouter/api-key-status`). Users then see the UI
+    # report "no OpenRouter key" even though the key is persisted in the OS
+    # keyring, until they happen to poll again after the bootstrap finishes.
+    # We fire-and-forget the warm start on a background task so the rest of
+    # the API is reachable the moment uvicorn is ready to accept connections.
+    lean4_warm_start_task: Optional[asyncio.Task] = None
+    if system_config.lean4_enabled:
+        try:
+            lean4_client = initialize_lean4_client()
+        except Exception as exc:
+            logger.warning("Lean 4 client initialization failed: %s", exc)
+        else:
+            async def _warm_start_lean4() -> None:
+                try:
+                    await lean4_client.warm_start()
+                except Exception as exc:  # pragma: no cover - defensive
+                    logger.warning("Lean 4 client warm start failed: %s", exc)
+
+            lean4_warm_start_task = asyncio.create_task(_warm_start_lean4())
+
     logger.info("ASI Aggregator System ready")
-    
+
     yield
     
     # Shutdown
     logger.info("Shutting down ASI Aggregator System...")
+    if lean4_warm_start_task is not None and not lean4_warm_start_task.done():
+        lean4_warm_start_task.cancel()
+        try:
+            await lean4_warm_start_task
+        except (asyncio.CancelledError, Exception):
+            pass
     await coordinator.stop()
     await compiler_coordinator.stop()
     await autonomous_coordinator.stop()
+    await close_lean4_client()
+    clear_lean4_client()
     await lm_studio_client.close()
     logger.info("Shutdown complete")
 
@@ -126,7 +267,7 @@ async def lifespan(app: FastAPI):
 app = FastAPI(
     title="ASI Aggregator System",
     description="AI-powered aggregator with RAG and multi-agent validation",
-    version="1.0.6",
+    version=build_info.version,
     lifespan=lifespan
 )
 
@@ -139,6 +280,9 @@ async def lifespan(app: FastAPI):
 app.include_router(autonomous.router)
 app.include_router(boost.router)
 app.include_router(workflow.router)
+app.include_router(features.router)
+app.include_router(health.router)
+app.include_router(proofs.router)
 app.include_router(openrouter.router)
 app.include_router(download.router)
 app.include_router(websocket.router)
@@ -149,7 +293,7 @@ async def root():
     """Root endpoint."""
     return {
         "name": "ASI Aggregator System",
-        "version": "1.0.6",
+        "version": build_info.version,
         "status": "running"
     }
 
@@ -162,5 +306,10 @@ async def health():
 
 if __name__ == "__main__":
     import uvicorn
-    uvicorn.run(app, host="0.0.0.0", port=8000, access_log=False)
+    uvicorn.run(
+        app,
+        host=system_config.backend_host,
+        port=system_config.backend_port,
+        access_log=False,
+    )
 
diff --git a/backend/api/middleware.py b/backend/api/middleware.py
index 8b052d5..357f160 100644
--- a/backend/api/middleware.py
+++ b/backend/api/middleware.py
@@ -2,18 +2,22 @@
 Middleware for CORS and error handling.
 """
 import os
-from fastapi import FastAPI
+from fastapi import FastAPI, Request
 from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
 import logging
 
+from backend.api.proxy_auth import ProxyAuthError, validate_proxy_headers
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 # Default allowed origins for local development
 DEFAULT_ORIGINS = [
-    "http://localhost:5173",
-    "http://127.0.0.1:5173",
-    "http://localhost:8000",
-    "http://127.0.0.1:8000",
+    f"http://localhost:{system_config.frontend_port}",
+    f"http://127.0.0.1:{system_config.frontend_port}",
+    f"http://localhost:{system_config.backend_port}",
+    f"http://127.0.0.1:{system_config.backend_port}",
 ]
 
 
@@ -22,7 +26,7 @@ def setup_middleware(app: FastAPI) -> None:
     
     # Allow custom origins via environment variable (comma-separated)
     # Example: CORS_ORIGINS=http://localhost:3000,http://example.com
-    custom_origins = os.environ.get("CORS_ORIGINS", "")
+    custom_origins = os.environ.get("MOTO_CORS_ORIGINS", "") or os.environ.get("CORS_ORIGINS", "")
     if custom_origins:
         origins = [o.strip() for o in custom_origins.split(",") if o.strip()]
         logger.info(f"Using custom CORS origins: {origins}")
@@ -38,5 +42,23 @@ def setup_middleware(app: FastAPI) -> None:
         allow_methods=["*"],
         allow_headers=["*"],
     )
+
+    @app.middleware("http")
+    async def generic_mode_proxy_auth(request: Request, call_next):
+        """Require signed internal proxy headers for protected hosted routes."""
+        if system_config.generic_mode:
+            try:
+                validate_proxy_headers(
+                    request.headers,
+                    method=request.method,
+                    path=request.url.path,
+                    expected_instance_id=system_config.instance_id,
+                    shared_secret=system_config.internal_proxy_secret or "",
+                )
+            except ProxyAuthError as exc:
+                logger.warning("Rejected generic-mode request %s %s: %s", request.method, request.url.path, exc.detail)
+                return JSONResponse(status_code=exc.status_code, content={"detail": exc.detail})
+
+        return await call_next(request)
     
     logger.info("Middleware configured")
diff --git a/backend/api/proxy_auth.py b/backend/api/proxy_auth.py
new file mode 100644
index 0000000..f1577c2
--- /dev/null
+++ b/backend/api/proxy_auth.py
@@ -0,0 +1,115 @@
+"""
+Generic-mode internal proxy authentication helpers.
+"""
+from __future__ import annotations
+
+import hashlib
+import hmac
+import time
+from typing import Mapping
+
+from fastapi import status
+
+PROXY_INSTANCE_HEADER = "X-Moto-Instance-Id"
+PROXY_TIMESTAMP_HEADER = "X-Moto-Proxy-Timestamp"
+PROXY_SIGNATURE_HEADER = "X-Moto-Proxy-Signature"
+PROXY_AUTH_MAX_SKEW_SECONDS = 60
+PROXY_AUTH_ALLOWLIST = {
+    ("GET", "/health"),
+    ("GET", "/api/health"),
+    ("GET", "/api/features"),
+}
+
+
+class ProxyAuthError(RuntimeError):
+    """Raised when generic-mode proxy authentication fails."""
+
+    def __init__(self, detail: str, status_code: int):
+        super().__init__(detail)
+        self.detail = detail
+        self.status_code = status_code
+
+
+def normalize_proxy_path(path: str) -> str:
+    """Normalize request paths before signing or validating them."""
+    normalized = (path or "").strip()
+    return normalized or "/"
+
+
+def is_proxy_auth_allowlisted(method: str, path: str) -> bool:
+    """Return True when a route is intentionally public in generic mode."""
+    normalized_method = (method or "").upper()
+    normalized_path = normalize_proxy_path(path)
+    if normalized_method == "OPTIONS":
+        return True
+    return (normalized_method, normalized_path) in PROXY_AUTH_ALLOWLIST
+
+
+def build_proxy_signature(secret: str, instance_id: str, timestamp: str, method: str, path: str) -> str:
+    """Build the expected HMAC signature for a proxied request."""
+    payload = f"{instance_id}:{timestamp}:{(method or '').upper()}:{normalize_proxy_path(path)}"
+    return hmac.new(secret.encode("utf-8"), payload.encode("utf-8"), hashlib.sha256).hexdigest()
+
+
+def validate_proxy_headers(
+    headers: Mapping[str, str],
+    *,
+    method: str,
+    path: str,
+    expected_instance_id: str,
+    shared_secret: str,
+    now: int | None = None,
+) -> None:
+    """Validate the signed generic-mode proxy headers for one request."""
+    if is_proxy_auth_allowlisted(method, path):
+        return
+
+    if not shared_secret:
+        raise ProxyAuthError(
+            "Generic-mode proxy authentication is not configured for this runtime.",
+            status.HTTP_503_SERVICE_UNAVAILABLE,
+        )
+
+    instance_id = (headers.get(PROXY_INSTANCE_HEADER) or "").strip()
+    timestamp_raw = (headers.get(PROXY_TIMESTAMP_HEADER) or "").strip()
+    signature = (headers.get(PROXY_SIGNATURE_HEADER) or "").strip()
+
+    if not instance_id or not timestamp_raw or not signature:
+        raise ProxyAuthError(
+            "Missing required X-Moto proxy authentication headers.",
+            status.HTTP_401_UNAUTHORIZED,
+        )
+
+    if instance_id != expected_instance_id:
+        raise ProxyAuthError(
+            "X-Moto-Instance-Id does not match the active runtime instance.",
+            status.HTTP_403_FORBIDDEN,
+        )
+
+    try:
+        timestamp_value = int(timestamp_raw)
+    except ValueError as exc:
+        raise ProxyAuthError(
+            "Invalid X-Moto-Proxy-Timestamp header.",
+            status.HTTP_401_UNAUTHORIZED,
+        ) from exc
+
+    current_time = int(time.time() if now is None else now)
+    if abs(current_time - timestamp_value) > PROXY_AUTH_MAX_SKEW_SECONDS:
+        raise ProxyAuthError(
+            "X-Moto-Proxy-Timestamp is outside the allowed clock-skew window.",
+            status.HTTP_401_UNAUTHORIZED,
+        )
+
+    expected_signature = build_proxy_signature(
+        secret=shared_secret,
+        instance_id=expected_instance_id,
+        timestamp=timestamp_raw,
+        method=method,
+        path=path,
+    )
+    if not hmac.compare_digest(signature, expected_signature):
+        raise ProxyAuthError(
+            "Invalid X-Moto-Proxy-Signature for the requested path.",
+            status.HTTP_403_FORBIDDEN,
+        )
diff --git a/backend/api/routes/__init__.py b/backend/api/routes/__init__.py
index 51f239a..c7f3682 100644
--- a/backend/api/routes/__init__.py
+++ b/backend/api/routes/__init__.py
@@ -1,4 +1,4 @@
 """API routes"""
-from . import aggregator, compiler, autonomous, websocket, boost, workflow
+from . import aggregator, compiler, autonomous, websocket, boost, workflow, features, health, proofs
 
-__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow']
+__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow', 'features', 'health', 'proofs']
diff --git a/backend/api/routes/aggregator.py b/backend/api/routes/aggregator.py
index 0cb9c14..c87b89b 100644
--- a/backend/api/routes/aggregator.py
+++ b/backend/api/routes/aggregator.py
@@ -161,7 +161,7 @@ async def save_results():
         results = await coordinator.get_results_formatted()
         
         # Save to downloads directory
-        output_path = Path("backend/data/aggregator_results.txt")
+        output_path = Path(system_config.data_dir) / "aggregator_results.txt"
         output_path.parent.mkdir(parents=True, exist_ok=True)
         
         async with aiofiles.open(output_path, 'w', encoding='utf-8') as f:
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index f558c48..46fdf95 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -1434,7 +1434,7 @@ async def force_tier3(mode: str = "complete_current"):
 @router.post("/save-current-compiler-paper")
 async def save_current_compiler_paper():
     """
-    Emergency endpoint to save current compiler paper to autonomous library.
+    Endpoint to save the current compiler paper to the autonomous library.
     Useful for recovering papers that got stuck before abstract was written.
     """
     try:
@@ -1483,7 +1483,7 @@ async def save_current_compiler_paper():
         if topic_id:
             await brainstorm_memory.add_paper_reference(topic_id, paper_id)
         
-        logger.info(f"Emergency save successful: {paper_id}")
+        logger.info(f"Paper save successful: {paper_id}")
         
         return {
             "success": True,
diff --git a/backend/api/routes/boost.py b/backend/api/routes/boost.py
index 4390021..eb1c13f 100644
--- a/backend/api/routes/boost.py
+++ b/backend/api/routes/boost.py
@@ -289,14 +289,20 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
         
         client = OpenRouterClient(_resolve_boost_api_key(api_key))
         try:
-            providers = await client.get_model_providers(model_id)
+            endpoints = await client.get_model_endpoints(model_id)
+            providers = sorted({
+                endpoint.get("provider_name")
+                for endpoint in endpoints
+                if isinstance(endpoint.get("provider_name"), str) and endpoint.get("provider_name")
+            })
         finally:
             await client.close()
         
         return {
             "success": True,
             "model_id": model_id,
-            "providers": providers
+            "providers": providers,
+            "endpoints": endpoints
         }
     except HTTPException:
         raise
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index eb3ebd3..c742b44 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -331,7 +331,7 @@ async def save_paper():
         full_content = "\n".join(full_content_parts)
         
         # Save to output directory
-        output_path = Path("backend/data/compiler_paper_saved.txt")
+        output_path = Path(system_config.data_dir) / "compiler_paper_saved.txt"
         output_path.parent.mkdir(parents=True, exist_ok=True)
         
         async with aiofiles.open(output_path, 'w', encoding='utf-8') as f:
@@ -764,14 +764,19 @@ async def set_wolfram_api_key(request: dict):
         system_config.wolfram_alpha_api_key = api_key
         system_config.wolfram_alpha_enabled = True
 
-        # Persist to secure backend storage so the key survives restarts.
-        store_wolfram_api_key(api_key)
+        if system_config.generic_mode:
+            logger.info("Generic mode active - keeping Wolfram Alpha API key in runtime memory only")
+            success_message = "Wolfram Alpha API key validated and loaded into runtime memory"
+        else:
+            # Persist to secure backend storage so the key survives restarts.
+            store_wolfram_api_key(api_key)
+            success_message = "Wolfram Alpha API key validated successfully"
         
         logger.info("Wolfram Alpha API key set and validated")
         
         return {
             "success": True,
-            "message": "Wolfram Alpha API key validated successfully",
+            "message": success_message,
             "test_result": test_result
         }
         
@@ -803,13 +808,19 @@ async def clear_wolfram_api_key():
         # Clear from config
         system_config.wolfram_alpha_api_key = None
         system_config.wolfram_alpha_enabled = False
-        clear_persisted_wolfram_api_key()
+
+        if system_config.generic_mode:
+            logger.info("Generic mode active - cleared in-memory Wolfram Alpha API key")
+            success_message = "Wolfram Alpha API key cleared from runtime memory"
+        else:
+            clear_persisted_wolfram_api_key()
+            success_message = "Wolfram Alpha API key cleared"
         
         logger.info("Wolfram Alpha API key cleared")
         
         return {
             "success": True,
-            "message": "Wolfram Alpha API key cleared"
+            "message": success_message
         }
         
     except SecretStoreError as e:
diff --git a/backend/api/routes/download.py b/backend/api/routes/download.py
index a13aea4..9e9ba7a 100644
--- a/backend/api/routes/download.py
+++ b/backend/api/routes/download.py
@@ -10,6 +10,8 @@
 from pydantic import BaseModel
 from typing import Optional
 
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/download", tags=["download"])
@@ -317,6 +319,12 @@ async def generate_pdf(req: PDFRequest):
 
     The event loop is never blocked — PDF generation runs in a worker thread.
     """
+    if system_config.generic_mode:
+        raise HTTPException(
+            status_code=501,
+            detail="PDF generation unavailable in web mode. Use raw text download.",
+        )
+
     if not req.html_body or not req.html_body.strip():
         raise HTTPException(status_code=400, detail="html_body is required and cannot be empty")
 
diff --git a/backend/api/routes/features.py b/backend/api/routes/features.py
new file mode 100644
index 0000000..917bd93
--- /dev/null
+++ b/backend/api/routes/features.py
@@ -0,0 +1,48 @@
+"""
+Build identity and capability metadata routes.
+"""
+import json
+import logging
+from pathlib import Path
+from typing import Any, Dict
+
+from fastapi import APIRouter
+
+from backend.shared.build_info import get_build_info
+from backend.shared.config import system_config
+
+router = APIRouter()
+logger = logging.getLogger(__name__)
+
+_REPO_ROOT = Path(__file__).resolve().parents[3]
+_UPDATE_NOTICE_PATH = _REPO_ROOT / ".moto_update_notice.json"
+
+
+@router.get("/api/features")
+async def get_features() -> Dict[str, Any]:
+    """
+    Return the public build-identity and capability contract.
+
+    The identity fields remain stable for update comparison while the capability
+    flags expose mode-level behavior without leaking per-user runtime state.
+    """
+    is_generic = system_config.generic_mode
+    return get_build_info().as_features_payload(
+        {
+            "generic_mode": is_generic,
+            "lm_studio_enabled": not is_generic,
+            "pdf_download_available": not is_generic,
+        }
+    )
+
+
+@router.get("/api/update-notice")
+async def get_update_notice() -> Dict[str, Any]:
+    """Return the launcher-written update notice, if one exists."""
+    try:
+        payload = json.loads(_UPDATE_NOTICE_PATH.read_text(encoding="utf-8"))
+        if isinstance(payload, dict) and payload.get("update_available"):
+            return payload
+    except (FileNotFoundError, json.JSONDecodeError, OSError):
+        pass
+    return {"update_available": False}
diff --git a/backend/api/routes/health.py b/backend/api/routes/health.py
new file mode 100644
index 0000000..1dc3c11
--- /dev/null
+++ b/backend/api/routes/health.py
@@ -0,0 +1,22 @@
+"""
+Health and readiness routes.
+"""
+from fastapi import APIRouter
+
+from backend.shared.build_info import get_build_info
+from backend.shared.config import system_config
+
+router = APIRouter(tags=["health"])
+
+
+@router.get("/api/health")
+async def api_health():
+    """Return a readiness payload for desktop and hosted runtime probes."""
+    build_info = get_build_info()
+    return {
+        "status": "healthy",
+        "instance_id": system_config.instance_id,
+        "generic_mode": system_config.generic_mode,
+        "version": build_info.version,
+        "build_commit": build_info.build_commit,
+    }
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index 80e2642..915239a 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -15,9 +15,10 @@
 from typing import Dict, Any, Optional
 import logging
 import json
+import httpx
 from pathlib import Path
 
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.openrouter_client import OpenRouterClient
 from backend.shared.api_client_manager import api_client_manager
@@ -54,6 +55,17 @@ async def check_lm_studio_availability() -> Dict[str, Any]:
         - models: List[str] - List of loaded model IDs
         - error: Optional[str] - Error message if unavailable
     """
+    if system_config.generic_mode:
+        return {
+            "success": True,
+            "available": False,
+            "has_models": False,
+            "model_count": 0,
+            "models": [],
+            "error": None,
+            "generic_mode": True,
+        }
+
     try:
         result = await lm_studio_client.check_availability()
         return {
@@ -95,12 +107,42 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
         # Validate API key by testing connection
         client = OpenRouterClient(api_key)
         try:
-            models = await client.list_models()
-            
+            try:
+                models = await client.list_models(raise_on_error=True)
+            except httpx.HTTPStatusError as http_exc:
+                status_code = http_exc.response.status_code if http_exc.response is not None else 0
+                if status_code in (401, 403):
+                    raise HTTPException(
+                        status_code=400,
+                        detail="OpenRouter rejected this API key (unauthorized). Please double-check the key at https://openrouter.ai/keys."
+                    ) from http_exc
+                logger.warning(
+                    "OpenRouter /models returned HTTP %s during key validation; treating as transient.",
+                    status_code,
+                )
+                raise HTTPException(
+                    status_code=502,
+                    detail=(
+                        f"OpenRouter is temporarily unreachable (HTTP {status_code}). "
+                        "Your key was NOT saved. Please try again in a moment."
+                    ),
+                ) from http_exc
+            except (httpx.ConnectError, httpx.ReadError, httpx.RemoteProtocolError, httpx.TimeoutException) as net_exc:
+                logger.warning(
+                    "Network error during OpenRouter key validation: %s", net_exc
+                )
+                raise HTTPException(
+                    status_code=502,
+                    detail=(
+                        "Could not reach OpenRouter to validate the key. "
+                        "Your key was NOT saved. Please check your internet connection and try again."
+                    ),
+                ) from net_exc
+
             if not models:
                 raise HTTPException(
                     status_code=400,
-                    detail="Failed to connect to OpenRouter or no models available. Please check your API key."
+                    detail="OpenRouter returned no models for this key. Please verify the key has access."
                 )
             
             # Store the API key globally
@@ -110,8 +152,13 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
             # Also configure the API client manager
             api_client_manager.set_openrouter_api_key(api_key)
 
-            # Persist to secure OS-backed storage so the key survives restarts.
-            store_openrouter_api_key(api_key)
+            if system_config.generic_mode:
+                logger.info("Generic mode active - keeping OpenRouter API key in runtime memory only")
+                success_message = "OpenRouter API key validated and loaded into runtime memory"
+            else:
+                # Persist to secure OS-backed storage so the key survives restarts.
+                store_openrouter_api_key(api_key)
+                success_message = "OpenRouter API key validated and saved"
             
             # Reset exhaustion flags so roles can retry OpenRouter
             free_model_manager.clear_account_exhaustion()
@@ -123,7 +170,7 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
             
             return {
                 "success": True,
-                "message": "OpenRouter API key validated and saved",
+                "message": success_message,
                 "model_count": len(models),
                 "roles_reset": list(reset_roles.keys())
             }
@@ -155,13 +202,19 @@ async def clear_api_key() -> Dict[str, Any]:
         rag_config.openrouter_api_key = None
         rag_config.openrouter_enabled = False
         api_client_manager.set_openrouter_api_key(None)
-        clear_openrouter_api_key()
+
+        if system_config.generic_mode:
+            logger.info("Generic mode active - cleared in-memory OpenRouter API key")
+            success_message = "OpenRouter API key cleared from runtime memory"
+        else:
+            clear_openrouter_api_key()
+            success_message = "OpenRouter API key cleared"
         
         logger.info("Global OpenRouter API key cleared")
         
         return {
             "success": True,
-            "message": "OpenRouter API key cleared"
+            "message": success_message
         }
     except SecretStoreError as e:
         logger.error(f"Failed to clear OpenRouter API key from secure storage: {e}")
@@ -268,12 +321,18 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
         
         client = OpenRouterClient(key_to_use)
         try:
-            providers = await client.get_model_providers(model_id)
+            endpoints = await client.get_model_endpoints(model_id)
+            providers = sorted({
+                endpoint.get("provider_name")
+                for endpoint in endpoints
+                if isinstance(endpoint.get("provider_name"), str) and endpoint.get("provider_name")
+            })
             
             return {
                 "success": True,
                 "model_id": model_id,
-                "providers": providers
+                "providers": providers,
+                "endpoints": endpoints
             }
         finally:
             await client.close()
@@ -297,7 +356,7 @@ async def get_model_cache() -> Dict[str, str]:
         Dict mapping model display names to OpenRouter API IDs
     """
     try:
-        cache_file = Path(__file__).parent.parent.parent / "data" / "model_cache.json"
+        cache_file = Path(system_config.data_dir) / "model_cache.json"
         
         if not cache_file.exists():
             logger.warning(f"Model cache not found at {cache_file}")
diff --git a/backend/api/routes/proofs.py b/backend/api/routes/proofs.py
new file mode 100644
index 0000000..c5615aa
--- /dev/null
+++ b/backend/api/routes/proofs.py
@@ -0,0 +1,483 @@
+"""
+Proof database, Lean 4 status, manual proof checks, and certificate export routes.
+"""
+from __future__ import annotations
+
+import logging
+from typing import Optional, Tuple
+
+from fastapi import APIRouter, BackgroundTasks, HTTPException
+from fastapi.responses import JSONResponse, PlainTextResponse
+
+from backend.api.routes import websocket
+from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+from backend.autonomous.core.proof_verification_stage import ProofVerificationStage
+from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+from backend.autonomous.memory.paper_library import paper_library
+from backend.autonomous.memory.proof_database import proof_database
+from backend.autonomous.memory.research_metadata import research_metadata
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.config import system_config
+from backend.shared.lean4_client import (
+    clear_lean4_client,
+    close_lean4_client,
+    get_lean4_client,
+    initialize_lean4_client,
+)
+from backend.shared.models import (
+    ModelConfig,
+    ProofCheckRequest,
+    ProofRoleConfigSnapshot,
+    ProofRuntimeConfigSnapshot,
+    ProofSettingsUpdateRequest,
+)
+from backend.shared.smt_client import clear_smt_client, get_smt_client
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(prefix="/api/proofs", tags=["proofs"])
+
+
+def _build_model_config(role: ProofRoleConfigSnapshot) -> ModelConfig:
+    return ModelConfig(
+        provider=role.provider,
+        model_id=role.model_id,
+        openrouter_model_id=role.model_id if role.provider == "openrouter" else None,
+        openrouter_provider=role.openrouter_provider,
+        lm_studio_fallback_id=role.lm_studio_fallback_id,
+        context_window=role.context_window,
+        max_output_tokens=role.max_output_tokens,
+    )
+
+
+async def _get_runtime_snapshot() -> Optional[ProofRuntimeConfigSnapshot]:
+    snapshot_dict = autonomous_coordinator.get_proof_runtime_config()
+    if not snapshot_dict:
+        snapshot_dict = await research_metadata.get_proof_runtime_config()
+    if not snapshot_dict:
+        return None
+
+    try:
+        return ProofRuntimeConfigSnapshot(**snapshot_dict)
+    except Exception as exc:
+        logger.error("Stored proof runtime config is invalid: %s", exc)
+        return None
+
+
+async def _get_manual_check_status() -> Tuple[bool, str]:
+    if not system_config.lean4_enabled:
+        return False, "Lean 4 proof checks are disabled."
+
+    snapshot = await _get_runtime_snapshot()
+    if snapshot is None:
+        return False, "No proof runtime model configuration is available yet. Start autonomous research once before using manual proof checks."
+
+    if not snapshot.brainstorm.model_id or not snapshot.paper.model_id or not snapshot.validator.model_id:
+        return False, "Proof runtime model configuration is incomplete. Start autonomous research again to refresh proof roles."
+
+    return True, ""
+
+
+def _configure_manual_roles(source_type: str, snapshot: ProofRuntimeConfigSnapshot) -> ProofRoleConfigSnapshot:
+    role_config = snapshot.brainstorm if source_type == "brainstorm" else snapshot.paper
+    if not role_config.model_id or not snapshot.validator.model_id:
+        raise RuntimeError("Manual proof roles are missing a configured submitter or validator model.")
+    suffix = f"manual_{source_type}"
+    api_client_manager.configure_role(
+        f"autonomous_proof_identification_{suffix}",
+        _build_model_config(role_config),
+    )
+    api_client_manager.configure_role(
+        f"autonomous_proof_lemma_search_{suffix}",
+        _build_model_config(role_config),
+    )
+    api_client_manager.configure_role(
+        f"autonomous_proof_formalization_{suffix}",
+        _build_model_config(role_config),
+    )
+    api_client_manager.configure_role(
+        "autonomous_proof_novelty",
+        _build_model_config(snapshot.validator),
+    )
+    return role_config
+
+
+async def _resolve_manual_source(request: ProofCheckRequest) -> Tuple[str, str]:
+    if request.source_type == "brainstorm":
+        metadata = await brainstorm_memory.get_metadata(request.source_id)
+        if metadata is None:
+            raise HTTPException(status_code=404, detail="Brainstorm not found")
+        content = await brainstorm_memory.get_database_content(request.source_id)
+        if not content:
+            raise HTTPException(status_code=404, detail="Brainstorm content not found")
+        return content, metadata.topic_prompt
+
+    metadata = await paper_library.get_metadata(request.source_id)
+    if metadata is None:
+        if ":" not in request.source_id:
+            raise HTTPException(status_code=404, detail="Paper not found")
+        session_id, paper_id = request.source_id.split(":", 1)
+        history_paper = await paper_library.get_history_paper(session_id, paper_id)
+        if not history_paper:
+            raise HTTPException(status_code=404, detail="Paper not found")
+        content = str(history_paper.get("content", "") or "")
+        if not content:
+            raise HTTPException(status_code=404, detail="Paper content not found")
+        return content, str(history_paper.get("title", "") or paper_id)
+    content = await paper_library.get_paper_content(request.source_id)
+    if not content:
+        raise HTTPException(status_code=404, detail="Paper content not found")
+    return content, metadata.title
+
+
+async def _run_manual_proof_check(request: ProofCheckRequest) -> None:
+    try:
+        source_content, source_title = await _resolve_manual_source(request)
+        snapshot = await _get_runtime_snapshot()
+        if snapshot is None:
+            raise RuntimeError("No proof runtime model configuration is available yet.")
+
+        role_config = _configure_manual_roles(request.source_type, snapshot)
+        user_prompt = await research_metadata.get_base_user_prompt()
+        stage = autonomous_coordinator._proof_verification_stage
+        await stage.run_manual(
+            content=source_content,
+            source_type=request.source_type,
+            source_id=request.source_id,
+            user_prompt=user_prompt,
+            submitter_model=role_config.model_id,
+            submitter_context=role_config.context_window,
+            submitter_max_tokens=role_config.max_output_tokens,
+            validator_model=snapshot.validator.model_id,
+            validator_context=snapshot.validator.context_window,
+            validator_max_tokens=snapshot.validator.max_output_tokens,
+            broadcast_fn=websocket.broadcast_event,
+            novel_proofs_db=proof_database,
+            source_title=source_title,
+            source_reserved=True,
+        )
+    except Exception:
+        logger.exception("Manual proof check failed for %s %s", request.source_type, request.source_id)
+        await ProofVerificationStage.release_source(request.source_type, request.source_id)
+
+
+@router.get("")
+async def list_proofs():
+    """Return all verified proofs plus aggregate counts."""
+    proofs = await proof_database.get_all_proofs()
+    return {
+        "proofs": [proof.model_dump(mode="json") for proof in proofs],
+        "counts": proof_database.count_proofs(),
+    }
+
+
+@router.get("/novel")
+async def list_novel_proofs():
+    """Return only novel verified proofs."""
+    proofs = await proof_database.get_all_proofs(novel_only=True)
+    return {
+        "proofs": [proof.model_dump(mode="json") for proof in proofs],
+        "counts": proof_database.count_proofs(),
+    }
+
+
+@router.get("/status")
+async def get_proofs_status():
+    """Return Lean 4 availability and proof-database status."""
+    version = ""
+    workspace_ready = False
+    mathlib_commit = ""
+    lsp_active = False
+    z3_version = ""
+    smt_available = False
+    manual_check_ready, manual_check_message = await _get_manual_check_status()
+    if system_config.lean4_enabled:
+        client = get_lean4_client()
+        version = await client.get_version()
+        workspace_ready = await client.ensure_workspace()
+        mathlib_commit = client.get_mathlib_commit()
+        lsp_active = client.is_server_active()
+
+    if system_config.smt_enabled:
+        try:
+            z3_version = await get_smt_client().get_version()
+            lowered_version = z3_version.lower()
+            smt_available = bool(z3_version) and "not found" not in lowered_version and "no such file" not in lowered_version
+        except Exception as exc:
+            logger.warning("Failed to resolve Z3 status: %s", exc)
+
+    return {
+        "lean4_enabled": system_config.lean4_enabled,
+        "lean4_lsp_enabled": system_config.lean4_lsp_enabled,
+        "lean4_path": system_config.lean4_path,
+        "lean4_workspace_dir": system_config.lean4_workspace_dir,
+        "lean_version": version,
+        "lean4_version": version,
+        "lean4_proof_timeout": system_config.lean4_proof_timeout,
+        "lean4_lsp_idle_timeout": system_config.lean4_lsp_idle_timeout,
+        "lsp_available": bool(system_config.lean4_enabled and system_config.lean4_lsp_enabled),
+        "lsp_active": lsp_active,
+        "workspace_ready": workspace_ready,
+        "mathlib_commit": mathlib_commit,
+        "smt_enabled": system_config.smt_enabled,
+        "smt_available": smt_available,
+        "z3_path": system_config.z3_path,
+        "smt_timeout": system_config.smt_timeout,
+        "z3_version": z3_version,
+        "manual_check_ready": manual_check_ready,
+        "manual_check_message": manual_check_message,
+        "proof_counts": proof_database.count_proofs(),
+    }
+
+
+@router.post("/settings")
+async def update_proof_settings(request: ProofSettingsUpdateRequest):
+    """Update runtime Lean 4 proof settings for the current backend process."""
+    if system_config.generic_mode:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Lean 4 settings are unavailable in hosted mode."})
+
+    previous_lean_settings = (
+        system_config.lean4_enabled,
+        system_config.lean4_lsp_enabled,
+        system_config.lean4_lsp_idle_timeout,
+        system_config.lean4_path,
+        system_config.lean4_workspace_dir,
+    )
+    previous_smt_settings = (
+        system_config.smt_enabled,
+        system_config.z3_path,
+        system_config.smt_timeout,
+    )
+
+    system_config.lean4_enabled = bool(request.enabled)
+    system_config.lean4_proof_timeout = int(request.timeout)
+    if request.lean4_lsp_enabled is not None:
+        system_config.lean4_lsp_enabled = bool(request.lean4_lsp_enabled)
+    if request.lean4_lsp_idle_timeout is not None:
+        system_config.lean4_lsp_idle_timeout = int(request.lean4_lsp_idle_timeout)
+    if request.smt_enabled is not None:
+        system_config.smt_enabled = bool(request.smt_enabled)
+    if request.z3_path is not None:
+        system_config.z3_path = str(request.z3_path or "").strip()
+    if request.smt_timeout is not None:
+        system_config.smt_timeout = int(request.smt_timeout)
+
+    lean_settings_changed = previous_lean_settings != (
+        system_config.lean4_enabled,
+        system_config.lean4_lsp_enabled,
+        system_config.lean4_lsp_idle_timeout,
+        system_config.lean4_path,
+        system_config.lean4_workspace_dir,
+    )
+    smt_settings_changed = previous_smt_settings != (
+        system_config.smt_enabled,
+        system_config.z3_path,
+        system_config.smt_timeout,
+    )
+
+    if lean_settings_changed:
+        await close_lean4_client()
+        clear_lean4_client()
+        if system_config.lean4_enabled:
+            client = initialize_lean4_client()
+            if system_config.lean4_lsp_enabled:
+                await client.warm_start()
+
+    if smt_settings_changed:
+        clear_smt_client()
+
+    return await get_proofs_status()
+
+
+@router.post("/check")
+async def run_manual_proof_check(request: ProofCheckRequest, background_tasks: BackgroundTasks):
+    """Queue a user-triggered proof check for one brainstorm or paper."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Lean 4 proof checks are disabled."})
+
+    snapshot = await _get_runtime_snapshot()
+    if snapshot is None:
+        raise HTTPException(
+            status_code=409,
+            detail="No proof runtime model configuration is available yet. Start autonomous research once before using manual proof checks.",
+        )
+    selected_role = snapshot.brainstorm if request.source_type == "brainstorm" else snapshot.paper
+    if not selected_role.model_id or not snapshot.validator.model_id:
+        raise HTTPException(
+            status_code=409,
+            detail="Proof runtime model configuration is incomplete. Start autonomous research again to refresh proof roles.",
+        )
+
+    await _resolve_manual_source(request)
+    try:
+        await ProofVerificationStage.reserve_source(request.source_type, request.source_id)
+    except RuntimeError:
+        raise HTTPException(status_code=409, detail="A proof verification is already running for that source.")
+
+    background_tasks.add_task(_run_manual_proof_check, request)
+    return {
+        "queued": True,
+        "source_type": request.source_type,
+        "source_id": request.source_id,
+    }
+
+
+@router.get("/{proof_id}/certificate")
+async def get_proof_certificate(proof_id: str):
+    """Return a machine-readable proof certificate JSON payload."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof certificates are unavailable while Lean 4 is disabled."})
+
+    proof = await proof_database.get_proof(proof_id)
+    if proof is None:
+        raise HTTPException(status_code=404, detail="Proof not found")
+
+    client = get_lean4_client()
+    lean_version = await client.get_version() if system_config.lean4_enabled else ""
+    mathlib_commit = client.get_mathlib_commit()
+    lean_code = await proof_database.get_lean_code(proof_id)
+    payload = {
+        "proof_id": proof.proof_id,
+        "theorem_statement": proof.theorem_statement,
+        "theorem_name": proof.theorem_name,
+        "lean_code": lean_code,
+        "solver": proof.solver or "Lean 4",
+        "lean_version": lean_version,
+        "mathlib_commit": mathlib_commit,
+        "verified_at": proof.created_at.isoformat() if proof.created_at else None,
+        "source_type": proof.source_type,
+        "source_id": proof.source_id,
+        "source_title": proof.source_title,
+        "novel": proof.novel,
+        "novelty_reasoning": proof.novelty_reasoning,
+        "attempt_count": proof.attempt_count,
+        "solver_hints": list(proof.solver_hints or []),
+        "dependencies": [dependency.model_dump(mode="json") for dependency in (proof.dependencies or [])],
+    }
+    return JSONResponse(
+        content=payload,
+        headers={
+            "Content-Disposition": f'attachment; filename="{proof_id}_certificate.json"',
+        },
+    )
+
+
+@router.get("/{proof_id}/certificate.lean")
+async def get_proof_certificate_lean(proof_id: str):
+    """Return the raw saved Lean file for a proof."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof certificates are unavailable while Lean 4 is disabled."})
+
+    proof = await proof_database.get_proof(proof_id)
+    if proof is None:
+        raise HTTPException(status_code=404, detail="Proof not found")
+
+    lean_code = await proof_database.get_lean_code(proof_id)
+    return PlainTextResponse(
+        content=lean_code or proof.lean_code,
+        headers={
+            "Content-Disposition": f'attachment; filename="{proof_id}.lean"',
+        },
+    )
+
+
+@router.get("/{proof_id}/dependencies")
+async def get_proof_dependencies(proof_id: str):
+    """Return one proof's dependency edges plus reverse MOTO ancestry."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof dependency data is unavailable while Lean 4 is disabled."})
+
+    proof = await proof_database.get_proof(proof_id)
+    if proof is None:
+        raise HTTPException(status_code=404, detail="Proof not found")
+
+    dependencies = await proof_database.get_dependencies(proof_id)
+    reverse_dependencies = await proof_database.get_proofs_depending_on(proof_id)
+    mathlib_reverse_usage = []
+    seen_mathlib_names = set()
+    for dependency in dependencies:
+        if dependency.kind != "mathlib" or not dependency.name or dependency.name in seen_mathlib_names:
+            continue
+        seen_mathlib_names.add(dependency.name)
+        dependents = [
+            dependent
+            for dependent in await proof_database.get_proofs_using_mathlib(dependency.name)
+            if dependent.proof_id != proof.proof_id
+        ]
+        if not dependents:
+            continue
+        mathlib_reverse_usage.append(
+            {
+                "name": dependency.name,
+                "source_ref": dependency.source_ref,
+                "dependents": [
+                    {
+                        "proof_id": dependent.proof_id,
+                        "theorem_name": dependent.theorem_name,
+                        "theorem_statement": dependent.theorem_statement,
+                        "source_type": dependent.source_type,
+                        "source_id": dependent.source_id,
+                    }
+                    for dependent in dependents
+                ],
+            }
+        )
+    return {
+        "proof_id": proof.proof_id,
+        "depends_on": [dependency.model_dump(mode="json") for dependency in dependencies],
+        "depended_on_by": [
+            {
+                "proof_id": dependent.proof_id,
+                "theorem_name": dependent.theorem_name,
+                "theorem_statement": dependent.theorem_statement,
+                "source_type": dependent.source_type,
+                "source_id": dependent.source_id,
+            }
+            for dependent in reverse_dependencies
+        ],
+        "mathlib_depended_on_by": mathlib_reverse_usage,
+    }
+
+
+@router.get("/graph")
+async def get_proof_graph():
+    """Return the full proof dependency graph in one payload."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof dependency data is unavailable while Lean 4 is disabled."})
+
+    graph = await proof_database.get_graph()
+    return {
+        **graph,
+        "proof_counts": proof_database.count_proofs(),
+    }
+
+
+@router.get("/mathlib/{lemma_name}/dependents")
+async def get_mathlib_dependents(lemma_name: str):
+    """Return proofs that depend on one Mathlib declaration."""
+    if not system_config.lean4_enabled:
+        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof dependency data is unavailable while Lean 4 is disabled."})
+
+    dependents = await proof_database.get_proofs_using_mathlib(lemma_name)
+    return {
+        "name": lemma_name,
+        "dependents": [
+            {
+                "proof_id": dependent.proof_id,
+                "theorem_name": dependent.theorem_name,
+                "theorem_statement": dependent.theorem_statement,
+                "source_type": dependent.source_type,
+                "source_id": dependent.source_id,
+            }
+            for dependent in dependents
+        ],
+    }
+
+
+@router.get("/{proof_id}")
+async def get_proof(proof_id: str):
+    """Return a single proof record with full Lean code."""
+    proof = await proof_database.get_proof(proof_id)
+    if proof is None:
+        raise HTTPException(status_code=404, detail="Proof not found")
+    return proof.model_dump(mode="json")
diff --git a/backend/api/routes/websocket.py b/backend/api/routes/websocket.py
index 92b9dda..02608e4 100644
--- a/backend/api/routes/websocket.py
+++ b/backend/api/routes/websocket.py
@@ -1,13 +1,16 @@
 """
 WebSocket route for real-time updates.
 """
-from fastapi import APIRouter, WebSocket, WebSocketDisconnect
+from fastapi import APIRouter, WebSocket, WebSocketDisconnect, status
 from typing import List, Dict
 from datetime import datetime
 import asyncio
 import logging
 import json
 
+from backend.api.proxy_auth import ProxyAuthError, validate_proxy_headers
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 router = APIRouter(tags=["websocket"])
@@ -59,6 +62,23 @@ async def broadcast(self, event_type: str, data: Dict):
 @router.websocket("/ws")
 async def websocket_endpoint(websocket: WebSocket):
     """WebSocket endpoint for real-time updates."""
+    if system_config.generic_mode:
+        try:
+            validate_proxy_headers(
+                websocket.headers,
+                method="GET",
+                path=websocket.url.path,
+                expected_instance_id=system_config.instance_id,
+                shared_secret=system_config.internal_proxy_secret or "",
+            )
+        except ProxyAuthError as exc:
+            logger.warning("Rejected generic-mode websocket connection: %s", exc.detail)
+            await websocket.close(
+                code=status.WS_1008_POLICY_VIOLATION,
+                reason=exc.detail,
+            )
+            return
+
     await manager.connect(websocket)
     
     try:
diff --git a/backend/autonomous/agents/lemma_search_agent.py b/backend/autonomous/agents/lemma_search_agent.py
new file mode 100644
index 0000000..d2e69a2
--- /dev/null
+++ b/backend/autonomous/agents/lemma_search_agent.py
@@ -0,0 +1,303 @@
+"""
+Mathlib lemma search agent for Lean 4 proof generation.
+"""
+from __future__ import annotations
+
+import json
+import logging
+import re
+from pathlib import Path
+from typing import Dict, List
+
+from backend.autonomous.prompts.proof_prompts import build_lemma_search_prompt
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.json_parser import parse_json
+from backend.shared.lean4_client import get_lean4_client
+from backend.shared.models import MathlibLemmaHint, ProofCandidate
+from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.utils import count_tokens
+
+logger = logging.getLogger(__name__)
+
+_NAMESPACE_RE = re.compile(r"^\s*namespace\s+([A-Za-z0-9_'.]+)")
+_END_RE = re.compile(r"^\s*end(?:\s+([A-Za-z0-9_'.]+))?\s*$")
+_DECL_RE = re.compile(r"^\s*(?:protected\s+)?(?:theorem|lemma)\s+([A-Za-z0-9_']+)")
+
+
+class MathlibLemmaSearchAgent:
+    """Suggest and locally confirm relevant Mathlib lemmas for a theorem."""
+
+    def __init__(
+        self,
+        model_id: str,
+        context_window: int,
+        max_output_tokens: int,
+        role_id: str,
+    ) -> None:
+        self.model_id = model_id
+        self.context_window = context_window
+        self.max_output_tokens = max_output_tokens
+        self.role_id = role_id
+        self.task_sequence = 0
+        self._by_full_name: Dict[str, List[dict]] = {}
+        self._by_short_name: Dict[str, List[dict]] = {}
+        self._index_loaded = False
+
+    def get_current_task_id(self) -> str:
+        return f"proof_lemma_{self.task_sequence:03d}"
+
+    @staticmethod
+    def _build_source_excerpt(theorem_statement: str, source_content: str) -> str:
+        statement = (theorem_statement or "").strip()
+        content = source_content or ""
+        if not content:
+            return ""
+
+        search_token = statement[:80]
+        if search_token:
+            match_index = content.find(search_token)
+            if match_index >= 0:
+                start = max(0, match_index - 2000)
+                end = min(len(content), match_index + max(len(statement), 1) + 2000)
+                return content[start:end]
+
+        return content[:5000]
+
+    @staticmethod
+    def _dedupe_hits(hits: List[MathlibLemmaHint]) -> List[MathlibLemmaHint]:
+        seen = set()
+        deduped: List[MathlibLemmaHint] = []
+        for hit in hits:
+            key = (hit.full_name, hit.file_path, hit.line_number)
+            if key in seen:
+                continue
+            seen.add(key)
+            deduped.append(hit)
+        return deduped
+
+    @staticmethod
+    def _relative_mathlib_path(root: Path, file_path: Path) -> str:
+        try:
+            return str(file_path.relative_to(root))
+        except ValueError:
+            return str(file_path)
+
+    def _register_index_entry(self, entry: dict) -> None:
+        full_name = str(entry.get("full_name", "")).strip()
+        short_name = str(entry.get("short_name", "")).strip()
+        if full_name:
+            self._by_full_name.setdefault(full_name, []).append(entry)
+        if short_name:
+            self._by_short_name.setdefault(short_name, []).append(entry)
+
+    def _load_index_from_cache(self, index_path: Path) -> bool:
+        if not index_path.exists():
+            return False
+
+        try:
+            payload = json.loads(index_path.read_text(encoding="utf-8"))
+            for entry in payload.get("entries", []) or []:
+                if isinstance(entry, dict):
+                    self._register_index_entry(entry)
+            self._index_loaded = True
+            return True
+        except Exception as exc:
+            logger.warning("Failed to load cached Mathlib declaration index: %s", exc)
+            return False
+
+    def _write_index_cache(self, index_path: Path) -> None:
+        entries = []
+        for entry_list in self._by_full_name.values():
+            entries.extend(entry_list)
+        index_path.write_text(json.dumps({"entries": entries}, indent=2), encoding="utf-8")
+
+    def _build_index_from_sources(self, roots: List[Path], index_path: Path) -> None:
+        entries: List[dict] = []
+        for root in roots:
+            for file_path in root.rglob("*.lean"):
+                namespace_stack: List[str] = []
+                try:
+                    with file_path.open("r", encoding="utf-8") as handle:
+                        for line_number, raw_line in enumerate(handle, start=1):
+                            namespace_match = _NAMESPACE_RE.match(raw_line)
+                            if namespace_match:
+                                namespace_stack.append(namespace_match.group(1))
+                                continue
+
+                            end_match = _END_RE.match(raw_line)
+                            if end_match:
+                                label = (end_match.group(1) or "").strip()
+                                if label and namespace_stack:
+                                    current_full = ".".join(namespace_stack)
+                                    current_leaf = namespace_stack[-1].split(".")[-1]
+                                    if label == current_full or label == current_leaf:
+                                        namespace_stack.pop()
+                                continue
+
+                            decl_match = _DECL_RE.match(raw_line)
+                            if not decl_match:
+                                continue
+
+                            short_name = decl_match.group(1)
+                            full_name = ".".join(namespace_stack + [short_name]) if namespace_stack else short_name
+                            entries.append(
+                                {
+                                    "full_name": full_name,
+                                    "short_name": short_name,
+                                    "declaration": raw_line.strip(),
+                                    "file_path": self._relative_mathlib_path(root, file_path),
+                                    "line_number": line_number,
+                                }
+                            )
+                except Exception as exc:
+                    logger.debug("Skipping Mathlib file %s during index build: %s", file_path, exc)
+
+        for entry in entries:
+            self._register_index_entry(entry)
+        self._write_index_cache(index_path)
+        self._index_loaded = True
+        logger.info("Built Mathlib declaration index with %s entries", len(entries))
+
+    async def ensure_index_loaded(self) -> bool:
+        if self._index_loaded:
+            return True
+
+        client = get_lean4_client()
+        workspace_ready = await client.ensure_workspace()
+        if not workspace_ready:
+            return False
+
+        roots = client.get_mathlib_source_roots()
+        if not roots:
+            return False
+
+        index_path = client.get_mathlib_index_path()
+        if self._load_index_from_cache(index_path):
+            return True
+
+        self._build_index_from_sources(roots, index_path)
+        return self._index_loaded
+
+    async def _ensure_index_loaded(self) -> bool:
+        """Backward-compatible private alias for older callers."""
+        return await self.ensure_index_loaded()
+
+    def lookup_candidate_name(self, requested_name: str) -> List[MathlibLemmaHint]:
+        requested_name = str(requested_name or "").strip()
+        if not requested_name:
+            return []
+
+        matched_entries = list(self._by_full_name.get(requested_name, []))
+        if not matched_entries:
+            short_name = requested_name.split(".")[-1]
+            matched_entries = list(self._by_short_name.get(short_name, []))
+
+        hits = [
+            MathlibLemmaHint(
+                requested_name=requested_name,
+                full_name=str(entry.get("full_name", "")).strip() or requested_name,
+                declaration=str(entry.get("declaration", "")).strip(),
+                file_path=str(entry.get("file_path", "")).strip(),
+                line_number=int(entry.get("line_number", 0) or 0),
+            )
+            for entry in matched_entries[:3]
+        ]
+        return self._dedupe_hits(hits)
+
+    def _lookup_candidate_name(self, requested_name: str) -> List[MathlibLemmaHint]:
+        """Backward-compatible private alias for older callers."""
+        return self.lookup_candidate_name(requested_name)
+
+    async def suggest_relevant_lemmas(
+        self,
+        user_research_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        source_content: str,
+        *,
+        max_candidates: int = 8,
+    ) -> List[MathlibLemmaHint]:
+        """Return locally confirmed Mathlib hints for the target theorem."""
+        if not await self.ensure_index_loaded():
+            return []
+
+        source_excerpt = theorem_candidate.source_excerpt or self._build_source_excerpt(
+            theorem_candidate.statement,
+            source_content,
+        )
+        prompt = build_lemma_search_prompt(
+            user_prompt=user_research_prompt,
+            source_type=source_type,
+            theorem_statement=theorem_candidate.statement,
+            formal_sketch=theorem_candidate.formal_sketch,
+            source_excerpt=source_excerpt,
+        )
+
+        max_input_tokens = self.context_window - self.max_output_tokens
+        prompt_tokens = count_tokens(prompt)
+        while prompt_tokens > max_input_tokens and len(source_excerpt) > 1200:
+            source_excerpt = source_excerpt[: max(len(source_excerpt) // 2, 1200)]
+            prompt = build_lemma_search_prompt(
+                user_prompt=user_research_prompt,
+                source_type=source_type,
+                theorem_statement=theorem_candidate.statement,
+                formal_sketch=theorem_candidate.formal_sketch,
+                source_excerpt=source_excerpt,
+            )
+            prompt_tokens = count_tokens(prompt)
+
+        if prompt_tokens > max_input_tokens:
+            return []
+
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_id,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=self.max_output_tokens,
+                temperature=0.0,
+            )
+            if not response or not response.get("choices"):
+                return []
+
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            if not content:
+                return []
+
+            data = parse_json(content)
+            if isinstance(data, list):
+                data = data[0] if data else {}
+
+            raw_names = data.get("lemma_names") or data.get("lemmas") or []
+            candidate_names = []
+            for raw_name in raw_names:
+                if isinstance(raw_name, dict):
+                    value = raw_name.get("name") or raw_name.get("lemma_name")
+                else:
+                    value = raw_name
+                value = str(value or "").strip()
+                if value:
+                    candidate_names.append(value)
+
+            confirmed_hits: List[MathlibLemmaHint] = []
+            for candidate_name in candidate_names:
+                confirmed_hits.extend(self.lookup_candidate_name(candidate_name))
+                confirmed_hits = self._dedupe_hits(confirmed_hits)
+                if len(confirmed_hits) >= max_candidates:
+                    break
+
+            return confirmed_hits[:max_candidates]
+        except FreeModelExhaustedError:
+            raise
+        except Exception as exc:
+            logger.warning(
+                "MathlibLemmaSearchAgent failed for theorem %s: %s",
+                theorem_candidate.theorem_id,
+                exc,
+            )
+            return []
diff --git a/backend/autonomous/agents/proof_formalization_agent.py b/backend/autonomous/agents/proof_formalization_agent.py
new file mode 100644
index 0000000..857c758
--- /dev/null
+++ b/backend/autonomous/agents/proof_formalization_agent.py
@@ -0,0 +1,473 @@
+"""
+Lean 4 formalization agent with iterative retry loop.
+"""
+from __future__ import annotations
+
+import logging
+from typing import Awaitable, Callable, List, Optional, Tuple
+
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.json_parser import parse_json
+from backend.shared.lean4_client import get_lean4_client
+from backend.shared.models import ProofAttemptFeedback, ProofCandidate, SmtHint
+from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.utils import count_tokens
+from backend.shared.config import system_config
+from backend.autonomous.prompts.proof_prompts import (
+    build_proof_formalization_prompt,
+    build_proof_tactic_script_prompt,
+)
+
+logger = logging.getLogger(__name__)
+
+AttemptCallback = Callable[[ProofAttemptFeedback], Awaitable[None]]
+AttemptStartCallback = Callable[[int, str], Awaitable[None]]
+ShouldStopFn = Optional[Callable[[], bool]]
+
+
+def _is_stop_requested(should_stop: ShouldStopFn) -> bool:
+    if should_stop is None:
+        return False
+    try:
+        return bool(should_stop())
+    except Exception:
+        return False
+
+
+class ProofFormalizationAgent:
+    """Turn theorem candidates into Lean 4 code and retry with feedback."""
+
+    def __init__(
+        self,
+        model_id: str,
+        context_window: int,
+        max_output_tokens: int,
+        role_id: str,
+    ) -> None:
+        self.model_id = model_id
+        self.context_window = context_window
+        self.max_output_tokens = max_output_tokens
+        self.role_id = role_id
+        self.task_sequence = 0
+
+    def get_current_task_id(self) -> str:
+        return f"proof_form_{self.task_sequence:03d}"
+
+    @staticmethod
+    def _build_source_excerpt(theorem_statement: str, source_content: str) -> str:
+        statement = (theorem_statement or "").strip()
+        content = source_content or ""
+        if not content:
+            return ""
+
+        search_token = statement[:80]
+        if search_token:
+            match_index = content.find(search_token)
+            if match_index >= 0:
+                start = max(0, match_index - 2500)
+                end = min(len(content), match_index + max(len(statement), 1) + 2500)
+                return content[start:end]
+
+        return content[:6000]
+
+    @staticmethod
+    def _normalize_tactic_trace(raw_tactics) -> tuple[List[str], List[str]]:
+        tactic_commands: List[str] = []
+        tactic_trace: List[str] = []
+        for item in raw_tactics or []:
+            tactic = ""
+            reasoning = ""
+            if isinstance(item, dict):
+                tactic = str(item.get("tactic") or item.get("command") or "").strip()
+                reasoning = str(item.get("reasoning") or item.get("note") or "").strip()
+            else:
+                tactic = str(item or "").strip()
+
+            if not tactic:
+                continue
+
+            tactic_commands.append(tactic)
+            tactic_trace.append(f"{tactic} -- {reasoning}" if reasoning else tactic)
+        return tactic_commands, tactic_trace
+
+    @staticmethod
+    def _compose_tactic_script_code(theorem_header: str, tactic_commands: List[str]) -> str:
+        header = (theorem_header or "").strip()
+        if not header:
+            return ""
+        if ":= by" not in header and not header.rstrip().endswith("by"):
+            header = f"{header} := by"
+
+        lines = header.splitlines()
+        for tactic in tactic_commands:
+            stripped = str(tactic or "").rstrip()
+            if not stripped:
+                continue
+            for line in stripped.splitlines():
+                lines.append(f"  {line.rstrip()}")
+
+        code = "\n".join(lines).strip()
+        if not code:
+            return ""
+
+        first_lines = code.splitlines()[:5]
+        if not any(line.strip().startswith("import ") for line in first_lines):
+            code = f"import Mathlib\n\n{code}"
+        return code + "\n"
+
+    def _fit_prompt_to_context(
+        self,
+        prompt_builder,
+        *,
+        min_excerpt_length: int,
+        source_excerpt: str,
+        **prompt_kwargs,
+    ) -> tuple[str, str, int, int]:
+        prompt = prompt_builder(source_excerpt=source_excerpt, **prompt_kwargs)
+        max_input_tokens = self.context_window - self.max_output_tokens
+        prompt_tokens = count_tokens(prompt)
+        while prompt_tokens > max_input_tokens and len(source_excerpt) > min_excerpt_length:
+            source_excerpt = source_excerpt[: max(len(source_excerpt) // 2, min_excerpt_length)]
+            prompt = prompt_builder(source_excerpt=source_excerpt, **prompt_kwargs)
+            prompt_tokens = count_tokens(prompt)
+        return prompt, source_excerpt, max_input_tokens, prompt_tokens
+
+    async def _run_full_script_attempt(
+        self,
+        *,
+        user_research_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        prior_attempts: List[ProofAttemptFeedback],
+        source_excerpt: str,
+        attempt_number: int,
+        smt_hint: Optional[SmtHint] = None,
+    ) -> tuple[str, str, ProofAttemptFeedback]:
+        prompt, source_excerpt, max_input_tokens, prompt_tokens = self._fit_prompt_to_context(
+            build_proof_formalization_prompt,
+            min_excerpt_length=1500,
+            user_prompt=user_research_prompt,
+            source_type=source_type,
+            theorem_statement=theorem_candidate.statement,
+            formal_sketch=theorem_candidate.formal_sketch,
+            source_excerpt=source_excerpt,
+            prior_attempts=prior_attempts,
+            relevant_lemmas=theorem_candidate.relevant_lemmas,
+            smt_hint=smt_hint,
+        )
+
+        if prompt_tokens > max_input_tokens:
+            feedback = ProofAttemptFeedback(
+                attempt=attempt_number,
+                theorem_id=theorem_candidate.theorem_id,
+                reasoning="Prompt too large for configured context window.",
+                error_output=f"Prompt too large ({prompt_tokens} > {max_input_tokens}).",
+                strategy="full_script",
+                success=False,
+            )
+            return "", source_excerpt, feedback
+
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_id,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=self.max_output_tokens,
+                temperature=0.0,
+            )
+            if not response or not response.get("choices"):
+                raise ValueError("Empty response from formalization model.")
+
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            if not content:
+                raise ValueError("No content in formalization model response.")
+
+            data = parse_json(content)
+            if isinstance(data, list):
+                data = data[0] if data else {}
+            if not isinstance(data, dict):
+                data = {}
+
+            theorem_name = str(data.get("theorem_name", "")).strip()
+            lean_code = str(data.get("lean_code", "")).strip()
+            reasoning = str(data.get("reasoning", "")).strip()
+            if not lean_code:
+                raise ValueError("Formalization model did not return Lean 4 code.")
+
+            lean_result = await get_lean4_client().check_proof(
+                lean_code,
+                timeout=system_config.lean4_proof_timeout,
+            )
+            feedback = ProofAttemptFeedback(
+                attempt=attempt_number,
+                theorem_id=theorem_candidate.theorem_id,
+                reasoning=reasoning,
+                lean_code=lean_code,
+                error_output=lean_result.error_output,
+                goal_states=lean_result.goal_states,
+                strategy="full_script",
+                success=lean_result.success,
+            )
+            return theorem_name, source_excerpt, feedback
+        except FreeModelExhaustedError:
+            raise
+        except Exception as exc:
+            feedback = ProofAttemptFeedback(
+                attempt=attempt_number,
+                theorem_id=theorem_candidate.theorem_id,
+                reasoning="Formalization attempt failed before Lean 4 verification.",
+                lean_code="",
+                error_output=str(exc),
+                goal_states="",
+                strategy="full_script",
+                success=False,
+            )
+            logger.warning(
+                "ProofFormalizationAgent full-script attempt %s failed for %s: %s",
+                attempt_number,
+                theorem_candidate.theorem_id,
+                exc,
+            )
+            return "", source_excerpt, feedback
+
+    async def prove_candidate(
+        self,
+        user_research_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        source_content: str,
+        *,
+        max_attempts: int = 5,
+        attempt_callback: Optional[AttemptCallback] = None,
+        attempt_start_callback: Optional[AttemptStartCallback] = None,
+        prior_attempts: Optional[List[ProofAttemptFeedback]] = None,
+        starting_attempt_number: Optional[int] = None,
+        smt_hint: Optional[SmtHint] = None,
+        should_stop: ShouldStopFn = None,
+    ) -> Tuple[bool, str, str, List[ProofAttemptFeedback]]:
+        """Attempt to formalize and verify one theorem candidate with full scripts."""
+        attempts: List[ProofAttemptFeedback] = list(prior_attempts or [])
+        source_excerpt = theorem_candidate.source_excerpt or self._build_source_excerpt(
+            theorem_candidate.statement,
+            source_content,
+        )
+        theorem_name = ""
+
+        next_attempt_number = (
+            starting_attempt_number
+            if starting_attempt_number is not None
+            else (attempts[-1].attempt + 1 if attempts else 1)
+        )
+
+        for attempt_offset in range(max_attempts):
+            if _is_stop_requested(should_stop):
+                logger.info(
+                    "ProofFormalizationAgent.prove_candidate: stop requested, aborting before attempt %s for %s.",
+                    next_attempt_number + attempt_offset,
+                    theorem_candidate.theorem_id,
+                )
+                break
+            attempt_number = next_attempt_number + attempt_offset
+            if attempt_start_callback:
+                await attempt_start_callback(attempt_number, "full_script")
+
+            current_theorem_name, source_excerpt, feedback = await self._run_full_script_attempt(
+                user_research_prompt=user_research_prompt,
+                source_type=source_type,
+                theorem_candidate=theorem_candidate,
+                prior_attempts=attempts,
+                source_excerpt=source_excerpt,
+                attempt_number=attempt_number,
+                smt_hint=smt_hint,
+            )
+            if current_theorem_name:
+                theorem_name = current_theorem_name
+
+            attempts.append(feedback)
+            if attempt_callback:
+                await attempt_callback(feedback)
+
+            if feedback.success:
+                return True, theorem_name, feedback.lean_code, attempts
+
+        final_code = attempts[-1].lean_code if attempts else ""
+        return False, theorem_name, final_code, attempts
+
+    async def prove_candidate_tactic_script(
+        self,
+        user_research_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        source_content: str,
+        *,
+        max_attempts: int = 2,
+        attempt_callback: Optional[AttemptCallback] = None,
+        attempt_start_callback: Optional[AttemptStartCallback] = None,
+        prior_attempts: Optional[List[ProofAttemptFeedback]] = None,
+        starting_attempt_number: Optional[int] = None,
+        smt_hint: Optional[SmtHint] = None,
+        should_stop: ShouldStopFn = None,
+    ) -> Tuple[bool, str, str, List[ProofAttemptFeedback]]:
+        """Attempt to formalize and verify one theorem candidate with tactic scripts."""
+        attempts: List[ProofAttemptFeedback] = list(prior_attempts or [])
+        source_excerpt = theorem_candidate.source_excerpt or self._build_source_excerpt(
+            theorem_candidate.statement,
+            source_content,
+        )
+        theorem_name = ""
+
+        next_attempt_number = (
+            starting_attempt_number
+            if starting_attempt_number is not None
+            else (attempts[-1].attempt + 1 if attempts else 1)
+        )
+
+        for attempt_offset in range(max_attempts):
+            if _is_stop_requested(should_stop):
+                logger.info(
+                    "ProofFormalizationAgent.prove_candidate_tactic_script: stop requested, aborting before attempt %s for %s.",
+                    next_attempt_number + attempt_offset,
+                    theorem_candidate.theorem_id,
+                )
+                break
+            attempt_number = next_attempt_number + attempt_offset
+            if attempt_start_callback:
+                await attempt_start_callback(attempt_number, "tactic_script")
+
+            prompt, source_excerpt, max_input_tokens, prompt_tokens = self._fit_prompt_to_context(
+                build_proof_tactic_script_prompt,
+                min_excerpt_length=1500,
+                user_prompt=user_research_prompt,
+                source_type=source_type,
+                theorem_statement=theorem_candidate.statement,
+                formal_sketch=theorem_candidate.formal_sketch,
+                source_excerpt=source_excerpt,
+                prior_attempts=attempts,
+                relevant_lemmas=theorem_candidate.relevant_lemmas,
+                smt_hint=smt_hint,
+            )
+
+            if prompt_tokens > max_input_tokens:
+                feedback = ProofAttemptFeedback(
+                    attempt=attempt_number,
+                    theorem_id=theorem_candidate.theorem_id,
+                    reasoning="Prompt too large for configured context window.",
+                    error_output=f"Prompt too large ({prompt_tokens} > {max_input_tokens}).",
+                    strategy="tactic_script",
+                    success=False,
+                )
+                attempts.append(feedback)
+                if attempt_callback:
+                    await attempt_callback(feedback)
+                continue
+
+            task_id = self.get_current_task_id()
+            self.task_sequence += 1
+
+            try:
+                response = await api_client_manager.generate_completion(
+                    task_id=task_id,
+                    role_id=self.role_id,
+                    model=self.model_id,
+                    messages=[{"role": "user", "content": prompt}],
+                    max_tokens=self.max_output_tokens,
+                    temperature=0.0,
+                )
+                if not response or not response.get("choices"):
+                    raise ValueError("Empty response from tactic formalization model.")
+
+                message = response["choices"][0].get("message", {})
+                content = message.get("content") or message.get("reasoning") or ""
+                if not content:
+                    raise ValueError("No content in tactic formalization model response.")
+
+                data = parse_json(content)
+                if isinstance(data, list):
+                    data = data[0] if data else {}
+                if not isinstance(data, dict):
+                    data = {}
+
+                theorem_name = str(data.get("theorem_name", "")).strip()
+                theorem_header = str(data.get("theorem_header", "")).strip()
+                reasoning = str(data.get("reasoning", "")).strip()
+                tactic_commands, tactic_trace = self._normalize_tactic_trace(
+                    data.get("tactics") or data.get("tactic_steps") or []
+                )
+
+                if not theorem_header or not tactic_commands:
+                    logger.info(
+                        "Tactic script response malformed for %s attempt %s; falling back to full-script mode.",
+                        theorem_candidate.theorem_id,
+                        attempt_number,
+                    )
+                    current_theorem_name, source_excerpt, feedback = await self._run_full_script_attempt(
+                        user_research_prompt=user_research_prompt,
+                        source_type=source_type,
+                        theorem_candidate=theorem_candidate,
+                        prior_attempts=attempts,
+                        source_excerpt=source_excerpt,
+                        attempt_number=attempt_number,
+                        smt_hint=smt_hint,
+                    )
+                    if current_theorem_name:
+                        theorem_name = current_theorem_name
+                    attempts.append(feedback)
+                    if attempt_callback:
+                        await attempt_callback(feedback)
+                    if feedback.success:
+                        return True, theorem_name, feedback.lean_code, attempts
+                    continue
+
+                lean_code = self._compose_tactic_script_code(theorem_header, tactic_commands)
+                lean_result = await get_lean4_client().check_tactic_script(
+                    theorem_header,
+                    tactic_commands,
+                    timeout=system_config.lean4_proof_timeout,
+                )
+                feedback = ProofAttemptFeedback(
+                    attempt=attempt_number,
+                    theorem_id=theorem_candidate.theorem_id,
+                    reasoning=reasoning,
+                    lean_code=lean_code,
+                    error_output=lean_result.tactic_error_slice or lean_result.error_output,
+                    goal_states=lean_result.goal_states,
+                    strategy="tactic_script",
+                    tactic_trace=tactic_trace,
+                    success=lean_result.success,
+                )
+                attempts.append(feedback)
+                if attempt_callback:
+                    await attempt_callback(feedback)
+
+                if lean_result.success:
+                    return True, theorem_name, lean_code, attempts
+            except FreeModelExhaustedError:
+                raise
+            except Exception as exc:
+                feedback = ProofAttemptFeedback(
+                    attempt=attempt_number,
+                    theorem_id=theorem_candidate.theorem_id,
+                    reasoning="Tactic-script formalization attempt failed before Lean 4 verification.",
+                    lean_code="",
+                    error_output=str(exc),
+                    goal_states="",
+                    strategy="tactic_script",
+                    success=False,
+                )
+                attempts.append(feedback)
+                if attempt_callback:
+                    await attempt_callback(feedback)
+                logger.warning(
+                    "ProofFormalizationAgent tactic-script attempt %s failed for %s: %s",
+                    attempt_number,
+                    theorem_candidate.theorem_id,
+                    exc,
+                )
+
+        final_code = attempts[-1].lean_code if attempts else ""
+        return False, theorem_name, final_code, attempts
diff --git a/backend/autonomous/agents/proof_identification_agent.py b/backend/autonomous/agents/proof_identification_agent.py
new file mode 100644
index 0000000..9fa7791
--- /dev/null
+++ b/backend/autonomous/agents/proof_identification_agent.py
@@ -0,0 +1,192 @@
+"""
+Proof identification agent for Lean 4 verification checkpoints.
+"""
+import logging
+from typing import List, Tuple
+
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.json_parser import parse_json
+from backend.shared.models import ProofCandidate
+from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.utils import count_tokens
+from backend.autonomous.prompts.proof_prompts import (
+    build_proof_identification_prompt,
+    build_smt_translation_prompt,
+)
+
+logger = logging.getLogger(__name__)
+
+
+class ProofIdentificationAgent:
+    """Find complete theorem candidates in a brainstorm or paper."""
+
+    def __init__(
+        self,
+        model_id: str,
+        context_window: int,
+        max_output_tokens: int,
+        role_id: str,
+    ) -> None:
+        self.model_id = model_id
+        self.context_window = context_window
+        self.max_output_tokens = max_output_tokens
+        self.role_id = role_id
+        self.task_sequence = 0
+
+    def get_current_task_id(self) -> str:
+        return f"proof_id_{self.task_sequence:03d}"
+
+    async def translate_candidate_to_smt(
+        self,
+        *,
+        user_research_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        source_content: str,
+    ) -> str:
+        """Return an SMT-LIB translation for a conservative proof candidate when possible."""
+        source_excerpt = theorem_candidate.source_excerpt or source_content[:4000]
+        prompt = build_smt_translation_prompt(
+            user_prompt=user_research_prompt,
+            source_type=source_type,
+            theorem_statement=theorem_candidate.statement,
+            formal_sketch=theorem_candidate.formal_sketch,
+            source_excerpt=source_excerpt,
+        )
+        prompt_tokens = count_tokens(prompt)
+        max_input_tokens = self.context_window - self.max_output_tokens
+        while prompt_tokens > max_input_tokens and len(source_excerpt) > 1200:
+            source_excerpt = source_excerpt[: max(len(source_excerpt) // 2, 1200)]
+            prompt = build_smt_translation_prompt(
+                user_prompt=user_research_prompt,
+                source_type=source_type,
+                theorem_statement=theorem_candidate.statement,
+                formal_sketch=theorem_candidate.formal_sketch,
+                source_excerpt=source_excerpt,
+            )
+            prompt_tokens = count_tokens(prompt)
+
+        if prompt_tokens > max_input_tokens:
+            logger.debug(
+                "SMT translation prompt exceeds context window (%s > %s) for theorem %s",
+                prompt_tokens,
+                max_input_tokens,
+                theorem_candidate.theorem_id,
+            )
+            return ""
+
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_id,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=self.max_output_tokens,
+                temperature=0.0,
+            )
+            if not response or not response.get("choices"):
+                return ""
+
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            if not content:
+                return ""
+
+            data = parse_json(content)
+            if isinstance(data, list):
+                data = data[0] if data else {}
+            if not isinstance(data, dict):
+                return ""
+            return str(data.get("smtlib", "") or data.get("smtlib2", "")).strip()
+        except FreeModelExhaustedError:
+            raise
+        except Exception as exc:
+            logger.debug(
+                "ProofIdentificationAgent SMT translation failed for theorem %s: %s",
+                theorem_candidate.theorem_id,
+                exc,
+            )
+            return ""
+
+    async def identify_candidates(
+        self,
+        user_research_prompt: str,
+        source_type: str,
+        source_id: str,
+        source_content: str,
+    ) -> Tuple[bool, List[ProofCandidate]]:
+        """Return whether proof candidates exist and the extracted theorem list."""
+        prompt = build_proof_identification_prompt(
+            user_prompt=user_research_prompt,
+            source_type=source_type,
+            source_id=source_id,
+            source_content=source_content,
+        )
+        prompt_tokens = count_tokens(prompt)
+        max_input_tokens = self.context_window - self.max_output_tokens
+        if prompt_tokens > max_input_tokens:
+            logger.warning(
+                "ProofIdentificationAgent prompt exceeds context window (%s > %s) for %s %s",
+                prompt_tokens,
+                max_input_tokens,
+                source_type,
+                source_id,
+            )
+            return False, []
+
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_id,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=self.max_output_tokens,
+                temperature=0.0,
+            )
+            if not response or not response.get("choices"):
+                return False, []
+
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            if not content:
+                return False, []
+
+            data = parse_json(content)
+            if isinstance(data, list):
+                data = data[0] if data else {}
+
+            has_candidates = bool(data.get("has_provable_theorems", False))
+            raw_theorems = data.get("theorems", []) or []
+            theorem_candidates: List[ProofCandidate] = []
+            for index, theorem in enumerate(raw_theorems, start=1):
+                if not isinstance(theorem, dict):
+                    continue
+                statement = str(theorem.get("statement", "")).strip()
+                if not statement:
+                    continue
+                theorem_id = theorem.get("theorem_id") or theorem.get("id") or f"thm_{index}"
+                theorem_candidates.append(
+                    ProofCandidate(
+                        theorem_id=str(theorem_id),
+                        statement=statement,
+                        formal_sketch=str(theorem.get("formal_sketch", "")).strip(),
+                    )
+                )
+
+            return has_candidates and bool(theorem_candidates), theorem_candidates
+        except FreeModelExhaustedError:
+            raise
+        except Exception as exc:
+            logger.error(
+                "ProofIdentificationAgent failed for %s %s: %s",
+                source_type,
+                source_id,
+                exc,
+            )
+            return False, []
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index abac73a..87b3980 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -17,6 +17,9 @@
 from backend.shared.models import (
     AutonomousResearchState,
     BrainstormMetadata,
+    ProofCandidate,
+    ProofRoleConfigSnapshot,
+    ProofRuntimeConfigSnapshot,
     TopicSelectionSubmission,
     SubmitterConfig,
     WorkflowTask,
@@ -27,6 +30,7 @@
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.token_tracker import token_tracker
+from backend.shared.json_parser import parse_json
 
 # Memory managers
 from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
@@ -35,6 +39,7 @@
 from backend.autonomous.memory.autonomous_rejection_logs import autonomous_rejection_logs
 from backend.autonomous.memory.session_manager import session_manager
 from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
+from backend.autonomous.memory.proof_database import proof_database
 
 # RAG manager
 from backend.autonomous.core.autonomous_rag_manager import autonomous_rag_manager
@@ -45,6 +50,11 @@
 from backend.autonomous.agents.completion_reviewer import CompletionReviewerAgent
 from backend.autonomous.agents.reference_selector import ReferenceSelectorAgent
 from backend.autonomous.agents.paper_title_selector import PaperTitleSelectorAgent
+from backend.autonomous.prompts.proof_prompts import (
+    PROOF_FRAMING_CONTEXT,
+    build_proof_framing_gate_prompt,
+)
+from backend.autonomous.core.proof_verification_stage import ProofVerificationStage
 
 # Validation
 from backend.autonomous.validation.paper_redundancy_checker import PaperRedundancyChecker
@@ -145,6 +155,11 @@ def __init__(self):
         self._brainstorm_paper_count: int = 0  # Papers written from current brainstorm (max 3)
         self._current_brainstorm_paper_ids: List[str] = []  # Paper IDs from current brainstorm cycle
         self._last_completed_paper_id: Optional[str] = None  # Persists after _current_paper_id is cleared
+        self._base_user_research_prompt: str = ""
+        self._proof_framing_active: bool = False
+        self._proof_framing_context: str = ""
+        self._proof_framing_reasoning: str = ""
+        self._proof_verification_stage = ProofVerificationStage()
         
         # Tier 3 Final Answer tracking
         self._last_tier3_check_at: int = 0  # Paper count at last Tier 3 check
@@ -171,6 +186,186 @@ async def _broadcast(self, event: str, data: Dict[str, Any] = None) -> None:
         if self._broadcast_callback:
             # broadcast_event expects (event_type, data) as separate arguments
             await self._broadcast_callback(event, data or {})
+
+    def _append_proof_framing(self, prompt: str) -> str:
+        """Append the persisted proof-framing context when active."""
+        effective_prompt = prompt or ""
+        if self._proof_framing_active and self._proof_framing_context:
+            if self._proof_framing_context not in effective_prompt:
+                effective_prompt = f"{effective_prompt}\n\n{self._proof_framing_context}".strip()
+        return effective_prompt
+
+    def _apply_proof_context(self, prompt: str) -> str:
+        """Append proof framing context and inject verified novel proofs."""
+        effective_prompt = self._append_proof_framing(prompt)
+        return proof_database.inject_into_prompt(effective_prompt)
+
+    def _get_effective_user_research_prompt(self) -> str:
+        """Return the current research prompt with all proof context applied."""
+        return self._apply_proof_context(self._user_research_prompt)
+
+    async def _get_effective_brainstorm_prompt(self, topic_prompt: str) -> str:
+        """Return the brainstorm prompt with proof context applied."""
+        effective_prompt = self._apply_proof_context(topic_prompt)
+        return await proof_database.inject_failure_hints_into_prompt(
+            effective_prompt,
+            self._current_topic_id or "",
+        )
+
+    def _get_effective_compiler_prompt(self, paper_title: str) -> str:
+        """Return the compiler prompt with proof context applied."""
+        return self._apply_proof_context(
+            f"Write a mathematical research paper titled: {paper_title}"
+        )
+
+    def _build_proof_runtime_config_snapshot(self) -> Dict[str, Any]:
+        """Build the persisted runtime snapshot used by proof routes/manual checks."""
+        first_submitter = self._submitter_configs[0] if self._submitter_configs else None
+        brainstorm_config = ProofRoleConfigSnapshot(
+            provider=first_submitter.provider if first_submitter else "lm_studio",
+            model_id=first_submitter.model_id if first_submitter else self._high_context_model,
+            openrouter_provider=first_submitter.openrouter_provider if first_submitter else self._high_context_openrouter_provider,
+            lm_studio_fallback_id=first_submitter.lm_studio_fallback_id if first_submitter else self._high_context_lm_studio_fallback,
+            context_window=first_submitter.context_window if first_submitter else self._high_context_context,
+            max_output_tokens=first_submitter.max_output_tokens if first_submitter else self._high_context_max_tokens,
+        )
+        paper_config = ProofRoleConfigSnapshot(
+            provider=self._high_context_provider,
+            model_id=self._high_context_model,
+            openrouter_provider=self._high_context_openrouter_provider,
+            lm_studio_fallback_id=self._high_context_lm_studio_fallback,
+            context_window=self._high_context_context,
+            max_output_tokens=self._high_context_max_tokens,
+        )
+        validator_config = ProofRoleConfigSnapshot(
+            provider=self._validator_provider,
+            model_id=self._validator_model,
+            openrouter_provider=self._validator_openrouter_provider,
+            lm_studio_fallback_id=self._validator_lm_studio_fallback,
+            context_window=self._validator_context,
+            max_output_tokens=self._validator_max_tokens,
+        )
+        return ProofRuntimeConfigSnapshot(
+            brainstorm=brainstorm_config,
+            paper=paper_config,
+            validator=validator_config,
+        ).model_dump(mode="json")
+
+    async def _run_proof_framing_gate(self) -> None:
+        """Run the one-time proof-framing decision before fresh research begins."""
+        if not self._submitter_configs:
+            logger.warning("Proof framing gate skipped: no submitter configuration available")
+            return
+
+        base_prompt = self._base_user_research_prompt or self._user_research_prompt
+        prompt = build_proof_framing_gate_prompt(base_prompt)
+        first_submitter = self._submitter_configs[0]
+
+        reasoning = ""
+        is_proof_amenable = False
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id="proof_framing_gate_000",
+                role_id="autonomous_proof_framing_gate",
+                model=first_submitter.model_id,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=first_submitter.max_output_tokens,
+                temperature=0.0,
+            )
+            if response and response.get("choices"):
+                message = response["choices"][0].get("message", {})
+                content = message.get("content") or message.get("reasoning") or ""
+                if content:
+                    parsed = parse_json(content)
+                    if isinstance(parsed, list):
+                        parsed = parsed[0] if parsed else {}
+                    is_proof_amenable = bool(parsed.get("is_proof_amenable", False))
+                    reasoning = str(parsed.get("reasoning", "")).strip()
+        except Exception as exc:
+            logger.warning("Proof framing gate failed, continuing without proof framing: %s", exc)
+            reasoning = f"Proof framing gate failed: {exc}"
+
+        self._proof_framing_active = is_proof_amenable
+        self._proof_framing_context = PROOF_FRAMING_CONTEXT if is_proof_amenable else ""
+        self._proof_framing_reasoning = reasoning
+        self._user_research_prompt = (
+            self._append_proof_framing(base_prompt)
+            if is_proof_amenable
+            else base_prompt
+        )
+
+        await research_metadata.set_proof_framing_state(
+            base_user_prompt=base_prompt,
+            effective_user_prompt=self._user_research_prompt,
+            active=self._proof_framing_active,
+            context=self._proof_framing_context,
+            reasoning=self._proof_framing_reasoning,
+        )
+        await self._save_workflow_state()
+        await self._broadcast(
+            "proof_framing_decided",
+            {
+                "is_proof_amenable": self._proof_framing_active,
+                "reasoning": self._proof_framing_reasoning,
+            },
+        )
+
+    async def _run_proof_verification(
+        self,
+        content: str,
+        source_type: str,
+        source_id: str,
+        source_title: str = "",
+        theorem_candidates: Optional[List[ProofCandidate]] = None,
+        trigger: str = "automatic",
+        role_suffix_override: Optional[str] = None,
+    ) -> None:
+        """Run the Lean 4 proof verification stage for a completed brainstorm or paper."""
+        if not content or not source_id:
+            return
+
+        if source_type == "brainstorm":
+            submitter_model = self._submitter_configs[0].model_id if self._submitter_configs else self._high_context_model
+            submitter_context = self._submitter_configs[0].context_window if self._submitter_configs else self._high_context_context
+            submitter_max_tokens = self._submitter_configs[0].max_output_tokens if self._submitter_configs else self._high_context_max_tokens
+        else:
+            submitter_model = self._high_context_model
+            submitter_context = self._high_context_context
+            submitter_max_tokens = self._high_context_max_tokens
+
+        await self._proof_verification_stage.run(
+            content=content,
+            source_type=source_type,
+            source_id=source_id,
+            user_prompt=self._get_effective_user_research_prompt(),
+            submitter_model=submitter_model,
+            submitter_context=submitter_context,
+            submitter_max_tokens=submitter_max_tokens,
+            validator_model=self._validator_model,
+            validator_context=self._validator_context,
+            validator_max_tokens=self._validator_max_tokens,
+            broadcast_fn=self._broadcast,
+            novel_proofs_db=proof_database,
+            source_title=source_title,
+            theorem_candidates=theorem_candidates,
+            role_suffix_override=role_suffix_override,
+            trigger=trigger,
+            should_stop=self._stop_event.is_set,
+        )
+
+    async def _run_brainstorm_completion_proofs(self) -> None:
+        """Run proof verification for the current completed brainstorm."""
+        if not self._current_topic_id:
+            return
+
+        metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
+        brainstorm_content = await brainstorm_memory.get_database_content(self._current_topic_id)
+        await self._run_proof_verification(
+            brainstorm_content,
+            "brainstorm",
+            self._current_topic_id,
+            source_title=metadata.topic_prompt if metadata else "",
+        )
     
     async def initialize(
         self,
@@ -276,6 +471,7 @@ async def initialize(
             paper_library.set_session_manager(session_manager)
             research_metadata.set_session_manager(session_manager)
             final_answer_memory.set_session_manager(session_manager)
+            proof_database.set_session_manager(session_manager)
             
             # Override the user_research_prompt with the one from the interrupted session
             # This ensures we continue with the same research goal
@@ -298,6 +494,7 @@ async def initialize(
                 # Don't set session manager - memory modules will use default legacy paths
                 # Clear any previous session manager state
                 await session_manager.clear()
+                proof_database.set_session_manager(None)
             else:
                 # PRIORITY 3: No interrupted session, no legacy data - create new session folder
                 await session_manager.initialize(user_research_prompt, system_config.auto_sessions_base_dir)
@@ -308,12 +505,18 @@ async def initialize(
                 paper_library.set_session_manager(session_manager)
                 research_metadata.set_session_manager(session_manager)
                 final_answer_memory.set_session_manager(session_manager)
+                proof_database.set_session_manager(session_manager)
         
         # Initialize memory systems
         await brainstorm_memory.initialize()
         await paper_library.initialize()
         await research_metadata.initialize(user_research_prompt)
+        await proof_database.initialize()
         await autonomous_rejection_logs.initialize()
+
+        self._base_user_research_prompt = await research_metadata.get_base_user_prompt()
+        if not self._base_user_research_prompt:
+            self._base_user_research_prompt = self._user_research_prompt
         
         # CRITICAL: Reset and clear all RAG state for fresh autonomous session
         # This prevents cross-contamination from Part 1 manual mode
@@ -473,6 +676,190 @@ async def initialize(
                 max_output_tokens=validator_max_tokens
             )
         )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_identification_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_lemma_search_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_framing_gate",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_formalization_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_identification_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_lemma_search_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_formalization_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_novelty",
+            ModelConfig(
+                provider=validator_provider,
+                model_id=validator_model,
+                openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
+                openrouter_provider=validator_openrouter_provider,
+                lm_studio_fallback_id=validator_lm_studio_fallback,
+                context_window=validator_context_window,
+                max_output_tokens=validator_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_identification_manual_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_lemma_search_manual_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_formalization_manual_brainstorm",
+            ModelConfig(
+                provider=first_config.provider if hasattr(first_config, 'provider') else "lm_studio",
+                model_id=first_submitter_model,
+                openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
+                openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
+                context_window=first_submitter_context,
+                max_output_tokens=first_submitter_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_identification_manual_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_lemma_search_manual_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        api_client_manager.configure_role(
+            "autonomous_proof_formalization_manual_paper",
+            ModelConfig(
+                provider=high_context_provider,
+                model_id=self._high_context_model,
+                openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
+                openrouter_provider=high_context_openrouter_provider,
+                lm_studio_fallback_id=high_context_lm_studio_fallback,
+                context_window=self._high_context_context,
+                max_output_tokens=self._high_context_max_tokens
+            )
+        )
+
+        await research_metadata.set_proof_runtime_config(self._build_proof_runtime_config_snapshot())
         
         # Configure Tier 3 Final Answer agents (certainty assessor, format selector, volume organizer)
         # These use the first submitter model configuration
@@ -572,6 +959,15 @@ async def _check_resume_state(self) -> None:
             # Restore brainstorm multi-paper continuation tracking
             self._brainstorm_paper_count = workflow_state.get("brainstorm_paper_count", 0)
             self._current_brainstorm_paper_ids = workflow_state.get("current_brainstorm_paper_ids", [])
+
+            # Restore proof framing state
+            self._proof_framing_active = workflow_state.get("proof_framing_active", False)
+            self._proof_framing_context = workflow_state.get("proof_framing_context", "")
+            self._proof_framing_reasoning = workflow_state.get("proof_framing_reasoning", "")
+            self._base_user_research_prompt = await research_metadata.get_base_user_prompt()
+            if not self._base_user_research_prompt:
+                self._base_user_research_prompt = self._user_research_prompt
+            self._user_research_prompt = self._append_proof_framing(self._base_user_research_prompt)
             
             # Restore Tier 3 flags for proper resume
             self._tier3_active = workflow_state.get("tier3_active", False)
@@ -717,12 +1113,14 @@ def _has_section(self, content: str, section_name: str) -> bool:
             rf"#\s*{section_name}",        # Markdown heading
             rf"\*\*{section_name}\*\*",    # Bold text
             rf"^{section_name}\s*$",       # Plain section name
+            rf"^\\(?:section|chapter)\*?\{{{section_name}\}}\s*$",  # LaTeX heading
         ]
         
         # Add section-specific patterns
         if section_name == "Introduction":
             # Introduction is always numbered as "I."
             base_patterns.append(rf"^I\.\s*{section_name}")
+            base_patterns.append(rf"^\\(?:section|chapter)\*?\{{I\.?\s*{section_name}\}}\s*$")
         elif section_name == "Conclusion":
             # Conclusion can have Roman numeral (variable position in paper)
             base_patterns.append(rf"^[IVXLC]+\.\s*{section_name}")
@@ -862,6 +1260,9 @@ async def _save_workflow_state(self, tier: str = None, phase: str = None) -> Non
             # Brainstorm multi-paper continuation tracking
             "brainstorm_paper_count": self._brainstorm_paper_count,
             "current_brainstorm_paper_ids": self._current_brainstorm_paper_ids,
+            "proof_framing_active": self._proof_framing_active,
+            "proof_framing_context": self._proof_framing_context,
+            "proof_framing_reasoning": self._proof_framing_reasoning,
             # Tier 3 Final Answer crash recovery fields
             "tier3_active": self._tier3_active,
             "tier3_enabled": self._tier3_enabled,
@@ -931,6 +1332,9 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
         
         # Check for interrupted workflow to resume
         resume_state = await self._get_resume_point()
+
+        if not resume_state:
+            await self._run_proof_framing_gate()
         
         try:
             # Main research loop
@@ -1788,6 +2192,12 @@ def get_validator_config(self) -> Optional[Dict[str, Any]]:
             "validator_provider": self._validator_provider,
             "validator_openrouter_provider": self._validator_openrouter_provider,
         }
+
+    def get_proof_runtime_config(self) -> Optional[Dict[str, Any]]:
+        """Return the current proof runtime snapshot when initialized."""
+        if not self._validator_model:
+            return None
+        return self._build_proof_runtime_config_snapshot()
     
     async def skip_critique_phase(self) -> bool:
         """
@@ -1840,7 +2250,7 @@ async def _topic_exploration_phase(self) -> str:
         papers_summary = await autonomous_rag_manager.get_all_papers_summary()
         
         exploration_prompt = build_exploration_user_prompt(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             brainstorms_summary=brainstorms_summary,
             papers_summary=papers_summary
         )
@@ -2021,7 +2431,7 @@ async def _topic_selection_loop(self, candidate_questions: str = "") -> Optional
             papers_summary = await autonomous_rag_manager.get_all_papers_summary()
             
             submission = await self._topic_selector.select_topic(
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 brainstorms_summary=brainstorms_summary,
                 papers_summary=papers_summary,
                 candidate_questions=candidate_questions
@@ -2034,7 +2444,7 @@ async def _topic_selection_loop(self, candidate_questions: str = "") -> Optional
             
             validation = await self._topic_validator.validate(
                 submission=submission,
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 brainstorms_summary=brainstorms_summary,
                 papers_summary=papers_summary
             )
@@ -2196,7 +2606,7 @@ async def _brainstorm_continuation_decision(self) -> str:
             logger.info(f"Brainstorm continuation decision attempt {attempt}")
             
             prompt = build_continuation_decision_prompt(
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 topic_prompt=topic_prompt,
                 brainstorm_summary=brainstorm_summary,
                 papers_from_brainstorm=papers_context,
@@ -2244,11 +2654,11 @@ async def _brainstorm_continuation_decision(self) -> str:
                         topic_prompt=f"[CONTINUATION DECISION: {decision}]",
                         reasoning=reasoning[:200]
                     ),
-                    user_research_prompt=self._user_research_prompt,
+                    user_research_prompt=self._get_effective_user_research_prompt(),
                     brainstorms_summary=await autonomous_rag_manager.get_all_brainstorms_summary(),
                     papers_summary=await autonomous_rag_manager.get_all_papers_summary(),
                     override_prompt=build_continuation_validation_prompt(
-                        user_research_prompt=self._user_research_prompt,
+                        user_research_prompt=self._get_effective_user_research_prompt(),
                         topic_prompt=topic_prompt,
                         brainstorm_summary=brainstorm_summary,
                         papers_from_brainstorm=papers_context,
@@ -2318,7 +2728,7 @@ async def _pre_brainstorm_reference_selection(self) -> List[str]:
         
         # Run reference selection in "initial" mode (before brainstorm)
         selected_ids = await self._reference_selector.select_references(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=topic_prompt,
             brainstorm_summary=brainstorm_summary,
             available_papers=papers_summary,
@@ -2462,7 +2872,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
             # CRITICAL: Pass per-submitter configs for multi-submitter support
             # CRITICAL: Pass reference papers as user_files to enable compounding knowledge
             await self._brainstorm_aggregator.initialize(
-                user_prompt=metadata.topic_prompt,
+                user_prompt=await self._get_effective_brainstorm_prompt(metadata.topic_prompt),
                 submitter_configs=self._submitter_configs,  # Per-submitter configs (1-10 submitters)
                 validator_model=self._validator_model,
                 user_files=reference_paper_paths,  # Reference papers for compounding knowledge
@@ -2512,6 +2922,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
             if self._manual_paper_writing_triggered:
                 logger.info("Manual override detected during initialization - skipping aggregator start")
                 self._manual_paper_writing_triggered = False
+                await self._run_brainstorm_completion_proofs()
                 return True
             
             # Start aggregator
@@ -2605,6 +3016,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                         
                         # Stop aggregator
                         await self._brainstorm_aggregator.stop()
+                        await self._run_brainstorm_completion_proofs()
                         
                         # Force transition to paper writing (skip completion review)
                         return True
@@ -2622,6 +3034,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                         if write_paper:
                             # Stop aggregator
                             await self._brainstorm_aggregator.stop()
+                            await self._run_brainstorm_completion_proofs()
                             return True
                 
                 # Check for manual override trigger (before checking stop event)
@@ -2629,6 +3042,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                     logger.info("Manual override detected - transitioning to paper writing")
                     self._manual_paper_writing_triggered = False
                     await self._brainstorm_aggregator.stop()
+                    await self._run_brainstorm_completion_proofs()
                     return True
                 
                 # Track consecutive rejections and increment total rejections stat
@@ -2663,6 +3077,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                         
                         # Stop aggregator
                         await self._brainstorm_aggregator.stop()
+                        await self._run_brainstorm_completion_proofs()
                         
                         # Force transition to paper writing (skip completion review)
                         return True
@@ -2981,7 +3396,7 @@ async def _run_completion_review(self) -> bool:
         
         # Run completion review with self-validation
         result, is_validated = await self._completion_reviewer.review_completion(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_id=self._current_topic_id,
             topic_prompt=metadata.topic_prompt,
             brainstorm_database=brainstorm_content,
@@ -3247,7 +3662,7 @@ async def _reference_selection_workflow(self) -> List[str]:
         
         # Run reference selection in "additional" mode
         additional_ids = await self._reference_selector.select_references(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=topic_prompt,
             brainstorm_summary=brainstorm_summary,
             available_papers=available_for_selection,
@@ -3305,7 +3720,7 @@ async def _paper_title_selection(
         
         # Select title (pass stop_event so user stop is honoured mid-loop)
         title = await self._title_selector.select_title(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=metadata.topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=existing_papers,
@@ -3342,18 +3757,11 @@ async def _paper_title_exploration_phase(
         TARGET_CANDIDATES = 5
         MAX_CONSECUTIVE_REJECTIONS = 15
         
-        await self._broadcast("paper_title_exploration_started", {
-            "target": TARGET_CANDIDATES,
-            "resumed_count": 0
-        })
-        
-        logger.info(f"Starting paper title exploration phase (target: {TARGET_CANDIDATES} candidates)")
-        
         # Build the exploration user prompt for the aggregator
         from backend.autonomous.prompts.paper_title_exploration_prompts import build_title_exploration_user_prompt
         
         exploration_prompt = build_title_exploration_user_prompt(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=existing_papers or [],
@@ -3365,84 +3773,117 @@ async def _paper_title_exploration_phase(
         title_db_path = brainstorm_memory._base_dir / f"title_candidates_{topic_suffix}.txt"
         title_db_path.parent.mkdir(parents=True, exist_ok=True)
         
-        # Clear any stale title candidates DB
-        if title_db_path.exists():
-            title_db_path.unlink()
-        
-        # Override shared training memory path for title exploration
+        # CRASH-RESUME: Preserve any prior validated candidates.
+        # If a previous run was interrupted mid-exploration, the finally-block cleanup
+        # never ran, so the file still contains accepted candidates. We reuse them and
+        # only top up to TARGET_CANDIDATES instead of restarting from zero.
+        # Override shared training memory path BEFORE counting so the reload reads this file.
         original_shared_path = system_config.shared_training_file
         system_config.shared_training_file = str(title_db_path)
         original_memory_path = shared_training_memory.file_path
         shared_training_memory.file_path = title_db_path
         await shared_training_memory.reload_insights_from_current_path()
         
+        resumed_count = len(shared_training_memory.insights)
+        if resumed_count > 0:
+            logger.info(
+                f"TitleExploration: Resuming with {resumed_count} previously-accepted "
+                f"candidate(s) from {title_db_path.name}"
+            )
+        
+        await self._broadcast("paper_title_exploration_started", {
+            "target": TARGET_CANDIDATES,
+            "resumed_count": resumed_count
+        })
+        
+        logger.info(
+            f"Starting paper title exploration phase (target: {TARGET_CANDIDATES} candidates, "
+            f"resumed: {resumed_count})"
+        )
+        
         exploration_aggregator = None
         
         try:
-            exploration_aggregator = AggregatorCoordinator()
-            
-            await exploration_aggregator.initialize(
-                user_prompt=exploration_prompt,
-                submitter_configs=self._submitter_configs,
-                validator_model=self._validator_model,
-                user_files=[],
-                skip_stats_load=True,
-                validator_context_window=self._validator_context,
-                validator_max_tokens=self._validator_max_tokens,
-                validator_provider=self._validator_provider,
-                validator_openrouter_provider=self._validator_openrouter_provider,
-                validator_lm_studio_fallback=self._validator_lm_studio_fallback,
-                enable_cleanup_review=False
-            )
-            
-            if self._broadcast_callback:
-                exploration_aggregator.websocket_broadcaster = self._broadcast_callback
-            
-            await exploration_aggregator.start()
-            logger.info("Title exploration aggregator started with parallel submitters")
-            
-            last_acceptances = 0
-            last_rejections = 0
-            consecutive_rejections = 0
-            
-            while self._running and not self._stop_event.is_set():
-                status = await exploration_aggregator.get_status()
-                current_acceptances = status.total_acceptances
-                current_rejections = status.total_rejections
+            # Short-circuit: if we already have enough candidates from a prior run,
+            # skip the aggregator entirely and proceed directly to reading them.
+            if resumed_count >= TARGET_CANDIDATES:
+                logger.info(
+                    f"TitleExploration: Already have {resumed_count} candidates from "
+                    f"prior run (>= target {TARGET_CANDIDATES}); skipping aggregator."
+                )
+                last_acceptances = resumed_count
+                last_rejections = 0
+            else:
+                exploration_aggregator = AggregatorCoordinator()
+                
+                await exploration_aggregator.initialize(
+                    user_prompt=exploration_prompt,
+                    submitter_configs=self._submitter_configs,
+                    validator_model=self._validator_model,
+                    user_files=[],
+                    skip_stats_load=True,
+                    validator_context_window=self._validator_context,
+                    validator_max_tokens=self._validator_max_tokens,
+                    validator_provider=self._validator_provider,
+                    validator_openrouter_provider=self._validator_openrouter_provider,
+                    validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                    enable_cleanup_review=False
+                )
                 
-                if current_acceptances > last_acceptances:
-                    consecutive_rejections = 0
-                    last_acceptances = current_acceptances
+                if self._broadcast_callback:
+                    exploration_aggregator.websocket_broadcaster = self._broadcast_callback
+                
+                await exploration_aggregator.start()
+                logger.info("Title exploration aggregator started with parallel submitters")
+                
+                # Aggregator starts at 0 acceptances even though the file may already
+                # contain resumed candidates. We track the aggregator's own counter for
+                # delta detection, but report the sum (resumed + new) as progress.
+                last_aggregator_acceptances = 0
+                last_acceptances = resumed_count
+                last_rejections = 0
+                consecutive_rejections = 0
+                
+                while self._running and not self._stop_event.is_set():
+                    status = await exploration_aggregator.get_status()
+                    current_aggregator_acceptances = status.total_acceptances
+                    current_acceptances = resumed_count + current_aggregator_acceptances
+                    current_rejections = status.total_rejections
                     
-                    await self._broadcast("paper_title_exploration_progress", {
-                        "accepted": current_acceptances,
-                        "target": TARGET_CANDIDATES,
-                        "total_attempts": current_acceptances + current_rejections
-                    })
-                    
-                    await self._save_workflow_state(
-                        tier=self._state.current_tier,
-                        phase="paper_title_exploration"
-                    )
-                    
-                    logger.info(f"TitleExploration: {current_acceptances}/{TARGET_CANDIDATES} candidates accepted")
+                    if current_aggregator_acceptances > last_aggregator_acceptances:
+                        consecutive_rejections = 0
+                        last_aggregator_acceptances = current_aggregator_acceptances
+                        last_acceptances = current_acceptances
+                        
+                        await self._broadcast("paper_title_exploration_progress", {
+                            "accepted": current_acceptances,
+                            "target": TARGET_CANDIDATES,
+                            "total_attempts": current_acceptances + current_rejections
+                        })
+                        
+                        await self._save_workflow_state(
+                            tier=self._state.current_tier,
+                            phase="paper_title_exploration"
+                        )
+                        
+                        logger.info(f"TitleExploration: {current_acceptances}/{TARGET_CANDIDATES} candidates accepted")
+                        
+                        if current_acceptances >= TARGET_CANDIDATES:
+                            logger.info(f"TitleExploration: Target of {TARGET_CANDIDATES} candidates reached")
+                            break
                     
-                    if current_acceptances >= TARGET_CANDIDATES:
-                        logger.info(f"TitleExploration: Target of {TARGET_CANDIDATES} candidates reached")
-                        break
-                
-                if current_rejections > last_rejections:
-                    new_rejections = current_rejections - last_rejections
-                    consecutive_rejections += new_rejections
-                    last_rejections = current_rejections
+                    if current_rejections > last_rejections:
+                        new_rejections = current_rejections - last_rejections
+                        consecutive_rejections += new_rejections
+                        last_rejections = current_rejections
+                        
+                        if consecutive_rejections >= MAX_CONSECUTIVE_REJECTIONS:
+                            logger.warning(f"TitleExploration: {consecutive_rejections} consecutive rejections - proceeding with {current_acceptances} candidates")
+                            break
                     
-                    if consecutive_rejections >= MAX_CONSECUTIVE_REJECTIONS:
-                        logger.warning(f"TitleExploration: {consecutive_rejections} consecutive rejections - proceeding with {current_acceptances} candidates")
-                        break
+                    await asyncio.sleep(2)
                 
-                await asyncio.sleep(2)
-            
-            await exploration_aggregator.stop()
+                await exploration_aggregator.stop()
             
             # Read accepted candidates from the title candidates database
             candidates_text = ""
@@ -3555,7 +3996,7 @@ async def _compile_paper(
             # CRITICAL: skip_aggregator_db=True prevents loading Part 1 aggregator database
             # Autonomous mode should ONLY use the brainstorm database for this topic
             await self._paper_compiler.initialize(
-                compiler_prompt=f"Write a mathematical research paper titled: {paper_title}",
+                compiler_prompt=self._get_effective_compiler_prompt(paper_title),
                 validator_model=self._validator_model,
                 high_context_model=self._high_context_model,
                 high_param_model=self._high_param_model,
@@ -3582,6 +4023,7 @@ async def _compile_paper(
             
             # Enable autonomous section order constraint
             self._paper_compiler.enable_autonomous_mode()
+            self._paper_compiler._current_paper_tracker = self._current_paper_tracker
             self._paper_compiler._current_topic_id = self._current_topic_id
             self._paper_compiler._current_reference_paper_ids = list(dict.fromkeys(
                 reference_paper_ids + self._current_brainstorm_paper_ids
@@ -3736,6 +4178,8 @@ def _has_abstract(self, paper_content: str) -> bool:
             r"##\s*Abstract",
             r"#\s*Abstract",
             r"\*\*Abstract\*\*",
+            r"\\(?:section|chapter)\*?\{Abstract\}",
+            r"\\begin\{abstract\}",
             r"Abstract\s*\n",
         ]
         
@@ -3752,6 +4196,8 @@ def _extract_abstract(self, paper_content: str) -> str:
             r"##\s*Abstract\s*\n(.*?)(?=\n##|\n#|\Z)",
             r"#\s*Abstract\s*\n(.*?)(?=\n##|\n#|\Z)",
             r"\*\*Abstract\*\*\s*\n(.*?)(?=\n##|\n#|\n\*\*|\Z)",
+            r"\\(?:section|chapter)\*?\{Abstract\}\s*\n(.*?)(?=\n\\(?:section|chapter)\*?\{|\Z)",
+            r"\\begin\{abstract\}\s*(.*?)\s*\\end\{abstract\}",
         ]
         
         for pattern in abstract_patterns:
@@ -3869,6 +4315,64 @@ async def _handle_paper_completion(
                 "word_count": paper_metadata.word_count
             })
 
+            await self._run_proof_verification(
+                content,
+                "paper",
+                paper_id,
+                source_title=title,
+            )
+
+            pending_retry_candidates: List[ProofCandidate] = []
+            retry_source_ids = paper_metadata.source_brainstorm_ids or ([self._current_topic_id] if self._current_topic_id else [])
+            for brainstorm_id in retry_source_ids:
+                pending_retries = await proof_database.get_pending_retries(
+                    brainstorm_id,
+                    retry_source_id=paper_id,
+                )
+                for pending_retry in pending_retries:
+                    combined_excerpt_parts = []
+                    if pending_retry.source_excerpt:
+                        combined_excerpt_parts.append(
+                            "ORIGINAL BRAINSTORM EXCERPT:\n" + pending_retry.source_excerpt
+                        )
+                    if content:
+                        combined_excerpt_parts.append(
+                            "REFINED PAPER CONTEXT:\n" + content[:6000]
+                        )
+
+                    retry_formal_sketch = pending_retry.formal_sketch
+                    if pending_retry.error_summary:
+                        retry_formal_sketch = (
+                            f"{retry_formal_sketch}\n\nPrior Lean 4 failure summary: {pending_retry.error_summary}"
+                        ).strip()
+
+                    pending_retry_candidates.append(
+                        ProofCandidate(
+                            theorem_id=pending_retry.theorem_id,
+                            statement=pending_retry.theorem_statement,
+                            formal_sketch=retry_formal_sketch,
+                            source_excerpt="\n\n".join(part for part in combined_excerpt_parts if part).strip(),
+                            origin_source_id=brainstorm_id,
+                        )
+                    )
+
+            if pending_retry_candidates:
+                await self._broadcast("proof_retry_scheduled", {
+                    "source_type": "paper",
+                    "source_id": paper_id,
+                    "source_title": title,
+                    "count": len(pending_retry_candidates),
+                    "brainstorm_ids": retry_source_ids,
+                })
+                await self._run_proof_verification(
+                    content,
+                    "paper",
+                    paper_id,
+                    source_title=title,
+                    theorem_candidates=pending_retry_candidates,
+                    trigger="retry",
+                )
+
             # Trigger auto-critique generation in background (only if marking as complete)
             asyncio.create_task(self._auto_generate_paper_critique(
                 paper_id=paper_id,
@@ -4078,7 +4582,7 @@ async def _check_paper_redundancy(self) -> None:
         
         # Check for redundancy
         result = await self._redundancy_checker.check_redundancy(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             papers_summary=papers_summary
         )
         
@@ -4284,7 +4788,7 @@ async def _resume_tier3_from_format_selection(self, tier3_state) -> bool:
                 })
                 
                 format_selection = await self._format_selector.select_format(
-                    user_research_prompt=self._user_research_prompt,
+                    user_research_prompt=self._get_effective_user_research_prompt(),
                     certainty_assessment=assessment,
                     all_papers=all_papers
                 )
@@ -4578,7 +5082,7 @@ async def tier3_model_tracking_callback(model_id: str) -> None:
             })
             
             assessment = await self._certainty_assessor.assess_certainty(
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 all_papers=all_papers
             )
             
@@ -4617,7 +5121,7 @@ async def tier3_model_tracking_callback(model_id: str) -> None:
             })
             
             format_selection = await self._format_selector.select_format(
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 certainty_assessment=assessment,
                 all_papers=all_papers
             )
@@ -4787,7 +5291,7 @@ async def _tier3_long_form_workflow(
         try:
             # Step 1: Organize volume structure
             volume = await self._volume_organizer.organize_volume(
-                user_research_prompt=self._user_research_prompt,
+                user_research_prompt=self._get_effective_user_research_prompt(),
                 certainty_assessment=assessment,
                 all_papers=all_papers
             )
@@ -4871,7 +5375,7 @@ async def _tier3_reference_selection(
 
         # For Tier 3, we browse ALL papers and select those most useful for answering
         selected_ids = await self._reference_selector.select_references(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt="[Tier 3 Final Answer - selecting papers to answer the research question]",
             brainstorm_summary="[No brainstorm - Tier 3 operates on completed papers only]",
             available_papers=all_papers,
@@ -4911,7 +5415,7 @@ async def _tier3_title_selection(
         
         # Use the existing title selector with special context + candidate titles
         title = await self._title_selector.select_title(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=topic_prompt,
             brainstorm_summary=brainstorm_summary,
             existing_papers_from_brainstorm=[],
@@ -4956,9 +5460,11 @@ async def _compile_tier3_paper(
             
             # Initialize compiler
             await self._paper_compiler.initialize(
-                compiler_prompt=f"Write a mathematical research paper titled: {paper_title}\n\n"
-                               f"IMPORTANT: This paper directly answers the research question.\n"
-                               f"Known Certainties: {assessment.known_certainties_summary}",
+                compiler_prompt=self._apply_proof_context(
+                    f"Write a mathematical research paper titled: {paper_title}\n\n"
+                    f"IMPORTANT: This paper directly answers the research question.\n"
+                    f"Known Certainties: {assessment.known_certainties_summary}"
+                ),
                 validator_model=self._validator_model,
                 high_context_model=self._high_context_model,
                 high_param_model=self._high_param_model,
@@ -5084,7 +5590,7 @@ async def _write_volume_chapter(
         
         # Select chapter title from candidates
         chapter_title = await self._title_selector.select_title(
-            user_research_prompt=self._user_research_prompt,
+            user_research_prompt=self._get_effective_user_research_prompt(),
             topic_prompt=f"[VOLUME CHAPTER: {chapter.chapter_type}] {context}",
             brainstorm_summary=f"Known Certainties:\n{assessment.known_certainties_summary}",
             existing_papers_from_brainstorm=[],
diff --git a/backend/autonomous/core/proof_dependency_extractor.py b/backend/autonomous/core/proof_dependency_extractor.py
new file mode 100644
index 0000000..a7cbf71
--- /dev/null
+++ b/backend/autonomous/core/proof_dependency_extractor.py
@@ -0,0 +1,208 @@
+"""
+Extract proof dependencies from verified Lean 4 code.
+"""
+from __future__ import annotations
+
+import logging
+import re
+from typing import TYPE_CHECKING, Iterable, List
+
+from backend.shared.models import MathlibLemmaHint, ProofDependency
+
+if TYPE_CHECKING:
+    from backend.autonomous.agents.lemma_search_agent import MathlibLemmaSearchAgent
+
+logger = logging.getLogger(__name__)
+
+_DOTTED_NAME_RE = re.compile(r"\b[A-Za-z][A-Za-z0-9_']*(?:\.[A-Za-z][A-Za-z0-9_']*)+\b")
+
+
+class ProofDependencyExtractor:
+    """Best-effort dependency extraction for verified proofs."""
+
+    @staticmethod
+    def _contains_symbol(search_text: str, symbol: str) -> bool:
+        if not search_text or not symbol:
+            return False
+        pattern = re.compile(rf"(?<![A-Za-z0-9_'.]){re.escape(symbol)}(?![A-Za-z0-9_'])")
+        return bool(pattern.search(search_text))
+
+    @staticmethod
+    def _dependency_source_ref(file_path: str, line_number: int) -> str:
+        if file_path and line_number:
+            return f"{file_path}:{line_number}"
+        return file_path or ""
+
+    @staticmethod
+    def _dedupe_dependencies(dependencies: Iterable[ProofDependency]) -> List[ProofDependency]:
+        seen = set()
+        deduped: List[ProofDependency] = []
+        for dependency in dependencies:
+            key = (dependency.kind, dependency.name, dependency.source_ref)
+            if key in seen:
+                continue
+            seen.add(key)
+            deduped.append(dependency)
+        return deduped
+
+    @staticmethod
+    def _extract_dotted_names(lean_code: str) -> List[str]:
+        return sorted(set(_DOTTED_NAME_RE.findall(lean_code or "")))
+
+    @staticmethod
+    def _strip_comments_and_strings(lean_code: str) -> str:
+        if not lean_code:
+            return ""
+
+        result: list[str] = []
+        index = 0
+        length = len(lean_code)
+        block_comment_depth = 0
+        in_string = False
+
+        while index < length:
+            current = lean_code[index]
+            pair = lean_code[index:index + 2]
+
+            if block_comment_depth > 0:
+                if pair == "/-":
+                    block_comment_depth += 1
+                    result.extend([" ", " "])
+                    index += 2
+                    continue
+                if pair == "-/":
+                    block_comment_depth -= 1
+                    result.extend([" ", " "])
+                    index += 2
+                    continue
+                result.append("\n" if current == "\n" else " ")
+                index += 1
+                continue
+
+            if in_string:
+                if current == "\\" and index + 1 < length:
+                    result.extend([" ", " "])
+                    index += 2
+                    continue
+                if current == "\"":
+                    in_string = False
+                    result.append(" ")
+                    index += 1
+                    continue
+                result.append("\n" if current == "\n" else " ")
+                index += 1
+                continue
+
+            if pair == "/-":
+                block_comment_depth = 1
+                result.extend([" ", " "])
+                index += 2
+                continue
+
+            if pair == "--":
+                while index < length and lean_code[index] != "\n":
+                    result.append(" ")
+                    index += 1
+                continue
+
+            if current == "\"":
+                in_string = True
+                result.append(" ")
+                index += 1
+                continue
+
+            result.append(current)
+            index += 1
+
+        return "".join(result)
+
+    @classmethod
+    def _extract_search_text(cls, lean_code: str) -> str:
+        sanitized = cls._strip_comments_and_strings(lean_code)
+        if not sanitized:
+            return ""
+
+        proof_match = re.search(r":=\s*by\b(?P<body>.*)", sanitized, flags=re.DOTALL)
+        if proof_match:
+            return proof_match.group("body")
+
+        theorem_by_match = re.search(
+            r"^\s*(?:protected\s+)?(?:theorem|lemma)\b[^\n]*\bby\b(?P<body>.*)",
+            sanitized,
+            flags=re.DOTALL | re.MULTILINE,
+        )
+        if theorem_by_match:
+            return theorem_by_match.group("body")
+
+        return sanitized
+
+    async def extract_dependencies(
+        self,
+        *,
+        lean_code: str,
+        theorem_name: str,
+        proof_database,
+        lemma_search_agent: "MathlibLemmaSearchAgent",
+        relevant_lemmas: Iterable[MathlibLemmaHint] = (),
+        current_proof_id: str = "",
+    ) -> List[ProofDependency]:
+        dependencies: List[ProofDependency] = []
+        search_text = self._extract_search_text(lean_code)
+        if not search_text:
+            return dependencies
+
+        try:
+            existing_proofs = await proof_database.get_all_proofs()
+            for proof in existing_proofs:
+                if current_proof_id and proof.proof_id == current_proof_id:
+                    continue
+                candidate_name = str(proof.theorem_name or "").strip()
+                if not candidate_name or candidate_name == theorem_name:
+                    continue
+                if not self._contains_symbol(search_text, candidate_name):
+                    continue
+                dependencies.append(
+                    ProofDependency(
+                        kind="moto",
+                        name=candidate_name,
+                        source_ref=proof.proof_id,
+                    )
+                )
+        except Exception as exc:
+            logger.debug("Failed to extract MOTO proof ancestry for %s: %s", theorem_name or "[unnamed theorem]", exc)
+
+        mathlib_index_ready = False
+        try:
+            mathlib_index_ready = await lemma_search_agent.ensure_index_loaded()
+        except Exception as exc:
+            logger.debug("Mathlib dependency extraction skipped: %s", exc)
+
+        if not mathlib_index_ready:
+            return self._dedupe_dependencies(dependencies)
+
+        for hint in relevant_lemmas or []:
+            short_name = (hint.full_name or hint.requested_name).split(".")[-1]
+            if not (
+                self._contains_symbol(search_text, hint.full_name)
+                or self._contains_symbol(search_text, short_name)
+            ):
+                continue
+            dependencies.append(
+                ProofDependency(
+                    kind="mathlib",
+                    name=hint.full_name or hint.requested_name,
+                    source_ref=self._dependency_source_ref(hint.file_path, hint.line_number),
+                )
+            )
+
+        for dotted_name in self._extract_dotted_names(search_text):
+            for hit in lemma_search_agent.lookup_candidate_name(dotted_name):
+                dependencies.append(
+                    ProofDependency(
+                        kind="mathlib",
+                        name=hit.full_name or hit.requested_name,
+                        source_ref=self._dependency_source_ref(hit.file_path, hit.line_number),
+                    )
+                )
+
+        return self._dedupe_dependencies(dependencies)
diff --git a/backend/autonomous/core/proof_novelty.py b/backend/autonomous/core/proof_novelty.py
new file mode 100644
index 0000000..c4ee9e9
--- /dev/null
+++ b/backend/autonomous/core/proof_novelty.py
@@ -0,0 +1,99 @@
+"""
+Shared Lean-4 proof novelty assessment.
+
+The autonomous research `ProofVerificationStage` and the compiler's rigor
+submitter both need to classify a freshly verified Lean 4 proof as novel
+(first time this system has produced it) or known (duplicates a result
+already in the proof database). Both call sites share a single helper
+here so the prompt + context-budget behaviour stays identical.
+"""
+from __future__ import annotations
+
+import logging
+from typing import Tuple
+
+from backend.autonomous.prompts.proof_prompts import build_proof_novelty_prompt
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.json_parser import parse_json
+from backend.shared.utils import count_tokens
+
+logger = logging.getLogger(__name__)
+
+
+async def assess_proof_novelty(
+    *,
+    user_prompt: str,
+    theorem_statement: str,
+    lean_code: str,
+    validator_model: str,
+    validator_context: int,
+    validator_max_tokens: int,
+    existing_novel_proofs: str,
+    task_id: str,
+    role_id: str = "autonomous_proof_novelty",
+) -> Tuple[bool, str]:
+    """Classify a Lean-4-verified theorem as novel or known.
+
+    Args:
+        user_prompt: Top-level research prompt for context.
+        theorem_statement: Human-readable statement of the verified theorem.
+        lean_code: Full Lean 4 source that compiled cleanly.
+        validator_model: Model identifier to drive the novelty judgement.
+        validator_context: Validator model's context window.
+        validator_max_tokens: Maximum output tokens reserved for the judgement.
+        existing_novel_proofs: Pre-formatted block listing already-novel proofs;
+            trimmed in-loop if it overflows the validator budget.
+        task_id: Caller-chosen task id used for workflow tracking.
+        role_id: Role identifier forwarded to the API client manager. Defaults
+            to the autonomous role; the compiler rigor caller passes a
+            compiler-specific role for correct logging.
+
+    Returns:
+        Tuple of (is_novel, reasoning). Falls back to (False, <message>) when
+        the novelty validator returns no usable response.
+    """
+    prompt = build_proof_novelty_prompt(
+        user_prompt=user_prompt,
+        theorem_statement=theorem_statement,
+        lean_code=lean_code,
+        existing_novel_proofs=existing_novel_proofs,
+    )
+
+    max_input_tokens = validator_context - validator_max_tokens
+    while count_tokens(prompt) > max_input_tokens and len(existing_novel_proofs) > 2000:
+        existing_novel_proofs = existing_novel_proofs[
+            : max(len(existing_novel_proofs) // 2, 2000)
+        ]
+        prompt = build_proof_novelty_prompt(
+            user_prompt=user_prompt,
+            theorem_statement=theorem_statement,
+            lean_code=lean_code,
+            existing_novel_proofs=existing_novel_proofs,
+        )
+
+    response = await api_client_manager.generate_completion(
+        task_id=task_id,
+        role_id=role_id,
+        model=validator_model,
+        messages=[{"role": "user", "content": prompt}],
+        max_tokens=validator_max_tokens,
+        temperature=0.0,
+    )
+    if not response or not response.get("choices"):
+        return False, "Novelty validator returned no response."
+
+    message = response["choices"][0].get("message", {})
+    content = message.get("content") or message.get("reasoning") or ""
+    if not content:
+        return False, "Novelty validator returned empty content."
+
+    try:
+        data = parse_json(content)
+    except Exception as exc:
+        logger.warning("Novelty validator JSON parse failed: %s", exc)
+        return False, f"Novelty validator JSON parse error: {exc}"
+
+    if isinstance(data, list):
+        data = data[0] if data else {}
+
+    return bool(data.get("is_novel", False)), str(data.get("reasoning", "")).strip()
diff --git a/backend/autonomous/core/proof_verification_stage.py b/backend/autonomous/core/proof_verification_stage.py
new file mode 100644
index 0000000..5c9f90c
--- /dev/null
+++ b/backend/autonomous/core/proof_verification_stage.py
@@ -0,0 +1,997 @@
+"""
+Orchestrates proof identification, Lean 4 attempts, retry handling, and novelty checks.
+"""
+from __future__ import annotations
+
+import asyncio
+import logging
+import re
+import time
+from dataclasses import dataclass, field
+from typing import Any, Awaitable, Callable, Optional
+
+from backend.autonomous.agents.lemma_search_agent import MathlibLemmaSearchAgent
+from backend.autonomous.agents.proof_formalization_agent import ProofFormalizationAgent
+from backend.autonomous.agents.proof_identification_agent import ProofIdentificationAgent
+from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
+from backend.autonomous.memory.paper_library import paper_library
+from backend.shared.config import system_config
+from backend.shared.models import ProofAttemptFeedback, ProofAttemptResult, ProofCandidate, ProofRecord, ProofStageResult, SmtHint
+from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.smt_client import get_smt_client
+from .proof_dependency_extractor import ProofDependencyExtractor
+
+logger = logging.getLogger(__name__)
+
+BroadcastFn = Optional[Callable[[str, dict[str, Any]], Awaitable[None]]]
+ShouldStopFn = Optional[Callable[[], bool]]
+
+
+@dataclass
+class _LeanVerificationOutcome:
+    """Outcome of a single candidate's Lean 4 formalization pipeline (Phase A)."""
+    candidate: ProofCandidate
+    success: bool
+    theorem_name: str
+    lean_code: str
+    attempts: list[ProofAttemptFeedback] = field(default_factory=list)
+
+
+class ProofVerificationStage:
+    """Run the full proof-verification checkpoint pipeline."""
+
+    _active_sources: set[str] = set()
+    _active_sources_lock: Optional[asyncio.Lock] = None
+
+    def __init__(self) -> None:
+        self._novelty_task_sequence = 0
+        self._dependency_extractor = ProofDependencyExtractor()
+
+    @classmethod
+    def _get_active_sources_lock(cls) -> asyncio.Lock:
+        if cls._active_sources_lock is None:
+            cls._active_sources_lock = asyncio.Lock()
+        return cls._active_sources_lock
+
+    @classmethod
+    def _source_key(cls, source_type: str, source_id: str) -> str:
+        return f"{source_type}:{source_id}"
+
+    @classmethod
+    async def is_source_running(cls, source_type: str, source_id: str) -> bool:
+        async with cls._get_active_sources_lock():
+            return cls._source_key(source_type, source_id) in cls._active_sources
+
+    @classmethod
+    async def reserve_source(cls, source_type: str, source_id: str) -> None:
+        """Reserve a source before background execution begins."""
+        await cls._acquire_source(source_type, source_id)
+
+    @classmethod
+    async def release_source(cls, source_type: str, source_id: str) -> None:
+        """Release a previously reserved source."""
+        await cls._release_source(source_type, source_id)
+
+    @classmethod
+    async def _acquire_source(cls, source_type: str, source_id: str) -> None:
+        async with cls._get_active_sources_lock():
+            source_key = cls._source_key(source_type, source_id)
+            if source_key in cls._active_sources:
+                raise RuntimeError(f"Proof verification already running for {source_type} {source_id}")
+            cls._active_sources.add(source_key)
+
+    @classmethod
+    async def _release_source(cls, source_type: str, source_id: str) -> None:
+        async with cls._get_active_sources_lock():
+            cls._active_sources.discard(cls._source_key(source_type, source_id))
+
+    async def _broadcast(self, broadcast_fn: BroadcastFn, event: str, data: dict[str, Any]) -> None:
+        if broadcast_fn:
+            await broadcast_fn(event, data)
+
+    @staticmethod
+    def _role_suffix(source_type: str, override: Optional[str] = None) -> str:
+        if override:
+            return override
+        return "brainstorm" if source_type == "brainstorm" else "paper"
+
+    @staticmethod
+    def _summarize_error(error_text: str, limit: int = 500) -> str:
+        raw = error_text or ""
+        if not raw.strip():
+            return ""
+
+        # Surface placeholder-rejection banners unchanged. These come from the
+        # Lean 4 client when a proof used `sorry`/`admit` or otherwise would
+        # have passed Lean with only a warning. The model must see the full
+        # rejection reason on retries, not a whitespace-collapsed fragment.
+        if "PROOF REJECTED: PLACEHOLDER USED" in raw:
+            cleaned = raw.strip()
+            return cleaned[:limit] + ("..." if len(cleaned) > limit else "")
+
+        # Surface real Lean 4 errors (and their trailing context) before
+        # deprecation warnings so retry prompts and the UI see the actual
+        # failure reason instead of a truncated `warning: ... deprecated` line.
+        lines = raw.splitlines()
+        error_pattern = re.compile(r":\s*error\s*:", re.IGNORECASE)
+        error_indices = [idx for idx, line in enumerate(lines) if error_pattern.search(line)]
+
+        if error_indices:
+            ordered_lines: list[str] = []
+            seen: set[int] = set()
+            for idx in error_indices:
+                for offset in range(idx, min(len(lines), idx + 4)):
+                    if offset in seen:
+                        continue
+                    seen.add(offset)
+                    ordered_lines.append(lines[offset])
+            for idx, line in enumerate(lines):
+                if idx in seen:
+                    continue
+                seen.add(idx)
+                ordered_lines.append(line)
+            raw = "\n".join(ordered_lines)
+
+        cleaned = " ".join(raw.split())
+        return cleaned[:limit] + ("..." if len(cleaned) > limit else "")
+
+    @staticmethod
+    def _extract_suggested_lemma_targets(error_text: str) -> list[str]:
+        targets: list[str] = []
+        for pattern in (
+            r"unknown (?:constant|identifier)\s+'?([A-Za-z][A-Za-z0-9_'.]*)'?",
+            r"failed to synthesize\s+([A-Za-z][A-Za-z0-9_'.]*)",
+        ):
+            for match in re.findall(pattern, error_text or "", flags=re.IGNORECASE):
+                candidate = str(match or "").strip()
+                if candidate and candidate not in targets:
+                    targets.append(candidate)
+        return targets[:6]
+
+    @staticmethod
+    def _is_smt_amenable(candidate: ProofCandidate) -> bool:
+        text = f"{candidate.statement}\n{candidate.formal_sketch}".lower()
+        if not text.strip():
+            return False
+
+        blocked_markers = (
+            "forall",
+            "for all",
+            "there exists",
+            "exists",
+            "∃",
+            "∀",
+            "set",
+            "finset",
+            "topological",
+            "continuous",
+            "measure",
+            "category",
+            "functor",
+            "matrix",
+            "module",
+            "vector",
+            "group",
+            "monoid",
+            "ring_hom",
+            "filter",
+        )
+        if any(marker in text for marker in blocked_markers):
+            return False
+
+        arithmetic_markers = (
+            "nat",
+            "int",
+            "real",
+            "integer",
+            "arithmetic",
+            "linear",
+            "inequal",
+            "=",
+            "<",
+            ">",
+            "≤",
+            "≥",
+            "+",
+            "-",
+            "*",
+        )
+        return any(marker in text for marker in arithmetic_markers)
+
+    @staticmethod
+    def _build_smt_tactic_suggestions(candidate: ProofCandidate) -> list[str]:
+        text = f"{candidate.statement}\n{candidate.formal_sketch}".lower()
+        suggestions: list[str] = []
+
+        if any(token in text for token in ("nat", "int")):
+            suggestions.extend(["omega", "norm_num"])
+        if any(token in text for token in ("real", "linear", "inequal", "≤", "≥", "<", ">")):
+            suggestions.extend(["linarith", "polyrith"])
+        if "=" in text or "decidable" in text:
+            suggestions.extend(["nativeDecide", "decide"])
+
+        deduped: list[str] = []
+        for suggestion in suggestions:
+            if suggestion not in deduped:
+                deduped.append(suggestion)
+        return deduped
+
+    @staticmethod
+    def _first_attempt_used_smt_hint(
+        attempts: list[ProofAttemptFeedback],
+        smt_hint: Optional[SmtHint],
+    ) -> bool:
+        if not attempts or not smt_hint or smt_hint.result != "unsat" or not smt_hint.suggested_tactics:
+            return False
+
+        first_attempt = attempts[0]
+        if not first_attempt.success or first_attempt.attempt != 1:
+            return False
+
+        haystack = "\n".join(
+            [
+                first_attempt.lean_code or "",
+                "\n".join(first_attempt.tactic_trace or []),
+            ]
+        ).lower()
+        return any(tactic.lower() in haystack for tactic in smt_hint.suggested_tactics)
+
+    async def _run_smt_check(
+        self,
+        *,
+        user_prompt: str,
+        source_type: str,
+        source_id: str,
+        base_event: dict[str, Any],
+        candidate: ProofCandidate,
+        source_content: str,
+        identification_agent: ProofIdentificationAgent,
+        broadcast_fn: BroadcastFn,
+    ) -> Optional[SmtHint]:
+        if not system_config.smt_enabled or not self._is_smt_amenable(candidate):
+            return None
+
+        await self._broadcast(
+            broadcast_fn,
+            "smt_check_started",
+            {
+                **base_event,
+                "theorem_id": candidate.theorem_id,
+                "theorem_statement": candidate.statement,
+            },
+        )
+
+        started_at = time.monotonic()
+        result_name = "unknown"
+        try:
+            smtlib = await identification_agent.translate_candidate_to_smt(
+                user_research_prompt=user_prompt,
+                source_type=source_type,
+                theorem_candidate=candidate,
+                source_content=source_content,
+            )
+            if not smtlib:
+                return SmtHint(result="unknown", suggested_tactics=[], smtlib="")
+
+            smt_result = await get_smt_client().check_smt2(
+                smtlib,
+                timeout=system_config.smt_timeout,
+            )
+            result_name = smt_result.result if smt_result.result in {"sat", "unsat", "unknown"} else "unknown"
+            suggestions = self._build_smt_tactic_suggestions(candidate) if result_name == "unsat" else []
+            return SmtHint(
+                result=result_name,
+                suggested_tactics=suggestions,
+                smtlib=smtlib,
+            )
+        except Exception as exc:
+            logger.debug("SMT check failed for theorem %s in %s %s: %s", candidate.theorem_id, source_type, source_id, exc)
+            return SmtHint(result="unknown", suggested_tactics=[], smtlib="")
+        finally:
+            elapsed_ms = int((time.monotonic() - started_at) * 1000)
+            await self._broadcast(
+                broadcast_fn,
+                "smt_check_complete",
+                {
+                    **base_event,
+                    "theorem_id": candidate.theorem_id,
+                    "theorem_statement": candidate.statement,
+                    "result": result_name,
+                    "elapsed_ms": elapsed_ms,
+                },
+            )
+
+    async def _assess_novelty(
+        self,
+        *,
+        user_prompt: str,
+        theorem_statement: str,
+        lean_code: str,
+        validator_model: str,
+        validator_context: int,
+        validator_max_tokens: int,
+        existing_novel_proofs: str,
+    ) -> tuple[bool, str]:
+        from .proof_novelty import assess_proof_novelty
+
+        task_id = f"proof_novelty_{self._novelty_task_sequence:03d}"
+        self._novelty_task_sequence += 1
+
+        return await assess_proof_novelty(
+            user_prompt=user_prompt,
+            theorem_statement=theorem_statement,
+            lean_code=lean_code,
+            validator_model=validator_model,
+            validator_context=validator_context,
+            validator_max_tokens=validator_max_tokens,
+            existing_novel_proofs=existing_novel_proofs,
+            task_id=task_id,
+            role_id="autonomous_proof_novelty",
+        )
+
+    async def _resolve_candidates(
+        self,
+        *,
+        theorem_candidates: Optional[list[ProofCandidate]],
+        identification_agent: ProofIdentificationAgent,
+        user_prompt: str,
+        source_type: str,
+        source_id: str,
+        content: str,
+    ) -> list[ProofCandidate]:
+        if theorem_candidates is not None:
+            return theorem_candidates
+
+        has_candidates, resolved_candidates = await identification_agent.identify_candidates(
+            user_research_prompt=user_prompt,
+            source_type=source_type,
+            source_id=source_id,
+            source_content=content,
+        )
+        return resolved_candidates if has_candidates else []
+
+    async def _prepare_candidate(
+        self,
+        *,
+        user_prompt: str,
+        source_type: str,
+        theorem_candidate: ProofCandidate,
+        source_content: str,
+        lemma_search_agent: MathlibLemmaSearchAgent,
+    ) -> ProofCandidate:
+        source_excerpt = theorem_candidate.source_excerpt or ProofFormalizationAgent._build_source_excerpt(
+            theorem_candidate.statement,
+            source_content,
+        )
+        candidate = theorem_candidate.model_copy(update={"source_excerpt": source_excerpt})
+        relevant_lemmas = await lemma_search_agent.suggest_relevant_lemmas(
+            user_research_prompt=user_prompt,
+            source_type=source_type,
+            theorem_candidate=candidate,
+            source_content=source_content,
+        )
+        if relevant_lemmas:
+            candidate = candidate.model_copy(update={"relevant_lemmas": relevant_lemmas})
+        return candidate
+
+    async def run(
+        self,
+        content: str,
+        source_type: str,
+        source_id: str,
+        user_prompt: str,
+        submitter_model: str,
+        submitter_context: int,
+        submitter_max_tokens: int,
+        validator_model: str,
+        validator_context: int,
+        validator_max_tokens: int,
+        broadcast_fn: BroadcastFn,
+        novel_proofs_db,
+        source_title: str = "",
+        theorem_candidates: Optional[list[ProofCandidate]] = None,
+        role_suffix_override: Optional[str] = None,
+        trigger: str = "automatic",
+        source_reserved: bool = False,
+        should_stop: ShouldStopFn = None,
+    ) -> ProofStageResult:
+        """Run proof identification, formalization, Lean 4 checking, and novelty review."""
+        result = ProofStageResult(source_type=source_type, source_id=source_id)
+        def _stop_requested() -> bool:
+            if should_stop is None:
+                return False
+            try:
+                return bool(should_stop())
+            except Exception:
+                return False
+        if not source_reserved:
+            await self._acquire_source(source_type, source_id)
+        try:
+            base_event = {
+                "source_type": source_type,
+                "source_id": source_id,
+                "source_title": source_title,
+                "trigger": trigger,
+            }
+            await self._broadcast(
+                broadcast_fn,
+                "proof_check_started",
+                base_event,
+            )
+
+            if not system_config.lean4_enabled:
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_check_complete",
+                    {
+                        **base_event,
+                        "novel_count": 0,
+                        "verified_count": 0,
+                        "total_candidates": 0,
+                        "message": "Lean 4 is disabled; proof verification was skipped.",
+                    },
+                )
+                return result
+
+            role_suffix = self._role_suffix(source_type, role_suffix_override)
+            identification_agent = ProofIdentificationAgent(
+                model_id=submitter_model,
+                context_window=submitter_context,
+                max_output_tokens=submitter_max_tokens,
+                role_id=f"autonomous_proof_identification_{role_suffix}",
+            )
+
+            resolved_candidates = await self._resolve_candidates(
+                theorem_candidates=theorem_candidates,
+                identification_agent=identification_agent,
+                user_prompt=user_prompt,
+                source_type=source_type,
+                source_id=source_id,
+                content=content,
+            )
+
+            if not resolved_candidates:
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_check_no_candidates",
+                    base_event,
+                )
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_check_complete",
+                    {
+                        **base_event,
+                        "novel_count": 0,
+                        "verified_count": 0,
+                        "total_candidates": 0,
+                    },
+                )
+                return result
+
+            if trigger == "retry":
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_retry_started",
+                    {
+                        **base_event,
+                        "count": len(resolved_candidates),
+                    },
+                )
+
+            result.total_candidates = len(resolved_candidates)
+            await self._broadcast(
+                broadcast_fn,
+                "proof_check_candidates_found",
+                {
+                    **base_event,
+                    "count": len(resolved_candidates),
+                    "theorems_preview": [candidate.statement[:180] for candidate in resolved_candidates],
+                },
+            )
+
+            max_parallel = max(1, int(getattr(system_config, "proof_max_parallel_candidates", 6) or 1))
+            semaphore = asyncio.Semaphore(max_parallel)
+
+            async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOutcome:
+                async with semaphore:
+                    if _stop_requested():
+                        return _LeanVerificationOutcome(
+                            candidate=theorem_candidate,
+                            success=False,
+                            theorem_name="",
+                            lean_code="",
+                            attempts=[],
+                        )
+                    return await self._run_lean_pipeline_for_candidate(
+                        theorem_candidate=theorem_candidate,
+                        base_event=base_event,
+                        user_prompt=user_prompt,
+                        source_type=source_type,
+                        source_id=source_id,
+                        source_content=content,
+                        submitter_model=submitter_model,
+                        submitter_context=submitter_context,
+                        submitter_max_tokens=submitter_max_tokens,
+                        role_suffix=role_suffix,
+                        trigger=trigger,
+                        novel_proofs_db=novel_proofs_db,
+                        broadcast_fn=broadcast_fn,
+                        should_stop=should_stop,
+                    )
+
+            verification_tasks = [
+                asyncio.create_task(run_phase_a(candidate))
+                for candidate in resolved_candidates
+            ]
+
+            pending_tasks = set(verification_tasks)
+            try:
+                for future in asyncio.as_completed(verification_tasks):
+                    if _stop_requested():
+                        logger.info(
+                            "Proof verification stopping early for %s %s (stop requested before next outcome).",
+                            source_type,
+                            source_id,
+                        )
+                        for task in pending_tasks:
+                            if not task.done():
+                                task.cancel()
+                        await asyncio.gather(*pending_tasks, return_exceptions=True)
+                        break
+                    try:
+                        outcome = await future
+                    except FreeModelExhaustedError:
+                        for task in pending_tasks:
+                            if not task.done():
+                                task.cancel()
+                        await asyncio.gather(*pending_tasks, return_exceptions=True)
+                        raise
+                    except asyncio.CancelledError:
+                        pending_tasks = {task for task in pending_tasks if not task.done()}
+                        continue
+                    except Exception as exc:
+                        # Any other per-candidate exception aborts the whole
+                        # parallel batch; the outer `except Exception` handler
+                        # will broadcast `proof_check_complete` with the error.
+                        logger.error(
+                            "Proof verification candidate task failed for %s %s: %s",
+                            source_type,
+                            source_id,
+                            exc,
+                        )
+                        for task in pending_tasks:
+                            if not task.done():
+                                task.cancel()
+                        await asyncio.gather(*pending_tasks, return_exceptions=True)
+                        raise
+
+                    pending_tasks = {task for task in pending_tasks if not task.done()}
+
+                    # Skip the expensive Phase B post-processing (novelty,
+                    # dependency extraction, DB writes) if the user has asked
+                    # us to stop. The outcome itself is dropped.
+                    if _stop_requested():
+                        logger.info(
+                            "Proof verification skipping phase B for %s %s (stop requested).",
+                            source_type,
+                            source_id,
+                        )
+                        for task in pending_tasks:
+                            if not task.done():
+                                task.cancel()
+                        await asyncio.gather(*pending_tasks, return_exceptions=True)
+                        break
+
+                    candidate = outcome.candidate
+                    attempts = outcome.attempts
+                    lean_code = outcome.lean_code
+
+                    if not outcome.success:
+                        error_summary = self._summarize_error(attempts[-1].error_output if attempts else "")
+                        suggested_targets = self._extract_suggested_lemma_targets(
+                            attempts[-1].error_output if attempts else ""
+                        )
+                        if source_type == "brainstorm" and trigger != "retry":
+                            await novel_proofs_db.record_failed_candidate(
+                                source_id,
+                                candidate,
+                                error_summary,
+                                suggested_lemma_targets=suggested_targets,
+                            )
+                        result.results.append(
+                            ProofAttemptResult(
+                                theorem_id=candidate.theorem_id,
+                                theorem_statement=candidate.statement,
+                                lean_code=lean_code,
+                                success=False,
+                                novel=False,
+                                attempts_used=len(attempts),
+                                error_summary=error_summary,
+                            )
+                        )
+                        continue
+
+                    result.verified_count += 1
+                    existing_novel_proofs = novel_proofs_db.get_novel_proofs_for_injection()
+                    is_novel, novelty_reasoning = await self._assess_novelty(
+                        user_prompt=user_prompt,
+                        theorem_statement=candidate.statement,
+                        lean_code=lean_code,
+                        validator_model=validator_model,
+                        validator_context=validator_context,
+                        validator_max_tokens=validator_max_tokens,
+                        existing_novel_proofs=existing_novel_proofs,
+                    )
+
+                    solver_hints = []
+                    if self._first_attempt_used_smt_hint(attempts, candidate.smt_hint):
+                        solver_hints.append("smt-z3")
+
+                    proof_record = ProofRecord(
+                        proof_id="",
+                        theorem_id=candidate.theorem_id,
+                        theorem_statement=candidate.statement,
+                        theorem_name=outcome.theorem_name,
+                        formal_sketch=candidate.formal_sketch,
+                        source_type=source_type,
+                        source_id=source_id,
+                        source_title=source_title,
+                        solver="Lean 4",
+                        lean_code=lean_code,
+                        novel=is_novel,
+                        novelty_reasoning=novelty_reasoning,
+                        verification_notes="Lean 4 accepted the submitted proof.",
+                        attempt_count=len(attempts),
+                        attempts=attempts,
+                        dependencies=[],
+                        solver_hints=solver_hints,
+                    )
+                    stored_record = await novel_proofs_db.add_proof(proof_record)
+
+                    # Dependency extraction runs in Phase B so later candidates
+                    # in the same paper can see earlier proofs. We instantiate
+                    # a scoped lemma search agent here (the Phase A agents are
+                    # already owned by their candidate tasks).
+                    dep_lemma_agent = MathlibLemmaSearchAgent(
+                        model_id=submitter_model,
+                        context_window=submitter_context,
+                        max_output_tokens=submitter_max_tokens,
+                        role_id=f"autonomous_proof_lemma_search_{role_suffix}_dep",
+                    )
+                    dependencies = []
+                    try:
+                        dependencies = await self._dependency_extractor.extract_dependencies(
+                            lean_code=lean_code,
+                            theorem_name=outcome.theorem_name,
+                            proof_database=novel_proofs_db,
+                            lemma_search_agent=dep_lemma_agent,
+                            relevant_lemmas=candidate.relevant_lemmas,
+                            current_proof_id=stored_record.proof_id,
+                        )
+                        if dependencies:
+                            updated_record = await novel_proofs_db.update_proof_dependencies(
+                                stored_record.proof_id,
+                                dependencies,
+                            )
+                            if updated_record is not None:
+                                stored_record = updated_record
+                            await self._broadcast(
+                                broadcast_fn,
+                                "proof_dependency_added",
+                                {
+                                    **base_event,
+                                    "proof_id": stored_record.proof_id,
+                                    "theorem_name": stored_record.theorem_name,
+                                    "dependencies": [
+                                        dependency.model_dump(mode="json")
+                                        for dependency in dependencies
+                                    ],
+                                },
+                            )
+                    except Exception as exc:
+                        logger.debug(
+                            "Dependency extraction failed for theorem %s: %s",
+                            candidate.theorem_id,
+                            exc,
+                        )
+
+                    if candidate.origin_source_id:
+                        await novel_proofs_db.mark_resolved_retry(
+                            candidate.origin_source_id,
+                            candidate.theorem_id,
+                            stored_record.proof_id,
+                        )
+
+                    if is_novel:
+                        result.novel_count += 1
+                        await self._broadcast(
+                            broadcast_fn,
+                            "novel_proof_discovered",
+                            {
+                                **base_event,
+                                "proof_id": stored_record.proof_id,
+                                "theorem_statement": stored_record.theorem_statement,
+                                "solver": "Lean 4",
+                                "retry_origin_source_id": candidate.origin_source_id,
+                            },
+                        )
+                    else:
+                        if source_type == "brainstorm":
+                            await brainstorm_memory.append_proofs_section(source_id, stored_record)
+                        elif ":" not in source_id:
+                            await paper_library.append_proofs_section(source_id, stored_record)
+
+                        await self._broadcast(
+                            broadcast_fn,
+                            "known_proof_verified",
+                            {
+                                **base_event,
+                                "proof_id": stored_record.proof_id,
+                                "theorem_statement": stored_record.theorem_statement,
+                                "retry_origin_source_id": candidate.origin_source_id,
+                            },
+                        )
+
+                    result.results.append(
+                        ProofAttemptResult(
+                            theorem_id=candidate.theorem_id,
+                            theorem_statement=candidate.statement,
+                            lean_code=lean_code,
+                            success=True,
+                            novel=is_novel,
+                            attempts_used=len(attempts),
+                            proof_id=stored_record.proof_id,
+                            error_summary="",
+                        )
+                    )
+            finally:
+                # Defensive cleanup: make sure we don't leak pending tasks if
+                # the consumer loop exits early for any reason.
+                leftover = [task for task in verification_tasks if not task.done()]
+                for task in leftover:
+                    task.cancel()
+                if leftover:
+                    await asyncio.gather(*leftover, return_exceptions=True)
+
+            await self._broadcast(
+                broadcast_fn,
+                "proof_check_complete",
+                {
+                    **base_event,
+                    "novel_count": result.novel_count,
+                    "verified_count": result.verified_count,
+                    "total_candidates": result.total_candidates,
+                },
+            )
+            return result
+        except FreeModelExhaustedError:
+            raise
+        except Exception as exc:
+            logger.error(
+                "Proof verification stage failed for %s %s: %s",
+                source_type,
+                source_id,
+                exc,
+            )
+            await self._broadcast(
+                broadcast_fn,
+                "proof_check_complete",
+                {
+                    "source_type": source_type,
+                    "source_id": source_id,
+                    "source_title": source_title,
+                    "trigger": trigger,
+                    "novel_count": result.novel_count,
+                    "verified_count": result.verified_count,
+                    "total_candidates": result.total_candidates,
+                    "message": str(exc),
+                },
+            )
+            return result
+        finally:
+            await self._release_source(source_type, source_id)
+
+    async def _run_lean_pipeline_for_candidate(
+        self,
+        *,
+        theorem_candidate: ProofCandidate,
+        base_event: dict[str, Any],
+        user_prompt: str,
+        source_type: str,
+        source_id: str,
+        source_content: str,
+        submitter_model: str,
+        submitter_context: int,
+        submitter_max_tokens: int,
+        role_suffix: str,
+        trigger: str,
+        novel_proofs_db,
+        broadcast_fn: BroadcastFn,
+        should_stop: ShouldStopFn = None,
+    ) -> _LeanVerificationOutcome:
+        """Phase A for one candidate: lemma prep, SMT hint, and Lean 4 attempts.
+
+        Each invocation creates its own agent instances so that concurrent
+        candidates do not race on shared ``task_sequence`` counters and so the
+        ``role_id`` remains the same for all attempts belonging to one
+        candidate.
+        """
+        identification_agent = ProofIdentificationAgent(
+            model_id=submitter_model,
+            context_window=submitter_context,
+            max_output_tokens=submitter_max_tokens,
+            role_id=f"autonomous_proof_identification_{role_suffix}",
+        )
+        lemma_search_agent = MathlibLemmaSearchAgent(
+            model_id=submitter_model,
+            context_window=submitter_context,
+            max_output_tokens=submitter_max_tokens,
+            role_id=f"autonomous_proof_lemma_search_{role_suffix}",
+        )
+        formalization_agent = ProofFormalizationAgent(
+            model_id=submitter_model,
+            context_window=submitter_context,
+            max_output_tokens=submitter_max_tokens,
+            role_id=f"autonomous_proof_formalization_{role_suffix}",
+        )
+
+        candidate = await self._prepare_candidate(
+            user_prompt=user_prompt,
+            source_type=source_type,
+            theorem_candidate=theorem_candidate,
+            source_content=source_content,
+            lemma_search_agent=lemma_search_agent,
+        )
+        smt_hint = await self._run_smt_check(
+            user_prompt=user_prompt,
+            source_type=source_type,
+            source_id=source_id,
+            base_event=base_event,
+            candidate=candidate,
+            source_content=source_content,
+            identification_agent=identification_agent,
+            broadcast_fn=broadcast_fn,
+        )
+        if smt_hint:
+            candidate = candidate.model_copy(update={"smt_hint": smt_hint})
+        if trigger == "retry" and candidate.origin_source_id:
+            await novel_proofs_db.mark_retried(
+                candidate.origin_source_id,
+                candidate.theorem_id,
+                source_id,
+            )
+
+        async def on_attempt_started(
+            attempt_number: int,
+            strategy: str,
+            current_candidate=candidate,
+        ) -> None:
+            await self._broadcast(
+                broadcast_fn,
+                "proof_attempt_started",
+                {
+                    **base_event,
+                    "theorem_id": current_candidate.theorem_id,
+                    "theorem_statement": current_candidate.statement,
+                    "attempt": attempt_number,
+                    "strategy": strategy,
+                    "retry_origin_source_id": current_candidate.origin_source_id,
+                },
+            )
+
+        async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
+            if feedback.success:
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_verified",
+                    {
+                        **base_event,
+                        "theorem_id": current_candidate.theorem_id,
+                        "theorem_statement": current_candidate.statement,
+                        "strategy": feedback.strategy,
+                        "retry_origin_source_id": current_candidate.origin_source_id,
+                    },
+                )
+            else:
+                await self._broadcast(
+                    broadcast_fn,
+                    "proof_attempt_failed",
+                    {
+                        **base_event,
+                        "theorem_id": current_candidate.theorem_id,
+                        "theorem_statement": current_candidate.statement,
+                        "attempt": feedback.attempt,
+                        "strategy": feedback.strategy,
+                        "error_summary": self._summarize_error(feedback.error_output),
+                        "retry_origin_source_id": current_candidate.origin_source_id,
+                    },
+                )
+
+        success, theorem_name, lean_code, attempts = await formalization_agent.prove_candidate(
+            user_research_prompt=user_prompt,
+            source_type=source_type,
+            theorem_candidate=candidate,
+            source_content=source_content,
+            max_attempts=3,
+            attempt_callback=on_attempt_feedback,
+            attempt_start_callback=on_attempt_started,
+            smt_hint=candidate.smt_hint,
+            should_stop=should_stop,
+        )
+        if not success and not (should_stop and should_stop()):
+            tactic_success, tactic_theorem_name, lean_code, attempts = await formalization_agent.prove_candidate_tactic_script(
+                user_research_prompt=user_prompt,
+                source_type=source_type,
+                theorem_candidate=candidate,
+                source_content=source_content,
+                max_attempts=2,
+                attempt_callback=on_attempt_feedback,
+                attempt_start_callback=on_attempt_started,
+                prior_attempts=attempts,
+                starting_attempt_number=(attempts[-1].attempt + 1 if attempts else 4),
+                smt_hint=candidate.smt_hint,
+                should_stop=should_stop,
+            )
+            if tactic_theorem_name:
+                theorem_name = tactic_theorem_name
+            success = tactic_success
+
+        if not success and not (should_stop and should_stop()):
+            await self._broadcast(
+                broadcast_fn,
+                "proof_attempts_exhausted",
+                {
+                    **base_event,
+                    "theorem_id": candidate.theorem_id,
+                    "theorem_statement": candidate.statement,
+                    "retry_origin_source_id": candidate.origin_source_id,
+                },
+            )
+
+        return _LeanVerificationOutcome(
+            candidate=candidate,
+            success=success,
+            theorem_name=theorem_name,
+            lean_code=lean_code,
+            attempts=attempts,
+        )
+
+    async def run_manual(
+        self,
+        *,
+        content: str,
+        source_type: str,
+        source_id: str,
+        user_prompt: str,
+        submitter_model: str,
+        submitter_context: int,
+        submitter_max_tokens: int,
+        validator_model: str,
+        validator_context: int,
+        validator_max_tokens: int,
+        broadcast_fn: BroadcastFn,
+        novel_proofs_db,
+        source_title: str = "",
+        source_reserved: bool = False,
+        should_stop: ShouldStopFn = None,
+    ) -> ProofStageResult:
+        """Run a user-triggered proof check using manual proof role IDs."""
+        return await self.run(
+            content=content,
+            source_type=source_type,
+            source_id=source_id,
+            user_prompt=user_prompt,
+            submitter_model=submitter_model,
+            submitter_context=submitter_context,
+            submitter_max_tokens=submitter_max_tokens,
+            validator_model=validator_model,
+            validator_context=validator_context,
+            validator_max_tokens=validator_max_tokens,
+            broadcast_fn=broadcast_fn,
+            novel_proofs_db=novel_proofs_db,
+            source_title=source_title,
+            role_suffix_override=f"manual_{source_type}",
+            trigger="manual",
+            source_reserved=source_reserved,
+            should_stop=should_stop,
+        )
diff --git a/backend/autonomous/memory/autonomous_api_logger.py b/backend/autonomous/memory/autonomous_api_logger.py
index 5fddc3a..723857a 100644
--- a/backend/autonomous/memory/autonomous_api_logger.py
+++ b/backend/autonomous/memory/autonomous_api_logger.py
@@ -10,6 +10,8 @@
 from typing import Dict, Any, List, Optional
 from pathlib import Path
 
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 
@@ -19,7 +21,6 @@ class AutonomousAPILogger:
     Stores logs in data/auto_api_log.txt with JSON entries.
     """
     
-    LOG_FILE = "backend/data/auto_api_log.txt"
     MAX_LOG_ENTRIES = 1000  # Maximum entries to keep in log
     
     _instance = None
@@ -41,11 +42,15 @@ def __init__(self):
     
     def _ensure_log_file(self) -> None:
         """Ensure the log file and directory exist."""
-        log_path = Path(self.LOG_FILE)
+        log_path = self._get_log_path()
         log_path.parent.mkdir(parents=True, exist_ok=True)
         
         if not log_path.exists():
             log_path.write_text("")
+
+    def _get_log_path(self) -> Path:
+        """Return the instance-scoped autonomous API log path."""
+        return Path(system_config.data_dir) / "auto_api_log.txt"
     
     async def log_api_call(
         self,
@@ -97,7 +102,7 @@ async def log_api_call(
                 }
                 
                 # Append to log file
-                with open(self.LOG_FILE, "a", encoding="utf-8") as f:
+                with open(self._get_log_path(), "a", encoding="utf-8") as f:
                     f.write(json.dumps(log_entry) + "\n")
                 
                 logger.debug(f"Logged autonomous API call: task={task_id}, model={model}, success={success}, phase={phase}")
@@ -111,13 +116,13 @@ async def log_api_call(
     async def _trim_log_if_needed(self) -> None:
         """Trim log file if it exceeds MAX_LOG_ENTRIES."""
         try:
-            with open(self.LOG_FILE, "r", encoding="utf-8") as f:
+            with open(self._get_log_path(), "r", encoding="utf-8") as f:
                 lines = f.readlines()
             
             if len(lines) > self.MAX_LOG_ENTRIES:
                 # Keep only the most recent entries
                 lines = lines[-self.MAX_LOG_ENTRIES:]
-                with open(self.LOG_FILE, "w", encoding="utf-8") as f:
+                with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.writelines(lines)
                 logger.debug(f"Trimmed autonomous API log to {self.MAX_LOG_ENTRIES} entries")
                 
@@ -136,10 +141,11 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
         """
         async with self._lock:
             try:
-                if not os.path.exists(self.LOG_FILE):
+                log_path = self._get_log_path()
+                if not os.path.exists(log_path):
                     return []
                 
-                with open(self.LOG_FILE, "r", encoding="utf-8") as f:
+                with open(log_path, "r", encoding="utf-8") as f:
                     lines = f.readlines()
                 
                 logs = []
@@ -164,7 +170,7 @@ async def clear_logs(self) -> None:
         """Clear all autonomous API logs."""
         async with self._lock:
             try:
-                with open(self.LOG_FILE, "w", encoding="utf-8") as f:
+                with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.write("")
                 logger.info("Autonomous API logs cleared")
             except Exception as e:
diff --git a/backend/autonomous/memory/brainstorm_memory.py b/backend/autonomous/memory/brainstorm_memory.py
index 33584bf..0ad3cf1 100644
--- a/backend/autonomous/memory/brainstorm_memory.py
+++ b/backend/autonomous/memory/brainstorm_memory.py
@@ -5,6 +5,7 @@
 import asyncio
 import json
 import logging
+import re
 from pathlib import Path
 from typing import Optional, List, Dict, Any
 from datetime import datetime
@@ -259,6 +260,58 @@ async def get_database_content(self, topic_id: str) -> str:
         except Exception as e:
             logger.error(f"Failed to read brainstorm database {topic_id}: {e}")
             return ""
+
+    async def append_proofs_section(self, topic_id: str, proofs_data: Any) -> bool:
+        """Append verified proofs to the bottom of a brainstorm database."""
+        async with self._lock:
+            db_path = self._get_database_path(topic_id)
+            if not db_path.exists():
+                logger.error(f"Brainstorm database not found for proof append: {topic_id}")
+                return False
+
+            proofs = proofs_data if isinstance(proofs_data, list) else [proofs_data]
+            header = "=== PROOFS GENERATED FROM THIS BRAINSTORM (Lean 4 Verified) ==="
+
+            try:
+                async with aiofiles.open(db_path, "r", encoding="utf-8") as handle:
+                    existing_content = await handle.read()
+
+                after_header = existing_content.split(header, 1)[1] if header in existing_content else ""
+                next_index = len(re.findall(r"(?m)^Proof \d+:", after_header)) + 1
+
+                lines: List[str] = []
+                if header not in existing_content:
+                    lines.extend(["", "", header, ""])
+                elif not existing_content.endswith("\n"):
+                    lines.append("")
+
+                for proof in proofs:
+                    theorem_statement = str(getattr(proof, "theorem_statement", "") or proof.get("theorem_statement", "")).strip()
+                    proof_id = str(getattr(proof, "proof_id", "") or proof.get("proof_id", "")).strip()
+                    novel = bool(getattr(proof, "novel", False) if hasattr(proof, "novel") else proof.get("novel", False))
+                    lean_code = str(getattr(proof, "lean_code", "") or proof.get("lean_code", "")).strip()
+                    status = "Verified (Novel)" if novel else "Verified (Known)"
+
+                    lines.extend(
+                        [
+                            f"Proof {next_index}: {theorem_statement}",
+                            f"Status: {status}",
+                            f"Proof ID: {proof_id or 'N/A'}",
+                            "Lean 4 Code:",
+                            lean_code or "[no Lean 4 code saved]",
+                            "---",
+                        ]
+                    )
+                    next_index += 1
+
+                async with aiofiles.open(db_path, "a", encoding="utf-8") as handle:
+                    await handle.write("\n".join(lines) + "\n")
+
+                logger.info("Appended %s proof(s) to brainstorm %s", len(proofs), topic_id)
+                return True
+            except Exception as exc:
+                logger.error(f"Failed to append proofs to brainstorm {topic_id}: {exc}")
+                return False
     
     async def get_submissions_list(self, topic_id: str) -> List[Dict[str, Any]]:
         """Get list of submissions from a brainstorm database."""
diff --git a/backend/autonomous/memory/final_answer_memory.py b/backend/autonomous/memory/final_answer_memory.py
index b1ca815..44b827b 100644
--- a/backend/autonomous/memory/final_answer_memory.py
+++ b/backend/autonomous/memory/final_answer_memory.py
@@ -8,6 +8,7 @@
 import asyncio
 import json
 import logging
+import re
 from pathlib import Path
 from typing import Optional, List, Dict, Any
 from datetime import datetime
@@ -86,6 +87,86 @@ def resolve_answer_base_dir(answer_id: str) -> Optional[Path]:
             base_dir = session_dir / "final_answer"
 
         return base_dir if base_dir.exists() else None
+
+    @staticmethod
+    def _normalize_user_prompt(prompt: Any) -> str:
+        """Normalize prompt values loaded from mixed legacy/session metadata."""
+        return prompt.strip() if isinstance(prompt, str) else ""
+
+    @classmethod
+    def _derive_prompt_from_session_id(cls, session_id: str) -> str:
+        """Recover a readable prompt from the session folder slug when metadata is blank."""
+        if session_id == "legacy":
+            return "Legacy research session"
+
+        prompt_slug = re.sub(r"_\d{4}-\d{2}-\d{2}_\d{2}-\d{2}$", "", session_id or "")
+        prompt = prompt_slug.replace("_", " ").strip()
+        if not prompt:
+            return "Unknown research question"
+
+        return prompt[0].upper() + prompt[1:]
+
+    @classmethod
+    def _select_user_prompt(cls, session_id: str, *candidates: Any) -> str:
+        """Choose the best available prompt, falling back to a readable session slug."""
+        for candidate in candidates:
+            prompt = cls._normalize_user_prompt(candidate)
+            if prompt and prompt != "Unknown research question":
+                return prompt
+
+        return cls._derive_prompt_from_session_id(session_id)
+
+    @classmethod
+    async def _read_session_metadata_prompt(cls, session_id: str, base_dir: Optional[Path] = None) -> str:
+        """Read the prompt from sibling session metadata for legacy and session-scoped answers."""
+        if session_id == "legacy":
+            metadata_path = Path(system_config.auto_research_metadata_file)
+        elif base_dir is not None:
+            metadata_path = base_dir.parent / "session_metadata.json"
+        else:
+            try:
+                session_dir = resolve_path_within_root(
+                    Path(system_config.auto_sessions_base_dir),
+                    validate_single_path_component(session_id, "final answer ID"),
+                )
+            except ValueError:
+                return cls._derive_prompt_from_session_id(session_id)
+
+            metadata_path = session_dir / "session_metadata.json"
+
+        if not metadata_path.exists():
+            return cls._derive_prompt_from_session_id(session_id)
+
+        try:
+            async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
+                metadata = json.loads(await f.read())
+        except Exception as e:
+            logger.warning(f"Failed to read final answer prompt metadata for {session_id}: {e}")
+            return cls._derive_prompt_from_session_id(session_id)
+
+        return cls._select_user_prompt(
+            session_id,
+            metadata.get("user_prompt"),
+            metadata.get("user_research_prompt"),
+        )
+
+    @classmethod
+    def _extract_user_prompt_from_state(
+        cls,
+        session_id: str,
+        state_data: Dict[str, Any],
+        session_metadata_prompt: str,
+    ) -> str:
+        """Resolve the display prompt from Tier 3 state with metadata and slug fallbacks."""
+        model_usage = state_data.get("model_usage", {}) or {}
+        cert_assess = state_data.get("certainty_assessment", {}) or {}
+
+        return cls._select_user_prompt(
+            session_id,
+            model_usage.get("user_prompt"),
+            cert_assess.get("user_prompt"),
+            session_metadata_prompt,
+        )
     
     def set_session_manager(self, session_manager) -> None:
         """Set session manager for session-based path resolution."""
@@ -583,7 +664,7 @@ def get_author_attribution_text(self) -> str:
             "=" * 80,
             "AUTONOMOUS AI SOLUTION",
             "",
-            "Disclaimer: This content is provided for informational and experimental purposes only. This paper was autonomously generated with the novelty-seeking MOTO harness without peer review or user oversight beyond the original prompt. It may contain incorrect, incomplete, misleading, or fabricated claims presented with high confidence. Use of this content is at your own risk. You are solely responsible for reviewing and independently verifying any output before relying on it, and the developers, operators, and contributors are not responsible for errors, omissions, decisions made from this content, or any resulting loss, damage, cost, or liability.",
+            "Disclaimer: This content is provided for informational purposes only. This paper was autonomously generated with the novelty-seeking MOTO harness without peer review or user oversight beyond the original prompt. It may contain incorrect, incomplete, misleading, or fabricated claims presented with high confidence. Use of this content is at your own risk. You are solely responsible for reviewing and independently verifying any output before relying on it, and the developers, operators, and contributors are not responsible for errors, omissions, decisions made from this content, or any resulting loss, damage, cost, or liability.",
             "",
             f"User's Research Prompt: {display_prompt}",
             "",
@@ -1355,12 +1436,12 @@ async def list_all_final_answers(self) -> List[Dict[str, Any]]:
                             title = state_data.get("short_form_title", "Untitled Paper")
                             chapter_count = 0
                         
-                        # Get user prompt from model_usage or certainty assessment
-                        model_usage = state_data.get("model_usage", {})
-                        user_prompt = model_usage.get("user_prompt", "")
-                        if not user_prompt:
-                            cert_assess = state_data.get("certainty_assessment", {})
-                            user_prompt = cert_assess.get("user_prompt", "Unknown research question")
+                        session_metadata_prompt = await self._read_session_metadata_prompt("legacy", legacy_dir)
+                        user_prompt = self._extract_user_prompt_from_state(
+                            "legacy",
+                            state_data,
+                            session_metadata_prompt,
+                        )
                         
                         certainty_level = state_data.get("certainty_assessment", {}).get("certainty_level", "unknown")
                         completion_date = state_data.get("timestamp", datetime.now().isoformat())
@@ -1431,12 +1512,15 @@ async def list_all_final_answers(self) -> List[Dict[str, Any]]:
                             title = state_data.get("short_form_title", "Untitled Paper")
                             chapter_count = 0
                         
-                        # Get user prompt
-                        model_usage = state_data.get("model_usage", {})
-                        user_prompt = model_usage.get("user_prompt", "")
-                        if not user_prompt:
-                            cert_assess = state_data.get("certainty_assessment", {})
-                            user_prompt = cert_assess.get("user_prompt", "Unknown research question")
+                        session_metadata_prompt = await self._read_session_metadata_prompt(
+                            session_folder.name,
+                            final_answer_dir,
+                        )
+                        user_prompt = self._extract_user_prompt_from_state(
+                            session_folder.name,
+                            state_data,
+                            session_metadata_prompt,
+                        )
                         
                         certainty_level = state_data.get("certainty_assessment", {}).get("certainty_level", "unknown")
                         completion_date = state_data.get("timestamp", datetime.now().isoformat())
@@ -1518,11 +1602,12 @@ async def get_final_answer_by_id(self, answer_id: str) -> Optional[Dict[str, Any
                 else:
                     full_content = ""
             
-            model_usage = state_data.get("model_usage", {})
-            user_prompt = model_usage.get("user_prompt", "")
-            if not user_prompt:
-                cert_assess = state_data.get("certainty_assessment", {})
-                user_prompt = cert_assess.get("user_prompt", "Unknown research question")
+            session_metadata_prompt = await self._read_session_metadata_prompt(answer_id, base_dir)
+            user_prompt = self._extract_user_prompt_from_state(
+                answer_id,
+                state_data,
+                session_metadata_prompt,
+            )
             
             certainty_level = state_data.get("certainty_assessment", {}).get("certainty_level", "unknown")
             completion_date = state_data.get("timestamp", datetime.now().isoformat())
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index b643b2c..e9a11be 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -117,6 +117,34 @@ def _build_scoped_library(base_dir: Path) -> "PaperLibrary":
         scoped_library._archive_dir = base_dir / "archive"
         return scoped_library
 
+    @staticmethod
+    def _normalize_history_prompt(prompt: Any) -> str:
+        """Normalize prompt values loaded from mixed metadata schemas."""
+        return prompt.strip() if isinstance(prompt, str) else ""
+
+    @classmethod
+    def _derive_history_prompt_from_session_id(cls, session_id: str) -> str:
+        """Recover a readable prompt from the session folder slug when metadata is blank."""
+        if session_id == "legacy":
+            return "Legacy research session"
+
+        prompt_slug = re.sub(r"_\d{4}-\d{2}-\d{2}_\d{2}-\d{2}$", "", session_id or "")
+        prompt = prompt_slug.replace("_", " ").strip()
+        if not prompt:
+            return "Unknown research question"
+
+        return prompt[0].upper() + prompt[1:]
+
+    @classmethod
+    def _resolve_history_prompt(cls, session_id: str, *candidates: Any) -> str:
+        """Choose the best history prompt and fall back to a readable session slug."""
+        for candidate in candidates:
+            prompt = cls._normalize_history_prompt(candidate)
+            if prompt and prompt != "Unknown research question":
+                return prompt
+
+        return cls._derive_history_prompt_from_session_id(session_id)
+
     def get_history_papers_dir(self, session_id: str) -> Optional[Path]:
         """Resolve the papers directory for a history session."""
         if session_id == "legacy":
@@ -141,29 +169,27 @@ async def _get_history_user_prompt(self, session_id: str) -> str:
         """Read the user prompt associated with a legacy or session-based paper history entry."""
         if session_id == "legacy":
             metadata_path = Path(system_config.auto_research_metadata_file)
-            default_prompt = "Legacy research session"
         else:
             papers_dir = self.get_history_papers_dir(session_id)
             if not papers_dir:
-                return "Unknown research question"
+                return self._derive_history_prompt_from_session_id(session_id)
 
             metadata_path = papers_dir.parent / "session_metadata.json"
-            default_prompt = "Unknown research question"
 
         if not metadata_path.exists():
-            return default_prompt
+            return self._derive_history_prompt_from_session_id(session_id)
 
         try:
             async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
                 metadata = json.loads(await f.read())
-            return (
-                metadata.get("user_prompt")
-                or metadata.get("user_research_prompt")
-                or default_prompt
+            return self._resolve_history_prompt(
+                session_id,
+                metadata.get("user_prompt"),
+                metadata.get("user_research_prompt"),
             )
         except Exception as e:
             logger.warning(f"Failed to read history prompt for session {session_id}: {e}")
-            return default_prompt
+            return self._derive_history_prompt_from_session_id(session_id)
 
     @staticmethod
     def _calculate_critique_average(critique: Any) -> Optional[float]:
@@ -381,6 +407,8 @@ async def _is_paper_complete(self, paper_id: str) -> bool:
                 r"##\s*Abstract",
                 r"#\s*Abstract",
                 r"\*\*Abstract\*\*",
+                r"\\(?:section|chapter)\*?\{Abstract\}",
+                r"\\begin\{abstract\}",
                 r"^Abstract\s*$"  # Abstract on its own line
             ]
             
@@ -399,6 +427,7 @@ async def _is_paper_complete(self, paper_id: str) -> bool:
                 r"##\s*Introduction",
                 r"#\s*Introduction",
                 r"\*\*Introduction\*\*",
+                r"\\(?:section|chapter)\*?\{(?:I\.?\s*)?Introduction\}",
                 r"^I\.\s*Introduction",
                 r"^Introduction\s*$"
             ]
@@ -418,6 +447,7 @@ async def _is_paper_complete(self, paper_id: str) -> bool:
                 r"##\s*Conclusion",
                 r"#\s*Conclusion",
                 r"\*\*Conclusion\*\*",
+                r"\\(?:section|chapter)\*?\{Conclusion\}",
                 r"^\w+\.\s*Conclusion",  # e.g., "V. Conclusion"
                 r"^Conclusion\s*$"
             ]
@@ -549,6 +579,58 @@ async def get_paper_content(self, paper_id: str) -> str:
         except Exception as e:
             logger.error(f"Failed to read paper {paper_id}: {e}")
             return ""
+
+    async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
+        """Append verified proofs to the bottom of a saved paper."""
+        async with self._lock:
+            paper_path = self._get_paper_path(paper_id)
+            if not paper_path.exists():
+                logger.error(f"Paper not found for proof append: {paper_id}")
+                return False
+
+            proofs = proofs_data if isinstance(proofs_data, list) else [proofs_data]
+            header = "=== PROOFS GENERATED FROM THIS PAPER (Lean 4 Verified) ==="
+
+            try:
+                async with aiofiles.open(paper_path, "r", encoding="utf-8") as handle:
+                    existing_content = await handle.read()
+
+                after_header = existing_content.split(header, 1)[1] if header in existing_content else ""
+                next_index = len(re.findall(r"(?m)^Proof \d+:", after_header)) + 1
+
+                lines: List[str] = []
+                if header not in existing_content:
+                    lines.extend(["", "", header, ""])
+                elif not existing_content.endswith("\n"):
+                    lines.append("")
+
+                for proof in proofs:
+                    theorem_statement = str(getattr(proof, "theorem_statement", "") or proof.get("theorem_statement", "")).strip()
+                    proof_id = str(getattr(proof, "proof_id", "") or proof.get("proof_id", "")).strip()
+                    novel = bool(getattr(proof, "novel", False) if hasattr(proof, "novel") else proof.get("novel", False))
+                    lean_code = str(getattr(proof, "lean_code", "") or proof.get("lean_code", "")).strip()
+                    status = "Verified (Novel)" if novel else "Verified (Known)"
+
+                    lines.extend(
+                        [
+                            f"Proof {next_index}: {theorem_statement}",
+                            f"Status: {status}",
+                            f"Proof ID: {proof_id or 'N/A'}",
+                            "Lean 4 Code:",
+                            lean_code or "[no Lean 4 code saved]",
+                            "---",
+                        ]
+                    )
+                    next_index += 1
+
+                async with aiofiles.open(paper_path, "a", encoding="utf-8") as handle:
+                    await handle.write("\n".join(lines) + "\n")
+
+                logger.info("Appended %s proof(s) to paper %s", len(proofs), paper_id)
+                return True
+            except Exception as exc:
+                logger.error(f"Failed to append proofs to paper {paper_id}: {exc}")
+                return False
     
     async def get_abstract(self, paper_id: str) -> str:
         """Get paper abstract."""
diff --git a/backend/autonomous/memory/paper_model_tracker.py b/backend/autonomous/memory/paper_model_tracker.py
index bd331d0..d42fab2 100644
--- a/backend/autonomous/memory/paper_model_tracker.py
+++ b/backend/autonomous/memory/paper_model_tracker.py
@@ -177,7 +177,7 @@ def generate_author_attribution(
             "=" * 80,
             "AUTONOMOUS AI SOLUTION",
             "",
-            "Disclaimer: This content is provided for informational and experimental purposes only. "
+            "Disclaimer: This content is provided for informational purposes only. "
             "This paper was autonomously generated with the novelty-seeking MOTO harness without "
             "peer review or user oversight beyond the original prompt. It may contain incorrect, "
             "incomplete, misleading, or fabricated claims presented with high confidence. Use of "
diff --git a/backend/autonomous/memory/proof_database.py b/backend/autonomous/memory/proof_database.py
new file mode 100644
index 0000000..400ec1c
--- /dev/null
+++ b/backend/autonomous/memory/proof_database.py
@@ -0,0 +1,633 @@
+"""
+Proof database for Lean 4 verified results.
+
+Stores both novel and non-novel verified proofs centrally for UI/API access.
+Novel proofs are also formatted for highest-priority direct prompt injection.
+"""
+import asyncio
+import json
+import logging
+import shutil
+from datetime import datetime
+from pathlib import Path
+from typing import Dict, Any, List, Optional
+
+import aiofiles
+
+from backend.shared.config import system_config
+from backend.shared.models import FailedProofCandidate, ProofCandidate, ProofRecord
+from backend.shared.path_safety import validate_single_path_component
+from backend.autonomous.prompts.proof_prompts import format_failure_hints_for_injection
+
+logger = logging.getLogger(__name__)
+
+
+class ProofDatabase:
+    """
+    Session-aware storage for Lean 4 verified proofs.
+
+    Storage layout:
+      - proofs_index.json
+      - proof_<proof_id>.json
+      - proof_<proof_id>_lean.lean
+    """
+
+    def __init__(self) -> None:
+        self._lock = asyncio.Lock()
+        self._base_dir = Path(system_config.data_dir) / "proofs"
+        self._session_manager = None
+        self._index_data: Optional[Dict[str, Any]] = None
+        self._mathlib_reverse_index: Dict[str, List[str]] = {}
+        self._mathlib_reverse_short_index: Dict[str, List[str]] = {}
+
+    def set_session_manager(self, session_manager) -> None:
+        """Switch storage to the active session directory when available."""
+        self._session_manager = session_manager
+        if session_manager and session_manager.is_session_active:
+            self._base_dir = session_manager.get_proofs_dir()
+        else:
+            self._base_dir = Path(system_config.data_dir) / "proofs"
+        self._index_data = None
+        logger.info("Proof database using path: %s", self._base_dir)
+
+    def _safe_proof_id(self, proof_id: str) -> str:
+        return validate_single_path_component(proof_id, "proof ID")
+
+    def _get_index_path(self) -> Path:
+        return self._base_dir / "proofs_index.json"
+
+    def _get_record_path(self, proof_id: str) -> Path:
+        return self._base_dir / f"proof_{self._safe_proof_id(proof_id)}.json"
+
+    def _get_lean_path(self, proof_id: str) -> Path:
+        return self._base_dir / f"proof_{self._safe_proof_id(proof_id)}_lean.lean"
+
+    def _get_failed_dir(self) -> Path:
+        return self._base_dir / "failed"
+
+    def _get_failed_candidates_path(self, source_brainstorm_id: str) -> Path:
+        safe_id = validate_single_path_component(source_brainstorm_id, "brainstorm ID")
+        return self._get_failed_dir() / f"{safe_id}.json"
+
+    def _default_index(self) -> Dict[str, Any]:
+        return {
+            "next_proof_id": 1,
+            "proofs": [],
+        }
+
+    def _rebuild_reverse_indexes(self) -> None:
+        self._mathlib_reverse_index = {}
+        self._mathlib_reverse_short_index = {}
+
+        proofs = self._index_data.get("proofs", []) if self._index_data else []
+        for proof in proofs:
+            proof_id = str(proof.get("proof_id", "")).strip()
+            if not proof_id:
+                continue
+            for dependency in proof.get("dependencies", []) or []:
+                if not isinstance(dependency, dict):
+                    continue
+                if dependency.get("kind") != "mathlib":
+                    continue
+                name = str(dependency.get("name", "")).strip()
+                if not name:
+                    continue
+                short_name = name.split(".")[-1]
+                self._mathlib_reverse_index.setdefault(name, [])
+                if proof_id not in self._mathlib_reverse_index[name]:
+                    self._mathlib_reverse_index[name].append(proof_id)
+                self._mathlib_reverse_short_index.setdefault(short_name, [])
+                if proof_id not in self._mathlib_reverse_short_index[short_name]:
+                    self._mathlib_reverse_short_index[short_name].append(proof_id)
+
+    async def initialize(self) -> None:
+        """Ensure storage exists and load the index."""
+        if self._session_manager and self._session_manager.is_session_active:
+            self._base_dir = self._session_manager.get_proofs_dir()
+
+        self._base_dir.mkdir(parents=True, exist_ok=True)
+        self._get_failed_dir().mkdir(parents=True, exist_ok=True)
+        await self._load_index()
+
+    async def _load_index(self) -> None:
+        index_path = self._get_index_path()
+        if index_path.exists():
+            try:
+                async with aiofiles.open(index_path, "r", encoding="utf-8") as handle:
+                    self._index_data = json.loads(await handle.read())
+            except Exception as exc:
+                logger.error("Failed to load proofs index: %s", exc)
+                self._index_data = self._default_index()
+                await self._save_index()
+        else:
+            self._index_data = self._default_index()
+            await self._save_index()
+
+        if "next_proof_id" not in self._index_data:
+            self._index_data["next_proof_id"] = len(self._index_data.get("proofs", [])) + 1
+        if "proofs" not in self._index_data:
+            self._index_data["proofs"] = []
+        self._rebuild_reverse_indexes()
+
+    def _ensure_index_loaded_sync(self) -> None:
+        if self._index_data is not None:
+            return
+
+        index_path = self._get_index_path()
+        self._base_dir.mkdir(parents=True, exist_ok=True)
+        if index_path.exists():
+            try:
+                self._index_data = json.loads(index_path.read_text(encoding="utf-8"))
+            except Exception as exc:
+                logger.error("Failed to synchronously load proofs index: %s", exc)
+                self._index_data = self._default_index()
+        else:
+            self._index_data = self._default_index()
+
+        self._index_data.setdefault("next_proof_id", len(self._index_data.get("proofs", [])) + 1)
+        self._index_data.setdefault("proofs", [])
+        self._rebuild_reverse_indexes()
+
+    async def _save_index(self) -> None:
+        self._base_dir.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(self._get_index_path(), "w", encoding="utf-8") as handle:
+            await handle.write(json.dumps(self._index_data, indent=2))
+
+    @staticmethod
+    def _serialize_record(record: ProofRecord) -> Dict[str, Any]:
+        return record.model_dump(mode="json")
+
+    @staticmethod
+    def _deserialize_record(data: Dict[str, Any]) -> ProofRecord:
+        return ProofRecord(**data)
+
+    @staticmethod
+    def _serialize_failed_candidate(candidate: FailedProofCandidate) -> Dict[str, Any]:
+        return candidate.model_dump(mode="json")
+
+    @staticmethod
+    def _deserialize_failed_candidate(data: Dict[str, Any]) -> FailedProofCandidate:
+        return FailedProofCandidate(**data)
+
+    async def _load_failed_candidates(self, source_brainstorm_id: str) -> List[FailedProofCandidate]:
+        failed_path = self._get_failed_candidates_path(source_brainstorm_id)
+        if not failed_path.exists():
+            return []
+
+        try:
+            async with aiofiles.open(failed_path, "r", encoding="utf-8") as handle:
+                payload = json.loads(await handle.read())
+            items = payload.get("items", []) if isinstance(payload, dict) else payload
+            return [
+                self._deserialize_failed_candidate(item)
+                for item in items
+                if isinstance(item, dict)
+            ]
+        except Exception as exc:
+            logger.error("Failed to load failed proof candidates for %s: %s", source_brainstorm_id, exc)
+            return []
+
+    async def _save_failed_candidates(
+        self,
+        source_brainstorm_id: str,
+        failed_candidates: List[FailedProofCandidate],
+    ) -> None:
+        self._get_failed_dir().mkdir(parents=True, exist_ok=True)
+        failed_path = self._get_failed_candidates_path(source_brainstorm_id)
+        payload = {
+            "source_brainstorm_id": source_brainstorm_id,
+            "items": [
+                self._serialize_failed_candidate(candidate)
+                for candidate in failed_candidates
+            ],
+        }
+        async with aiofiles.open(failed_path, "w", encoding="utf-8") as handle:
+            await handle.write(json.dumps(payload, indent=2))
+
+    async def add_proof(self, record: ProofRecord) -> ProofRecord:
+        """Persist a proof record and return the stored copy."""
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            proof_id = record.proof_id or f"proof_{self._index_data['next_proof_id']:03d}"
+            stored_record = record.model_copy(update={"proof_id": proof_id})
+            serialized = self._serialize_record(stored_record)
+
+            async with aiofiles.open(self._get_record_path(proof_id), "w", encoding="utf-8") as handle:
+                await handle.write(json.dumps(serialized, indent=2))
+            async with aiofiles.open(self._get_lean_path(proof_id), "w", encoding="utf-8") as handle:
+                await handle.write(stored_record.lean_code)
+
+            proofs = [
+                proof
+                for proof in self._index_data.get("proofs", [])
+                if proof.get("proof_id") != proof_id
+            ]
+            proofs.append(serialized)
+            proofs.sort(key=lambda proof: proof.get("created_at", ""), reverse=True)
+
+            self._index_data["proofs"] = proofs
+            current_number = self._index_data.get("next_proof_id", 1)
+            self._index_data["next_proof_id"] = max(current_number, len(proofs) + 1)
+            self._rebuild_reverse_indexes()
+            await self._save_index()
+
+            logger.info(
+                "Stored proof %s (%s, novel=%s) from %s %s",
+                proof_id,
+                stored_record.theorem_statement[:80],
+                stored_record.novel,
+                stored_record.source_type,
+                stored_record.source_id,
+            )
+            return stored_record
+
+    async def record_failed_candidate(
+        self,
+        source_brainstorm_id: str,
+        theorem_candidate: ProofCandidate,
+        error_summary: str,
+        suggested_lemma_targets: Optional[List[str]] = None,
+    ) -> FailedProofCandidate:
+        """Persist a failed brainstorm theorem so later papers can retry it."""
+        async with self._lock:
+            failed_candidates = await self._load_failed_candidates(source_brainstorm_id)
+            existing = None
+            for candidate in failed_candidates:
+                if candidate.theorem_id == theorem_candidate.theorem_id:
+                    existing = candidate
+                    break
+
+            now = datetime.now()
+            cleaned_targets = []
+            for target in suggested_lemma_targets or []:
+                normalized = str(target or "").strip()
+                if normalized and normalized not in cleaned_targets:
+                    cleaned_targets.append(normalized)
+            if existing:
+                existing.theorem_statement = theorem_candidate.statement
+                existing.formal_sketch = theorem_candidate.formal_sketch
+                existing.source_excerpt = theorem_candidate.source_excerpt
+                existing.error_summary = error_summary
+                if cleaned_targets:
+                    existing.suggested_lemma_targets = cleaned_targets
+                existing.updated_at = now
+                stored_candidate = existing
+            else:
+                stored_candidate = FailedProofCandidate(
+                    source_brainstorm_id=source_brainstorm_id,
+                    theorem_id=theorem_candidate.theorem_id,
+                    theorem_statement=theorem_candidate.statement,
+                    formal_sketch=theorem_candidate.formal_sketch,
+                    source_excerpt=theorem_candidate.source_excerpt,
+                    error_summary=error_summary,
+                    suggested_lemma_targets=cleaned_targets,
+                    created_at=now,
+                    updated_at=now,
+                )
+                failed_candidates.append(stored_candidate)
+
+            await self._save_failed_candidates(source_brainstorm_id, failed_candidates)
+            return stored_candidate
+
+    async def get_pending_retries(
+        self,
+        source_brainstorm_id: str,
+        retry_source_id: str = "",
+    ) -> List[FailedProofCandidate]:
+        """Return unresolved failed candidates eligible for retry."""
+        async with self._lock:
+            failed_candidates = await self._load_failed_candidates(source_brainstorm_id)
+            pending = [
+                candidate
+                for candidate in failed_candidates
+                if not candidate.resolved_proof_id
+                and (not retry_source_id or candidate.last_retry_source_id != retry_source_id)
+            ]
+            pending.sort(key=lambda candidate: candidate.updated_at, reverse=True)
+            return pending
+
+    async def mark_retried(
+        self,
+        source_brainstorm_id: str,
+        theorem_id: str,
+        retry_source_id: str,
+    ) -> None:
+        """Mark a failed candidate as having been retried for a specific paper/source."""
+        async with self._lock:
+            failed_candidates = await self._load_failed_candidates(source_brainstorm_id)
+            updated = False
+            for candidate in failed_candidates:
+                if candidate.theorem_id != theorem_id:
+                    continue
+                candidate.retry_count += 1
+                candidate.last_retry_source_id = retry_source_id
+                candidate.updated_at = datetime.now()
+                updated = True
+                break
+
+            if updated:
+                await self._save_failed_candidates(source_brainstorm_id, failed_candidates)
+
+    async def mark_resolved_retry(
+        self,
+        source_brainstorm_id: str,
+        theorem_id: str,
+        proof_id: str,
+    ) -> None:
+        """Mark a failed candidate as resolved by a later verified proof."""
+        async with self._lock:
+            failed_candidates = await self._load_failed_candidates(source_brainstorm_id)
+            updated = False
+            for candidate in failed_candidates:
+                if candidate.theorem_id != theorem_id:
+                    continue
+                candidate.resolved_proof_id = proof_id
+                candidate.updated_at = datetime.now()
+                updated = True
+                break
+
+            if updated:
+                await self._save_failed_candidates(source_brainstorm_id, failed_candidates)
+
+    async def get_recent_failure_hints(
+        self,
+        source_brainstorm_id: str,
+        *,
+        limit: int = 5,
+    ) -> List[FailedProofCandidate]:
+        """Return recent unresolved failed proof hints for brainstorm prompt injection."""
+        async with self._lock:
+            failed_candidates = await self._load_failed_candidates(source_brainstorm_id)
+            hints = [candidate for candidate in failed_candidates if not candidate.resolved_proof_id]
+            hints.sort(key=lambda candidate: candidate.updated_at, reverse=True)
+            return hints[:limit]
+
+    async def get_lean_code(self, proof_id: str) -> str:
+        """Return the raw saved Lean file for a proof when available."""
+        async with self._lock:
+            lean_path = self._get_lean_path(proof_id)
+            if lean_path.exists():
+                try:
+                    async with aiofiles.open(lean_path, "r", encoding="utf-8") as handle:
+                        return await handle.read()
+                except Exception as exc:
+                    logger.error("Failed to read Lean file for %s: %s", proof_id, exc)
+
+            if self._index_data is None:
+                await self._load_index()
+            for proof in self._index_data.get("proofs", []) if self._index_data else []:
+                if proof.get("proof_id") == proof_id:
+                    return str(proof.get("lean_code", "") or "")
+            return ""
+
+    async def get_all_proofs(self, novel_only: Optional[bool] = None) -> List[ProofRecord]:
+        """Return all stored proofs, optionally filtered by novelty."""
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            proofs = [
+                self._deserialize_record(proof)
+                for proof in self._index_data.get("proofs", [])
+            ]
+            if novel_only is None:
+                return proofs
+            return [proof for proof in proofs if proof.novel is novel_only]
+
+    async def update_proof_dependencies(self, proof_id: str, dependencies) -> Optional[ProofRecord]:
+        """Persist a new dependency list for an existing proof record."""
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            updated_record: Optional[ProofRecord] = None
+            updated_proofs: List[Dict[str, Any]] = []
+
+            for proof_data in self._index_data.get("proofs", []):
+                if proof_data.get("proof_id") != proof_id:
+                    updated_proofs.append(proof_data)
+                    continue
+                record = self._deserialize_record(proof_data)
+                updated_record = record.model_copy(update={"dependencies": list(dependencies or [])})
+                updated_proofs.append(self._serialize_record(updated_record))
+
+            if updated_record is None:
+                return None
+
+            self._index_data["proofs"] = updated_proofs
+            self._rebuild_reverse_indexes()
+
+            async with aiofiles.open(self._get_record_path(proof_id), "w", encoding="utf-8") as handle:
+                await handle.write(json.dumps(self._serialize_record(updated_record), indent=2))
+            await self._save_index()
+            return updated_record
+
+    async def get_dependencies(self, proof_id: str):
+        """Return dependency edges for one proof."""
+        proof = await self.get_proof(proof_id)
+        if proof is None:
+            return []
+        return list(proof.dependencies or [])
+
+    async def get_proofs_using_mathlib(self, name: str) -> List[ProofRecord]:
+        """Return proofs that reference a specific Mathlib lemma name."""
+        requested_name = str(name or "").strip()
+        if not requested_name:
+            return []
+
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            proof_ids = []
+            for candidate_id in self._mathlib_reverse_index.get(requested_name, []):
+                if candidate_id not in proof_ids:
+                    proof_ids.append(candidate_id)
+
+            short_name = requested_name.split(".")[-1]
+            if not proof_ids:
+                for candidate_id in self._mathlib_reverse_short_index.get(short_name, []):
+                    if candidate_id not in proof_ids:
+                        proof_ids.append(candidate_id)
+
+            proofs: List[ProofRecord] = []
+            for proof_data in self._index_data.get("proofs", []):
+                proof_id = str(proof_data.get("proof_id", "")).strip()
+                if proof_id and proof_id in proof_ids:
+                    proofs.append(self._deserialize_record(proof_data))
+            return proofs
+
+    async def get_proofs_depending_on(self, proof_id: str) -> List[ProofRecord]:
+        """Return proofs whose MOTO ancestry depends on the given proof."""
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            proofs = [
+                self._deserialize_record(proof)
+                for proof in self._index_data.get("proofs", [])
+            ]
+            return [
+                proof
+                for proof in proofs
+                if any(
+                    dependency.kind == "moto" and dependency.source_ref == proof_id
+                    for dependency in (proof.dependencies or [])
+                )
+            ]
+
+    async def get_graph(self) -> Dict[str, Any]:
+        """Return the proof graph in one pass for graph-oriented UIs."""
+        async with self._lock:
+            if self._index_data is None:
+                await self._load_index()
+
+            proofs = [
+                self._deserialize_record(proof)
+                for proof in self._index_data.get("proofs", [])
+            ]
+
+        nodes = [
+            {
+                "proof_id": proof.proof_id,
+                "theorem_name": proof.theorem_name,
+                "theorem_statement": proof.theorem_statement,
+                "source_type": proof.source_type,
+                "source_id": proof.source_id,
+                "source_title": proof.source_title,
+                "solver": proof.solver,
+                "is_novel": proof.novel,
+                "created_at": proof.created_at.isoformat() if proof.created_at else None,
+            }
+            for proof in proofs
+        ]
+
+        edges_moto: List[Dict[str, str]] = []
+        edges_mathlib: List[Dict[str, str]] = []
+        for proof in proofs:
+            for dependency in proof.dependencies or []:
+                if dependency.kind == "moto" and dependency.source_ref:
+                    edges_moto.append(
+                        {
+                            "from": proof.proof_id,
+                            "to": dependency.source_ref,
+                            "name": dependency.name,
+                        }
+                    )
+                elif dependency.kind == "mathlib":
+                    edges_mathlib.append(
+                        {
+                            "from": proof.proof_id,
+                            "name": dependency.name,
+                            "source_ref": dependency.source_ref,
+                        }
+                    )
+
+        return {
+            "nodes": nodes,
+            "edges_moto": edges_moto,
+            "edges_mathlib": edges_mathlib,
+        }
+
+    async def get_proof(self, proof_id: str) -> Optional[ProofRecord]:
+        """Return one stored proof."""
+        async with self._lock:
+            record_path = self._get_record_path(proof_id)
+            if record_path.exists():
+                try:
+                    async with aiofiles.open(record_path, "r", encoding="utf-8") as handle:
+                        return self._deserialize_record(json.loads(await handle.read()))
+                except Exception as exc:
+                    logger.error("Failed to read proof %s: %s", proof_id, exc)
+
+            if self._index_data is None:
+                await self._load_index()
+            for proof in self._index_data.get("proofs", []):
+                if proof.get("proof_id") == proof_id:
+                    return self._deserialize_record(proof)
+        return None
+
+    def count_proofs(self) -> Dict[str, int]:
+        """Return proof counts for display and prompt gating."""
+        self._ensure_index_loaded_sync()
+        proofs = self._index_data.get("proofs", []) if self._index_data else []
+        novel_count = sum(1 for proof in proofs if proof.get("novel"))
+        return {
+            "total": len(proofs),
+            "novel": novel_count,
+            "known": len(proofs) - novel_count,
+        }
+
+    def get_novel_proofs_for_injection(self) -> str:
+        """Format the novel proofs block for highest-priority prompt injection."""
+        self._ensure_index_loaded_sync()
+        proofs = self._index_data.get("proofs", []) if self._index_data else []
+        novel_proofs = [proof for proof in proofs if proof.get("novel")]
+
+        if not novel_proofs:
+            return ""
+
+        lines = [
+            "=== VERIFIED NOVEL MATHEMATICAL PROOFS (Lean 4 Verified) ===",
+            "[These proofs have been formally verified. They represent proven mathematical truths.]",
+            "",
+        ]
+        for index, proof in enumerate(novel_proofs, start=1):
+            lines.extend(
+                [
+                    f"PROOF {index}: {proof.get('theorem_statement', '').strip()}",
+                    f"Source: {proof.get('source_type', '')} {proof.get('source_id', '')}".strip(),
+                    "Lean 4 Code:",
+                    proof.get("lean_code", "").strip(),
+                    "---",
+                ]
+            )
+        lines.append("=== END VERIFIED PROOFS ===")
+        return "\n".join(lines)
+
+    def inject_into_prompt(self, prompt: str) -> str:
+        """Prepend the verified novel proofs block when available."""
+        proofs_block = self.get_novel_proofs_for_injection()
+        if not proofs_block:
+            return prompt
+        if "=== VERIFIED NOVEL MATHEMATICAL PROOFS (Lean 4 Verified) ===" in prompt:
+            return prompt
+        if not prompt:
+            return proofs_block
+        return f"{proofs_block}\n\n{prompt}"
+
+    async def inject_failure_hints_into_prompt(
+        self,
+        prompt: str,
+        source_brainstorm_id: str,
+        *,
+        limit: int = 5,
+    ) -> str:
+        """Prepend recent failed proof targets for the active brainstorm when available."""
+        if not source_brainstorm_id:
+            return prompt
+
+        hints = await self.get_recent_failure_hints(source_brainstorm_id, limit=limit)
+        hints_block = format_failure_hints_for_injection(hints)
+        if not hints_block:
+            return prompt
+        if "=== OPEN LEMMA TARGETS LEAN 4 COULD NOT YET CLOSE ===" in prompt:
+            return prompt
+        if not prompt:
+            return hints_block
+        return f"{hints_block}\n\n{prompt}"
+
+    async def clear_all(self) -> None:
+        """Remove all proof files and reset the index."""
+        async with self._lock:
+            if self._base_dir.exists():
+                shutil.rmtree(self._base_dir, ignore_errors=True)
+            self._base_dir.mkdir(parents=True, exist_ok=True)
+            self._index_data = self._default_index()
+            self._rebuild_reverse_indexes()
+            await self._save_index()
+
+
+proof_database = ProofDatabase()
diff --git a/backend/autonomous/memory/research_metadata.py b/backend/autonomous/memory/research_metadata.py
index c24a450..c3c6732 100644
--- a/backend/autonomous/memory/research_metadata.py
+++ b/backend/autonomous/memory/research_metadata.py
@@ -82,6 +82,11 @@ async def _ensure_initialized(self) -> None:
             if self._data is None:
                 self._data = {
                     "user_research_prompt": "",
+                    "base_user_research_prompt": "",
+                    "proof_framing_active": False,
+                    "proof_framing_context": "",
+                    "proof_framing_reasoning": "",
+                    "proof_runtime_config": {},
                     "brainstorms": [],
                     "papers": [],
                     "next_topic_id": 1,
@@ -114,10 +119,17 @@ async def initialize(self, user_research_prompt: str = "") -> None:
             if user_research_prompt and self._data.get("user_research_prompt") != user_research_prompt:
                 logger.info("User research prompt updated")
                 self._data["user_research_prompt"] = user_research_prompt
+                if not self._data.get("base_user_research_prompt"):
+                    self._data["base_user_research_prompt"] = user_research_prompt
                 await self._save_metadata()
         else:
             self._data = {
                 "user_research_prompt": user_research_prompt,
+                "base_user_research_prompt": user_research_prompt,
+                "proof_framing_active": False,
+                "proof_framing_context": "",
+                "proof_framing_reasoning": "",
+                "proof_runtime_config": {},
                 "brainstorms": [],
                 "papers": [],
                 "next_topic_id": 1,
@@ -149,6 +161,11 @@ async def _load_metadata(self) -> None:
             # This is OUTSIDE the async with block so we can safely save
             defaults = {
                 "user_research_prompt": "",
+                "base_user_research_prompt": "",
+                "proof_framing_active": False,
+                "proof_framing_context": "",
+                "proof_framing_reasoning": "",
+                "proof_runtime_config": {},
                 "brainstorms": [],
                 "papers": [],
                 "next_topic_id": 1,
@@ -165,6 +182,11 @@ async def _load_metadata(self) -> None:
             logger.error(f"Failed to load research metadata: {e}")
             self._data = {
                 "user_research_prompt": "",
+                "base_user_research_prompt": "",
+                "proof_framing_active": False,
+                "proof_framing_context": "",
+                "proof_framing_reasoning": "",
+                "proof_runtime_config": {},
                 "brainstorms": [],
                 "papers": [],
                 "next_topic_id": 1,
@@ -225,6 +247,10 @@ def _get_default_workflow_state(self) -> Dict[str, Any]:
             "current_paper_id": None,
             "current_paper_title": None,
             "paper_phase": None,  # "body", "conclusion", "introduction", "abstract"
+            "base_user_research_prompt": "",
+            "proof_framing_active": False,
+            "proof_framing_context": "",
+            "proof_framing_reasoning": "",
             "acceptance_count": 0,
             "rejection_count": 0,
             "consecutive_rejections": 0,
@@ -326,12 +352,47 @@ async def get_user_prompt(self) -> str:
         """Get the user's research prompt."""
         await self._ensure_initialized()
         return self._data.get("user_research_prompt", "")
+
+    async def get_base_user_prompt(self) -> str:
+        """Get the original user research prompt before proof framing."""
+        await self._ensure_initialized()
+        return self._data.get("base_user_research_prompt") or self._data.get("user_research_prompt", "")
     
     async def set_user_prompt(self, prompt: str) -> None:
         """Set the user's research prompt."""
         async with self._lock:
             self._data["user_research_prompt"] = prompt
             await self._save_metadata()
+
+    async def set_proof_framing_state(
+        self,
+        *,
+        base_user_prompt: str,
+        effective_user_prompt: str,
+        active: bool,
+        context: str,
+        reasoning: str,
+    ) -> None:
+        """Persist the proof-framing decision in metadata."""
+        async with self._lock:
+            self._data["base_user_research_prompt"] = base_user_prompt
+            self._data["user_research_prompt"] = effective_user_prompt
+            self._data["proof_framing_active"] = active
+            self._data["proof_framing_context"] = context
+            self._data["proof_framing_reasoning"] = reasoning
+            await self._save_metadata()
+
+    async def get_proof_runtime_config(self) -> Dict[str, Any]:
+        """Return the persisted proof runtime model configuration snapshot."""
+        await self._ensure_initialized()
+        value = self._data.get("proof_runtime_config")
+        return value if isinstance(value, dict) else {}
+
+    async def set_proof_runtime_config(self, config: Dict[str, Any]) -> None:
+        """Persist the proof runtime model configuration snapshot."""
+        async with self._lock:
+            self._data["proof_runtime_config"] = config if isinstance(config, dict) else {}
+            await self._save_metadata()
     
     # ========================================================================
     # BRAINSTORM REGISTRATION
diff --git a/backend/autonomous/memory/session_manager.py b/backend/autonomous/memory/session_manager.py
index fa9be68..5b334b1 100644
--- a/backend/autonomous/memory/session_manager.py
+++ b/backend/autonomous/memory/session_manager.py
@@ -16,6 +16,7 @@
     resolve_path_within_root,
     validate_single_path_component,
 )
+from backend.shared.config import system_config
 
 logger = logging.getLogger(__name__)
 
@@ -32,6 +33,7 @@ class SessionManager:
         └── {sanitized_prompt}_{timestamp}/
             ├── brainstorms/
             ├── papers/
+            ├── proofs/
             ├── final_answer/
             └── session_metadata.json
     """
@@ -120,7 +122,7 @@ def _generate_session_id(self, prompt: str) -> str:
         timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M")
         return f"{sanitized}_{timestamp}"
     
-    async def initialize(self, user_prompt: str, base_dir: str = "backend/data/auto_sessions") -> Path:
+    async def initialize(self, user_prompt: str, base_dir: Optional[str] = None) -> Path:
         """
         Initialize a new session for the given user prompt.
         
@@ -134,7 +136,7 @@ async def initialize(self, user_prompt: str, base_dir: str = "backend/data/auto_
             Path to the session folder
         """
         async with self._lock:
-            self._base_dir = Path(base_dir)
+            self._base_dir = Path(base_dir or system_config.auto_sessions_base_dir)
             self._user_prompt = user_prompt
             self._session_id = self._generate_session_id(user_prompt)
             self._session_path = self._base_dir / self._session_id
@@ -143,6 +145,7 @@ async def initialize(self, user_prompt: str, base_dir: str = "backend/data/auto_
             self._session_path.mkdir(parents=True, exist_ok=True)
             (self._session_path / "brainstorms").mkdir(exist_ok=True)
             (self._session_path / "papers").mkdir(exist_ok=True)
+            (self._session_path / "proofs").mkdir(exist_ok=True)
             (self._session_path / "final_answer").mkdir(exist_ok=True)
             
             # Save session metadata
@@ -162,7 +165,7 @@ async def initialize(self, user_prompt: str, base_dir: str = "backend/data/auto_
             
             return self._session_path
     
-    async def resume_session(self, session_id: str, base_dir: str = "backend/data/auto_sessions") -> Optional[Path]:
+    async def resume_session(self, session_id: str, base_dir: Optional[str] = None) -> Optional[Path]:
         """
         Resume an existing session by ID.
         
@@ -174,7 +177,7 @@ async def resume_session(self, session_id: str, base_dir: str = "backend/data/au
             Path to the session folder, or None if not found
         """
         async with self._lock:
-            self._base_dir = Path(base_dir)
+            self._base_dir = Path(base_dir or system_config.auto_sessions_base_dir)
             try:
                 safe_session_id = validate_single_path_component(session_id, "session ID")
                 self._session_path = resolve_path_within_root(self._base_dir, safe_session_id)
@@ -223,6 +226,10 @@ async def _update_metadata(self, updates: Dict[str, Any]) -> None:
         # Save
         async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
             await f.write(json.dumps(metadata, indent=2))
+
+    async def update_metadata(self, updates: Dict[str, Any]) -> None:
+        """Public wrapper for updating session metadata fields."""
+        await self._update_metadata(updates)
     
     def get_brainstorms_dir(self) -> Path:
         """Get brainstorms subdirectory for current session."""
@@ -235,6 +242,12 @@ def get_papers_dir(self) -> Path:
         if not self._session_path:
             raise RuntimeError("Session not initialized. Call initialize() first.")
         return self._session_path / "papers"
+
+    def get_proofs_dir(self) -> Path:
+        """Get proofs subdirectory for current session."""
+        if not self._session_path:
+            raise RuntimeError("Session not initialized. Call initialize() first.")
+        return self._session_path / "proofs"
     
     def get_final_answer_dir(self) -> Path:
         """Get final_answer subdirectory for current session."""
@@ -264,7 +277,7 @@ async def clear(self) -> None:
             self._session_id = None
             logger.info("Session manager cleared")
     
-    async def find_interrupted_session(self, base_dir: str = "backend/data/auto_sessions") -> Optional[Dict[str, Any]]:
+    async def find_interrupted_session(self, base_dir: Optional[str] = None) -> Optional[Dict[str, Any]]:
         """
         Find the most recent RESUMABLE session in its workflow_state.
         
@@ -283,7 +296,7 @@ async def find_interrupted_session(self, base_dir: str = "backend/data/auto_sess
             Session info dict with session_id, path, user_prompt, workflow_state
             Or None if no resumable session found
         """
-        base_path = Path(base_dir)
+        base_path = Path(base_dir or system_config.auto_sessions_base_dir)
         
         if not base_path.exists():
             return None
@@ -300,7 +313,10 @@ async def find_interrupted_session(self, base_dir: str = "backend/data/auto_sess
                 
             try:
                 async with aiofiles.open(workflow_state_path, 'r', encoding='utf-8') as f:
-                    workflow_state = json.loads(await f.read())
+                    raw = await f.read()
+                if not raw.strip().strip('\x00'):
+                    continue  # Empty or null-padded file — skip silently
+                workflow_state = json.loads(raw)
                 
                 # Check if this session is resumable
                 # Resumable means: has a tier AND (has a topic OR has completed papers)
@@ -326,7 +342,7 @@ async def find_interrupted_session(self, base_dir: str = "backend/data/auto_sess
                         "was_running": workflow_state.get("is_running", False)
                     })
             except Exception as e:
-                logger.warning(f"Failed to read workflow state from {session_dir}: {e}")
+                logger.debug(f"Skipping unreadable workflow state in {session_dir.name}: {e}")
                 continue
         
         if not resumable_sessions:
@@ -341,14 +357,14 @@ async def find_interrupted_session(self, base_dir: str = "backend/data/auto_sess
         
         return most_recent
 
-    async def list_all_sessions(self, base_dir: str = "backend/data/auto_sessions") -> List[Dict[str, Any]]:
+    async def list_all_sessions(self, base_dir: Optional[str] = None) -> List[Dict[str, Any]]:
         """
         List all research sessions.
         
         Returns:
             List of session metadata dictionaries
         """
-        base_path = Path(base_dir)
+        base_path = Path(base_dir or system_config.auto_sessions_base_dir)
         sessions = []
         
         if not base_path.exists():
diff --git a/backend/autonomous/prompts/proof_prompts.py b/backend/autonomous/prompts/proof_prompts.py
new file mode 100644
index 0000000..bc57009
--- /dev/null
+++ b/backend/autonomous/prompts/proof_prompts.py
@@ -0,0 +1,515 @@
+"""
+Prompt builders for Lean 4 proof integration.
+"""
+from __future__ import annotations
+
+from typing import Iterable, Any
+
+from backend.shared.models import MathlibLemmaHint, ProofAttemptFeedback, SmtHint
+
+
+PROOF_FRAMING_CONTEXT = """[PROOF FRAMING CONTEXT -- This research prompt is amenable to formal mathematical proof.
+All submissions should work toward producing formally testable theorems where possible.
+The validator should additionally assess whether submissions contribute toward results
+that can be verified by the Lean 4 proof assistant. This framing does not exclude
+non-proof explorations but provides a directional objective.]"""
+
+
+def _json_only_footer(example: str) -> str:
+    return (
+        "Respond with ONLY valid JSON. Do not use markdown fences. "
+        "Escape backslashes correctly for JSON.\n\n"
+        f"JSON format:\n{example}"
+    )
+
+
+def _format_attempt_history(prior_attempts: Iterable[ProofAttemptFeedback]) -> str:
+    attempts = list(prior_attempts or [])
+    if not attempts:
+        return "No prior attempts."
+
+    lines = []
+    for attempt in attempts:
+        tactic_trace = "\n".join(
+            f"  - {step}"
+            for step in (attempt.tactic_trace or [])
+        ) or "[none]"
+        error_text = attempt.error_output or "[no error output]"
+        rejection_banner = ""
+        if "PROOF REJECTED: PLACEHOLDER USED" in error_text:
+            rejection_banner = (
+                "!! PLACEHOLDER REJECTION !! This prior attempt was rejected "
+                "because it used `sorry` / `admit` (or an equivalent placeholder). "
+                "Do NOT submit another placeholder proof. Either prove the goal "
+                "fully, or return a narrower lemma you can actually close."
+            )
+        block = [
+            f"ATTEMPT {attempt.attempt}:",
+            f"Strategy: {attempt.strategy}",
+            f"Reasoning: {attempt.reasoning}",
+            "Lean 4 code:",
+            attempt.lean_code or "[none]",
+            "Tactic trace:",
+            tactic_trace,
+            "Lean 4 feedback:",
+            error_text,
+            f"Goal states: {attempt.goal_states or '[none]'}",
+        ]
+        if rejection_banner:
+            block.append(rejection_banner)
+        block.append("---")
+        lines.extend(block)
+    return "\n".join(lines)
+
+
+def _format_relevant_lemmas(relevant_lemmas: Iterable[MathlibLemmaHint]) -> str:
+    lemmas = list(relevant_lemmas or [])
+    if not lemmas:
+        return "[No confirmed Mathlib lemmas identified.]"
+
+    lines = []
+    for index, lemma in enumerate(lemmas, start=1):
+        location = f"{lemma.file_path}:{lemma.line_number}" if lemma.file_path and lemma.line_number else (lemma.file_path or "[path unavailable]")
+        lines.extend(
+            [
+                f"{index}. {lemma.full_name or lemma.requested_name}",
+                f"   Declaration: {lemma.declaration or '[declaration unavailable]'}",
+                f"   Source: {location}",
+            ]
+        )
+    return "\n".join(lines)
+
+
+def _truncate_text(value: str, limit: int) -> str:
+    text = " ".join((value or "").split())
+    return text[:limit] + ("..." if len(text) > limit else "")
+
+
+def _format_smt_hint(smt_hint: SmtHint | None) -> str:
+    if not smt_hint:
+        return "[No SMT guidance available.]"
+
+    tactics = ", ".join(smt_hint.suggested_tactics or []) or "[none]"
+    return "\n".join(
+        [
+            f"SMT result: {smt_hint.result}",
+            f"Suggested Lean tactics: {tactics}",
+        ]
+    )
+
+
+LEAN4_COMMON_PITFALLS = """COMMON LEAN 4 PITFALLS TO AVOID:
+- NEVER use `sorry` or `admit` in the proof body. MOTO rejects any proof
+  that contains `sorry` or `admit` anywhere, even though Lean would only
+  emit a warning. A proof with `sorry` is not a proof. If you cannot close
+  every goal, return a narrower lemma that you CAN fully prove.
+- NEVER introduce new `axiom` declarations that exist only to make the
+  target theorem trivial. Axiomatizing the concepts in the statement
+  (e.g. `axiom Protocol : Type`, `axiom IC ... : ℝ`) and then proving the
+  theorem with `sorry` is a vacuous proof and will be rejected. If a notion
+  is not available, model it constructively or use concrete types from
+  Mathlib instead.
+- STOP writing tactics the instant all goals are closed. Appending ANY
+  tactic after the proof is already complete causes Lean to emit
+  `error: No goals to be solved`, which counts as a failed attempt. This
+  includes: an extra `rfl`, `trivial`, `simp`, `exact`, `decide`, `omega`,
+  `norm_num`, or a dangling bullet (`·` / `case _ =>`) after the previous
+  branch already finished. If a prior attempt failed with "no goals to be
+  solved", do NOT add more tactics -- DELETE the tactic at the reported
+  line/column (and any tactics after it) and resubmit.
+- Mathlib name collisions: Mathlib already defines names such as `Distribution`,
+  `Protocol`, `Relation`, `Graph`, `Set`, `Group`, `Module`, `Order`, and many
+  more. Do NOT redeclare these. If you need a local notion, use a unique prefix
+  (e.g., `MOTO_Distribution`, `MyDist`, or open a fresh `namespace`), or
+  introduce the object as a `variable` of abstract type.
+- Missing `Inhabited`/`Nonempty` instances: when you write `∃ x, ...` or use
+  tactics like `choose`, `Classical.choice`, or `Exists.intro` on a type with
+  no default inhabitant, Lean cannot synthesize the instance. Either assume
+  `[Inhabited α]` / `[Nonempty α]` in the theorem header, or construct an
+  explicit witness before closing the goal.
+- Deprecated tactics: do NOT use `push_neg` as a bare tactic in recent Mathlib.
+  Use `push_neg at h` on a hypothesis, or prefer `simp only [not_forall,
+  not_exists, not_and, not_or, not_not]` / `by_contra` with explicit rewrites.
+  Similarly, avoid legacy aliases like `finish`, `tauto!`, `show_term` in proof
+  output.
+- Tactic state hygiene: every branch must actually close its goal. Do not rely
+  on tactics that may leave unsolved goals (`cases`, `rcases`, `induction`)
+  without a closing tactic on each branch.
+- Import surface: `import Mathlib` is acceptable but slow; prefer narrower
+  imports (e.g., `import Mathlib.Data.Real.Basic`) when you know exactly what
+  is needed. When uncertain, fall back to `import Mathlib`."""
+
+
+def format_failure_hints_for_injection(failure_hints: Iterable[Any]) -> str:
+    hints = list(failure_hints or [])
+    if not hints:
+        return ""
+
+    lines = [
+        "=== OPEN LEMMA TARGETS LEAN 4 COULD NOT YET CLOSE ===",
+        "[These are recent proof attempts that failed. Prefer brainstorms that generate missing lemmas, stronger assumptions, or cleaner formal theorem statements.]",
+        "",
+    ]
+    for index, hint in enumerate(hints, start=1):
+        theorem_statement = ""
+        error_summary = ""
+        suggested_targets: list[str] = []
+        if isinstance(hint, dict):
+            theorem_statement = str(hint.get("theorem_statement", "")).strip()
+            error_summary = str(hint.get("error_summary", "")).strip()
+            suggested_targets = [
+                str(target).strip()
+                for target in (hint.get("suggested_lemma_targets") or [])
+                if str(target).strip()
+            ]
+        else:
+            theorem_statement = str(getattr(hint, "theorem_statement", "")).strip()
+            error_summary = str(getattr(hint, "error_summary", "")).strip()
+            suggested_targets = [
+                str(target).strip()
+                for target in (getattr(hint, "suggested_lemma_targets", None) or [])
+                if str(target).strip()
+            ]
+        placeholder_note = ""
+        if "PROOF REJECTED: PLACEHOLDER USED" in error_summary:
+            placeholder_note = (
+                "Note: the previous formalization attempt was rejected because "
+                "it used `sorry`/`admit` or axiomatized the theorem's concepts "
+                "to make the goal trivial. Prefer brainstorms that state a "
+                "narrower, concretely provable lemma instead of the full claim."
+            )
+        lines.extend(
+            [
+                f"OPEN TARGET {index}: {_truncate_text(theorem_statement or '[unnamed theorem]', 180)}",
+                f"Lean 4 failure summary: {_truncate_text(error_summary or '[no summary available]', 200)}",
+                f"Suggested lemma targets: {', '.join(suggested_targets[:6]) if suggested_targets else '[none identified]'}",
+            ]
+        )
+        if placeholder_note:
+            lines.append(placeholder_note)
+        lines.append("---")
+    lines.append("=== END OPEN LEMMA TARGETS ===")
+    return "\n".join(lines)
+
+
+def build_proof_framing_gate_prompt(user_prompt: str) -> str:
+    """Ask whether the research goal should be framed toward formal proof."""
+    return f"""You are deciding whether a research program should be explicitly framed toward formal mathematical proof.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+Return TRUE only if the prompt is meaningfully served by working toward formally provable theorems in a proof assistant such as Lean 4.
+Return FALSE if the prompt is primarily empirical, engineering-focused, descriptive, or only tangentially mathematical.
+
+Consider:
+- Is the core task mathematical rather than experimental?
+- Are theorem statements or proof obligations likely to be central?
+- Would proof-oriented framing materially improve the research direction?
+
+{_json_only_footer('{"is_proof_amenable": true, "reasoning": "brief explanation"}')}
+"""
+
+
+def build_proof_identification_prompt(
+    user_prompt: str,
+    source_type: str,
+    source_id: str,
+    source_content: str,
+) -> str:
+    """Identify complete, testable theorem candidates from a brainstorm or paper."""
+    example_json = """{
+  "has_provable_theorems": true,
+  "theorems": [
+    {
+      "theorem_id": "thm_1",
+      "statement": "natural-language theorem statement",
+      "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy"
+    }
+  ]
+}"""
+    return f"""You are a theorem-identification agent for MOTO. Lean 4 is available as an external proof checker.
+
+Your job is NOT to prove anything yet. Your job is only to decide whether the source below contains any COMPLETE, TESTABLE mathematical theorem statements that should be submitted to Lean 4.
+
+Rules:
+- Return FALSE if the content only contains conjectures, loose ideas, heuristics, empirical claims, or incomplete proof sketches.
+- Return TRUE only for theorem candidates that are stated clearly enough to attempt formalization now.
+- Include ALL viable candidate theorems, not just the best one.
+- Prefer exact theorem statements over vague summaries.
+- Use theorem IDs that are stable strings such as "thm_1", "thm_2", etc.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+SOURCE TYPE: {source_type}
+SOURCE ID: {source_id}
+
+SOURCE CONTENT:
+{source_content}
+
+{_json_only_footer(example_json)}
+"""
+
+
+def build_lemma_search_prompt(
+    user_prompt: str,
+    source_type: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    source_excerpt: str,
+) -> str:
+    """Suggest existing Mathlib lemmas likely to help prove the target theorem."""
+    example_json = """{
+  "lemma_names": [
+    "Nat.add_comm",
+    "Nat.add_assoc"
+  ],
+  "reasoning": "brief explanation"
+}"""
+    return f"""You are a Mathlib-lemma suggestion agent for Lean 4 proof generation.
+
+Your job is to suggest EXISTING Mathlib declaration names that are likely useful for proving the target theorem.
+
+Rules:
+- Return 5-10 candidate lemma/theorem names when possible.
+- Prefer concrete declaration names over descriptions.
+- Use familiar Mathlib naming when possible (for example `Nat.add_comm`, `mul_assoc`, `Finset.card_union_add_card_inter`).
+- If the theorem is too vague or no good candidates are evident, return an empty list.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+SOURCE TYPE:
+{source_type}
+
+TARGET THEOREM:
+{theorem_statement}
+
+FORMALIZATION NOTES:
+{formal_sketch or "[none]"}
+
+SOURCE EXCERPT:
+{source_excerpt}
+
+{_json_only_footer(example_json)}
+"""
+
+
+def build_smt_translation_prompt(
+    user_prompt: str,
+    source_type: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    source_excerpt: str,
+) -> str:
+    """Ask the model to translate a conservative arithmetic theorem into SMT-LIB."""
+    example_json = """{
+  "smtlib": "(set-logic QF_LIA)\\n(declare-const n Int)\\n(assert (not (= (+ n 0) n)))\\n(check-sat)",
+  "reasoning": "Negate the target theorem so unsat means the theorem is valid."
+}"""
+    return f"""You are translating a mathematical theorem into an SMT-LIB v2 check for Z3.
+
+Your job is ONLY to build a conservative SMT-LIB program for a theorem that appears arithmetic or otherwise SMT-amenable.
+
+Rules:
+- Encode the NEGATION of the target theorem so that `unsat` means the theorem is valid.
+- Prefer quantifier-free arithmetic fragments when possible.
+- If the theorem is underspecified, only encode the part that is clearly justified by the theorem statement and notes.
+- Do not invent new assumptions that are not strongly implied by the theorem.
+- Return an empty `smtlib` string if you cannot produce a faithful SMT translation.
+- Use only SMT-LIB text in the `smtlib` field.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+SOURCE TYPE:
+{source_type}
+
+TARGET THEOREM:
+{theorem_statement}
+
+FORMALIZATION NOTES:
+{formal_sketch or "[none]"}
+
+SOURCE EXCERPT:
+{source_excerpt}
+
+{_json_only_footer(example_json)}
+"""
+
+
+def build_proof_formalization_prompt(
+    user_prompt: str,
+    source_type: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    source_excerpt: str,
+    prior_attempts: Iterable[ProofAttemptFeedback],
+    relevant_lemmas: Iterable[MathlibLemmaHint] = (),
+    smt_hint: SmtHint | None = None,
+) -> str:
+    """Build the Lean 4 formalization prompt for one theorem."""
+    attempt_history = _format_attempt_history(prior_attempts)
+    relevant_lemmas_block = _format_relevant_lemmas(relevant_lemmas)
+    smt_hint_block = _format_smt_hint(smt_hint)
+    example_json = """{
+  "theorem_name": "optional_lean_identifier",
+  "lean_code": "import Mathlib\\n\\n theorem ... := by ...",
+  "reasoning": "brief note about the formalization strategy"
+}"""
+    return f"""You are formalizing a mathematical theorem into Lean 4 code for MOTO.
+
+Lean 4 will immediately compile-check your output. If prior attempts failed, you must use the exact failure history to improve the next attempt.
+
+Requirements:
+- Output COMPLETE Lean 4 code, ready to run.
+- Include needed imports.
+- State assumptions explicitly.
+- Prefer correct, minimal, compilable code over stylistic elegance.
+- Your proof MUST close every goal without `sorry` or `admit`. Vacuous
+  proofs (e.g. axiomatizing the theorem's own concepts and then closing
+  with `sorry`) will be rejected even if Lean compiles them with only a
+  warning.
+- If the theorem seems invalid or underspecified, still make the strongest faithful formalization attempt you can from the provided source. If the full theorem cannot be proved, prove a narrower concrete lemma that is faithful to the source -- do NOT return a `sorry`-closed stub.
+- Do not describe the code; provide the actual Lean 4 code in JSON.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+SOURCE TYPE:
+{source_type}
+
+TARGET THEOREM:
+{theorem_statement}
+
+FORMALIZATION NOTES:
+{formal_sketch or "[none]"}
+
+SOURCE EXCERPT:
+{source_excerpt}
+
+RELEVANT MATHLIB LEMMAS:
+{relevant_lemmas_block}
+
+OPTIONAL SMT GUIDANCE:
+{smt_hint_block}
+
+If SMT guidance is present, treat it as a hint only. Lean 4 must still prove the theorem directly.
+If one of the suggested tactics is genuinely appropriate, you may use it. Do not force it when it does not fit the goal.
+
+{LEAN4_COMMON_PITFALLS}
+
+PRIOR ATTEMPT HISTORY:
+{attempt_history}
+
+{_json_only_footer(example_json)}
+"""
+
+
+def build_proof_tactic_script_prompt(
+    user_prompt: str,
+    source_type: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    source_excerpt: str,
+    prior_attempts: Iterable[ProofAttemptFeedback],
+    relevant_lemmas: Iterable[MathlibLemmaHint] = (),
+    smt_hint: SmtHint | None = None,
+) -> str:
+    """Build a tactic-oriented Lean 4 prompt for one theorem."""
+    attempt_history = _format_attempt_history(prior_attempts)
+    relevant_lemmas_block = _format_relevant_lemmas(relevant_lemmas)
+    smt_hint_block = _format_smt_hint(smt_hint)
+    example_json = """{
+  "theorem_name": "optional_lean_identifier",
+  "theorem_header": "theorem optional_lean_identifier (n : Nat) : n + 0 = n",
+  "tactics": [
+    {
+      "tactic": "simpa using Nat.add_zero n",
+      "reasoning": "Close the goal with the standard right-identity lemma."
+    }
+  ],
+  "reasoning": "brief note about the tactic strategy"
+}"""
+    return f"""You are formalizing a mathematical theorem into Lean 4 using a tactic-by-tactic proof sketch for MOTO.
+
+Lean 4 will immediately compile-check your output. If prior attempts failed, you must use the exact failure history to improve this attempt.
+
+Requirements:
+- Return a theorem header ONLY, without a proof body. Do not include `:= by` unless absolutely necessary.
+- Return a short, ordered list of tactics that can be appended under a `by` block.
+- Each tactic entry must include the Lean tactic string and one short reasoning note.
+- Prefer small, composable tactics over a single opaque script.
+- NEVER include `sorry` or `admit` in the tactic list. A script that uses
+  `sorry`/`admit` will be rejected even if Lean compiles it.
+- Include needed assumptions in the theorem header. Do NOT axiomatize the
+  concepts inside the theorem statement just to make the goal trivial.
+- If the theorem is underspecified, make the strongest faithful formalization attempt you can from the source. If you cannot close every goal, return a narrower concrete lemma instead of a `sorry`-closed stub.
+- Do not describe the code outside the JSON fields.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+SOURCE TYPE:
+{source_type}
+
+TARGET THEOREM:
+{theorem_statement}
+
+FORMALIZATION NOTES:
+{formal_sketch or "[none]"}
+
+SOURCE EXCERPT:
+{source_excerpt}
+
+RELEVANT MATHLIB LEMMAS:
+{relevant_lemmas_block}
+
+OPTIONAL SMT GUIDANCE:
+{smt_hint_block}
+
+If SMT guidance is present, treat it as a hint only. Lean 4 must still verify the theorem directly.
+Suggested tactics are optional and should only be used when they genuinely match the goal.
+
+{LEAN4_COMMON_PITFALLS}
+
+PRIOR ATTEMPT HISTORY:
+{attempt_history}
+
+{_json_only_footer(example_json)}
+"""
+
+
+def build_proof_novelty_prompt(
+    user_prompt: str,
+    theorem_statement: str,
+    lean_code: str,
+    existing_novel_proofs: str,
+) -> str:
+    """Ask the validator whether a Lean-verified theorem is novel."""
+    existing_proofs_block = existing_novel_proofs or "[No previously stored novel proofs.]"
+    return f"""This proof has been FORMALLY VERIFIED by Lean 4. It is mathematically valid.
+
+Your ONLY task: decide whether the verified result appears NOVEL in the context of this research program.
+
+Rules:
+- Do NOT re-check validity. Lean 4 already verified it.
+- Focus only on novelty/originality relative to known mathematics and the currently stored novel proofs.
+- If the theorem appears standard, classical, or already well known, mark it as not novel.
+- If you are uncertain, prefer FALSE unless there is a strong reason to believe the result is genuinely new.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+VERIFIED THEOREM:
+{theorem_statement}
+
+LEAN 4 CODE:
+{lean_code}
+
+EXISTING STORED NOVEL PROOFS:
+{existing_proofs_block}
+
+{_json_only_footer('{"is_novel": false, "reasoning": "brief explanation"}')}
+"""
diff --git a/backend/compiler/README.md b/backend/compiler/README.md
index cd34765..dc003b6 100644
--- a/backend/compiler/README.md
+++ b/backend/compiler/README.md
@@ -17,7 +17,7 @@ The compiler tool reads the aggregator's shared training database and systematic
   - **Outline Creation/Update**: High-context model creates and maintains paper structure
   - **Paper Construction**: High-context model writes paper sections following the outline
   - **Review/Cleanup**: High-context model reviews and fixes errors (without aggregator DB context)
-  - **Rigor Enhancement**: High-parameter model adds scientific rigor and precision
+  - **Rigor Mode (Lean 4)**: High-parameter model proposes one theorem per cycle, runs up to 5 Lean 4 formalization attempts with error-feedback chaining, persists the verified proof into the shared `proof_database`, and places it inline (2 placement attempts) or appends it to the Theorems Appendix on double rejection.
 - **Real-time Paper Viewing**: Live updates in the GUI as the paper is constructed
 - **Intelligent Placement Logic**: Automatically inserts content at the correct location based on placement context
 - **Separate GUI Tabs**: Compiler Interface, Settings, Logs, and Live Paper view
@@ -32,7 +32,7 @@ The compiler tool reads the aggregator's shared training database and systematic
 ### Agents
 
 - `high_context_submitter.py` - Low-parameter, high-context model (outline, construction, review)
-- `high_param_submitter.py` - High-parameter, low-context model (rigor enhancement)
+- `high_param_submitter.py` - High-parameter model. Rigor mode: discovery + 5x Lean 4 attempts + novelty classification + 2-attempt placement + Theorems Appendix fallback.
 
 ### Validation
 
@@ -54,11 +54,14 @@ The compiler uses two categories of hard-coded markers:
 - `[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]`
 - `[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS COMPLETE]`
 - `[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]`
+- `[HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]`
+- `[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]`
 
 **Management:**
 - Added by `paper_memory.py` via `initialize_with_placeholders()`
 - Replaced by `paper_memory.replace_placeholder()` when sections are validated
-- Purpose: Make it crystal clear to AI what sections exist vs. don't exist
+- Theorems appendix bracket pair wraps the Lean-4-verified theorem entries that the rigor loop produces; new entries are appended via `paper_memory.append_to_theorems_appendix(...)`.
+- Purpose: Make it crystal clear to AI what sections exist vs. don't exist, and keep Lean-4-verified theorems in a dedicated, stable location.
 
 ### 2. Anchors (in paper and outline)
 
@@ -101,3 +104,8 @@ Default context window: 131072 tokens (configurable in GUI settings)
 
 The compiler continuously reads from the aggregator's shared training database (`backend/data/rag_shared_training.txt`) and re-RAGs every 10 new aggregator acceptances.
 
+## Tools Available to Submitters
+
+- **Wolfram Alpha (construction mode only)**: When `system_config.wolfram_alpha_enabled=true`, the high-context submitter may invoke the `wolfram_alpha_query` OpenAI-compatible tool up to 20 times per construction submission. See `WOLFRAM_TOOL_SCHEMA` in `high_context_submitter.py`. Audit trail attached to `CompilerSubmission.metadata["wolfram_calls"]`. Not available in `outline_create`, `outline_update`, `review`, or rigor mode.
+- **Lean 4 (rigor mode only)**: The rigor loop uses `ProofFormalizationAgent.prove_candidate(max_attempts=5)` from `backend/autonomous/agents/proof_formalization_agent.py` backed by the Lean 4 toolchain + Mathlib workspace. Verified proofs are persisted in the shared `proof_database` (same store used by autonomous mode). Novel proofs are automatically injected into the highest-priority direct-injection block on subsequent submitter instantiations.
+
diff --git a/backend/compiler/agents/high_context_submitter.py b/backend/compiler/agents/high_context_submitter.py
index 35ff23d..fa1cb0d 100644
--- a/backend/compiler/agents/high_context_submitter.py
+++ b/backend/compiler/agents/high_context_submitter.py
@@ -15,6 +15,7 @@
 from backend.shared.config import system_config, rag_config
 from backend.shared.utils import count_tokens
 from backend.shared.json_parser import parse_json
+from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.validation.json_validator import json_validator
 from backend.compiler.prompts.outline_prompts import (
     build_outline_create_prompt,
@@ -31,16 +32,80 @@
 from backend.compiler.memory.outline_memory import outline_memory
 from backend.compiler.memory.paper_memory import (
     paper_memory,
-    PAPER_ANCHOR,
     ABSTRACT_PLACEHOLDER,
     INTRO_PLACEHOLDER,
-    CONCLUSION_PLACEHOLDER
+    CONCLUSION_PLACEHOLDER,
 )
 from backend.compiler.core.compiler_rag_manager import compiler_rag_manager
 
 logger = logging.getLogger(__name__)
 
 
+# =============================================================================
+# WOLFRAM ALPHA TOOL (Phase 3)
+# =============================================================================
+# The main writer may invoke Wolfram Alpha as a real OpenAI-style tool during
+# construction mode. Each submission gets a budget of 20 calls; the loop
+# forces finalization once the budget is exhausted. Callers attach the full
+# audit trail to `CompilerSubmission.metadata["wolfram_calls"]`.
+
+WOLFRAM_MAX_CALLS_PER_SUBMISSION = 20
+
+WOLFRAM_TOOL_SCHEMA: Dict[str, Any] = {
+    "type": "function",
+    "function": {
+        "name": "wolfram_alpha_query",
+        "description": (
+            "Query Wolfram Alpha to verify a mathematical or computational claim "
+            "before writing it into the paper. Use for: numerical verifications, "
+            "symbolic computations, well-known mathematical facts, unit "
+            "conversions, named-constant values. Do NOT use for open research "
+            "questions or narrative prose. You may call this tool up to "
+            f"{WOLFRAM_MAX_CALLS_PER_SUBMISSION} times per submission."
+        ),
+        "parameters": {
+            "type": "object",
+            "properties": {
+                "query": {
+                    "type": "string",
+                    "description": (
+                        "Natural-language Wolfram Alpha query, e.g. 'Is pi "
+                        "algebraic?', 'integral of x^2 from 0 to 1', "
+                        "'prime factorization of 360'."
+                    ),
+                },
+                "purpose": {
+                    "type": "string",
+                    "description": (
+                        "Brief note on how the result will be used in the paper "
+                        "(for audit trail)."
+                    ),
+                },
+            },
+            "required": ["query", "purpose"],
+        },
+    },
+}
+
+
+def _wolfram_tool_available() -> bool:
+    """Return True iff Wolfram Alpha is configured AND its client is live.
+
+    Registration of the tool with the LLM is gated on this so models never
+    see a callable tool when the backend cannot actually service it.
+    """
+    if not system_config.wolfram_alpha_enabled:
+        return False
+    try:
+        from backend.shared.wolfram_alpha_client import get_wolfram_client
+    except ImportError:
+        return False
+    try:
+        return get_wolfram_client() is not None
+    except Exception:
+        return False
+
+
 def _normalize_string_field(value) -> str:
     """
     Normalize string field from LLM response.
@@ -68,7 +133,7 @@ def _normalize_string_field(value) -> str:
 
 def _strip_paper_markers_for_llm(paper_content: str) -> str:
     """
-    Remove only the end-of-paper anchor from paper before sending to LLM.
+    Prepare paper text before sending it to the LLM.
     
     The section placeholders are KEPT so the LLM can see and use them
     as exact old_string values for replacement operations.
@@ -81,14 +146,15 @@ def _strip_paper_markers_for_llm(paper_content: str) -> str:
     Args:
         paper_content: Full paper content with markers
     
+    The writer must see the same editable paper text that exact-match
+    validation checks. Keep placeholders and theorem appendix bracket markers
+    visible so old_string anchors can be copied verbatim from the real paper.
+
     Returns:
-        Paper content with end-of-paper anchor removed but placeholders intact
+        Paper content with all system markers intact
     """
-    # Remove only the paper anchor marker (end-of-paper boundary)
-    # Keep placeholders intact so LLM can use them as exact old_string values
-    result = paper_content.replace(PAPER_ANCHOR, "").strip()
-    
-    return result
+    # Keep markers intact so LLM can use them as exact old_string values.
+    return paper_content.strip()
 
 
 class HighContextSubmitter:
@@ -104,7 +170,7 @@ class HighContextSubmitter:
     
     def __init__(self, model_name: str, user_prompt: str, websocket_broadcaster: Optional[Callable] = None):
         self.model_name = model_name
-        self.user_prompt = user_prompt
+        self.user_prompt = proof_database.inject_into_prompt(user_prompt)
         self.websocket_broadcaster = websocket_broadcaster
         self._initialized = False
         
@@ -288,9 +354,9 @@ async def submit_outline_update(self) -> Optional[CompilerSubmission]:
             current_paper = await paper_memory.get_paper()
             logger.info(f"State loaded: outline={len(current_outline)} chars, paper={len(current_paper)} chars")
             
-            # Strip structural markers from paper for LLM (prevents anchor text mismatch)
+            # Show the same marker-bearing paper that validation/apply will match.
             paper_for_llm = _strip_paper_markers_for_llm(current_paper)
-            logger.info(f"Paper stripped: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers removed)")
+            logger.info(f"Paper prepared for LLM: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers preserved)")
             
             # Retrieve aggregator database evidence
             # Exclude outline and paper (both direct-injected in outline_update mode)
@@ -456,9 +522,9 @@ async def submit_construction(
             current_paper = await paper_memory.get_paper()
             logger.info(f"State loaded: outline={len(current_outline)} chars, paper={len(current_paper)} chars")
             
-            # Strip structural markers from paper for LLM (prevents anchor text mismatch)
+            # Show the same marker-bearing paper that validation/apply will match.
             paper_for_llm = _strip_paper_markers_for_llm(current_paper)
-            logger.info(f"Paper stripped: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers removed)")
+            logger.info(f"Paper prepared for LLM: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers preserved)")
             
             # Calculate RAG budget accounting for brainstorm content (prevents context overflow)
             max_allowed_tokens = rag_config.get_available_input_tokens(
@@ -580,28 +646,42 @@ async def submit_construction(
             if self.task_tracking_callback:
                 self.task_tracking_callback("started", task_id)
             
-            # Get completion via api_client_manager (handles boost and fallback)
+            # Get completion via api_client_manager with Wolfram tool-loop.
+            # Phase 3: the main writer may invoke Wolfram Alpha up to
+            # WOLFRAM_MAX_CALLS_PER_SUBMISSION times per submission. When
+            # Wolfram is disabled this helper degrades to a single-shot call.
             logger.info(f"Generating LLM completion via api_client_manager (task_id={task_id})...")
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,  # Deterministic generation - evolving context provides diversity
-                max_tokens=system_config.compiler_high_context_max_output_tokens  # User-configurable (outline creation, update, construction, review)
+            try:
+                llm_output, wolfram_calls, _message = await self._generate_completion_with_wolfram_tool(
+                    task_id=task_id,
+                    initial_prompt=prompt,
+                )
+            except Exception as exc:
+                # Any tool-loop failure falls back to the plain single-shot
+                # path so construction still makes forward progress.
+                logger.warning(
+                    "Wolfram tool-loop failed (%s); falling back to single-shot construction call",
+                    exc,
+                )
+                fallback = await api_client_manager.generate_completion(
+                    task_id=f"{task_id}_fallback",
+                    role_id=self.role_id,
+                    model=self.model_name,
+                    messages=[{"role": "user", "content": prompt}],
+                    temperature=0.0,
+                    max_tokens=system_config.compiler_high_context_max_output_tokens,
+                )
+                if not fallback.get("choices") or not fallback["choices"][0].get("message"):
+                    logger.error("construction: LLM returned empty response structure")
+                    raise ValueError("LLM returned empty response")
+                fallback_msg = fallback["choices"][0]["message"]
+                llm_output = fallback_msg.get("content") or fallback_msg.get("reasoning") or ""
+                wolfram_calls = []
+            logger.info(
+                f"LLM completion received: {len(llm_output)} chars "
+                f"({len(wolfram_calls)} Wolfram tool call(s))"
             )
             
-            # Check for empty response
-            if not response.get("choices") or not response["choices"][0].get("message"):
-                logger.error("construction: LLM returned empty response structure")
-                raise ValueError("LLM returned empty response")
-            
-            # Extract content from either 'content' or 'reasoning' field
-            # Some reasoning models (e.g., DeepSeek R1, certain GPT variants) output JSON in 'reasoning' field
-            message = response["choices"][0]["message"]
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            logger.info(f"LLM completion received: {len(llm_output)} chars")
-            
             # Check for empty content
             # Parse response with retry
             logger.info("Parsing JSON response...")
@@ -646,7 +726,12 @@ async def submit_construction(
                         new_string="",
                         reasoning=data.get("reasoning", "Section marked as complete"),
                         section_complete=True,
-                        metadata={"coverage": context_pack.coverage, "is_first": is_first_portion, "phase": section_phase}
+                        metadata={
+                            "coverage": context_pack.coverage,
+                            "is_first": is_first_portion,
+                            "phase": section_phase,
+                            "wolfram_calls": wolfram_calls,
+                        },
                     )
                     # Notify task completed successfully
                     if self.task_tracking_callback:
@@ -678,7 +763,12 @@ async def submit_construction(
                 new_string=new_string_content,  # Already normalized above
                 reasoning=data.get("reasoning", ""),
                 section_complete=section_complete,
-                metadata={"coverage": context_pack.coverage, "is_first": is_first_portion, "phase": section_phase}
+                metadata={
+                    "coverage": context_pack.coverage,
+                    "is_first": is_first_portion,
+                    "phase": section_phase,
+                    "wolfram_calls": wolfram_calls,
+                },
             )
             
             # Parse optional brainstorm retroactive operation
@@ -741,9 +831,9 @@ async def submit_review(self, review_focus: str = "general") -> Optional[Compile
             current_paper = await paper_memory.get_paper()
             logger.info(f"State loaded: outline={len(current_outline)} chars, paper={len(current_paper)} chars")
             
-            # Strip structural markers from paper for LLM (prevents anchor text mismatch)
+            # Show the same marker-bearing paper that validation/apply will match.
             paper_for_llm = _strip_paper_markers_for_llm(current_paper)
-            logger.info(f"Paper stripped: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers removed)")
+            logger.info(f"Paper prepared for LLM: {len(current_paper)} chars → {len(paper_for_llm)} chars (markers preserved)")
             
             # Build prompt (no RAG, just direct outline + paper content)
             # CRITICAL: Outline is ALWAYS fully injected per architectural rules
@@ -878,6 +968,230 @@ async def submit_review(self, review_focus: str = "general") -> Optional[Compile
                 self.task_tracking_callback("completed", task_id)
             return None  # Don't crash workflow on review failure
     
+    async def _generate_completion_with_wolfram_tool(
+        self,
+        *,
+        task_id: str,
+        initial_prompt: str,
+    ) -> tuple[str, List[Dict[str, Any]], Dict[str, Any]]:
+        """Run the construction LLM call with the Wolfram tool attached.
+
+        Returns (final_llm_text, wolfram_calls, raw_message_dict).
+
+        Behavior:
+        - If Wolfram is disabled / unavailable, behaves like a single-shot
+          `generate_completion` (preserves pre-Phase-3 behavior).
+        - Otherwise, registers WOLFRAM_TOOL_SCHEMA on the call and loops: on
+          any `tool_calls` in the assistant response, executes each via
+          `wolfram_client.query(...)`, appends a tool-role turn with the
+          result, and re-prompts the LLM. Up to 20 tool calls per submission.
+        - On budget exhaustion, injects a user-role reminder and re-calls
+          the LLM with tools disabled so it finalizes with whatever data
+          it has gathered.
+        - If the model never emits tool_calls (or the backend returns a
+          plain completion in one shot), this function behaves identically
+          to the single-shot path.
+
+        Websocket events:
+        - `compiler_wolfram_call` broadcast per call with query + preview.
+        """
+        wolfram_enabled = _wolfram_tool_available()
+
+        messages: List[Dict[str, Any]] = [{"role": "user", "content": initial_prompt}]
+        wolfram_calls: List[Dict[str, Any]] = []
+
+        # Get the Wolfram client once per submission so we don't repeatedly
+        # re-resolve the singleton. Only resolved when tool is enabled.
+        wolfram_client = None
+        if wolfram_enabled:
+            try:
+                from backend.shared.wolfram_alpha_client import get_wolfram_client
+                wolfram_client = get_wolfram_client()
+            except Exception as exc:
+                logger.warning(f"Wolfram client init failed; disabling tool for this call: {exc}")
+                wolfram_enabled = False
+
+        # Hard cap on total LLM turns in the loop. Each tool round is 1
+        # assistant turn + 1 user/tool turn; plus one finalization turn on
+        # budget exhaustion. This bound prevents runaway if the model just
+        # keeps calling tools.
+        max_loop_iterations = WOLFRAM_MAX_CALLS_PER_SUBMISSION + 3
+
+        for iteration in range(max_loop_iterations):
+            # Attach tools when the budget is not yet exhausted
+            tools_param = (
+                [WOLFRAM_TOOL_SCHEMA]
+                if wolfram_enabled and len(wolfram_calls) < WOLFRAM_MAX_CALLS_PER_SUBMISSION
+                else None
+            )
+
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=self.role_id,
+                model=self.model_name,
+                messages=messages,
+                temperature=0.0,
+                max_tokens=system_config.compiler_high_context_max_output_tokens,
+                tools=tools_param,
+            )
+
+            if not response.get("choices") or not response["choices"][0].get("message"):
+                raise ValueError("LLM returned empty response")
+            message = response["choices"][0]["message"]
+            tool_calls = message.get("tool_calls") or []
+
+            if not tool_calls:
+                # Final turn - extract content and return
+                content = message.get("content") or message.get("reasoning") or ""
+                return content, wolfram_calls, message
+
+            # Append assistant turn verbatim so tool-role replies have the
+            # right pairing ids.
+            assistant_turn: Dict[str, Any] = {
+                "role": "assistant",
+                "content": message.get("content") or "",
+                "tool_calls": tool_calls,
+            }
+            messages.append(assistant_turn)
+
+            # Execute each tool call and append tool-role replies.
+            for tool_call in tool_calls:
+                fn = tool_call.get("function") or {}
+                name = fn.get("name", "")
+                arguments_raw = fn.get("arguments") or "{}"
+                if name != "wolfram_alpha_query":
+                    # Unknown tool - return a structured error so the model
+                    # learns not to call it again, but don't hard-fail.
+                    messages.append({
+                        "role": "tool",
+                        "tool_call_id": tool_call.get("id", ""),
+                        "content": f"Tool '{name}' is not available; ignore.",
+                    })
+                    continue
+
+                if not wolfram_enabled or wolfram_client is None:
+                    messages.append({
+                        "role": "tool",
+                        "tool_call_id": tool_call.get("id", ""),
+                        "content": "Wolfram Alpha is not enabled; continue without external verification.",
+                    })
+                    continue
+
+                if len(wolfram_calls) >= WOLFRAM_MAX_CALLS_PER_SUBMISSION:
+                    messages.append({
+                        "role": "tool",
+                        "tool_call_id": tool_call.get("id", ""),
+                        "content": (
+                            f"Wolfram Alpha call budget exhausted "
+                            f"({WOLFRAM_MAX_CALLS_PER_SUBMISSION} calls used). "
+                            "Do not call this tool again; finalize your JSON response."
+                        ),
+                    })
+                    continue
+
+                try:
+                    args = json.loads(arguments_raw) if isinstance(arguments_raw, str) else dict(arguments_raw)
+                except Exception as exc:
+                    messages.append({
+                        "role": "tool",
+                        "tool_call_id": tool_call.get("id", ""),
+                        "content": f"Tool call arguments were not valid JSON ({exc}); re-issue the call with valid JSON.",
+                    })
+                    continue
+
+                query = str(args.get("query", "") or "").strip()
+                purpose = str(args.get("purpose", "") or "").strip()
+                if not query:
+                    messages.append({
+                        "role": "tool",
+                        "tool_call_id": tool_call.get("id", ""),
+                        "content": "Tool call missing 'query'; re-issue with a concrete query.",
+                    })
+                    continue
+
+                try:
+                    result_text = await wolfram_client.query(query)
+                except Exception as exc:
+                    logger.warning(f"Wolfram query raised: {exc}")
+                    result_text = None
+                result_text = result_text or "Wolfram Alpha returned no result."
+                wolfram_calls.append({
+                    "query": query,
+                    "purpose": purpose,
+                    "result": result_text,
+                })
+                logger.info(
+                    "Wolfram Alpha call %d/%d: %s",
+                    len(wolfram_calls),
+                    WOLFRAM_MAX_CALLS_PER_SUBMISSION,
+                    query[:120],
+                )
+                try:
+                    await self._broadcast_wolfram_event(
+                        task_id=task_id,
+                        query=query,
+                        purpose=purpose,
+                        result=result_text,
+                        calls_used=len(wolfram_calls),
+                    )
+                except Exception as exc:
+                    logger.debug(f"Wolfram websocket broadcast failed (non-fatal): {exc}")
+
+                messages.append({
+                    "role": "tool",
+                    "tool_call_id": tool_call.get("id", ""),
+                    "content": result_text,
+                })
+
+            # After exhausting the budget, inject a one-time reminder and
+            # let the next loop iteration run without tools so the model
+            # must finalize its JSON response.
+            if wolfram_enabled and len(wolfram_calls) >= WOLFRAM_MAX_CALLS_PER_SUBMISSION:
+                messages.append({
+                    "role": "user",
+                    "content": (
+                        f"You have used all {WOLFRAM_MAX_CALLS_PER_SUBMISSION} "
+                        "Wolfram Alpha calls for this submission. Finalize "
+                        "your JSON response now using the information you "
+                        "have gathered. Do not attempt further tool calls."
+                    ),
+                })
+
+        # Loop cap reached without a clean finalization - surface whatever
+        # text the last assistant turn produced, or empty string.
+        for turn in reversed(messages):
+            if turn.get("role") == "assistant" and turn.get("content"):
+                return str(turn["content"]), wolfram_calls, turn
+        return "", wolfram_calls, {}
+
+    async def _broadcast_wolfram_event(
+        self,
+        *,
+        task_id: str,
+        query: str,
+        purpose: str,
+        result: str,
+        calls_used: int,
+    ) -> None:
+        """Broadcast one compiler_wolfram_call websocket event."""
+        if not self.websocket_broadcaster:
+            return
+        try:
+            await self.websocket_broadcaster(
+                "compiler_wolfram_call",
+                {
+                    "task_id": task_id,
+                    "query": query,
+                    "purpose": purpose,
+                    "result_preview": (result or "")[:200],
+                    "calls_used": calls_used,
+                    "calls_remaining": max(0, WOLFRAM_MAX_CALLS_PER_SUBMISSION - calls_used),
+                    "max_calls": WOLFRAM_MAX_CALLS_PER_SUBMISSION,
+                },
+            )
+        except Exception as exc:
+            logger.debug(f"Wolfram broadcast failed: {exc}")
+
     async def _parse_json_response_with_retry(
         self, 
         response: str, 
diff --git a/backend/compiler/agents/high_param_submitter.py b/backend/compiler/agents/high_param_submitter.py
index 745cda8..3722798 100644
--- a/backend/compiler/agents/high_param_submitter.py
+++ b/backend/compiler/agents/high_param_submitter.py
@@ -1,44 +1,60 @@
 """
-High-parameter submitter agent for compiler.
-Handles rigor enhancement mode (2-step process).
+High-parameter submitter agent for the compiler's rigor loop.
+
+The rigor loop no longer rewrites paper text. Instead it runs a two-stage
+Lean-4-verified-theorem flow (see RIGOR_LEAN_BUILD_PLAN.md):
+
+    Stage 1 (discovery): pick a theorem worth formalizing using the full
+        writing context.
+    Stage 2 (formalization): hand the candidate to ProofFormalizationAgent
+        for up to 5 Lean 4 attempts with error-feedback chaining.
+    Stage 3 (novelty): classify the verified proof and persist it via
+        proof_database.add_proof.
+    Stage 4 (placement): propose an inline edit that introduces the
+        theorem with a "verified in Lean 4" marker and an appendix
+        reference. The coordinator owns the 2-attempt validator retry loop
+        and the appendix fallback.
+
+The Wolfram sub-mode that used to live here has been removed in Phase 2.
+Wolfram Alpha is now a tool available to HighContextSubmitter.submit_construction
+(see Phase 3 of the build plan).
 """
-import asyncio
+
+from __future__ import annotations
+
 import logging
 import uuid
-from datetime import datetime
-from typing import Optional, Dict, Any, List, Callable
+from dataclasses import dataclass, field
+from typing import Any, Awaitable, Callable, Dict, List, Optional
 
-from backend.shared.lm_studio_client import lm_studio_client
+from backend.autonomous.memory.proof_database import proof_database
+from backend.compiler.core.compiler_rag_manager import compiler_rag_manager
+from backend.compiler.memory.outline_memory import outline_memory
+from backend.compiler.memory.paper_memory import (
+    paper_memory,
+)
+from backend.compiler.prompts.rigor_prompts import (
+    build_rigor_placement_prompt,
+    build_rigor_theorem_discovery_prompt,
+)
 from backend.shared.api_client_manager import api_client_manager
-from backend.shared.models import CompilerSubmission
-from backend.shared.config import system_config, rag_config
+from backend.shared.config import rag_config, system_config
 from backend.shared.json_parser import parse_json
-from backend.aggregator.validation.json_validator import json_validator
-from backend.compiler.prompts.rigor_prompts import (
-    build_rigor_planning_prompt,
-    build_rigor_execution_prompt,
-    build_rigor_wolfram_execution_prompt
+from backend.shared.lm_studio_client import lm_studio_client
+from backend.shared.models import (
+    CompilerSubmission,
+    ProofAttemptFeedback,
+    ProofCandidate,
+    ProofRecord,
 )
-from backend.compiler.memory.outline_memory import outline_memory
-from backend.compiler.memory.paper_memory import paper_memory
-from backend.compiler.core.compiler_rag_manager import compiler_rag_manager
+from backend.shared.utils import count_tokens
 
 logger = logging.getLogger(__name__)
 
 
 def _normalize_string_field(value) -> str:
-    """
-    Normalize string field from LLM response.
-    Some LLMs incorrectly return strings as lists.
-    
-    Args:
-        value: Raw value from JSON (could be str, list, or other)
-    
-    Returns:
-        Normalized string value
-    """
+    """Normalize string field from LLM response (tolerates list-of-strings mistakes)."""
     if isinstance(value, list):
-        # LLM returned list - join into single string
         logger.warning(f"LLM returned field as list (length {len(value)}), converting to string")
         return " ".join(str(item) for item in value if item)
     elif isinstance(value, str):
@@ -46,755 +62,839 @@ def _normalize_string_field(value) -> str:
     elif value is None:
         return ""
     else:
-        # Fallback: convert to string
         logger.warning(f"LLM returned field as {type(value)}, converting to string")
         return str(value)
 
 
-class HighParamSubmitter:
+def _strip_paper_markers_for_llm(paper_content: str) -> str:
+    """Prepare paper text before handing it to the LLM.
+
+    The submitter must see the same editable paper text that exact-match
+    validation checks. Keep placeholders and theorem appendix bracket markers
+    visible so old_string anchors can be copied verbatim from the real paper.
+    """
+    if not paper_content:
+        return ""
+    return paper_content.strip()
+
+
+def format_theorem_appendix_entry(
+    *,
+    proof_id: str,
+    theorem_statement: str,
+    lean_code: str,
+    is_novel: bool,
+    theorem_name: str = "",
+    placement_outcome: str = "appendix_fallback",
+) -> str:
+    """Format a verified-theorem entry for the Theorems Appendix.
+
+    Used both when placement is inline (a short cross-reference stub) and
+    when placement fails and the full entry is the only record (appendix
+    fallback). Caller selects via `placement_outcome`.
+    """
+    header_name = theorem_name.strip() or proof_id
+    novelty_label = "Novel" if is_novel else "Known"
+    status_suffix = {
+        "appendix_fallback": "inline placement rejected; preserved here because Lean 4 verified the math",
+        "inline": "also placed inline in the body",
+    }.get(placement_outcome, placement_outcome)
+
+    lines = [
+        f"Theorem ({proof_id}) [{novelty_label}] - {header_name}",
+        f"Status: verified by Lean 4 ({status_suffix})",
+        f"Statement: {theorem_statement.strip()}",
+        "Lean 4 proof:",
+        lean_code.strip() or "[lean code unavailable]",
+        "---",
+    ]
+    return "\n".join(lines)
+
+
+@dataclass
+class RigorTheoremResult:
+    """Bundle returned from submit_rigor_lean_theorem on a verified proof.
+
+    The coordinator owns the 2-attempt validator loop and the appendix
+    fallback, so the submitter returns everything the coordinator needs to
+    drive retries without re-running discovery / formalization.
     """
-    High-parameter, low-context submitter for compiler.
-    
-    Mode:
-    - rigor: Enhance scientific rigor (2-step process)
-      Step 1: Planning (unvalidated)
-      Step 2: Execution (with self-refusal option)
+    proof_id: str
+    theorem_statement: str
+    theorem_name: str
+    lean_code: str
+    is_novel: bool
+    novelty_reasoning: str
+    attempts: List[ProofAttemptFeedback]
+    source_id: str
+    initial_placement_submission: Optional[CompilerSubmission] = None
+    # Retained for retry-prompt assembly
+    formal_sketch: str = ""
+    source_excerpt: str = ""
+    # Metadata pass-through
+    metadata: Dict[str, Any] = field(default_factory=dict)
+
+
+class HighParamSubmitter:
+    """High-parameter submitter for the compiler's rigor loop.
+
+    Drives the Lean-4-verified-theorem flow end-to-end: discovery -> 5 Lean
+    attempts -> novelty classification -> persist -> initial placement
+    submission. Placement retries are driven by `submit_rigor_placement_retry`
+    (called by the coordinator after a validator rejection).
     """
-    
-    def __init__(self, model_name: str, user_prompt: str, websocket_broadcaster: Optional[Callable] = None):
+
+    def __init__(
+        self,
+        model_name: str,
+        user_prompt: str,
+        websocket_broadcaster: Optional[Callable[[str, Dict[str, Any]], Awaitable[None]]] = None,
+    ):
         self.model_name = model_name
-        self.user_prompt = user_prompt
+        # NOTE: proof_database.inject_into_prompt prepends all novel proofs
+        # so later discovery calls naturally avoid re-proposing them.
+        self.user_prompt = proof_database.inject_into_prompt(user_prompt)
+        self.raw_user_prompt = user_prompt
         self.websocket_broadcaster = websocket_broadcaster
         self._initialized = False
-        
+        self._standalone_session_id = f"standalone_{uuid.uuid4().hex[:12]}"
+
         # Task tracking for workflow panel and boost integration
         self.task_sequence: int = 0
         self.role_id = "compiler_high_param"
-        self.task_tracking_callback: Optional[Callable] = None
-    
-    def set_task_tracking_callback(self, callback: Callable) -> None:
-        """Set callback for task tracking (workflow panel integration)."""
+        self.task_tracking_callback: Optional[Callable[[str, str], None]] = None
+
+        # Populated by initialize()
+        self.context_window: int = system_config.compiler_high_param_context_window
+        self.max_output_tokens: int = system_config.compiler_high_param_max_output_tokens
+        self.available_input_tokens: int = rag_config.get_available_input_tokens(
+            self.context_window, self.max_output_tokens
+        )
+
+    # ------------------------------------------------------------------ setup
+
+    def set_task_tracking_callback(self, callback: Callable[[str, str], None]) -> None:
         self.task_tracking_callback = callback
-    
+
     def get_current_task_id(self) -> str:
-        """Get the task ID for the current/next API call."""
         return f"comp_hp_{self.task_sequence:03d}"
-    
+
     async def initialize(self) -> None:
-        """Initialize submitter."""
         if self._initialized:
             return
-        
-        # Set context window from system config
+
         self.context_window = system_config.compiler_high_param_context_window
         self.max_output_tokens = system_config.compiler_high_param_max_output_tokens
-        self.available_input_tokens = rag_config.get_available_input_tokens(self.context_window, self.max_output_tokens)
-        
+        self.available_input_tokens = rag_config.get_available_input_tokens(
+            self.context_window, self.max_output_tokens
+        )
+
         self._initialized = True
         logger.info(f"High-param submitter initialized with model: {self.model_name}")
-        logger.info(f"Context budget: {self.available_input_tokens} tokens (window: {self.context_window})")
-    
-    
-    async def submit_rigor_enhancement(self) -> Optional[CompilerSubmission]:
-        """
-        Submit rigor enhancement using 2-step process.
-        
-        Step 1: Planning (unvalidated) - decide if work needed and choose mode
-        Step 2: Execution (with self-refusal) - carry out the work
-        
-        Returns:
-            CompilerSubmission if enhancement made, None otherwise
-        """
-        logger.info("Starting rigor enhancement (Step 1: Planning)...")
-        
+        logger.info(
+            f"Context budget: {self.available_input_tokens} tokens "
+            f"(window: {self.context_window})"
+        )
+
+    # -------------------------------------------------------- broadcast helpers
+
+    async def _broadcast(self, event: str, data: Dict[str, Any]) -> None:
+        if not self.websocket_broadcaster:
+            return
         try:
-            # STEP 1: PLANNING
-            planning_result = await self._step1_planning()
-            
-            if planning_result is None:
-                logger.error("Step 1 planning failed (JSON parse error)")
-                return None
-            
-            if not planning_result.get("needs_rigor_work", False):
-                logger.info("Step 1: No rigor work needed (declined)")
-                return None
-            
-            mode = planning_result.get("mode")
-            target_section = planning_result.get("target_section", "")
-            wolfram_query = planning_result.get("wolfram_query", "")
-            
-            logger.info(f"Step 1 complete: mode={mode}, target_section_len={len(target_section)}")
-            
-            # STEP 2: EXECUTION (mode-specific)
-            if mode == "wolfram_verification":
-                return await self._step2_wolfram_execution(
-                    target_section,
-                    wolfram_query
-                )
-            else:  # standard_enhancement or rewrite_focus
-                return await self._step2_standard_execution(
-                    mode,
-                    target_section
-                )
-                
-        except Exception as e:
-            logger.error(f"Rigor enhancement failed: {e}", exc_info=True)
-            raise
-    
-    async def _step1_planning(self) -> Optional[dict]:
+            await self.websocket_broadcaster(event, data)
+        except Exception as exc:
+            logger.debug("Rigor broadcast failed (%s): %s", event, exc)
+
+    # -------------------------------------------------------- session helpers
+
+    def _resolve_session_id(self) -> str:
+        """Best-effort session id for proof / failure tracking.
+
+        When the autonomous session manager is active, proof_database is
+        already storing in the session directory. Otherwise each manual
+        compiler instance gets its own id so failed theorem candidates do not
+        bleed into later standalone compiler runs.
         """
-        Execute Step 1: Planning (unvalidated).
-        
-        LLM decides:
-        - Does document need rigor work?
-        - Which mode to use?
-        - What section to work on?
-        
-        Returns:
-            Planning JSON dict or None if parse fails
+        sm = getattr(proof_database, "_session_manager", None)
+        if sm is not None and getattr(sm, "is_session_active", False):
+            return str(getattr(sm, "session_id", "") or "autonomous_active")
+        return self._standalone_session_id
+
+    def _compiler_source_id(self) -> str:
+        """Source id used on ProofRecord / failed candidate storage.
+
+        Format: ``compiler_rigor:<session>``. The session suffix lets the
+        failure-hint log cleanly scope retries per session (same as how
+        brainstorm-driven proofs scope by brainstorm id).
         """
-        logger.info("Step 1: Loading document state for planning...")
-        
-        # Get current outline and paper
-        current_outline = await outline_memory.get_outline()
-        current_paper = await paper_memory.get_paper()
-        
-        logger.info(f"Step 1: State loaded - outline={len(current_outline)} chars, paper={len(current_paper)} chars")
-        
-        # Retrieve relevant paper sections via RAG (same as current rigor mode)
-        from backend.shared.utils import count_tokens
-        max_allowed_tokens = rag_config.get_available_input_tokens(
-            system_config.compiler_high_param_context_window,
-            system_config.compiler_high_param_max_output_tokens
+        return f"compiler_rigor:{self._resolve_session_id()}"
+
+    # ---------------------------------------------------- context assembly
+
+    async def _build_rigor_rag_context(
+        self,
+        *,
+        query_seed: str,
+        reserved_tokens: int,
+    ) -> str:
+        """Retrieve RAG evidence for the rigor prompts.
+
+        Mirrors the HighContextSubmitter.submit_construction budget
+        pattern: outline + paper are direct-injected by the caller, so
+        we exclude them from RAG. The remaining budget goes to the
+        RAG offload priority (Shared Training DB -> Local Submitter DB
+        -> Rejection Log -> User Upload Files) handled inside the
+        aggregator RAG manager.
+        """
+        max_allowed = rag_config.get_available_input_tokens(
+            self.context_window, self.max_output_tokens
         )
-        
-        # Try initial RAG retrieval - may overflow if outline + system prompts are large
-        # Exclude outline (always direct-injected in rigor mode)
-        rigor_exclude = ["compiler_outline.txt"]
+        remaining = max(1000, max_allowed - reserved_tokens - 200)
+
         try:
-            logger.info("Step 1: Retrieving relevant paper sections via RAG...")
             context_pack = await compiler_rag_manager.retrieve_for_mode(
-                query=self.user_prompt + " " + current_paper[-1000:],
+                query=query_seed,
                 mode="rigor",
-                exclude_sources=rigor_exclude
-            )
-            logger.info(f"Step 1: RAG retrieval complete - {len(context_pack.text)} chars")
-            
-            # Build planning prompt
-            logger.info("Step 1: Building planning prompt...")
-            prompt = await build_rigor_planning_prompt(
-                user_prompt=self.user_prompt,
-                current_outline=current_outline,
-                current_paper=context_pack.text
-            )
-            
-            # Verify prompt size
-            actual_prompt_tokens = count_tokens(prompt)
-            
-            if actual_prompt_tokens > max_allowed_tokens:
-                raise ValueError(f"Prompt too large: {actual_prompt_tokens} tokens > {max_allowed_tokens} max")
-            
-            logger.debug(f"Step 1: Planning prompt {actual_prompt_tokens} tokens (max: {max_allowed_tokens})")
-            
-        except ValueError as e:
-            if "Prompt too large" not in str(e):
-                raise
-            
-            # Context overflow - reduce RAG budget
-            logger.warning("Step 1: Initial prompt too large, calculating reduced RAG budget...")
-            
-            mandatory_tokens = count_tokens(
-                await build_rigor_planning_prompt(self.user_prompt, current_outline, "")
+                max_tokens=remaining,
+                exclude_sources=["compiler_outline.txt", "compiler_paper.txt"],
             )
-            
-            remaining_budget = max_allowed_tokens - mandatory_tokens - 200
-            
-            if remaining_budget < 500:
-                raise ValueError(
-                    f"Context window too small for rigor mode: outline + system prompts require "
-                    f"{mandatory_tokens} tokens, only {max_allowed_tokens} available. "
-                    f"Increase compiler_high_param_context_window or reduce outline size."
+            return context_pack.text or ""
+        except Exception as exc:
+            logger.warning("Rigor RAG retrieval failed (%s); proceeding without RAG", exc)
+            return ""
+
+    # -------------------------------------------------------- public entrypoint
+
+    async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
+        """Run discovery + 5 Lean 4 attempts + novelty + initial placement.
+
+        Returns a RigorTheoremResult on a verified proof (coordinator then
+        drives the 2-attempt placement validator loop + appendix fallback).
+        Returns None on any decline path: no theorem worth trying, 5 Lean
+        attempts failed, or the placement submitter refused on attempt 1.
+        """
+        # Guard: if Lean 4 is disabled system-wide, there is nothing this
+        # submitter can do - the coordinator also guards on this but we add
+        # a belt-and-suspenders check here so callers can't bypass it.
+        if not system_config.lean4_enabled:
+            logger.info("submit_rigor_lean_theorem: Lean 4 disabled; declining rigor cycle")
+            return None
+
+        logger.info("Rigor cycle: Stage 1 - theorem discovery")
+        discovery = await self._step_discovery()
+        if discovery is None:
+            logger.info("Rigor cycle: discovery declined")
+            return None
+
+        theorem_statement = str(discovery.get("theorem_statement") or "").strip()
+        formal_sketch = str(discovery.get("formal_sketch") or "").strip()
+        source_excerpt = str(discovery.get("source_excerpt") or "").strip()
+        retry_failure_id = str(discovery.get("retry_existing_failure_id") or "").strip()
+
+        if not theorem_statement:
+            logger.info("Rigor cycle: discovery returned empty theorem_statement; declining")
+            return None
+
+        logger.info(
+            "Rigor cycle: Stage 2 - Lean 4 formalization (up to 5 attempts), "
+            f"retry_failure_id={retry_failure_id or 'none'}"
+        )
+
+        candidate = ProofCandidate(
+            theorem_id=retry_failure_id or f"compiler_rigor_{uuid.uuid4().hex[:12]}",
+            statement=theorem_statement,
+            formal_sketch=formal_sketch,
+            source_excerpt=source_excerpt,
+            origin_source_id=self._compiler_source_id() if retry_failure_id else "",
+        )
+
+        formalizer_result = await self._step_formalize(candidate, theorem_statement)
+        if formalizer_result is None:
+            return None
+
+        theorem_name, lean_code, attempts = formalizer_result
+
+        logger.info("Rigor cycle: Stage 3 - novelty classification + persistence")
+        is_novel, novelty_reasoning, stored_record = await self._step_assess_novelty_and_store(
+            theorem_statement=theorem_statement,
+            theorem_name=theorem_name,
+            lean_code=lean_code,
+            formal_sketch=formal_sketch,
+            attempts=attempts,
+        )
+
+        await self._broadcast(
+            "proof_verified",
+            {
+                "source_type": "compiler_rigor",
+                "source_id": self._compiler_source_id(),
+                "theorem_id": candidate.theorem_id,
+                "theorem_statement": theorem_statement,
+                "proof_id": stored_record.proof_id,
+                "is_novel": is_novel,
+            },
+        )
+
+        # If we retried a previously-failed candidate and it succeeded, mark it
+        # resolved so it stops appearing in future failure-hint lists.
+        if retry_failure_id:
+            try:
+                await proof_database.mark_resolved_retry(
+                    source_brainstorm_id=self._compiler_source_id(),
+                    theorem_id=retry_failure_id,
+                    proof_id=stored_record.proof_id,
                 )
-            
-            logger.warning(f"Step 1: Retrying with reduced RAG budget: {remaining_budget} tokens")
-            context_pack = await compiler_rag_manager.retrieve_for_mode(
-                query=self.user_prompt + " " + current_paper[-1000:],
-                mode="rigor",
-                max_tokens=remaining_budget,
-                exclude_sources=rigor_exclude
-            )
-            
-            prompt = await build_rigor_planning_prompt(
-                user_prompt=self.user_prompt,
-                current_outline=current_outline,
-                current_paper=context_pack.text
-            )
-            
-            actual_prompt_tokens = count_tokens(prompt)
-            logger.info(f"Step 1: Adjusted prompt to {actual_prompt_tokens} tokens")
-        
-        # Generate task ID
-        task_id = self.get_current_task_id()
-        self.task_sequence += 1
-        
-        if self.task_tracking_callback:
-            self.task_tracking_callback("started", task_id)
-        
-        # Call LLM
-        logger.info(f"Step 1: Generating LLM completion (task_id={task_id})...")
-        response = await api_client_manager.generate_completion(
-            task_id=task_id,
-            role_id=self.role_id,
-            model=self.model_name,
-            messages=[{"role": "user", "content": prompt}],
-            temperature=0.0,
-            max_tokens=system_config.compiler_high_param_max_output_tokens
+            except Exception as exc:
+                logger.debug("mark_resolved_retry failed (non-fatal): %s", exc)
+
+        logger.info("Rigor cycle: Stage 4 - initial placement proposal")
+        initial_submission = await self._step_initial_placement(
+            proof_id=stored_record.proof_id,
+            theorem_statement=theorem_statement,
+            theorem_name=theorem_name,
+            lean_code=lean_code,
+            is_novel=is_novel,
         )
-        
-        # Extract content
-        if not response.get("choices") or not response["choices"][0].get("message"):
-            logger.error("Step 1: LLM returned empty response structure")
-            raise ValueError("LLM returned empty response")
-        message = response["choices"][0]["message"]
-        llm_output = message.get("content") or message.get("reasoning") or ""
-        logger.info(f"Step 1: LLM completion received - {len(llm_output)} chars")
-        
-        # Parse JSON
+
+        return RigorTheoremResult(
+            proof_id=stored_record.proof_id,
+            theorem_statement=theorem_statement,
+            theorem_name=theorem_name,
+            lean_code=lean_code,
+            is_novel=is_novel,
+            novelty_reasoning=novelty_reasoning,
+            attempts=attempts,
+            source_id=self._compiler_source_id(),
+            initial_placement_submission=initial_submission,
+            formal_sketch=formal_sketch,
+            source_excerpt=source_excerpt,
+            metadata={
+                "retry_failure_id": retry_failure_id,
+                "attempt_count": len(attempts),
+            },
+        )
+
+    # --------------------------------------------------------- stage 1
+
+    async def _step_discovery(self) -> Optional[dict]:
+        """Ask the LLM whether a Lean 4 theorem is worth pursuing right now."""
+        current_outline = await outline_memory.get_outline()
+        current_paper_raw = await paper_memory.get_paper()
+        current_paper = _strip_paper_markers_for_llm(current_paper_raw)
+
+        # Existing verified proofs - compact blob of statements so the model
+        # can recognize duplicates without blowing the token budget.
+        existing_proofs: List[dict] = []
         try:
-            data = parse_json(llm_output)
-            logger.info("Step 1: JSON parsed successfully")
-            
-            # Handle array responses
-            if isinstance(data, list):
-                if len(data) == 0:
-                    logger.warning("Step 1: Empty array returned, treating as no work needed")
-                    if self.task_tracking_callback:
-                        self.task_tracking_callback("completed", task_id)
-                    return None
-                logger.warning(f"Step 1: Array of {len(data)} objects returned, using first")
-                data = data[0]
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            return data
-            
-        except RuntimeError as e:
-            if "credits exhausted" in str(e).lower():
-                raise
-            logger.error(f"Step 1: JSON parse failed - {e}")
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
+            for record in await proof_database.get_all_proofs():
+                existing_proofs.append(
+                    {
+                        "proof_id": record.proof_id,
+                        "novel": record.novel,
+                        "theorem_statement": record.theorem_statement,
+                    }
+                )
+        except Exception as exc:
+            logger.debug("proof_database.get_all_proofs failed: %s", exc)
+
+        try:
+            failure_hints = await proof_database.get_recent_failure_hints(
+                self._compiler_source_id(), limit=5
+            )
+        except Exception as exc:
+            logger.debug("proof_database.get_recent_failure_hints failed: %s", exc)
+            failure_hints = []
+
+        # Build with empty RAG first to measure the mandatory footprint,
+        # then allocate the rest to RAG.
+        base_prompt = await build_rigor_theorem_discovery_prompt(
+            user_prompt=self.user_prompt,
+            current_outline=current_outline,
+            current_paper=current_paper,
+            rag_evidence="",
+            existing_verified_proofs=existing_proofs,
+            recent_failure_hints=failure_hints,
+        )
+        mandatory_tokens = count_tokens(base_prompt)
+        query_seed = (self.raw_user_prompt + " " + current_paper[-1500:]).strip()
+        rag_evidence = await self._build_rigor_rag_context(
+            query_seed=query_seed,
+            reserved_tokens=mandatory_tokens,
+        )
+
+        prompt = await build_rigor_theorem_discovery_prompt(
+            user_prompt=self.user_prompt,
+            current_outline=current_outline,
+            current_paper=current_paper,
+            rag_evidence=rag_evidence,
+            existing_verified_proofs=existing_proofs,
+            recent_failure_hints=failure_hints,
+        )
+
+        max_allowed = rag_config.get_available_input_tokens(
+            self.context_window, self.max_output_tokens
+        )
+        if count_tokens(prompt) > max_allowed:
+            logger.warning("Rigor discovery prompt too large; retrying without RAG evidence")
+            prompt = base_prompt
+
+        data = await self._call_llm_and_parse(
+            prompt=prompt,
+            task_label="rigor_discovery",
+        )
+        if data is None:
             return None
-        except Exception as e:
-            logger.error(f"Step 1: JSON parse failed - {e}")
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
+        if isinstance(data, list):
+            data = data[0] if data else {}
+        if not isinstance(data, dict):
+            return None
+        if not data.get("needs_theorem_work", False):
             return None
-    
-    async def _step2_standard_execution(
+        return data
+
+    # --------------------------------------------------------- stage 2
+
+    async def _step_formalize(
         self,
-        mode: str,
-        target_section: str
-    ) -> Optional[CompilerSubmission]:
-        """
-        Execute Step 2: Standard or rewrite enhancement.
-        
-        Args:
-            mode: "standard_enhancement" or "rewrite_focus"
-            target_section: Target section from Step 1 (guidance label)
-        
-        Returns:
-            CompilerSubmission if enhancement made, None otherwise
+        candidate: ProofCandidate,
+        theorem_statement: str,
+    ) -> Optional[tuple]:
+        """Run up to 5 Lean 4 attempts with feedback chaining.
+
+        Returns (theorem_name, lean_code, attempts) on success, None on
+        all-5-fail. On failure, records the candidate in proof_database so
+        future rigor cycles can see it as an open lemma target.
         """
-        logger.info(f"Starting Step 2: {mode} execution...")
-        
+        current_paper_raw = await paper_memory.get_paper()
+        current_paper = _strip_paper_markers_for_llm(current_paper_raw)
+
+        # Imported lazily to avoid a circular-import chain through the
+        # autonomous agents package at module load time.
+        from backend.autonomous.agents.proof_formalization_agent import (
+            ProofFormalizationAgent,
+        )
+
+        formalizer = ProofFormalizationAgent(
+            model_id=self.model_name,
+            context_window=self.context_window,
+            max_output_tokens=self.max_output_tokens,
+            role_id="compiler_rigor_formalization",
+        )
+
+        async def _on_attempt_started(attempt_number: int, strategy: str) -> None:
+            await self._broadcast(
+                "proof_attempt_started",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "theorem_id": candidate.theorem_id,
+                    "theorem_statement": theorem_statement,
+                    "attempt": attempt_number,
+                    "strategy": strategy,
+                },
+            )
+
+        async def _on_attempt_feedback(feedback: ProofAttemptFeedback) -> None:
+            event = "proof_verified" if feedback.success else "proof_attempt_failed"
+            await self._broadcast(
+                event,
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "theorem_id": candidate.theorem_id,
+                    "theorem_statement": theorem_statement,
+                    "attempt": feedback.attempt,
+                    "strategy": feedback.strategy,
+                    "error_output": feedback.error_output[:500] if feedback.error_output else "",
+                },
+            )
+
+        await self._broadcast(
+            "proof_check_started",
+            {
+                "source_type": "compiler_rigor",
+                "source_id": self._compiler_source_id(),
+                "trigger": "rigor_loop",
+            },
+        )
+
         try:
-            # Get current state (same RAG retrieval as Step 1)
-            current_outline = await outline_memory.get_outline()
-            current_paper = await paper_memory.get_paper()
-            
-            # Use same RAG retrieval approach as Step 1
-            from backend.shared.utils import count_tokens
-            max_allowed_tokens = rag_config.get_available_input_tokens(
-                system_config.compiler_high_param_context_window,
-                system_config.compiler_high_param_max_output_tokens
+            success, theorem_name, lean_code, attempts = await formalizer.prove_candidate(
+                user_research_prompt=self.raw_user_prompt,
+                source_type="paper",  # ProofCandidate expects "paper" | "brainstorm"
+                theorem_candidate=candidate,
+                source_content=current_paper,
+                max_attempts=5,
+                attempt_callback=_on_attempt_feedback,
+                attempt_start_callback=_on_attempt_started,
+            )
+        except Exception as exc:
+            logger.error("Rigor formalization raised (%s); declining cycle", exc, exc_info=True)
+            await self._broadcast(
+                "proof_check_complete",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "verified_count": 0,
+                    "message": f"formalization error: {exc}",
+                },
             )
-            
-            # Try RAG retrieval
-            # Exclude outline (always direct-injected in rigor mode)
-            rigor_exclude = ["compiler_outline.txt"]
+            return None
+
+        if not success:
+            # Record as an open lemma target so the next rigor cycle's
+            # discovery step can optionally retry it.
             try:
-                logger.info("Step 2: Retrieving paper sections via RAG...")
-                context_pack = await compiler_rag_manager.retrieve_for_mode(
-                    query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor",
-                    exclude_sources=rigor_exclude
-                )
-                
-                # Build execution prompt
-                logger.info("Step 2: Building execution prompt...")
-                prompt = await build_rigor_execution_prompt(
-                    user_prompt=self.user_prompt,
-                    current_outline=current_outline,
-                    current_paper=context_pack.text,  # FULL paper via RAG
-                    target_section=target_section,  # Guidance label
-                    mode=mode
-                )
-                
-                # Verify prompt size
-                actual_prompt_tokens = count_tokens(prompt)
-                
-                if actual_prompt_tokens > max_allowed_tokens:
-                    raise ValueError(f"Prompt too large: {actual_prompt_tokens} tokens > {max_allowed_tokens} max")
-                
-                logger.debug(f"Step 2: Execution prompt {actual_prompt_tokens} tokens (max: {max_allowed_tokens})")
-                
-            except ValueError as e:
-                if "Prompt too large" not in str(e):
-                    raise
-                
-                # Reduce RAG budget
-                logger.warning("Step 2: Prompt too large, reducing RAG budget...")
-                
-                mandatory_tokens = count_tokens(
-                    await build_rigor_execution_prompt(
-                        self.user_prompt, current_outline, "", target_section, mode
-                    )
-                )
-                
-                remaining_budget = max_allowed_tokens - mandatory_tokens - 200
-                
-                if remaining_budget < 500:
-                    raise ValueError(
-                        f"Context window too small for Step 2: {mandatory_tokens} tokens required"
-                    )
-                
-                logger.warning(f"Step 2: Retrying with reduced budget: {remaining_budget} tokens")
-                context_pack = await compiler_rag_manager.retrieve_for_mode(
-                    query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor",
-                    max_tokens=remaining_budget,
-                    exclude_sources=rigor_exclude
-                )
-                
-                prompt = await build_rigor_execution_prompt(
-                    user_prompt=self.user_prompt,
-                    current_outline=current_outline,
-                    current_paper=context_pack.text,
-                    target_section=target_section,
-                    mode=mode
+                error_summary = attempts[-1].error_output if attempts else ""
+                await proof_database.record_failed_candidate(
+                    source_brainstorm_id=self._compiler_source_id(),
+                    theorem_candidate=candidate,
+                    error_summary=error_summary[:2000] if error_summary else "No Lean diagnostics captured.",
                 )
-                
-                actual_prompt_tokens = count_tokens(prompt)
-                logger.info(f"Step 2: Adjusted prompt to {actual_prompt_tokens} tokens")
-            
-            # Generate task ID
-            task_id = self.get_current_task_id()
-            self.task_sequence += 1
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM
-            logger.info(f"Step 2: Generating LLM completion (task_id={task_id})...")
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,
-                max_tokens=system_config.compiler_high_param_max_output_tokens
+            except Exception as exc:
+                logger.debug("record_failed_candidate failed: %s", exc)
+
+            await self._broadcast(
+                "proof_check_complete",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "verified_count": 0,
+                    "message": "5 Lean 4 attempts failed",
+                },
             )
-            
-            # Extract content
-            if not response.get("choices") or not response["choices"][0].get("message"):
-                logger.error("Step 2: LLM returned empty response structure")
-                raise ValueError("LLM returned empty response")
-            message = response["choices"][0]["message"]
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            logger.info(f"Step 2: LLM completion received - {len(llm_output)} chars")
-            
-            # Parse JSON
-            data = await self._parse_json_response_with_retry(llm_output, prompt, task_id)
-            
-            if not data:
-                logger.error("Step 2: JSON parse failed")
-                return None
-            
-            # Handle array responses
-            if isinstance(data, list):
-                if len(data) == 0:
-                    logger.warning("Step 2: Empty array returned, treating as refusal")
-                    if self.task_tracking_callback:
-                        self.task_tracking_callback("completed", task_id)
-                    return None
-                logger.warning(f"Step 2: Array of {len(data)} objects returned, using first")
-                data = data[0]
-            
-            # Check if LLM refused (self-refusal option)
-            if not data.get("proceed", True):
-                logger.info("Step 2: LLM refused (Step 1 made mistake)")
-                if self.task_tracking_callback:
-                    self.task_tracking_callback("completed", task_id)
-                return None
-            
-            # Check if enhancement needed
-            if not data.get("needs_enhancement", False):
-                logger.info("Step 2: No enhancement needed")
-                if self.task_tracking_callback:
-                    self.task_tracking_callback("completed", task_id)
-                return None
-            
-            # Create submission
-            new_string_content = _normalize_string_field(data.get("new_string", ""))
-            
-            submission = CompilerSubmission(
-                submission_id=str(uuid.uuid4()),
-                mode="rigor",
-                content=new_string_content,
-                operation=data.get("operation", "replace"),
-                old_string=_normalize_string_field(data.get("old_string", "")),
-                new_string=new_string_content,
-                reasoning=data.get("reasoning", ""),
-                metadata={"rigor_mode": mode}  # No Wolfram data for standard mode
+            return None
+
+        return theorem_name, lean_code, attempts
+
+    # --------------------------------------------------------- stage 3
+
+    async def _step_assess_novelty_and_store(
+        self,
+        *,
+        theorem_statement: str,
+        theorem_name: str,
+        lean_code: str,
+        formal_sketch: str,
+        attempts: List[ProofAttemptFeedback],
+    ) -> tuple:
+        """Classify the verified proof and persist it via proof_database.
+
+        Returns (is_novel, novelty_reasoning, stored_record).
+        """
+        # Lazy import to break an early-load circular chain through the
+        # autonomous.core package __init__.
+        from backend.autonomous.core.proof_novelty import assess_proof_novelty
+
+        existing_block = proof_database.get_novel_proofs_for_injection()
+
+        task_id = f"{self.get_current_task_id()}_novelty"
+        self.task_sequence += 1
+
+        try:
+            is_novel, novelty_reasoning = await assess_proof_novelty(
+                user_prompt=self.raw_user_prompt,
+                theorem_statement=theorem_statement,
+                lean_code=lean_code,
+                validator_model=self.model_name,
+                validator_context=self.context_window,
+                validator_max_tokens=self.max_output_tokens,
+                existing_novel_proofs=existing_block,
+                task_id=task_id,
+                role_id="compiler_rigor_novelty",
             )
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            logger.info(f"Step 2: Rigor enhancement submission generated - {submission.submission_id}")
-            return submission
-            
-        except Exception as e:
-            logger.error(f"Step 2 execution failed: {e}", exc_info=True)
-            raise
-    
-    async def _step2_wolfram_execution(
+        except Exception as exc:
+            logger.warning("Novelty assessment failed (%s); defaulting to non-novel", exc)
+            is_novel, novelty_reasoning = False, f"Novelty assessment error: {exc}"
+
+        record = ProofRecord(
+            proof_id="",  # proof_database assigns proof_XXX on add_proof
+            theorem_id="",
+            theorem_statement=theorem_statement,
+            theorem_name=theorem_name,
+            formal_sketch=formal_sketch,
+            source_type="paper",  # compiler rigor proofs live under the "paper" channel
+            source_id=self._compiler_source_id(),
+            source_title="Compiler Rigor Theorem",
+            solver="Lean 4",
+            lean_code=lean_code,
+            novel=is_novel,
+            novelty_reasoning=novelty_reasoning,
+            verification_notes="Produced by compiler rigor loop (HighParamSubmitter).",
+            attempt_count=len(attempts),
+            attempts=list(attempts),
+            dependencies=[],
+            solver_hints=[],
+        )
+
+        stored = await proof_database.add_proof(record)
+        return is_novel, novelty_reasoning, stored
+
+    # --------------------------------------------------------- stage 4
+
+    async def _step_initial_placement(
         self,
-        target_section: str,
-        wolfram_query: str
+        *,
+        proof_id: str,
+        theorem_statement: str,
+        theorem_name: str,
+        lean_code: str,
+        is_novel: bool,
     ) -> Optional[CompilerSubmission]:
+        """Produce the attempt-1 placement submission.
+
+        Returns None when the submitter refuses a legal placement on attempt 1.
+        The coordinator treats a None attempt-1 submission the same way it
+        treats a double rejection: appendix fallback + acceptance counter.
         """
-        Execute Step 2: Wolfram Alpha verification.
-        
-        Args:
-            target_section: Target section from Step 1 (guidance label)
-            wolfram_query: Natural language query for Wolfram Alpha
-        
-        Returns:
-            CompilerSubmission if verification added, None otherwise
-        """
-        logger.info("Starting Step 2: Wolfram Alpha verification...")
-        
-        # Check if Wolfram Alpha enabled
-        if not system_config.wolfram_alpha_enabled:
-            logger.warning("Step 2: Wolfram Alpha requested but not enabled in config")
+        return await self._build_placement_submission(
+            proof_id=proof_id,
+            theorem_statement=theorem_statement,
+            theorem_name=theorem_name,
+            lean_code=lean_code,
+            is_novel=is_novel,
+            placement_attempt=1,
+            validator_rejection_feedback="",
+        )
+
+    async def submit_rigor_placement_retry(
+        self,
+        prior: RigorTheoremResult,
+        validator_feedback: str,
+    ) -> Optional[CompilerSubmission]:
+        """Produce the attempt-2 placement submission, with validator feedback."""
+        return await self._build_placement_submission(
+            proof_id=prior.proof_id,
+            theorem_statement=prior.theorem_statement,
+            theorem_name=prior.theorem_name,
+            lean_code=prior.lean_code,
+            is_novel=prior.is_novel,
+            placement_attempt=2,
+            validator_rejection_feedback=validator_feedback or "",
+        )
+
+    async def _build_placement_submission(
+        self,
+        *,
+        proof_id: str,
+        theorem_statement: str,
+        theorem_name: str,
+        lean_code: str,
+        is_novel: bool,
+        placement_attempt: int,
+        validator_rejection_feedback: str,
+    ) -> Optional[CompilerSubmission]:
+        current_outline = await outline_memory.get_outline()
+        current_paper_raw = await paper_memory.get_paper()
+        current_paper = _strip_paper_markers_for_llm(current_paper_raw)
+
+        base_prompt = await build_rigor_placement_prompt(
+            user_prompt=self.user_prompt,
+            current_outline=current_outline,
+            current_paper=current_paper,
+            rag_evidence="",
+            theorem_statement=theorem_statement,
+            lean_code=lean_code,
+            proof_id=proof_id,
+            placement_attempt=placement_attempt,
+            validator_rejection_feedback=validator_rejection_feedback,
+        )
+        mandatory_tokens = count_tokens(base_prompt)
+        query_seed = (theorem_statement + " " + current_paper[-1500:]).strip()
+        rag_evidence = await self._build_rigor_rag_context(
+            query_seed=query_seed,
+            reserved_tokens=mandatory_tokens,
+        )
+
+        prompt = await build_rigor_placement_prompt(
+            user_prompt=self.user_prompt,
+            current_outline=current_outline,
+            current_paper=current_paper,
+            rag_evidence=rag_evidence,
+            theorem_statement=theorem_statement,
+            lean_code=lean_code,
+            proof_id=proof_id,
+            placement_attempt=placement_attempt,
+            validator_rejection_feedback=validator_rejection_feedback,
+        )
+
+        max_allowed = rag_config.get_available_input_tokens(
+            self.context_window, self.max_output_tokens
+        )
+        if count_tokens(prompt) > max_allowed:
+            logger.warning("Rigor placement prompt too large; retrying without RAG evidence")
+            prompt = base_prompt
+
+        data = await self._call_llm_and_parse(
+            prompt=prompt,
+            task_label=f"rigor_placement_{placement_attempt}",
+        )
+        if data is None:
             return None
-        
-        # Get Wolfram Alpha client
-        from backend.shared.wolfram_alpha_client import get_wolfram_client
-        wolfram_client = get_wolfram_client()
-        
-        if not wolfram_client:
-            logger.error("Step 2: Wolfram Alpha client not initialized")
+        if isinstance(data, list):
+            data = data[0] if data else {}
+        if not isinstance(data, dict):
             return None
-        
-        # Make Wolfram Alpha API query
-        logger.info(f"Step 2: Querying Wolfram Alpha - '{wolfram_query}'")
-        wolfram_result = await wolfram_client.query(wolfram_query)
-        
-        if not wolfram_result:
-            logger.warning("Step 2: Wolfram Alpha query failed - treating as decline")
+        if not data.get("proceed", True):
+            logger.info(
+                "Rigor placement attempt %s: submitter refused a legal placement",
+                placement_attempt,
+            )
+            return None
+
+        new_string = _normalize_string_field(data.get("new_string", ""))
+        old_string = _normalize_string_field(data.get("old_string", ""))
+        if not new_string or not old_string:
+            logger.info(
+                "Rigor placement attempt %s: missing old_string or new_string",
+                placement_attempt,
+            )
             return None
-        
-        logger.info(f"Step 2: Wolfram Alpha result - {wolfram_result[:200]}")
-        
-        # Get current state (same RAG retrieval as Step 1)
+
+        operation = data.get("operation", "insert_after")
+        if operation not in ("replace", "insert_after"):
+            operation = "insert_after"
+
+        submission = CompilerSubmission(
+            submission_id=str(uuid.uuid4()),
+            mode="rigor",
+            content=new_string,
+            operation=operation,
+            old_string=old_string,
+            new_string=new_string,
+            reasoning=str(data.get("reasoning", "")),
+            metadata={
+                "rigor_mode": "lean_placement",
+                "lean_proof_id": proof_id,
+                "lean_code": lean_code,
+                "theorem_statement": theorem_statement,
+                "theorem_name": theorem_name,
+                "is_novel": is_novel,
+                "placement_attempt": placement_attempt,
+                "validator_rejection_feedback": validator_rejection_feedback,
+            },
+        )
+        return submission
+
+    # -------------------------------------------------------- llm helper
+
+    async def _call_llm_and_parse(
+        self,
+        *,
+        prompt: str,
+        task_label: str,
+    ) -> Optional[Any]:
+        """Send `prompt` to the high-param model and return parsed JSON.
+
+        On a JSON parse failure, issues a single conversational retry that
+        feeds the failed output back with a JSON-escape-rules reminder.
+        """
+        task_id = self.get_current_task_id()
+        self.task_sequence += 1
+
+        # LM Studio cache warmup (silent no-op for OpenRouter)
         try:
-            current_outline = await outline_memory.get_outline()
-            current_paper = await paper_memory.get_paper()
-            
-            # Use same RAG retrieval approach
-            from backend.shared.utils import count_tokens
-            max_allowed_tokens = rag_config.get_available_input_tokens(
-                system_config.compiler_high_param_context_window,
-                system_config.compiler_high_param_max_output_tokens
+            await lm_studio_client.cache_model_load_config(
+                self.model_name,
+                {"context_length": self.context_window, "model_path": self.model_name},
             )
-            
-            # Try RAG retrieval
-            # Exclude outline (always direct-injected in rigor mode)
-            rigor_exclude = ["compiler_outline.txt"]
-            try:
-                logger.info("Step 2 (Wolfram): Retrieving paper sections via RAG...")
-                context_pack = await compiler_rag_manager.retrieve_for_mode(
-                    query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor",
-                    exclude_sources=rigor_exclude
-                )
-                
-                # Build Wolfram execution prompt
-                logger.info("Step 2 (Wolfram): Building execution prompt...")
-                prompt = await build_rigor_wolfram_execution_prompt(
-                    user_prompt=self.user_prompt,
-                    current_outline=current_outline,
-                    current_paper=context_pack.text,  # FULL paper via RAG
-                    target_section=target_section,  # Guidance label
-                    wolfram_query=wolfram_query,
-                    wolfram_result=wolfram_result
-                )
-                
-                # Verify prompt size
-                actual_prompt_tokens = count_tokens(prompt)
-                
-                if actual_prompt_tokens > max_allowed_tokens:
-                    raise ValueError(f"Prompt too large: {actual_prompt_tokens} tokens > {max_allowed_tokens} max")
-                
-                logger.debug(f"Step 2 (Wolfram): Prompt {actual_prompt_tokens} tokens (max: {max_allowed_tokens})")
-                
-            except ValueError as e:
-                if "Prompt too large" not in str(e):
-                    raise
-                
-                # Reduce RAG budget
-                logger.warning("Step 2 (Wolfram): Prompt too large, reducing RAG budget...")
-                
-                mandatory_tokens = count_tokens(
-                    await build_rigor_wolfram_execution_prompt(
-                        self.user_prompt, current_outline, "", target_section, 
-                        wolfram_query, wolfram_result
-                    )
-                )
-                
-                remaining_budget = max_allowed_tokens - mandatory_tokens - 200
-                
-                if remaining_budget < 500:
-                    raise ValueError(
-                        f"Context window too small for Step 2 (Wolfram): {mandatory_tokens} tokens required"
-                    )
-                
-                logger.warning(f"Step 2 (Wolfram): Retrying with reduced budget: {remaining_budget} tokens")
-                context_pack = await compiler_rag_manager.retrieve_for_mode(
-                    query=self.user_prompt + " " + current_paper[-1000:],
-                    mode="rigor",
-                    max_tokens=remaining_budget,
-                    exclude_sources=rigor_exclude
-                )
-                
-                prompt = await build_rigor_wolfram_execution_prompt(
-                    user_prompt=self.user_prompt,
-                    current_outline=current_outline,
-                    current_paper=context_pack.text,
-                    target_section=target_section,
-                    wolfram_query=wolfram_query,
-                    wolfram_result=wolfram_result
-                )
-                
-                actual_prompt_tokens = count_tokens(prompt)
-                logger.info(f"Step 2 (Wolfram): Adjusted prompt to {actual_prompt_tokens} tokens")
-            
-            # Generate task ID
-            task_id = self.get_current_task_id()
-            self.task_sequence += 1
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM
-            logger.info(f"Step 2 (Wolfram): Generating LLM completion (task_id={task_id})...")
+        except Exception:
+            pass
+
+        if self.task_tracking_callback:
+            self.task_tracking_callback("started", task_id)
+
+        try:
             response = await api_client_manager.generate_completion(
                 task_id=task_id,
                 role_id=self.role_id,
                 model=self.model_name,
                 messages=[{"role": "user", "content": prompt}],
                 temperature=0.0,
-                max_tokens=system_config.compiler_high_param_max_output_tokens
-            )
-            
-            # Extract content
-            if not response.get("choices") or not response["choices"][0].get("message"):
-                logger.error("Step 2 (Wolfram): LLM returned empty response structure")
-                raise ValueError("LLM returned empty response")
-            message = response["choices"][0]["message"]
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            logger.info(f"Step 2 (Wolfram): LLM completion received - {len(llm_output)} chars")
-            
-            # Parse JSON
-            data = await self._parse_json_response_with_retry(llm_output, prompt, task_id)
-            
-            if not data:
-                logger.error("Step 2 (Wolfram): JSON parse failed")
-                return None
-            
-            # Handle array responses
-            if isinstance(data, list):
-                if len(data) == 0:
-                    logger.warning("Step 2 (Wolfram): Empty array returned, treating as refusal")
-                    if self.task_tracking_callback:
-                        self.task_tracking_callback("completed", task_id)
-                    return None
-                logger.warning(f"Step 2 (Wolfram): Array of {len(data)} objects returned, using first")
-                data = data[0]
-            
-            # Check if LLM refused
-            if not data.get("proceed", True):
-                logger.info("Step 2 (Wolfram): LLM refused (query inappropriate or Step 1 wrong)")
-                if self.task_tracking_callback:
-                    self.task_tracking_callback("completed", task_id)
-                return None
-            
-            # Check if enhancement needed
-            if not data.get("needs_enhancement", False):
-                logger.info("Step 2 (Wolfram): No enhancement needed")
-                if self.task_tracking_callback:
-                    self.task_tracking_callback("completed", task_id)
-                return None
-            
-            # Create submission
-            new_string_content = _normalize_string_field(data.get("new_string", ""))
-            
-            submission = CompilerSubmission(
-                submission_id=str(uuid.uuid4()),
-                mode="rigor",
-                content=new_string_content,
-                operation=data.get("operation", "insert_after"),
-                old_string=_normalize_string_field(data.get("old_string", "")),
-                new_string=new_string_content,
-                reasoning=data.get("reasoning", ""),
-                metadata={
-                    "rigor_mode": "wolfram_verification",
-                    "wolfram_query": wolfram_query,
-                    "wolfram_result": wolfram_result
-                }
+                max_tokens=self.max_output_tokens,
             )
-            
+        except Exception as exc:
+            logger.error("High-param LLM call failed (%s): %s", task_label, exc)
             if self.task_tracking_callback:
                 self.task_tracking_callback("completed", task_id)
-            
-            logger.info(f"Step 2 (Wolfram): Verification submission generated - {submission.submission_id}")
-            return submission
-            
-        except Exception as e:
-            logger.error(f"Step 2 (Wolfram) execution failed: {e}", exc_info=True)
-            raise
-    
-    async def _parse_json_response_with_retry(
-        self,
-        response: str,
-        original_prompt: str,
-        task_id: str
-    ) -> Optional[dict]:
-        """
-        Parse JSON response with conversational retry on failure.
-        
-        Args:
-            response: LLM response
-            original_prompt: Original prompt sent to LLM (for retry context)
-            task_id: Task ID for tracking retry attempt
-        
-        Returns:
-            Parsed JSON dict or None if validation fails after retries
-        """
-        # Cache model config on first use (only relevant for LM Studio)
-        try:
-            await lm_studio_client.cache_model_load_config(self.model_name, {
-                "context_length": self.context_window,
-                "model_path": self.model_name
-            })
-        except Exception:
-            # Silently ignore - only applies to LM Studio models
-            pass
-        
-        # Parse JSON
+            return None
+
+        if not response or not response.get("choices") or not response["choices"][0].get("message"):
+            logger.error("High-param LLM returned empty response (%s)", task_label)
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
+            return None
+
+        message = response["choices"][0]["message"]
+        llm_output = message.get("content") or message.get("reasoning") or ""
+        if not llm_output.strip():
+            logger.error("High-param LLM returned empty content (%s)", task_label)
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
+            return None
+
         try:
-            parsed = parse_json(response)
+            parsed = parse_json(llm_output)
+            if self.task_tracking_callback:
+                self.task_tracking_callback("completed", task_id)
             return parsed
-            
         except Exception as parse_error:
-            # Not corrupted, just invalid JSON - continue with conversational retry
-            valid = False
-            parsed = None
-            error = str(parse_error)
-            
-            # Initial parse failed - attempt conversational retry
-            logger.info("Compiler high-param submitter (rigor): Initial JSON parse failed, attempting retry")
-            logger.debug(f"Parse error: {error}")
-        
-        # Build retry prompt
+            logger.info(
+                "High-param submitter (%s): initial JSON parse failed, attempting one retry: %s",
+                task_label,
+                parse_error,
+            )
+
+        # Single conversational retry with a JSON-escape reminder
         retry_prompt = (
-            f"Your previous response could not be parsed as valid JSON.\n\n"
-            f"PARSE ERROR: {error}\n\n"
+            "Your previous response could not be parsed as valid JSON.\n\n"
+            f"PARSE ERROR: {parse_error}\n\n"
             "JSON ESCAPING RULES FOR LaTeX:\n"
-            "LaTeX notation IS ALLOWED - but you must escape it properly in JSON:\n"
-            "1. Every backslash in your content needs ONE escape in JSON\n"
-            "   - To write \\mathbb{Z} in content, write: \"\\\\mathbb{Z}\" in JSON\n"
-            "   - To write \\( and \\), write: \"\\\\(\" and \"\\\\)\" in JSON\n"
-            "2. Do NOT double-escape: \\\\\\\\mathbb is WRONG, \\\\mathbb is CORRECT\n"
-            "3. For old_string: copy text EXACTLY from the document, just escape backslashes\n"
-            "4. Escape quotes inside strings: use \\\" for literal quotes\n"
-            "5. Avoid malformed unicode escapes (must be exactly \\uXXXX with 4 hex digits)\n\n"
-            "Please provide your response again in valid JSON format.\n\n"
-            "Respond with ONLY the JSON object, no markdown, no explanation."
+            "1. Every backslash in content needs ONE extra escape in JSON "
+            "(write \\\\mathbb{Z} not \\mathbb{Z}).\n"
+            "2. Escape double quotes inside strings as \\\".\n"
+            "3. Newlines: \\n (not \\\\n).\n"
+            "4. Do not include any system-managed bracket markers.\n\n"
+            "Please respond again with ONLY the JSON object, no markdown."
         )
-        
+
         try:
-            # CRITICAL FIX: Truncate failed output to prevent context overflow during retry
-            from backend.shared.utils import count_tokens
-            
-            max_failed_output_chars = 2000  # ~500 tokens - enough for error context
-            if len(response) > max_failed_output_chars:
-                failed_output_preview = response[:max_failed_output_chars] + "\n[...output truncated for retry...]"
-            else:
-                failed_output_preview = response
-            
-            # Calculate if conversation fits in context window
-            prompt_tokens = count_tokens(original_prompt)
-            preview_tokens = count_tokens(failed_output_preview)
-            retry_prompt_tokens = count_tokens(retry_prompt)
-            conversation_tokens = prompt_tokens + preview_tokens + retry_prompt_tokens
-            
-            if conversation_tokens > self.available_input_tokens:
-                # Too large - just retry with original prompt
-                logger.warning(
-                    f"Compiler high-param submitter (rigor): Retry conversation too large "
-                    f"({conversation_tokens} > {self.available_input_tokens}), using simple retry"
-                )
-                retry_response = await api_client_manager.generate_completion(
-                    task_id=f"{task_id}_retry",
-                    role_id=self.role_id,
-                    model=self.model_name,
-                    messages=[{"role": "user", "content": original_prompt}],
-                    temperature=0.0,
-                    max_tokens=self.max_output_tokens
-                )
-            else:
-                # Build conversation with truncated failed output
-                retry_response = await api_client_manager.generate_completion(
-                    task_id=f"{task_id}_retry",
-                    role_id=self.role_id,
-                    model=self.model_name,
-                    messages=[
-                        {"role": "user", "content": original_prompt},
-                        {"role": "assistant", "content": failed_output_preview},
-                        {"role": "user", "content": retry_prompt}
-                    ],
-                    temperature=0.0,
-                    max_tokens=self.max_output_tokens
-                )
-            
-            if retry_response.get("choices"):
-                retry_output = retry_response["choices"][0]["message"]["content"]
-                
-                try:
-                    parsed = parse_json(retry_output)
-                    logger.info("Compiler high-param submitter (rigor): Retry succeeded!")
-                    return parsed
-                except Exception as parse_error:
-                    error = str(parse_error)
-                    logger.warning(f"Compiler high-param submitter (rigor): Retry failed - {error}")
-        except Exception as e:
-            logger.error(f"Compiler high-param submitter (rigor): Retry request failed - {e}")
-        
-        # All retries failed
-        logger.error(f"Compiler high-param submitter (rigor): JSON validation failed after retry: {error}")
+            truncated_preview = llm_output[:2000] + (
+                "\n[...truncated...]" if len(llm_output) > 2000 else ""
+            )
+            retry_response = await api_client_manager.generate_completion(
+                task_id=f"{task_id}_retry",
+                role_id=self.role_id,
+                model=self.model_name,
+                messages=[
+                    {"role": "user", "content": prompt},
+                    {"role": "assistant", "content": truncated_preview},
+                    {"role": "user", "content": retry_prompt},
+                ],
+                temperature=0.0,
+                max_tokens=self.max_output_tokens,
+            )
+            if retry_response and retry_response.get("choices"):
+                retry_msg = retry_response["choices"][0]["message"]
+                retry_output = retry_msg.get("content") or retry_msg.get("reasoning") or ""
+                parsed = parse_json(retry_output)
+                logger.info("High-param submitter (%s): retry succeeded", task_label)
+                if self.task_tracking_callback:
+                    self.task_tracking_callback("completed", task_id)
+                return parsed
+        except Exception as retry_error:
+            logger.warning(
+                "High-param submitter (%s): retry failed: %s", task_label, retry_error
+            )
+
+        if self.task_tracking_callback:
+            self.task_tracking_callback("completed", task_id)
         return None
+
+
+
+
+
+
+
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 66e15da..ba2b5ef 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -225,7 +225,7 @@ async def initialize(
         if system_config.wolfram_alpha_enabled and system_config.wolfram_alpha_api_key:
             from backend.shared.wolfram_alpha_client import initialize_wolfram_client
             initialize_wolfram_client(system_config.wolfram_alpha_api_key)
-            logger.info("Wolfram Alpha client initialized for rigor mode")
+            logger.info("Wolfram Alpha client initialized (available as a construction-mode tool)")
         
         # Note: Resume logic is handled in _main_workflow() to properly skip startup loops
         
@@ -1041,6 +1041,7 @@ async def _initial_paper_loop(self) -> None:
                 await paper_memory.initialize_with_placeholders(submission.content)
                 initial_portion_accepted = True
                 self.construction_acceptances += 1
+                self._track_submission_wolfram_calls(submission)
                 
                 await compiler_rejection_log.add_acceptance(
                     submission.submission_id,
@@ -1121,20 +1122,61 @@ async def _construction_loop(self) -> None:
             await self._submit_and_validate_review()
         
         logger.info("Construction loop complete")
+
+    def _track_submission_wolfram_calls(self, submission: CompilerSubmission) -> None:
+        """Record accepted construction-mode Wolfram tool calls in paper credits.
+
+        HighContextSubmitter stores the full Wolfram audit trail on
+        `submission.metadata["wolfram_calls"]`. PaperModelTracker only tracks a
+        count (and accepts the query for logging), so we bridge the two here
+        after the paper operation has been accepted.
+        """
+        wolfram_calls = (submission.metadata or {}).get("wolfram_calls") or []
+        if not wolfram_calls:
+            return
+
+        tracker = (
+            self._current_paper_tracker
+            if self.autonomous_mode
+            else self._paper_model_tracker
+        )
+        if not tracker:
+            logger.debug(
+                "Accepted submission had %s Wolfram call(s), but no paper tracker is active.",
+                len(wolfram_calls),
+            )
+            return
+
+        for call in wolfram_calls:
+            query = ""
+            if isinstance(call, dict):
+                query = str(call.get("query", "") or "").strip()
+            else:
+                query = str(call or "").strip()
+            tracker.track_wolfram_call(query)
+        logger.info("Tracked %s accepted Wolfram Alpha construction call(s)", len(wolfram_calls))
     
     async def _rigor_loop(self) -> None:
-        """LOOP 2: Rigor enhancement (steps 19-21)."""
+        """LOOP 2: Rigor enhancement.
+
+        With the new Lean-4-verified-theorem flow, every verified theorem
+        lands somewhere (inline or appendix). So the rigor loop continues
+        as long as `_submit_and_validate_rigor` returns True (theorem was
+        placed somewhere in this cycle) and ends on the first decline
+        (no theorem worth proposing, 5 Lean attempts failed, or Lean 4 is
+        disabled).
+        """
         logger.info("Starting rigor loop...")
         self.rigor_cycle_active = True
         
-        # Continue until first rejection
+        # Continue until first decline (no theorem found or Lean failed 5x).
         while self.is_running and self.rigor_cycle_active:
-            accepted = await self._submit_and_validate_rigor()
+            continued = await self._submit_and_validate_rigor()
             
-            if not accepted:
-                # First rejection - return to Loop 1
+            if not continued:
+                # Decline - end this rigor loop and return to construction.
                 self.rigor_cycle_active = False
-                logger.info("Rigor cycle ended (first rejection)")
+                logger.info("Rigor cycle ended (decline: no more theorems or Lean failed)")
         
         logger.info("Rigor loop complete")
     
@@ -1418,6 +1460,7 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 
                 # Phase transitioned successfully - this is a success, not a rejection
                 logger.info(f"Phase transition successful. New phase: {self.autonomous_section_phase}")
+                self._track_submission_wolfram_calls(submission)
                 
                 await self._broadcast("phase_completion_signal", {
                     "previous_phase": submission.metadata.get("phase", "unknown"),
@@ -1449,34 +1492,51 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
         )
         
         if result.decision == "accept":
-            # Update paper - use placeholder replacement for conclusion/intro/abstract
-            # This ensures content replaces the placeholder marker instead of generic insertion
+            # Update paper. For phase-section creation, prefer placeholder replacement
+            # only when the submission actually targets that placeholder. If the
+            # placeholder is already gone (resume/retry) or the model submitted a
+            # validated edit against existing section text, apply the edit normally.
             section_phase = self.autonomous_section_phase if self.autonomous_mode else None
-            
-            if section_phase == "conclusion":
-                # Replace the conclusion placeholder with validated content
-                success = await paper_memory.replace_placeholder(CONCLUSION_PLACEHOLDER, submission.content)
-                if not success:
-                    logger.error("Conclusion placeholder not found - paper is in invalid state. Rejecting.")
-                    updated_paper = None  # Trigger rejection
-                else:
-                    updated_paper = await paper_memory.get_paper()
-            elif section_phase == "introduction":
-                # Replace the introduction placeholder with validated content
-                success = await paper_memory.replace_placeholder(INTRO_PLACEHOLDER, submission.content)
-                if not success:
-                    logger.error("Introduction placeholder not found - paper is in invalid state. Rejecting.")
-                    updated_paper = None  # Trigger rejection
-                else:
-                    updated_paper = await paper_memory.get_paper()
-            elif section_phase == "abstract":
-                # Replace the abstract placeholder with validated content
-                success = await paper_memory.replace_placeholder(ABSTRACT_PLACEHOLDER, submission.content)
-                if not success:
-                    logger.error("Abstract placeholder not found - paper is in invalid state. Rejecting.")
-                    updated_paper = None  # Trigger rejection
+            placeholder_replaced = False
+            phase_placeholder = {
+                "conclusion": CONCLUSION_PLACEHOLDER,
+                "introduction": INTRO_PLACEHOLDER,
+                "abstract": ABSTRACT_PLACEHOLDER,
+            }.get(section_phase)
+
+            if phase_placeholder:
+                old_string = (submission.old_string or "").strip()
+                uses_placeholder_target = (
+                    phase_placeholder in current_paper
+                    and (
+                        submission.operation == "full_content"
+                        or (
+                            submission.operation == "replace"
+                            and (not old_string or old_string == phase_placeholder)
+                        )
+                    )
+                )
+
+                if uses_placeholder_target:
+                    success = await paper_memory.replace_placeholder(phase_placeholder, submission.content)
+                    if not success:
+                        logger.error("%s placeholder was present but replacement failed.", section_phase.capitalize())
+                        updated_paper = None  # Trigger rejection
+                    else:
+                        placeholder_replaced = True
+                        updated_paper = await paper_memory.get_paper()
                 else:
-                    updated_paper = await paper_memory.get_paper()
+                    if phase_placeholder not in current_paper:
+                        logger.info(
+                            "%s placeholder not present; applying validated edit operation instead",
+                            section_phase.capitalize(),
+                        )
+                    else:
+                        logger.info(
+                            "%s phase submission targets existing content; applying validated edit operation",
+                            section_phase.capitalize(),
+                        )
+                    updated_paper = self._apply_edit(current_paper, submission)
             else:
                 # Body section or no phase - use standard _apply_edit
                 updated_paper = self._apply_edit(current_paper, submission)
@@ -1489,8 +1549,8 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 )
                 self.construction_rejections += 1
                 
-                # Create emergency rejection
-                emergency_result = CompilerValidationResult(
+                # Create rejection result for placement failure
+                rejection_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
                     reasoning=f"Exact string match failed: old_string='{submission.old_string[:100]}...' not found or not unique in document",
@@ -1499,21 +1559,22 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                     validation_stage="pre-validation"  # Exact string match check
                 )
                 
-                await compiler_rejection_log.add_rejection(emergency_result, "construction", submission.content)
+                await compiler_rejection_log.add_rejection(rejection_result, "construction", submission.content)
                 
                 await self._broadcast("compiler_rejection", {
                     "mode": "construction",
                     "submission_id": submission.submission_id,
-                    "reasoning": "Emergency rejection: exact string match failed"
+                    "reasoning": "Exact string match failed"
                 })
                 
-                return False, emergency_result.reasoning
+                return False, rejection_result.reasoning
             
-            # Only call update_paper for _apply_edit cases (placeholder replacement already saved)
-            if section_phase not in ("conclusion", "introduction", "abstract"):
+            # Only skip update_paper when replace_placeholder already saved.
+            if not placeholder_replaced:
                 await paper_memory.update_paper(updated_paper)
             
             self.construction_acceptances += 1
+            self._track_submission_wolfram_calls(submission)
             
             # If rewrite was pending, mark it as completed now (first successful acceptance)
             if self.rewrite_pending:
@@ -1696,8 +1757,8 @@ async def _submit_and_validate_outline_update(self) -> bool:
                 )
                 self.outline_rejections += 1
                 
-                # Create emergency rejection
-                emergency_result = CompilerValidationResult(
+                # Create rejection result for outline placement failure
+                rejection_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
                     reasoning=f"Outline exact string match failed: old_string='{submission.old_string[:100]}...' not found or not unique in outline",
@@ -1706,12 +1767,12 @@ async def _submit_and_validate_outline_update(self) -> bool:
                     validation_stage="pre-validation"  # Exact string match check
                 )
                 
-                await compiler_rejection_log.add_rejection(emergency_result, "outline_update", submission.content)
+                await compiler_rejection_log.add_rejection(rejection_result, "outline_update", submission.content)
                 
                 await self._broadcast("compiler_rejection", {
                     "mode": "outline_update",
                     "submission_id": submission.submission_id,
-                    "reasoning": "Emergency rejection: outline exact string match failed"
+                    "reasoning": "Outline exact string match failed"
                 })
                 
                 return False
@@ -1821,8 +1882,8 @@ async def _submit_and_validate_review(self, review_focus: str = "general") -> bo
                 )
                 self.review_rejections += 1
                 
-                # Create emergency rejection
-                emergency_result = CompilerValidationResult(
+                # Create rejection result for placement failure
+                rejection_result = CompilerValidationResult(
                     submission_id=submission.submission_id,
                     decision="reject",
                     reasoning=f"Exact string match failed: old_string='{submission.old_string[:100]}...' not found or not unique in document",
@@ -1831,13 +1892,13 @@ async def _submit_and_validate_review(self, review_focus: str = "general") -> bo
                     validation_stage="pre-validation"  # Exact string match check
                 )
                 
-                await compiler_rejection_log.add_rejection(emergency_result, "review", submission.content)
+                await compiler_rejection_log.add_rejection(rejection_result, "review", submission.content)
                 
                 await self._broadcast("compiler_rejection", {
                     "mode": "review",
                     "submission_id": submission.submission_id,
                     "review_focus": review_focus,
-                    "reasoning": "Emergency rejection: exact string match failed"
+                    "reasoning": "Exact string match failed"
                 })
                 
                 return False
@@ -1918,134 +1979,288 @@ async def _run_pre_abstract_red_team_review(self) -> None:
         )
     
     async def _submit_and_validate_rigor(self) -> bool:
-        """Submit and validate rigor enhancement. Returns True if accepted."""
+        """Run one rigor cycle.
+
+        New Lean-4-verified-theorem flow:
+          1. If Lean 4 is disabled in config, decline immediately (no work).
+          2. Submitter does discovery + 5 Lean attempts + novelty + store.
+             If it returns None, decline and end the rigor cycle.
+          3. Coordinator owns the 2-attempt validator placement loop.
+          4. If both placement attempts reject (or the submitter never
+             produced a legal attempt-1), the theorem is routed to the
+             Theorems Appendix (its Lean 4 verification is preserved).
+             Counts as a rigor_acceptance per the build plan.
+
+        Returns True to signal "continue the rigor loop" (a theorem landed
+        somewhere). Returns False on decline (no theorem to propose / Lean
+        5-attempt failure / Lean 4 disabled) so the outer loop ends this
+        rigor cycle.
+        """
         self.current_mode = "rigor"
-        
+
+        # Hard guard: Lean 4 disabled system-wide means rigor mode has no work.
+        if not system_config.lean4_enabled:
+            logger.info("Rigor loop: Lean 4 disabled; declining cycle")
+            self.rigor_declines += 1
+            await compiler_rejection_log.add_decline(
+                "rigor", "Lean 4 is disabled in system configuration"
+            )
+            await self._broadcast(
+                "compiler_decline",
+                {"mode": "rigor", "reasoning": "Lean 4 is disabled"},
+            )
+            return False
+
         try:
-            submission = await self.high_param_submitter.submit_rigor_enhancement()
-        except ValueError as e:
-            logger.error(f"Rigor enhancement error: {e}")
+            lean_result = await self.high_param_submitter.submit_rigor_lean_theorem()
+        except ValueError as exc:
+            logger.error(f"Rigor lean flow error: {exc}")
             self.rigor_declines += 1
-            await compiler_rejection_log.add_decline("rigor", f"LLM error: {e}")
-            await self._broadcast("compiler_decline", {
-                "mode": "rigor",
-                "reasoning": f"LLM error: {e}"
-            })
+            await compiler_rejection_log.add_decline("rigor", f"LLM error: {exc}")
+            await self._broadcast(
+                "compiler_decline", {"mode": "rigor", "reasoning": f"LLM error: {exc}"}
+            )
             return False
-        
-        if submission is None:
-            logger.info("No rigor enhancement needed")
+        except Exception as exc:
+            logger.error(f"Rigor lean flow raised: {exc}", exc_info=True)
             self.rigor_declines += 1
-            await compiler_rejection_log.add_decline("rigor", "Rigor already adequate")
-            
-            await self._broadcast("compiler_decline", {
-                "mode": "rigor",
-                "reasoning": "Rigor already adequate"
-            })
-            
-            # Treat as rejection for loop purposes
+            await compiler_rejection_log.add_decline(
+                "rigor", f"Internal error: {exc}"
+            )
+            await self._broadcast(
+                "compiler_decline",
+                {"mode": "rigor", "reasoning": f"Internal error: {exc}"},
+            )
             return False
-        
-        self.total_submissions += 1
-        
-        await self._broadcast("compiler_submission", {
-            "mode": "rigor",
-            "submission_id": submission.submission_id
-        })
-        
-        current_paper = await paper_memory.get_paper()
-        current_outline = await outline_memory.get_outline()
-        
-        result = await self.validator.validate_submission(
-            submission,
-            current_paper=current_paper,
-            current_outline=current_outline
+
+        if lean_result is None:
+            logger.info("Rigor loop: no theorem attempted this cycle (decline)")
+            self.rigor_declines += 1
+            await compiler_rejection_log.add_decline(
+                "rigor",
+                "No theorem to formalize or 5 Lean 4 attempts failed",
+            )
+            await self._broadcast(
+                "compiler_decline",
+                {
+                    "mode": "rigor",
+                    "reasoning": "No theorem to formalize or 5 Lean 4 attempts failed",
+                },
+            )
+            return False
+
+        # At this point a Lean-4-verified proof exists in proof_database.
+        # The submitter may or may not have produced an attempt-1 placement.
+        return await self._place_or_appendix_fallback(lean_result)
+
+    async def _place_or_appendix_fallback(self, lean_result) -> bool:
+        """Drive the 2-attempt placement validator loop.
+
+        On double rejection (or when the submitter never produced a legal
+        attempt), the theorem is appended to the Theorems Appendix and the
+        cycle is counted as a rigor_acceptance.
+        """
+        from backend.compiler.agents.high_param_submitter import (
+            format_theorem_appendix_entry,
         )
-        
-        if result.decision == "accept":
-            # Apply enhancement
-            updated_paper = self._apply_edit(current_paper, submission)
-            
-            # Check if exact string match failed
-            if updated_paper is None:
-                logger.error(
-                    f"Placement execution failed despite validator acceptance. "
-                    f"Treating as rejection. Submission: {submission.submission_id}"
-                )
-                self.rigor_rejections += 1
-                
-                # Create emergency rejection
-                emergency_result = CompilerValidationResult(
-                    submission_id=submission.submission_id,
-                    decision="reject",
-                    reasoning=f"Exact string match failed: old_string='{submission.old_string[:100]}...' not found or not unique in document",
-                    summary="Exact string match failed - old_string not found or not unique",
-                    placement_check=False,
-                    validation_stage="pre-validation"  # Exact string match check
+
+        submission = lean_result.initial_placement_submission
+        validator_feedback = ""
+
+        for placement_attempt in (1, 2):
+            if submission is None:
+                logger.info(
+                    "Rigor placement attempt %s: submitter returned no placement submission; "
+                    "routing directly to appendix fallback",
+                    placement_attempt,
                 )
-                
-                await compiler_rejection_log.add_rejection(emergency_result, "rigor", submission.content)
-                
-                await self._broadcast("compiler_rejection", {
+                break
+
+            self.total_submissions += 1
+            await self._broadcast(
+                "compiler_submission",
+                {
                     "mode": "rigor",
                     "submission_id": submission.submission_id,
-                    "reasoning": "Emergency rejection: exact string match failed"
-                })
-                
-                return False
-            
-            await paper_memory.update_paper(updated_paper)
-            
-            self.rigor_acceptances += 1
-            
-            # Track Wolfram Alpha call if applicable (only for accepted submissions)
-            if submission.metadata.get("wolfram_query"):
-                if self.autonomous_mode and self._current_paper_tracker:
-                    # Autonomous mode (Part 3)
-                    self._current_paper_tracker.track_wolfram_call(
-                        submission.metadata["wolfram_query"]
+                    "lean_proof_id": lean_result.proof_id,
+                    "placement_attempt": placement_attempt,
+                },
+            )
+
+            current_paper = await paper_memory.get_paper()
+            current_outline = await outline_memory.get_outline()
+
+            result = await self.validator.validate_submission(
+                submission,
+                current_paper=current_paper,
+                current_outline=current_outline,
+            )
+
+            if result.decision == "accept":
+                updated_paper = self._apply_edit(current_paper, submission)
+                if updated_paper is None:
+                    logger.error(
+                        "Rigor placement attempt %s: exact-string apply failed after "
+                        "validator acceptance for submission %s",
+                        placement_attempt,
+                        submission.submission_id,
                     )
-                    logger.info(f"Tracked Wolfram Alpha call (autonomous): {submission.metadata['wolfram_query']}")
-                elif not self.autonomous_mode and self._paper_model_tracker:
-                    # Manual mode (Part 2)
-                    self._paper_model_tracker.track_wolfram_call(
-                        submission.metadata["wolfram_query"]
+                    # Treat apply failure as a placement rejection for retry
+                    validator_feedback = (
+                        f"Exact-string match failed when applying your edit: "
+                        f"old_string='{(submission.old_string or '')[:120]}...' was not "
+                        "found or not unique in the current paper. Pick a more "
+                        "specific anchor."
                     )
-                    logger.info(f"Tracked Wolfram Alpha call (manual): {submission.metadata['wolfram_query']}")
-            
-            await compiler_rejection_log.add_acceptance(
-                submission.submission_id,
-                "rigor",
-                submission.content[:500]
-            )
-            
-            word_count = await paper_memory.get_word_count()
-            
-            await self._broadcast("compiler_acceptance", {
-                "mode": "rigor",
-                "submission_id": submission.submission_id
-            })
-            
-            await self._broadcast("paper_updated", {
-                "word_count": word_count,
-                "preview": updated_paper[:500]
-            })
-            
-            logger.info(f"Rigor enhancement accepted ({word_count} words)")
-            return True
-        else:
+                    rejection_result = CompilerValidationResult(
+                        submission_id=submission.submission_id,
+                        decision="reject",
+                        reasoning=validator_feedback,
+                        summary=validator_feedback[:750],
+                        placement_check=False,
+                        validation_stage="pre-validation",
+                    )
+                    await compiler_rejection_log.add_rejection(
+                        rejection_result, "rigor", submission.content
+                    )
+                    await self._broadcast(
+                        "compiler_rejection",
+                        {
+                            "mode": "rigor",
+                            "submission_id": submission.submission_id,
+                            "reasoning": validator_feedback,
+                            "placement_attempt": placement_attempt,
+                        },
+                    )
+                    self.rigor_rejections += 1
+                    if placement_attempt == 1:
+                        submission = await self.high_param_submitter.submit_rigor_placement_retry(
+                            lean_result, validator_feedback
+                        )
+                    continue
+
+                # Success: inline placement accepted + applied.
+                await paper_memory.update_paper(updated_paper)
+
+                # Also drop a short cross-reference stub into the appendix so
+                # the full Lean proof is preserved and easy to look up.
+                appendix_stub = format_theorem_appendix_entry(
+                    proof_id=lean_result.proof_id,
+                    theorem_statement=lean_result.theorem_statement,
+                    lean_code=lean_result.lean_code,
+                    is_novel=lean_result.is_novel,
+                    theorem_name=lean_result.theorem_name,
+                    placement_outcome="inline",
+                )
+                try:
+                    await paper_memory.append_to_theorems_appendix(appendix_stub)
+                except Exception as exc:
+                    logger.warning(
+                        "Inline-placed theorem appendix stub append failed (non-fatal): %s",
+                        exc,
+                    )
+
+                self.rigor_acceptances += 1
+                await compiler_rejection_log.add_acceptance(
+                    submission.submission_id,
+                    "rigor",
+                    submission.content[:500],
+                )
+
+                word_count = await paper_memory.get_word_count()
+                await self._broadcast(
+                    "compiler_acceptance",
+                    {
+                        "mode": "rigor",
+                        "submission_id": submission.submission_id,
+                        "placement_outcome": "inline",
+                        "lean_proof_id": lean_result.proof_id,
+                        "is_novel": lean_result.is_novel,
+                        "placement_attempt": placement_attempt,
+                    },
+                )
+                await self._broadcast(
+                    "paper_updated",
+                    {"word_count": word_count, "preview": updated_paper[:500]},
+                )
+                logger.info(
+                    "Rigor theorem %s placed inline on attempt %s (%s words)",
+                    lean_result.proof_id,
+                    placement_attempt,
+                    word_count,
+                )
+                return True
+
+            # Validator rejected this placement attempt
             self.rigor_rejections += 1
-            
-            await compiler_rejection_log.add_rejection(result, "rigor", submission.content)
-            
-            await self._broadcast("compiler_rejection", {
+            validator_feedback = result.reasoning or "Placement rejected without reason"
+            await compiler_rejection_log.add_rejection(
+                result, "rigor", submission.content
+            )
+            await self._broadcast(
+                "compiler_rejection",
+                {
+                    "mode": "rigor",
+                    "submission_id": submission.submission_id,
+                    "reasoning": result.reasoning,
+                    "placement_attempt": placement_attempt,
+                },
+            )
+            logger.info(
+                "Rigor placement attempt %s rejected: %s",
+                placement_attempt,
+                (result.reasoning or "")[:160],
+            )
+
+            if placement_attempt == 1:
+                submission = await self.high_param_submitter.submit_rigor_placement_retry(
+                    lean_result, validator_feedback
+                )
+
+        # Appendix fallback: both placement attempts failed (or attempt 1 was
+        # impossible). The math is already Lean-verified, so the theorem is
+        # preserved in the Theorems Appendix and counted as a rigor_acceptance.
+        appendix_entry = format_theorem_appendix_entry(
+            proof_id=lean_result.proof_id,
+            theorem_statement=lean_result.theorem_statement,
+            lean_code=lean_result.lean_code,
+            is_novel=lean_result.is_novel,
+            theorem_name=lean_result.theorem_name,
+            placement_outcome="appendix_fallback",
+        )
+        appended = await paper_memory.append_to_theorems_appendix(appendix_entry)
+        if not appended:
+            # Paper markers might be missing - try one repair pass then retry.
+            logger.warning(
+                "Appendix append returned False; attempting marker repair before retry"
+            )
+            await paper_memory.ensure_markers_intact()
+            appended = await paper_memory.append_to_theorems_appendix(appendix_entry)
+
+        self.rigor_acceptances += 1
+        word_count = await paper_memory.get_word_count()
+        await self._broadcast(
+            "compiler_acceptance",
+            {
                 "mode": "rigor",
-                "submission_id": submission.submission_id,
-                "reasoning": result.reasoning
-            })
-            
-            logger.info("Rigor enhancement rejected")
-            return False
+                "submission_id": (
+                    lean_result.initial_placement_submission.submission_id
+                    if lean_result.initial_placement_submission
+                    else f"rigor_appendix_{lean_result.proof_id}"
+                ),
+                "placement_outcome": "appendix_fallback",
+                "lean_proof_id": lean_result.proof_id,
+                "is_novel": lean_result.is_novel,
+            },
+        )
+        await self._broadcast("paper_updated", {"word_count": word_count})
+        logger.info(
+            "Rigor theorem %s stored in Theorems Appendix (both placement attempts "
+            "failed or unavailable)",
+            lean_result.proof_id,
+        )
+        return True
+
     
     def _apply_edit_to_outline(self, current_outline: str, submission: CompilerSubmission) -> Optional[str]:
         """
@@ -3581,7 +3796,7 @@ async def _check_phase_transition(self, section_complete: bool = False) -> bool:
             # VERIFY CONCLUSION ACTUALLY EXISTS BEFORE TRANSITIONING
             current_paper = await paper_memory.get_paper()
             has_conclusion = bool(re.search(
-                r"(?:^|\n)\s*(?:#+\s*)?(?:[IVXLCDM]+\.?\s*)?(?:Conclusion|Summary|Discussion|Final\s*Remarks|Concluding\s*Remarks)",
+                r"(?:^|\n)\s*(?:(?:#+\s*)?(?:[IVXLCDM]+\.?\s*)?(?:Conclusion|Summary|Discussion|Final\s*Remarks|Concluding\s*Remarks)|\\(?:section|chapter)\*?\{(?:Conclusion|Summary|Discussion|Final\s*Remarks|Concluding\s*Remarks)\})",
                 current_paper, re.IGNORECASE | re.MULTILINE
             ))
             
@@ -3603,7 +3818,7 @@ async def _check_phase_transition(self, section_complete: bool = False) -> bool:
             # VERIFY INTRODUCTION ACTUALLY EXISTS BEFORE TRANSITIONING
             current_paper = await paper_memory.get_paper()
             has_introduction = bool(re.search(
-                r"(?:^|\n)\s*(?:#+\s*)?(?:I\.?\s*)?Introduction",
+                r"(?:^|\n)\s*(?:(?:#+\s*)?(?:I\.?\s*)?Introduction|\\(?:section|chapter)\*?\{(?:I\.?\s*)?Introduction\})",
                 current_paper, re.IGNORECASE | re.MULTILINE
             ))
             
@@ -3628,7 +3843,7 @@ async def _check_phase_transition(self, section_complete: bool = False) -> bool:
             # VERIFY ABSTRACT ACTUALLY EXISTS BEFORE MARKING PAPER COMPLETE
             current_paper = await paper_memory.get_paper()
             has_abstract = bool(re.search(
-                r"(?:^|\n)\s*(?:#+\s*)?\*{0,2}Abstract\*{0,2}",
+                r"(?:^|\n)\s*(?:(?:#+\s*)?\*{0,2}Abstract\*{0,2}|\\(?:section|chapter)\*?\{Abstract\}|\\begin\{abstract\})",
                 current_paper, re.IGNORECASE | re.MULTILINE
             ))
             
diff --git a/backend/compiler/memory/paper_memory.py b/backend/compiler/memory/paper_memory.py
index 9444efb..e107b7e 100644
--- a/backend/compiler/memory/paper_memory.py
+++ b/backend/compiler/memory/paper_memory.py
@@ -21,6 +21,13 @@
 INTRO_PLACEHOLDER = "[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS COMPLETE]"
 CONCLUSION_PLACEHOLDER = "[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION - TO BE WRITTEN AFTER THE BODY SECTION IS COMPLETE]"
 
+# Theorems appendix bracket markers - wrap the Lean-4-verified theorems appendix.
+# System-managed; the body is free-form and may be empty (default placeholder line)
+# or contain theorem entries appended by the rigor flow.
+THEOREMS_APPENDIX_START = "[HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]"
+THEOREMS_APPENDIX_END = "[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]"
+APPENDIX_EMPTY_PLACEHOLDER = "[Theorems appendix - verified Lean 4 theorems not placed inline will appear here]"
+
 
 class PaperMemory:
     """
@@ -179,12 +186,18 @@ async def initialize_with_placeholders(self, first_body_content: str) -> None:
         Args:
             first_body_content: The first body section content (already validated)
         """
-        # Build paper with placeholders framing the body content
+        # Build paper with placeholders framing the body content.
+        # Appendix block sits between the conclusion placeholder and the paper anchor;
+        # its body starts as the empty-placeholder line and is later replaced /
+        # appended to by append_to_theorems_appendix.
         paper = (
             f"{ABSTRACT_PLACEHOLDER}\n\n"
             f"{INTRO_PLACEHOLDER}\n\n"
             f"{first_body_content}\n\n"
             f"{CONCLUSION_PLACEHOLDER}\n\n"
+            f"{THEOREMS_APPENDIX_START}\n"
+            f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+            f"{THEOREMS_APPENDIX_END}\n\n"
             f"{PAPER_ANCHOR}"
         )
         
@@ -284,13 +297,17 @@ async def clear_body_section(self) -> None:
                     ABSTRACT_PLACEHOLDER not in line and
                     INTRO_PLACEHOLDER not in line and
                     CONCLUSION_PLACEHOLDER not in line and
+                    THEOREMS_APPENDIX_START not in line and
+                    THEOREMS_APPENDIX_END not in line and
                     PAPER_ANCHOR not in line):
                     body_start_idx = i
                     break
             
-            # Find where body ends (at CONCLUSION_PLACEHOLDER or PAPER_ANCHOR)
+            # Find where body ends (at CONCLUSION_PLACEHOLDER, THEOREMS_APPENDIX_START, or PAPER_ANCHOR)
             for i, line in enumerate(lines):
-                if CONCLUSION_PLACEHOLDER in line or PAPER_ANCHOR in line:
+                if (CONCLUSION_PLACEHOLDER in line
+                        or THEOREMS_APPENDIX_START in line
+                        or PAPER_ANCHOR in line):
                     body_end_idx = i
                     break
             
@@ -371,6 +388,152 @@ async def get_previous_versions(self) -> list:
         async with self._lock:
             return self.previous_versions.copy()
     
+    def _extract_body_and_appendix(self, paper: str) -> tuple[str, str]:
+        """
+        Split existing paper into (body_lines_text, appendix_body_text).
+        
+        The "body" is all non-marker content that sits OUTSIDE the
+        THEOREMS_APPENDIX_START / THEOREMS_APPENDIX_END brackets. The
+        "appendix body" is everything BETWEEN those two markers (preserved
+        verbatim so repair operations never lose verified-theorem entries).
+        
+        Marker lines themselves (placeholders + anchor + appendix brackets)
+        are stripped from the body half; they get re-emitted by the repair
+        logic.
+        
+        Args:
+            paper: Raw paper content
+        
+        Returns:
+            (body_text, appendix_body_text). Both stripped. Either may be "".
+        """
+        lines = paper.split('\n')
+        body_lines: list[str] = []
+        appendix_lines: list[str] = []
+        in_appendix = False
+        
+        for line in lines:
+            if THEOREMS_APPENDIX_START in line:
+                in_appendix = True
+                continue
+            if THEOREMS_APPENDIX_END in line:
+                in_appendix = False
+                continue
+            
+            if in_appendix:
+                appendix_lines.append(line)
+                continue
+            
+            # Outside the appendix: skip structural markers
+            if (ABSTRACT_PLACEHOLDER in line
+                    or INTRO_PLACEHOLDER in line
+                    or CONCLUSION_PLACEHOLDER in line
+                    or PAPER_ANCHOR in line):
+                continue
+            
+            body_lines.append(line)
+        
+        return '\n'.join(body_lines).strip(), '\n'.join(appendix_lines).strip()
+    
+    def _build_appendix_block(self, appendix_body: str) -> str:
+        """
+        Produce the fully-bracketed appendix block as it should appear in
+        the paper file. When the caller has no entries yet, the empty
+        placeholder line is used so the LLM-facing rendering stays readable.
+        """
+        body = (appendix_body or "").strip()
+        if not body:
+            body = APPENDIX_EMPTY_PLACEHOLDER
+        return (
+            f"{THEOREMS_APPENDIX_START}\n"
+            f"{body}\n"
+            f"{THEOREMS_APPENDIX_END}"
+        )
+    
+    async def append_to_theorems_appendix(self, theorem_entry: str) -> bool:
+        """
+        Atomically append a verified-theorem entry to the Theorems Appendix.
+        
+        - Locates the THEOREMS_APPENDIX_END marker and inserts the new entry
+          immediately above it.
+        - If the appendix is still carrying the default APPENDIX_EMPTY_PLACEHOLDER
+          line, that line is replaced wholesale by the new entry (first entry).
+        - If neither marker exists yet, the paper is left untouched and False
+          is returned (caller should trigger ensure_markers_intact first).
+        - Triggers the re-chunking callback outside the lock so RAG sees the
+          new theorem text.
+        
+        Args:
+            theorem_entry: Preformatted entry (statement + Lean code + trailing
+                separator). Caller controls formatting.
+        
+        Returns:
+            True on success, False when the paper is missing or markers aren't
+            present yet.
+        """
+        entry = (theorem_entry or "").strip()
+        if not entry:
+            logger.warning("append_to_theorems_appendix called with empty entry")
+            return False
+        
+        final_content: Optional[str] = None
+        
+        async with self._lock:
+            if not self.file_path.exists():
+                logger.warning("Cannot append to appendix: paper file does not exist")
+                return False
+            
+            async with aiofiles.open(self.file_path, 'r', encoding='utf-8') as f:
+                paper = await f.read()
+            
+            if THEOREMS_APPENDIX_START not in paper or THEOREMS_APPENDIX_END not in paper:
+                logger.warning(
+                    "Appendix markers missing - cannot append theorem entry. "
+                    "Caller should call ensure_markers_intact() first."
+                )
+                return False
+            
+            body_text, appendix_body = self._extract_body_and_appendix(paper)
+            
+            # First real entry replaces the empty placeholder
+            if not appendix_body or appendix_body.strip() == APPENDIX_EMPTY_PLACEHOLDER:
+                new_appendix_body = entry
+            else:
+                new_appendix_body = f"{appendix_body}\n\n{entry}"
+            
+            # Reconstruct paper using the bracketed appendix block in the same
+            # slot it currently occupies. Simplest correct approach: locate
+            # the original bracket span and swap it out.
+            start_idx = paper.find(THEOREMS_APPENDIX_START)
+            end_idx = paper.find(THEOREMS_APPENDIX_END, start_idx)
+            if start_idx < 0 or end_idx < 0:
+                # Defensive: should not happen given the earlier guard.
+                logger.error("Appendix markers disappeared between checks")
+                return False
+            end_idx += len(THEOREMS_APPENDIX_END)
+            
+            new_block = self._build_appendix_block(new_appendix_body)
+            new_paper = paper[:start_idx] + new_block + paper[end_idx:]
+            
+            async with aiofiles.open(self.file_path, 'w', encoding='utf-8') as f:
+                await f.write(new_paper)
+            
+            self.version += 1
+            final_content = new_paper
+            logger.info(
+                f"Appended theorem to appendix (version {self.version}, "
+                f"appendix now {len(new_appendix_body)} chars)"
+            )
+        
+        # Trigger re-chunking callback OUTSIDE the lock to avoid deadlock
+        if final_content and self.rechunk_callback:
+            try:
+                await self.rechunk_callback(final_content)
+            except Exception as e:
+                logger.error(f"Re-chunking callback failed after appendix append: {e}")
+        
+        return True
+    
     async def ensure_placeholders_exist(self) -> bool:
         """
         Ensure placeholders exist in the paper when resuming from an existing file.
@@ -404,6 +567,8 @@ async def ensure_placeholders_exist(self) -> bool:
             has_intro_placeholder = INTRO_PLACEHOLDER in paper
             has_conclusion_placeholder = CONCLUSION_PLACEHOLDER in paper
             has_anchor = PAPER_ANCHOR in paper
+            has_appendix_start = THEOREMS_APPENDIX_START in paper
+            has_appendix_end = THEOREMS_APPENDIX_END in paper
             
             # Check for actual section content (not placeholders)
             # Use flexible patterns to detect if sections have been written
@@ -442,36 +607,38 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 else:
                     return len(after_header_sample) > 50  # No keywords, check substance
             
-            has_abstract_content = has_real_section_content(r'^Abstract\s*$', paper)
-            has_intro_content = has_real_section_content(r'^I\.?\s+Introduction|^Introduction\s*$', paper)
-            has_conclusion_content = has_real_section_content(r'^(?:[IVXLCDM]+\.?\s+)?Conclusion\s*$|^\d+\.?\s+Conclusion\s*$', paper)
-            
-            # If all placeholders exist OR corresponding content exists, nothing to do
-            if (has_abstract_placeholder or has_abstract_content) and \
-               (has_intro_placeholder or has_intro_content) and \
-               (has_conclusion_placeholder or has_conclusion_content):
-                logger.info("Placeholders check: All sections either have placeholders or actual content")
+            has_abstract_content = has_real_section_content(
+                r'^(?:Abstract\s*|\\(?:section|chapter)\*?\{Abstract\}|\\begin\{abstract\})\s*$',
+                paper,
+            )
+            has_intro_content = has_real_section_content(
+                r'^(?:(?:I\.?\s+)?Introduction|\\(?:section|chapter)\*?\{(?:I\.?\s*)?Introduction\})\s*$',
+                paper,
+            )
+            has_conclusion_content = has_real_section_content(
+                r'^(?:(?:[IVXLCDM]+\.?\s+|\d+\.?\s+)?Conclusion|\\(?:section|chapter)\*?\{Conclusion\})\s*$',
+                paper,
+            )
+            
+            # Real section content supersedes its placeholder. If both are
+            # present, rebuild below to strip the stale placeholder.
+            if (((has_abstract_placeholder or has_abstract_content) and not (has_abstract_placeholder and has_abstract_content)) and
+                    ((has_intro_placeholder or has_intro_content) and not (has_intro_placeholder and has_intro_content)) and
+                    ((has_conclusion_placeholder or has_conclusion_content) and not (has_conclusion_placeholder and has_conclusion_content)) and
+                    has_appendix_start and has_appendix_end):
+                logger.info("Placeholders check: all sections present and appendix intact")
                 return False
             
-            logger.info(f"Placeholder check - abstract: {has_abstract_placeholder}/{has_abstract_content}, "
-                       f"intro: {has_intro_placeholder}/{has_intro_content}, "
-                       f"conclusion: {has_conclusion_placeholder}/{has_conclusion_content}")
-            
-            # Need to add missing placeholders
-            # Extract current body content (everything that's not a placeholder or anchor)
-            lines = paper.split('\n')
-            body_lines = []
-            
-            for line in lines:
-                # Skip existing placeholders and anchor
-                if ABSTRACT_PLACEHOLDER in line or \
-                   INTRO_PLACEHOLDER in line or \
-                   CONCLUSION_PLACEHOLDER in line or \
-                   PAPER_ANCHOR in line:
-                    continue
-                body_lines.append(line)
+            logger.info(
+                f"Placeholder check - abstract: {has_abstract_placeholder}/{has_abstract_content}, "
+                f"intro: {has_intro_placeholder}/{has_intro_content}, "
+                f"conclusion: {has_conclusion_placeholder}/{has_conclusion_content}, "
+                f"appendix: {has_appendix_start}/{has_appendix_end}"
+            )
             
-            body_content = '\n'.join(body_lines).strip()
+            # Need to add missing placeholders. Preserve any existing appendix
+            # body content while we rebuild the skeleton.
+            body_content, appendix_body = self._extract_body_and_appendix(paper)
             
             if not body_content:
                 logger.warning("No body content found - cannot add placeholders to empty paper")
@@ -501,6 +668,11 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 new_paper_parts.append(CONCLUSION_PLACEHOLDER)
                 new_paper_parts.append("")
             
+            # Theorems Appendix (preserve existing entries if any, otherwise
+            # insert the empty placeholder line inside the bracket pair)
+            new_paper_parts.append(self._build_appendix_block(appendix_body))
+            new_paper_parts.append("")
+            
             # Anchor at end
             new_paper_parts.append(PAPER_ANCHOR)
             
@@ -544,6 +716,8 @@ async def ensure_markers_intact(self) -> bool:
             has_intro_placeholder = INTRO_PLACEHOLDER in paper
             has_conclusion_placeholder = CONCLUSION_PLACEHOLDER in paper
             has_anchor = PAPER_ANCHOR in paper
+            has_appendix_start = THEOREMS_APPENDIX_START in paper
+            has_appendix_end = THEOREMS_APPENDIX_END in paper
             
             # Check for actual section content (not placeholders)
             # CRITICAL: Must distinguish between real content and fake placeholders inserted by model
@@ -581,31 +755,29 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 else:
                     return len(after_header_sample) > 50  # No keywords, check substance
             
-            has_abstract_content = has_real_section_content(r'^Abstract\s*$', paper)
-            has_intro_content = has_real_section_content(r'^I\.?\s+Introduction|^Introduction\s*$', paper)
-            has_conclusion_content = has_real_section_content(r'^(?:[IVXLCDM]+\.?\s+)?Conclusion\s*$|^\d+\.?\s+Conclusion\s*$', paper)
-            
-            # If all markers exist OR corresponding content exists, nothing to repair
-            if (has_abstract_placeholder or has_abstract_content) and \
-               (has_intro_placeholder or has_intro_content) and \
-               (has_conclusion_placeholder or has_conclusion_content) and \
-               has_anchor:
+            has_abstract_content = has_real_section_content(
+                r'^(?:Abstract\s*|\\(?:section|chapter)\*?\{Abstract\}|\\begin\{abstract\})\s*$',
+                paper,
+            )
+            has_intro_content = has_real_section_content(
+                r'^(?:(?:I\.?\s+)?Introduction|\\(?:section|chapter)\*?\{(?:I\.?\s*)?Introduction\})\s*$',
+                paper,
+            )
+            has_conclusion_content = has_real_section_content(
+                r'^(?:(?:[IVXLCDM]+\.?\s+|\d+\.?\s+)?Conclusion|\\(?:section|chapter)\*?\{Conclusion\})\s*$',
+                paper,
+            )
+            
+            # Real section content supersedes its placeholder. If both are
+            # present, rebuild below to strip the stale placeholder.
+            if ((has_abstract_placeholder or has_abstract_content) and not (has_abstract_placeholder and has_abstract_content)) and \
+               ((has_intro_placeholder or has_intro_content) and not (has_intro_placeholder and has_intro_content)) and \
+               ((has_conclusion_placeholder or has_conclusion_content) and not (has_conclusion_placeholder and has_conclusion_content)) and \
+               has_anchor and has_appendix_start and has_appendix_end:
                 return False
             
-            # Need to repair - extract body content
-            lines = paper.split('\n')
-            body_lines = []
-            
-            for line in lines:
-                # Skip existing placeholders and anchor
-                if ABSTRACT_PLACEHOLDER in line or \
-                   INTRO_PLACEHOLDER in line or \
-                   CONCLUSION_PLACEHOLDER in line or \
-                   PAPER_ANCHOR in line:
-                    continue
-                body_lines.append(line)
-            
-            body_content = '\n'.join(body_lines).strip()
+            # Need to repair - preserve body + appendix body across the rebuild
+            body_content, appendix_body = self._extract_body_and_appendix(paper)
             
             if not body_content:
                 # Empty paper - just ensure anchor exists
@@ -638,6 +810,10 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
                 new_paper_parts.append(CONCLUSION_PLACEHOLDER)
                 new_paper_parts.append("")
             
+            # Theorems Appendix (preserve existing entries, default otherwise)
+            new_paper_parts.append(self._build_appendix_block(appendix_body))
+            new_paper_parts.append("")
+            
             # Anchor at end
             new_paper_parts.append(PAPER_ANCHOR)
             
diff --git a/backend/compiler/prompts/construction_prompts.py b/backend/compiler/prompts/construction_prompts.py
index e4fdd54..0d255ec 100644
--- a/backend/compiler/prompts/construction_prompts.py
+++ b/backend/compiler/prompts/construction_prompts.py
@@ -11,6 +11,7 @@
 from typing import Optional
 
 from backend.compiler.memory.compiler_rejection_log import compiler_rejection_log
+from backend.shared.config import system_config
 
 
 CONSTRUCTION_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES:
@@ -24,6 +25,36 @@
 - NEVER invent citations, experiments, benchmark numbers, hardware measurements, datasets, or code artifacts."""
 
 
+def get_wolfram_tool_guidance() -> str:
+    """Return prompt guidance for the construction-only Wolfram tool.
+
+    The actual OpenAI-compatible tool schema is registered by
+    HighContextSubmitter.submit_construction. This prompt section is only shown
+    when Wolfram is enabled so the model knows the tool exists and when to use
+    it.
+    """
+    if not system_config.wolfram_alpha_enabled:
+        return ""
+
+    return """WOLFRAM ALPHA TOOL AVAILABLE (CONSTRUCTION MODE ONLY):
+You may call the `wolfram_alpha_query` tool when it would help verify a mathematical or computational claim BEFORE writing it into the paper.
+
+Use the tool for:
+- concrete symbolic calculations, simplifications, integrals, sums, or equations
+- numerical checks, constants, arithmetic, factorization, or unit conversions
+- established computational facts that can be queried directly
+
+Do NOT use the tool for:
+- open research questions
+- narrative prose
+- claims that require Lean 4 proof verification
+- broad literature claims or source discovery
+
+Tool budget: up to 20 Wolfram Alpha calls for this submission. If you do not need a computational check, skip the tool and produce your JSON normally.
+
+When you use the tool, incorporate only relevant verified results into your final JSON `new_string` and explain in `reasoning` how the Wolfram result informed the content. The system records the full audit trail separately."""
+
+
 # =============================================================================
 # PHASE-SPECIFIC CONSTRUCTION PROMPTS
 # =============================================================================
@@ -79,10 +110,16 @@ def get_body_construction_system_prompt() -> str:
 **PAPER ANCHOR** (marks document boundary):
 - [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
 
+**THEOREMS APPENDIX BRACKETS** (wrap verified Lean 4 theorem appendix):
+- [HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]
+- [HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]
+
 CRITICAL DISTINCTIONS:
 1. **Placeholders/anchors in CURRENT DOCUMENT PROGRESS (shown below)**: These are SYSTEM-MANAGED. The code in paper_memory.py adds them automatically. You did NOT create them.
 
-2. **You must NEVER output these markers in YOUR SUBMISSIONS**: If you include any of these markers in your submitted content, your submission will be automatically rejected by pre-validation.
+2. **Use editable prose for old_string anchors**: old_string must match the visible CURRENT DOCUMENT PROGRESS verbatim. Do not include theorem appendix brackets or the paper anchor in insert_after/delete targets. For replace, prefer editable content only; if you accidentally include a protected marker as trailing context, the validator may trim it.
+
+3. **You must NEVER include these markers in new_string / generated paper content**: If markers appear in your generated content, the system will strip or reject them.
 
 HOW PLACEHOLDERS WORK:
 - When you see a placeholder in CURRENT DOCUMENT PROGRESS, that section has NOT been written yet
@@ -256,10 +293,16 @@ def get_conclusion_construction_system_prompt() -> str:
 **PAPER ANCHOR** (marks document boundary):
 - [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
 
+**THEOREMS APPENDIX BRACKETS** (wrap verified Lean 4 theorem appendix):
+- [HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]
+- [HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]
+
 CRITICAL DISTINCTIONS:
 1. **Placeholders/anchors in CURRENT DOCUMENT PROGRESS (shown below)**: These are SYSTEM-MANAGED. The code in paper_memory.py adds them automatically. You did NOT create them.
 
-2. **You must NEVER output these markers in YOUR SUBMISSIONS**: If you include any of these markers in your submitted content, your submission will be automatically rejected by pre-validation.
+2. **Use editable prose for old_string anchors**: old_string must match the visible CURRENT DOCUMENT PROGRESS verbatim. Do not include theorem appendix brackets or the paper anchor in insert_after/delete targets. For replace, prefer editable content only; if you accidentally include a protected marker as trailing context, the validator may trim it.
+
+3. **You must NEVER include these markers in new_string / generated paper content**: If markers appear in your generated content, the system will strip or reject them.
 
 HOW PLACEHOLDERS WORK:
 - When you see a placeholder in CURRENT DOCUMENT PROGRESS, that section has NOT been written yet
@@ -407,10 +450,16 @@ def get_introduction_construction_system_prompt() -> str:
 **PAPER ANCHOR** (marks document boundary):
 - [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
 
+**THEOREMS APPENDIX BRACKETS** (wrap verified Lean 4 theorem appendix):
+- [HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]
+- [HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]
+
 CRITICAL DISTINCTIONS:
 1. **Placeholders/anchors in CURRENT DOCUMENT PROGRESS (shown below)**: These are SYSTEM-MANAGED. The code in paper_memory.py adds them automatically. You did NOT create them.
 
-2. **You must NEVER output these markers in YOUR SUBMISSIONS**: If you include any of these markers in your submitted content, your submission will be automatically rejected by pre-validation.
+2. **Use editable prose for old_string anchors**: old_string must match the visible CURRENT DOCUMENT PROGRESS verbatim. Do not include theorem appendix brackets or the paper anchor in insert_after/delete targets. For replace, prefer editable content only; if you accidentally include a protected marker as trailing context, the validator may trim it.
+
+3. **You must NEVER include these markers in new_string / generated paper content**: If markers appear in your generated content, the system will strip or reject them.
 
 HOW PLACEHOLDERS WORK:
 - When you see a placeholder in CURRENT DOCUMENT PROGRESS, that section has NOT been written yet
@@ -563,10 +612,16 @@ def get_abstract_construction_system_prompt() -> str:
 **PAPER ANCHOR** (marks document boundary):
 - [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
 
+**THEOREMS APPENDIX BRACKETS** (wrap verified Lean 4 theorem appendix):
+- [HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]
+- [HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]
+
 CRITICAL DISTINCTIONS:
 1. **Placeholders/anchors in CURRENT DOCUMENT PROGRESS (shown below)**: These are SYSTEM-MANAGED. The code in paper_memory.py adds them automatically. You did NOT create them.
 
-2. **You must NEVER output these markers in YOUR SUBMISSIONS**: If you include any of these markers in your submitted content, your submission will be automatically rejected by pre-validation.
+2. **Use editable prose for old_string anchors**: old_string must match the visible CURRENT DOCUMENT PROGRESS verbatim. Do not include theorem appendix brackets or the paper anchor in insert_after/delete targets. For replace, prefer editable content only; if you accidentally include a protected marker as trailing context, the validator may trim it.
+
+3. **You must NEVER include these markers in new_string / generated paper content**: If markers appear in your generated content, the system will strip or reject them.
 
 HOW PLACEHOLDERS WORK:
 - When you see a placeholder in CURRENT DOCUMENT PROGRESS, that section has NOT been written yet
@@ -939,6 +994,11 @@ async def build_construction_prompt(
         get_construction_json_schema(),
         "\n---\n"
     ]
+
+    wolfram_guidance = get_wolfram_tool_guidance()
+    if wolfram_guidance:
+        parts.append(wolfram_guidance)
+        parts.append("\n---\n")
     
     # Add rejection history (DIRECT INJECTION - almost always fits)
     rejection_history = await compiler_rejection_log.get_rejections_text()
diff --git a/backend/compiler/prompts/review_prompts.py b/backend/compiler/prompts/review_prompts.py
index 815d6e4..0b700e8 100644
--- a/backend/compiler/prompts/review_prompts.py
+++ b/backend/compiler/prompts/review_prompts.py
@@ -88,12 +88,19 @@ def get_review_system_prompt() -> str:
 **PAPER ANCHOR** (marks document boundary):
 - [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
 
+**THEOREMS APPENDIX BRACKETS** (wrap verified Lean 4 theorem appendix):
+- [HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]
+- [HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]
+
 IMPORTANT: These markers are SYSTEM-MANAGED (added by paper_memory.py), NOT AI-generated content. They are NORMAL and EXPECTED during document construction.
 
-**YOU MUST NEVER OUTPUT THESE MARKERS IN YOUR EDITS**
+**MARKER USE IN EDITS**
 
 When making edits:
-- Do NOT include any of these markers in your edit content
+- Use editable prose for old_string anchors
+- Do not include theorem appendix brackets or the paper anchor in insert_after/delete targets
+- For replace, prefer editable content only; if a protected marker is accidentally included as trailing context, validation may trim it
+- Do NOT include any of these markers in new_string / generated edit content
 - Placeholders in the current document are expected - don't try to remove them
 - Your edits should contain only actual mathematical prose
 
diff --git a/backend/compiler/prompts/rigor_prompts.py b/backend/compiler/prompts/rigor_prompts.py
index 56d1c50..5491eb6 100644
--- a/backend/compiler/prompts/rigor_prompts.py
+++ b/backend/compiler/prompts/rigor_prompts.py
@@ -1,19 +1,43 @@
 """
-Rigor prompts for mathematical rigor enhancement (2-step process).
+Rigor prompts for the Lean-4-verified-theorem rigor mode.
 
-Step 1: Planning - LLM decides if rigor work needed and chooses mode
-Step 2: Execution - LLM executes with self-refusal option
+The compiler's rigor loop no longer edits paper text directly. Instead it runs
+a two-stage agent:
+
+    Stage 1 - Theorem discovery (build_rigor_theorem_discovery_prompt):
+        Using the full writing context, the submitter asks itself whether the
+        paper contains a theorem worth formalizing and proving in Lean 4 that
+        has not already been verified. Output is a candidate theorem JSON (or
+        a decline).
+
+    Stage 2 - Placement (build_rigor_placement_prompt):
+        Given a Lean-4-verified theorem, the submitter proposes an inline
+        edit that introduces the theorem to the paper with an explicit
+        "verified in Lean 4" marker and a pointer to the Theorems Appendix.
+        The submitter gets up to two placement attempts; attempt 2 receives
+        the validator's rejection feedback from attempt 1.
+
+Context assembly follows the RAG offload priority documented in
+`.cursor/rules/rag-design-for-overall-program.mdc`:
+
+    Submitter: Shared Training DB -> Local Submitter DB -> Rejection Log -> User Upload Files
+
+The high-param submitter direct-injects the outline and paper when they fit
+inside the budget (mirroring HighContextSubmitter.submit_construction), then
+fills the remaining budget with RAG results that exclude `compiler_outline.txt`
+and `compiler_paper.txt`.
 """
 
+from typing import Iterable, List, Optional
+
 from backend.compiler.memory.compiler_rejection_log import compiler_rejection_log
-from backend.shared.config import system_config
 
 
 # =============================================================================
-# INTERNAL CONTENT WARNING (shared across all prompts)
+# INTERNAL CONTENT WARNING (shared across all rigor prompts)
 # =============================================================================
 
-INTERNAL_CONTENT_WARNING = """⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
+INTERNAL_CONTENT_WARNING = """WARNING - INTERNAL CONTENT WARNING
 
 ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
 
@@ -24,544 +48,368 @@
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
- The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
- 
- WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
+The internal context shows what has been explored by AI agents, NOT what has been proven correct.
 
----"""
+The EXCEPTION is content inside the "LEAN 4 VERIFIED" certificate block provided with a placement request: that Lean 4 proof has been mechanically verified by the Lean 4 toolchain and is the source of truth for the mathematical statement it closes."""
 
 
 # =============================================================================
-# STEP 1: PLANNING PROMPTS
+# STAGE 1: THEOREM DISCOVERY
 # =============================================================================
 
-def get_rigor_planning_system_prompt(wolfram_enabled: bool = False) -> str:
-    """Get system prompt for Step 1: rigor planning."""
-    wolfram_mode_section = ""
-    if wolfram_enabled:
-        wolfram_mode_section = """
-3. **wolfram_verification**: Verify mathematical claim with Wolfram Alpha API
-   - Send specific computable query to Wolfram Alpha
-   - System will make the API call and pass result to Step 2
-   - Examples: "Is pi algebraic?", "Solve x^2 + 2x + 1 = 0", "Is 2^67-1 prime?"
-   - Use for computational verification of claims
-"""
-    else:
-        wolfram_mode_section = """
-3. **wolfram_verification**: NOT AVAILABLE (Wolfram Alpha not enabled)
-"""
-    
-    return f"""You are planning rigor enhancements for a mathematical document.
+_DISCOVERY_SYSTEM_PROMPT = f"""You are the rigor agent for a mathematical-paper compiler. Your job during the rigor loop is to look at the paper-in-progress together with the full research context and decide whether there is a theorem worth formalizing and proving in Lean 4.
 
 {INTERNAL_CONTENT_WARNING}
 
-YOUR TASK - STEP 1: PLANNING
-
-Review the current document and decide:
-1. Does it need rigor work?
-2. If yes, which approach is best?
-3. What section should Step 2 focus on?
-
-THREE MODES AVAILABLE:
-
-1. **standard_enhancement**: Normal rigor improvements
-   - Strengthen proof arguments with additional steps
-   - Clarify assumptions and conditions
-   - Add intermediate lemmas
-   - Improve precision of notation
-   - Address counterexamples or edge cases
-
-2. **rewrite_focus**: Significant rewriting needed for rigor
-   - Identify specific section that needs substantial improvement
-   - You'll specify that section for Step 2 to work on
-   - Use when proofs are fundamentally weak or unclear
-{wolfram_mode_section}
-
-CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
-
-The CURRENT DOCUMENT may contain system-managed markers:
+YOUR TASK - STAGE 1 (DISCOVERY)
 
-**SECTION PLACEHOLDERS** (show where sections will be written):
-- [HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION...]
-- [HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION...]
-- [HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION...]
+1. Read the current outline and the current paper text.
+2. Read the list of theorems that have ALREADY been verified by Lean 4 (EXISTING VERIFIED PROOFS block).
+3. Read the list of theorems that PREVIOUSLY FAILED Lean 4 verification (OPEN LEMMA TARGETS block, if present).
+4. Decide exactly one of:
+   (A) `needs_theorem_work=false` - no theorem worth trying right now. Good reasons: all interesting claims in the paper are already covered by existing verified proofs; the paper is in too early a state; there is no claim a Lean 4 proof could close usefully.
+   (B) `needs_theorem_work=true` - propose a single candidate theorem to formalize.
 
-**PAPER ANCHOR** (marks document boundary):
-- [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
+RULES FOR PROPOSING A THEOREM:
+- The theorem must be provable in Lean 4 with Mathlib.
+- You MUST NOT re-propose a theorem that is already in EXISTING VERIFIED PROOFS. Look for theorems that are DIFFERENT - new results, missed lemmas, or sharper versions that are not yet on the list.
+- You MAY retry a theorem from OPEN LEMMA TARGETS when the paper now gives you a better angle on it. When you do, set `retry_existing_failure_id` to the failed `theorem_id`.
+- Prefer theorems whose statements are tight enough that Lean 4 can actually close them (arithmetic facts, concrete inequalities, specific algebraic identities, small group/ring/field lemmas, concrete combinatorial identities) over large open conjectures.
+- The `theorem_statement` is for a human reader. It should be precise, self-contained, and include the hypotheses.
+- The `formal_sketch` tells the formalization agent what tactics or lemmas look promising in Lean 4 / Mathlib. Keep it concrete.
+- The `source_excerpt` is 2-6 sentences of surrounding paper text that motivates why this theorem is a natural target here. It must be a direct paraphrase or quote from the current paper.
 
-IMPORTANT: These markers are SYSTEM-MANAGED. Do NOT include them in your outputs.
-
-TARGET SECTION:
-Specify `target_section` as a text snippet (200-500 chars) that identifies which section needs work.
-This provides continuity to Step 2 - it's a reminder/label, not a context limitation.
-Step 2 will see the FULL paper (same as you do now).
-
-If the document is already rigorous enough, set needs_rigor_work=false.
-
-STEP 2 WILL HAVE THE OPTION TO REFUSE if your assessment is wrong.
-Don't overthink this - Step 2 can self-correct.
+If Stage 1 guesses wrong, Stage 2 cannot recover - 5 Lean 4 attempts will be spent on the wrong target. Prefer declining over a weak proposal.
 
 Output your response ONLY as JSON in this exact format:
-{{
-  "needs_rigor_work": true or false,
-  "mode": "standard_enhancement | rewrite_focus | wolfram_verification | null",
-  "target_section": "exact text snippet from paper (200-500 chars, empty if needs_rigor_work=false)",
-  "wolfram_query": "natural language query for Wolfram Alpha (only if mode=wolfram_verification)",
-  "preliminary_reasoning": "why this approach and this target section"
-}}"""
-
-
-def get_rigor_planning_json_schema() -> str:
-    """Get JSON schema for Step 1: planning."""
-    return """
-REQUIRED JSON FORMAT - STEP 1 (PLANNING):
-{
-  "needs_rigor_work": true OR false,
-  "mode": "standard_enhancement" | "rewrite_focus" | "wolfram_verification" | null,
-  "target_section": "string - text snippet from paper (200-500 chars, identifies work area)",
-  "wolfram_query": "string - natural language query for Wolfram Alpha (only if mode=wolfram_verification)",
-  "preliminary_reasoning": "string - explanation of chosen approach and target section"
-}
+{{{{
+  "needs_theorem_work": true or false,
+  "theorem_statement": "precise theorem statement with explicit hypotheses and conclusion (empty if needs_theorem_work=false)",
+  "formal_sketch": "concrete sketch: what tactics / Mathlib lemmas you expect to work (empty if needs_theorem_work=false)",
+  "source_excerpt": "2-6 sentences of surrounding paper text that motivates this theorem (empty if needs_theorem_work=false)",
+  "retry_existing_failure_id": "theorem_id from OPEN LEMMA TARGETS if retrying a prior failure, empty string otherwise",
+  "reasoning": "why this theorem is the best target right now OR why no theorem should be attempted"
+}}}}"""
+
 
-FIELD REQUIREMENTS:
-- needs_rigor_work: Whether any rigor work should be attempted
-- mode: Required if needs_rigor_work=true, null otherwise
-  * standard_enhancement: Normal rigor improvements
-  * rewrite_focus: Significant rewriting needed
-  * wolfram_verification: Verify claim with Wolfram Alpha (only if enabled)
-- target_section: ALWAYS required if needs_rigor_work=true
-  * Text snippet (200-500 chars) identifying which section to work on
-  * Provides continuity to Step 2 (guidance, not context limitation)
-  * Step 2 will see the FULL paper, not just this section
-- wolfram_query: Required ONLY if mode=wolfram_verification
-  * Natural language query for computational verification
-  * Examples: "Is pi algebraic?", "Solve x^2 + 2x + 1 = 0"
-- preliminary_reasoning: ALWAYS required
-
-Example (Standard Enhancement):
+_DISCOVERY_JSON_SCHEMA = """REQUIRED JSON FORMAT - STAGE 1 (DISCOVERY):
 {
-  "needs_rigor_work": true,
-  "mode": "standard_enhancement",
-  "target_section": "Theorem 3.2: Every constructible number is algebraic.\\nProof: Let alpha be constructible...",
-  "wolfram_query": "",
-  "preliminary_reasoning": "Theorem 3.2's proof needs more precise field-theoretic justification for the algebraicity claim"
+  "needs_theorem_work": true OR false,
+  "theorem_statement": "string",
+  "formal_sketch": "string",
+  "source_excerpt": "string",
+  "retry_existing_failure_id": "string (may be empty)",
+  "reasoning": "string"
 }
 
-Example (Wolfram Verification):
+Example (propose a theorem):
 {
-  "needs_rigor_work": true,
-  "mode": "wolfram_verification",
-  "target_section": "Theorem 4.1: π is transcendental.\\nProof sketch: By Lindemann-Weierstrass...",
-  "wolfram_query": "Is pi algebraic?",
-  "preliminary_reasoning": "Computational verification would strengthen the π transcendence claim"
+  "needs_theorem_work": true,
+  "theorem_statement": "For every natural number n, the sum of the first n positive integers equals n*(n+1)/2.",
+  "formal_sketch": "Induction on n. Base: n=0 both sides are 0. Step: use Finset.sum_range_succ and Nat.succ_mul; close with omega / ring. Mathlib has Finset.sum_range_id which may finish it outright.",
+  "source_excerpt": "In Section 2 we reasoned about partial sums of the form 1 + 2 + ... + n...",
+  "retry_existing_failure_id": "",
+  "reasoning": "Section 2 relies on the closed form but currently presents it without a verified proof. Lean 4 can close this cleanly; it does not duplicate any existing verified proof."
 }
 
-Example (No Work Needed):
+Example (decline):
 {
-  "needs_rigor_work": false,
-  "mode": null,
-  "target_section": "",
-  "wolfram_query": "",
-  "preliminary_reasoning": "Document maintains appropriate rigor for current stage. All proofs complete, definitions precise."
+  "needs_theorem_work": false,
+  "theorem_statement": "",
+  "formal_sketch": "",
+  "source_excerpt": "",
+  "retry_existing_failure_id": "",
+  "reasoning": "The paper currently contains only outline scaffolding and the one verified theorem (proof_002). Attempting another Lean 4 proof right now would either duplicate proof_002 or target claims that are too vague to formalize."
 }
 """
 
 
 # =============================================================================
-# STEP 2: EXECUTION PROMPTS
+# STAGE 2: PLACEMENT
 # =============================================================================
 
-def get_rigor_execution_system_prompt(mode: str) -> str:
-    """Get system prompt for Step 2: rigor execution."""
-    mode_specific_guidance = {
-        "standard_enhancement": """
-YOU ARE EXECUTING: Standard Rigor Enhancement
-Your prior planning indicated normal rigor improvements are needed.""",
-        "rewrite_focus": """
-YOU ARE EXECUTING: Rewrite Focus
-Your prior planning indicated significant rewriting is needed for rigor."""
-    }
-    
-    guidance = mode_specific_guidance.get(mode, "")
-    
-    return f"""You are executing a rigor enhancement based on your prior planning.
+_PLACEMENT_SYSTEM_PROMPT = f"""You are the rigor agent for a mathematical-paper compiler. A theorem you proposed has been formally verified by the Lean 4 toolchain. Your ONLY job now is to decide where in the paper the theorem should be introduced.
 
 {INTERNAL_CONTENT_WARNING}
 
-{guidance}
-
-YOUR PRIOR DECISION (Step 1):
-Mode: {mode}
-Target Section: [shown below in context]
+YOUR TASK - STAGE 2 (PLACEMENT)
 
-STEP 2: EXECUTION - YOU CAN REFUSE
+You are given:
+- The current outline and the current paper.
+- The VERIFIED Lean 4 theorem: statement + proof ID + Lean code.
+- Optionally (on attempt 2 of 2), the validator's rejection feedback from attempt 1.
 
-Review the full document and your target section.
-If you realize your Step 1 assessment was wrong, set proceed=false.
+You must produce exactly one paper edit that introduces the theorem inline. The edit uses exact-string matching: you pick `old_string` (must appear verbatim in the current paper), `operation` ("replace" or "insert_after"), and `new_string` (the replacement / insertion text).
 
-Refusals are NOT validated - you won't be penalized.
-This is your chance to self-correct.
+HARD REQUIREMENTS ON `new_string`:
 
-If you proceed, propose your rigor enhancement using exact string matching:
-1. Find EXACT text in the document (must exist verbatim)
-2. Choose operation: "replace" or "insert_after"
-3. Provide enhanced version
+1. Include a clear inline theorem statement (mirroring the verified statement but formatted for human readers; LaTeX math allowed).
+2. Include an explicit "verified in Lean 4" marker. Preferred wording is "(verified in Lean 4, see Appendix A, <proof_id>)" immediately after the theorem label, e.g. "Theorem 3.2 (verified in Lean 4, see Appendix A, proof_007)." .
+3. Include a short informal proof sketch or remark connecting the theorem to the surrounding prose. Keep it 1-4 sentences.
+4. DO NOT paste the Lean 4 source code into `new_string`. The full Lean proof lives in the Theorems Appendix block at the end of the paper; the system inserts it there automatically. Duplicating the Lean code inline is grounds for rejection.
+5. DO NOT emit any of the system-managed markers (ABSTRACT / INTRODUCTION / CONCLUSION placeholders, the paper anchor, or either Theorems Appendix bracket) in `new_string`. Use editable prose for `old_string`; do not include protected markers in insert_after anchors.
 
-CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
+PLACEMENT GUIDELINES:
+- Put the theorem where it strengthens the local argument. Prefer insertion points inside a relevant body section (near the discussion it closes) over dumping it in a new section.
+- The paper has a Theorems Appendix block already; do NOT try to edit the appendix directly.
+- Keep `old_string` short but unique (3-5 lines of surrounding context is usually enough).
 
-The CURRENT DOCUMENT may contain system-managed markers:
-
-**SECTION PLACEHOLDERS**:
-- [HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION...]
-- [HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION...]
-- [HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION...]
-
-**PAPER ANCHOR**:
-- [HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]
-
-Do NOT include these markers in your enhancement content.
-
-EXACT STRING MATCHING FOR EDITS:
-- old_string must exist verbatim in the document
-- Must be unique (appears only once)
-- Include enough context (3-5 lines) for uniqueness
-- System will pre-validate before validator sees it
-
-OPERATIONS:
-- "replace": Find old_string exactly, replace with new_string
-- "insert_after": Find old_string (anchor), insert new_string after it
+SELF-REFUSAL:
+If, after re-reading the paper, you conclude that the theorem cannot be placed well anywhere inline (even in the appendix-only fallback), you MAY still attempt a placement - the system will route the theorem to the appendix automatically if both placement attempts are rejected, so the mathematical content is never lost. Only refuse (set `proceed=false`) if you cannot produce any legal edit at all (e.g. the paper body is empty).
 
 Output your response ONLY as JSON in this exact format:
-{{
+{{{{
   "proceed": true or false,
-  "needs_enhancement": true or false,
   "operation": "replace | insert_after",
-  "old_string": "exact text from document (empty if not proceeding or needs_enhancement=false)",
-  "new_string": "enhanced text (empty if not proceeding or needs_enhancement=false)",
-  "content": "full content for logging (typically same as new_string)",
-  "reasoning": "explanation of changes OR refusal reason"
-}}"""
-
-
-def get_rigor_wolfram_execution_system_prompt() -> str:
-    """Get system prompt for Step 2: Wolfram verification execution."""
-    return f"""You are executing Wolfram Alpha verification based on your prior planning.
+  "old_string": "exact text from the current paper (empty if proceed=false)",
+  "new_string": "the inline theorem introduction text (empty if proceed=false)",
+  "reasoning": "why this placement works, or the refusal reason"
+}}}}"""
 
-{INTERNAL_CONTENT_WARNING}
-
-YOU ARE EXECUTING: Wolfram Alpha Verification
-Your prior planning requested computational verification of a mathematical claim.
-
-YOUR PRIOR DECISION (Step 1):
-Wolfram Alpha Query: [shown below]
-Target Section: [shown below in context]
-
-WOLFRAM ALPHA RESULT:
-[shown below]
-
-STEP 2: EXECUTION - YOU CAN REFUSE
-
-Review the Wolfram Alpha result in context of the full document.
-
-You can REFUSE (proceed=false) if:
-- The query was inappropriate or malformed
-- Result doesn't help strengthen rigor
-- Target section choice was wrong
-- Step 1 made a mistake
 
-If you proceed, create a verification remark that:
-- Interprets the Wolfram Alpha result
-- Relates it to the paper's claims
-- Strengthens mathematical rigor
-- Uses "insert_after" to add the remark
-
-CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
-
-The CURRENT DOCUMENT may contain system-managed markers. Do NOT include them in your outputs.
-
-EXACT STRING MATCHING:
-- old_string must exist verbatim in the document
-- Must be unique
-- System will pre-validate
-
-VERIFICATION REMARK FORMAT:
-Format your new_string as a mathematical remark:
-
-\\n\\n**Computational Verification (Wolfram Alpha)**\\n
-Query: [the query]\\n
-Result: [Wolfram's answer]\\n
-Interpretation: [Your analysis of what this means for the paper's claims]\\n
-
-Output your response ONLY as JSON in this exact format:
-{{
-  "proceed": true or false,
-  "verification_result_interpretation": "how you interpret the Wolfram result",
-  "needs_enhancement": true or false,
-  "operation": "insert_after",
-  "old_string": "exact text after which to insert remark (empty if not proceeding or needs_enhancement=false)",
-  "new_string": "verification remark incorporating Wolfram result (empty if not proceeding or needs_enhancement=false)",
-  "content": "full content for logging (typically same as new_string)",
-  "reasoning": "explanation OR refusal reason"
-}}"""
-
-
-def get_rigor_execution_json_schema(mode: str) -> str:
-    """Get JSON schema for Step 2: execution."""
-    if mode == "wolfram_verification":
-        return """
-REQUIRED JSON FORMAT - STEP 2 (WOLFRAM VERIFICATION):
+_PLACEMENT_JSON_SCHEMA = """REQUIRED JSON FORMAT - STAGE 2 (PLACEMENT):
 {
   "proceed": true OR false,
-  "verification_result_interpretation": "string - how you interpret the Wolfram Alpha result",
-  "needs_enhancement": true OR false,
-  "operation": "insert_after",
-  "old_string": "string - exact text after which to insert verification remark",
-  "new_string": "string - verification remark incorporating Wolfram result",
-  "content": "string - full content for logging",
-  "reasoning": "string - explanation OR refusal reason"
+  "operation": "replace" OR "insert_after",
+  "old_string": "string - exact text in the current paper (anchor point)",
+  "new_string": "string - inline theorem introduction with Lean 4 marker and appendix reference",
+  "reasoning": "string - why this placement works (or refusal reason)"
 }
 
-SELF-REFUSAL OPTION:
-If you set proceed=false:
-- System logs refusal (not counted as rejection)
-- No validation occurs
-- Workflow continues normally
-- Use when Step 1 made a mistake or query was inappropriate
-
-WOLFRAM VERIFICATION REMARKS:
-Format your new_string as:
-
-\\n\\n**Computational Verification (Wolfram Alpha)**\\n
-Query: [the query]\\n
-Result: [Wolfram's answer]\\n
-Interpretation: [Your analysis]\\n
-
-Example:
-{
-  "proceed": true,
-  "verification_result_interpretation": "Wolfram confirms π is transcendental (not algebraic)",
-  "needs_enhancement": true,
-  "operation": "insert_after",
-  "old_string": "Theorem 4.1: π is transcendental. \\\\square",
-  "new_string": "\\n\\n**Computational Verification (Wolfram Alpha)**\\nQuery: Is pi algebraic?\\nResult: No\\nInterpretation: This computational verification confirms π is transcendental, consistent with the Lindemann-Weierstrass theorem.",
-  "content": "\\n\\n**Computational Verification (Wolfram Alpha)**\\nQuery: Is pi algebraic?\\nResult: No\\nInterpretation: This computational verification confirms π is transcendental, consistent with the Lindemann-Weierstrass theorem.",
-  "reasoning": "Adding computational verification strengthens the claim by providing an independent confirmation"
-}
-"""
-    else:  # standard_enhancement or rewrite_focus
-        return """
-REQUIRED JSON FORMAT - STEP 2 (EXECUTION):
-{
-  "proceed": true OR false,
-  "needs_enhancement": true OR false,
-  "operation": "replace" | "insert_after",
-  "old_string": "string - exact text from document",
-  "new_string": "string - enhanced text",
-  "content": "string - full content for logging",
-  "reasoning": "string - explanation OR refusal reason"
-}
-
-SELF-REFUSAL OPTION:
-If you set proceed=false:
-- System logs refusal (not counted as rejection)
-- No validation occurs
-- Workflow continues normally
-- Use when Step 1 made a mistake
-
-EXACT STRING MATCHING:
-- old_string must exist verbatim in the document
-- Must be unique
-- If not found: pre-validation rejects before LLM sees it
-
 CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-3. Newlines: Use \\n for newlines (NOT \\\\n)
-4. LaTeX notation: Escape backslashes - write "\\\\mathbb{Z}", "\\\\Delta", etc.
+1. Backslashes: ALWAYS double-escape any backslash - write "\\\\mathbb{Z}" not "\\mathbb{Z}".
+2. Quotes inside strings: escape as \\\\".
+3. Newlines inside strings: \\n (not \\\\n).
+4. Use editable prose for old_string anchors. Do not include protected system markers in insert_after anchors or new_string. For replace, prefer editable content only; if a marker is accidentally included as trailing context, validation may trim it.
 
-Example (Enhancement):
+Example (insert_after):
 {
   "proceed": true,
-  "needs_enhancement": true,
   "operation": "insert_after",
-  "old_string": "Theorem 2.3: A number \\\\alpha is constructible if and only if it lies in a field extension of \\\\mathbb{Q} of degree 2^n.",
-  "new_string": "\\n\\nRemark: This characterization requires the field extension to be normal and separable over \\\\mathbb{Q}. If K/\\\\mathbb{Q} contains constructible \\\\alpha, there exists a tower \\\\mathbb{Q} = K_0 \\\\subset K_1 \\\\subset \\\\ldots \\\\subset K_n = K where each K_{i+1}/K_i has degree exactly 2.",
-  "content": "\\n\\nRemark: This characterization requires the field extension to be normal and separable over \\\\mathbb{Q}. If K/\\\\mathbb{Q} contains constructible \\\\alpha, there exists a tower \\\\mathbb{Q} = K_0 \\\\subset K_1 \\\\subset \\\\ldots \\\\subset K_n = K where each K_{i+1}/K_i has degree exactly 2.",
-  "reasoning": "Adding field-theoretic precision strengthens the theorem statement"
+  "old_string": "In this section we examine partial sums of the form 1 + 2 + ... + n and look for a closed form.",
+  "new_string": "\\n\\nTheorem 2.3 (verified in Lean 4, see Appendix A, proof_007). For every n \\\\in \\\\mathbb{N}, \\\\sum_{k=1}^{n} k = n(n+1)/2.\\n\\nProof sketch. Induction on n, with Finset.sum_range_succ closing the step; the closed form follows by elementary algebra. The full Lean 4 proof appears in the Theorems Appendix under proof_007.",
+  "reasoning": "Section 2 already motivates the closed form but presents it without a proof; inserting the theorem here strengthens the argument at the exact point where the claim first appears. The Lean code itself is kept in the appendix to keep the body readable."
 }
 
-Example (Refusal):
+Example (refusal):
 {
   "proceed": false,
-  "needs_enhancement": false,
-  "operation": "replace",
+  "operation": "insert_after",
   "old_string": "",
   "new_string": "",
-  "content": "",
-  "reasoning": "Upon review, Step 1's assessment was wrong. The target section is already rigorous enough."
+  "reasoning": "The paper body is currently empty; no legal placement anchor exists. Let the system route the theorem directly to the Theorems Appendix."
 }
 """
 
 
 # =============================================================================
-# PROMPT BUILDERS
+# HELPERS
 # =============================================================================
 
-async def build_rigor_planning_prompt(
-    user_prompt: str,
-    current_outline: str,
-    current_paper: str
-) -> str:
-    """
-    Build complete prompt for Step 1: rigor planning.
-    
-    Args:
-        user_prompt: User's compiler-directing prompt
-        current_outline: Current outline (ALWAYS fully injected)
-        current_paper: Current document (RAG-retrieved if large)
-    
-    Returns:
-        Complete prompt string
+def _format_existing_verified_proofs(proofs: Iterable[dict]) -> str:
+    """Compact rendering of already-verified proofs for the discovery prompt.
+
+    Each entry shows just the proof_id, novelty flag, and the theorem
+    statement - enough for the LLM to recognize duplicates without blowing
+    the context budget on full Lean 4 source.
     """
-    # Check if Wolfram Alpha is enabled
-    wolfram_enabled = system_config.wolfram_alpha_enabled
-    
-    parts = [
-        get_rigor_planning_system_prompt(wolfram_enabled),
-        "\n---\n",
-        get_rigor_planning_json_schema(),
-        "\n---\n"
-    ]
-    
-    # Add rejection history (DIRECT INJECTION - almost always fits)
-    rejection_history = await compiler_rejection_log.get_rejections_text()
-    if rejection_history:
-        parts.append(f"""YOUR RECENT REJECTION HISTORY (Last 10 rejections):
-{rejection_history}
+    lines: List[str] = []
+    for index, proof in enumerate(proofs, start=1):
+        proof_id = str(proof.get("proof_id", "") or "").strip() or f"proof_{index}"
+        novel = bool(proof.get("novel", False))
+        statement = str(proof.get("theorem_statement", "") or "").strip()
+        if not statement:
+            continue
+        # One-line compact form; the discovery model only needs uniqueness signals.
+        marker = "novel" if novel else "known"
+        lines.append(f"- [{proof_id}] ({marker}) {statement}")
+    if not lines:
+        return ""
+    return (
+        "EXISTING VERIFIED PROOFS (do NOT re-propose these; pick a DIFFERENT theorem):\n"
+        + "\n".join(lines)
+    )
+
+
+def _format_recent_failure_hints(hints: Iterable) -> str:
+    """Compact rendering of recent failed candidates for the discovery prompt."""
+    entries: List[str] = []
+    for index, hint in enumerate(hints, start=1):
+        theorem_id = getattr(hint, "theorem_id", None) or f"failed_{index}"
+        statement = (getattr(hint, "theorem_statement", "") or "").strip()
+        error_summary = (getattr(hint, "error_summary", "") or "").strip()
+        targets = list(getattr(hint, "suggested_lemma_targets", []) or [])
+        if not statement:
+            continue
+        line = f"- [{theorem_id}] {statement}"
+        if error_summary:
+            line += f"\n  last Lean 4 failure: {error_summary[:240]}"
+        if targets:
+            line += f"\n  suggested targets: {', '.join(targets[:6])}"
+        entries.append(line)
+    if not entries:
+        return ""
+    return (
+        "OPEN LEMMA TARGETS LEAN 4 COULD NOT YET CLOSE (optional retry candidates):\n"
+        + "\n".join(entries)
+    )
 
-LEARN FROM THESE PAST MISTAKES.
----
-""")
-    
-    parts.extend([
-        f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
-        "\n---\n",
-        f"CURRENT OUTLINE:\n{current_outline}",
-        "\n---\n",
-        f"CURRENT DOCUMENT:\n{current_paper}",
-        "\n---\n",
-        "Now decide if rigor work is needed and choose your approach (respond as JSON):"
-    ])
-    
-    return "\n".join(parts)
 
+# =============================================================================
+# PROMPT BUILDERS
+# =============================================================================
 
-async def build_rigor_execution_prompt(
+async def build_rigor_theorem_discovery_prompt(
     user_prompt: str,
     current_outline: str,
     current_paper: str,
-    target_section: str,
-    mode: str
+    rag_evidence: str = "",
+    existing_verified_proofs: Optional[Iterable[dict]] = None,
+    recent_failure_hints: Optional[Iterable] = None,
 ) -> str:
-    """
-    Build complete prompt for Step 2: standard/rewrite execution.
-    
+    """Build the Stage 1 (discovery) prompt.
+
     Args:
-        user_prompt: User's compiler-directing prompt
-        current_outline: Current outline (ALWAYS fully injected)
-        current_paper: Current document (RAG-retrieved, FULL paper)
-        target_section: Target section from Step 1 (guidance label)
-        mode: "standard_enhancement" or "rewrite_focus"
-    
+        user_prompt: User's compiler-directing prompt.
+        current_outline: Full outline (direct-injected).
+        current_paper: Current paper content with system markers preserved
+            for exact old_string matching.
+        rag_evidence: RAG-retrieved context per the offload priority
+            (Shared Training DB -> Local Submitter DB -> Rejection Log ->
+            User Upload Files) with outline + paper sources EXCLUDED.
+        existing_verified_proofs: Iterable of proof records (dicts from
+            `proof_database.get_all_proofs()` serialized) - shown so the
+            model does not re-propose already-verified results.
+        recent_failure_hints: Iterable of `FailedProofCandidate` objects
+            from `proof_database.get_recent_failure_hints(...)` - shown
+            as optional retry targets.
+
     Returns:
-        Complete prompt string
+        Complete prompt string.
     """
-    parts = [
-        get_rigor_execution_system_prompt(mode),
+    parts: List[str] = [
+        _DISCOVERY_SYSTEM_PROMPT,
+        "\n---\n",
+        _DISCOVERY_JSON_SCHEMA,
         "\n---\n",
-        get_rigor_execution_json_schema(mode),
-        "\n---\n"
     ]
-    
-    # Add rejection history (DIRECT INJECTION - almost always fits)
+
     rejection_history = await compiler_rejection_log.get_rejections_text()
     if rejection_history:
-        parts.append(f"""YOUR RECENT REJECTION HISTORY (Last 10 rejections):
-{rejection_history}
+        parts.append(
+            "YOUR RECENT REJECTION HISTORY (Last 10 rejections - learn from these):\n"
+            f"{rejection_history}\n---\n"
+        )
+
+    verified_block = _format_existing_verified_proofs(existing_verified_proofs or [])
+    if verified_block:
+        parts.append(verified_block + "\n---\n")
+
+    failure_block = _format_recent_failure_hints(recent_failure_hints or [])
+    if failure_block:
+        parts.append(failure_block + "\n---\n")
 
-LEARN FROM THESE PAST MISTAKES.
----
-""")
-    
     parts.extend([
         f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
         "\n---\n",
         f"CURRENT OUTLINE:\n{current_outline}",
         "\n---\n",
-        f"TARGET SECTION (from your Step 1 planning - guidance reminder):\n{target_section}",
-        "\n---\n",
-        f"CURRENT DOCUMENT (FULL PAPER - not limited to target section):\n{current_paper}",
+        f"CURRENT PAPER:\n{current_paper}",
         "\n---\n",
-        "Now execute your rigor enhancement or refuse if Step 1 was wrong (respond as JSON):"
     ])
-    
+
+    if rag_evidence and rag_evidence.strip():
+        parts.append(f"SUPPORTING EVIDENCE (RAG):\n{rag_evidence}\n---\n")
+
+    parts.append(
+        "Now decide whether to propose a Lean 4 theorem candidate "
+        "or to decline this rigor cycle (respond as JSON):"
+    )
+
     return "\n".join(parts)
 
 
-async def build_rigor_wolfram_execution_prompt(
+async def build_rigor_placement_prompt(
     user_prompt: str,
     current_outline: str,
     current_paper: str,
-    target_section: str,
-    wolfram_query: str,
-    wolfram_result: str
+    rag_evidence: str = "",
+    *,
+    theorem_statement: str,
+    lean_code: str,
+    proof_id: str,
+    placement_attempt: int = 1,
+    validator_rejection_feedback: str = "",
 ) -> str:
-    """
-    Build complete prompt for Step 2: Wolfram verification execution.
-    
+    """Build the Stage 2 (placement) prompt.
+
     Args:
-        user_prompt: User's compiler-directing prompt
-        current_outline: Current outline (ALWAYS fully injected)
-        current_paper: Current document (RAG-retrieved, FULL paper)
-        target_section: Target section from Step 1 (guidance label)
-        wolfram_query: The query sent to Wolfram Alpha
-        wolfram_result: The result from Wolfram Alpha API
-    
+        user_prompt: User's compiler-directing prompt.
+        current_outline: Full outline (direct-injected).
+        current_paper: Current paper content (direct-injected or RAG'd by the
+            caller per the high-context submitter budget rules).
+        rag_evidence: Optional RAG-retrieved supporting context.
+        theorem_statement: Human-readable statement of the verified theorem.
+        lean_code: Full Lean 4 source that compiled. Included so the model
+            can accurately paraphrase / cite the verified statement.
+        proof_id: Database proof ID used in the appendix reference.
+        placement_attempt: 1 or 2.
+        validator_rejection_feedback: Validator reasoning from attempt 1;
+            only populated for attempt 2.
+
     Returns:
-        Complete prompt string
+        Complete prompt string.
     """
-    parts = [
-        get_rigor_wolfram_execution_system_prompt(),
+    parts: List[str] = [
+        _PLACEMENT_SYSTEM_PROMPT,
+        "\n---\n",
+        _PLACEMENT_JSON_SCHEMA,
         "\n---\n",
-        get_rigor_execution_json_schema("wolfram_verification"),
-        "\n---\n"
     ]
-    
-    # Add rejection history
+
     rejection_history = await compiler_rejection_log.get_rejections_text()
     if rejection_history:
-        parts.append(f"""YOUR RECENT REJECTION HISTORY (Last 10 rejections):
-{rejection_history}
+        parts.append(
+            "YOUR RECENT REJECTION HISTORY (Last 10 rejections - learn from these):\n"
+            f"{rejection_history}\n---\n"
+        )
 
-LEARN FROM THESE PAST MISTAKES.
----
-""")
-    
     parts.extend([
         f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
         "\n---\n",
         f"CURRENT OUTLINE:\n{current_outline}",
         "\n---\n",
-        f"TARGET SECTION (from your Step 1 planning - guidance reminder):\n{target_section}",
-        "\n---\n",
-        f"WOLFRAM ALPHA QUERY (from your Step 1 planning):\n{wolfram_query}",
-        "\n---\n",
-        f"WOLFRAM ALPHA RESULT:\n{wolfram_result}",
-        "\n---\n",
-        f"CURRENT DOCUMENT (FULL PAPER - not limited to target section):\n{current_paper}",
+        f"CURRENT PAPER:\n{current_paper}",
         "\n---\n",
-        "Now interpret the Wolfram Alpha result and decide if you want to add it to the paper, or refuse if inappropriate (respond as JSON):"
     ])
-    
+
+    if rag_evidence and rag_evidence.strip():
+        parts.append(f"SUPPORTING EVIDENCE (RAG):\n{rag_evidence}\n---\n")
+
+    parts.append(
+        "LEAN 4 VERIFIED THEOREM CERTIFICATE:\n"
+        f"Proof ID: {proof_id}\n"
+        f"Theorem statement: {theorem_statement}\n"
+        "Lean 4 source (verified by the Lean 4 toolchain; do NOT paste this "
+        "into your `new_string`, it is stored in the Theorems Appendix "
+        "automatically):\n"
+        f"{lean_code}\n"
+        "\n---\n"
+    )
+
+    parts.append(f"PLACEMENT ATTEMPT: {placement_attempt} of 2\n---\n")
+
+    if placement_attempt > 1 and validator_rejection_feedback.strip():
+        parts.append(
+            "VALIDATOR REJECTION FEEDBACK FROM YOUR PREVIOUS PLACEMENT ATTEMPT:\n"
+            f"{validator_rejection_feedback.strip()}\n"
+            "The math is already verified by Lean 4 - the validator is judging "
+            "PLACEMENT and NARRATIVE only. Adjust accordingly.\n---\n"
+        )
+
+    parts.append(
+        "Now produce an inline placement edit OR refuse if no legal placement exists "
+        "(respond as JSON):"
+    )
+
     return "\n".join(parts)
diff --git a/backend/compiler/validation/compiler_validator.py b/backend/compiler/validation/compiler_validator.py
index e0806d0..0afe2fa 100644
--- a/backend/compiler/validation/compiler_validator.py
+++ b/backend/compiler/validation/compiler_validator.py
@@ -13,8 +13,14 @@
 from backend.shared.models import CompilerSubmission, CompilerValidationResult
 from backend.shared.json_parser import parse_json
 from backend.shared.utils import count_tokens
+from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.validation.json_validator import json_validator
-from backend.compiler.memory.paper_memory import paper_memory
+from backend.compiler.memory.paper_memory import (
+    paper_memory,
+    PAPER_ANCHOR,
+    THEOREMS_APPENDIX_END,
+    THEOREMS_APPENDIX_START,
+)
 from backend.compiler.memory.outline_memory import outline_memory
 
 logger = logging.getLogger(__name__)
@@ -356,7 +362,7 @@ class CompilerValidator:
     
     def __init__(self, model_name: str, user_prompt: str, websocket_broadcaster: Optional[Callable] = None):
         self.model_name = model_name
-        self.user_prompt = user_prompt
+        self.user_prompt = proof_database.inject_into_prompt(user_prompt)
         self.websocket_broadcaster = websocket_broadcaster
         self._initialized = False
         
@@ -549,6 +555,76 @@ async def _parse_json_with_retry(
                 logger.error(f"CompilerValidator: Retry request failed - {retry_error}")
                 return self._fallback_parse(response)
     
+    def _handle_protected_marker_old_string(
+        self,
+        submission: CompilerSubmission,
+        document_to_check: str,
+        document_name: str,
+    ) -> Optional[CompilerValidationResult]:
+        """Prevent edit operations from removing system-managed paper boundaries.
+
+        Models may copy visible markers into old_string as context. For replace
+        operations, if the marker block is only a suffix used to anchor a section,
+        trim old_string back to the real editable content when that trimmed span
+        is unique. Delete operations remain unsafe because they would remove
+        content adjacent to a system boundary.
+        """
+        protected_markers = (
+            THEOREMS_APPENDIX_START,
+            THEOREMS_APPENDIX_END,
+            PAPER_ANCHOR,
+        )
+        marker_positions = [
+            submission.old_string.find(marker)
+            for marker in protected_markers
+            if marker in submission.old_string
+        ]
+        if not marker_positions:
+            return None
+
+        first_marker_pos = min(marker_positions)
+
+        if submission.operation == "replace":
+            trimmed_old = submission.old_string[:first_marker_pos].rstrip()
+            if trimmed_old:
+                normalized_doc = normalize_unicode_hyphens(document_to_check)
+                normalized_trimmed = normalize_unicode_hyphens(trimmed_old)
+                if normalized_doc.count(normalized_trimmed) == 1:
+                    logger.warning(
+                        "Pre-validation adjusted old_string to exclude system marker boundary "
+                        "from replace target in %s",
+                        document_name,
+                    )
+                    submission.old_string = trimmed_old
+                    return None
+
+        logger.warning(
+            "Pre-validation failed: %s operation old_string includes a protected system marker",
+            submission.operation,
+        )
+        return CompilerValidationResult(
+            submission_id=submission.submission_id,
+            decision="reject",
+            reasoning=(
+                "PROTECTED_MARKER_BOUNDARY: The old_string includes a system-managed "
+                "paper boundary marker (the Theorems Appendix bracket or end-of-paper "
+                "anchor). Replacing or deleting across that marker can corrupt the paper "
+                "structure.\n\n"
+                "FIX REQUIRED:\n"
+                f"1. Use old_string from the editable {document_name} content only.\n"
+                "2. Do not include Theorems Appendix bracket markers or the end-of-paper "
+                "anchor in replace/delete targets.\n"
+                "3. If you need marker context for placement, use a shorter unique "
+                "old_string immediately before the marker."
+            ),
+            summary=f"old_string crosses protected system marker boundary in {document_name} (pre-validation)",
+            coherence_check=True,
+            rigor_check=True,
+            placement_check=False,
+            json_valid=True,
+            validation_stage="pre-validation",
+        )
+
     def _pre_validate_exact_string_match(
         self,
         submission: CompilerSubmission,
@@ -643,6 +719,14 @@ def _pre_validate_exact_string_match(
                 json_valid=True,
                 validation_stage="pre-validation"
             )
+
+        protected_marker_result = self._handle_protected_marker_old_string(
+            submission,
+            document_to_check,
+            document_name,
+        )
+        if protected_marker_result is not None:
+            return protected_marker_result
         
         # Check if old_string exists in the document (with Unicode hyphen normalization)
         pos, actual_text = find_with_normalized_hyphens(submission.old_string, document_to_check)
@@ -1044,6 +1128,21 @@ async def validate_submission(
             # So placement_check defaults to True unless LLM finds placement context issue
             placement = validation_data.get("placement_check", True)
             
+            # Lean-4-verified theorem placement submissions: Lean 4 is the source
+            # of truth for mathematical rigor. Force rigor_check=True regardless
+            # of what the LLM emitted so the criterion is never the reason for
+            # a rejection on this kind of submission.
+            if (
+                submission.mode == "rigor"
+                and (submission.metadata or {}).get("rigor_mode") == "lean_placement"
+            ):
+                if not rigor:
+                    logger.info(
+                        "Validator returned rigor_check=False for lean_placement submission; "
+                        "forcing True because Lean 4 verified the math."
+                    )
+                rigor = True
+            
             # Create summary for rejection log (max 750 chars)
             summary = reasoning[:750]
             
@@ -1292,7 +1391,9 @@ def _strip_placeholder_text(self, text: str) -> str:
             ABSTRACT_PLACEHOLDER,
             INTRO_PLACEHOLDER,
             CONCLUSION_PLACEHOLDER,
-            PAPER_ANCHOR
+            PAPER_ANCHOR,
+            THEOREMS_APPENDIX_START,
+            THEOREMS_APPENDIX_END,
         )
         
         # List of exact placeholder strings to strip
@@ -1300,7 +1401,9 @@ def _strip_placeholder_text(self, text: str) -> str:
             ABSTRACT_PLACEHOLDER,
             INTRO_PLACEHOLDER,
             CONCLUSION_PLACEHOLDER,
-            PAPER_ANCHOR
+            PAPER_ANCHOR,
+            THEOREMS_APPENDIX_START,
+            THEOREMS_APPENDIX_END,
         ]
         
         result = text
@@ -1330,7 +1433,16 @@ def _build_validation_prompt(
         if submission.mode in ["outline_create", "outline_update"]:
             system_prompt = self._get_outline_validation_system_prompt(submission.mode)
         else:
-            system_prompt = self._get_paper_validation_system_prompt(submission.mode)
+            # For rigor submissions backed by a Lean 4 verified theorem, swap in
+            # the placement-only criteria. Anything else falls through to the
+            # normal paper-validation prompt for the submission's mode.
+            rigor_mode_hint = (submission.metadata or {}).get("rigor_mode")
+            effective_mode = (
+                "rigor_lean_placement"
+                if submission.mode == "rigor" and rigor_mode_hint == "lean_placement"
+                else submission.mode
+            )
+            system_prompt = self._get_paper_validation_system_prompt(effective_mode)
         
         parts = [
             system_prompt,
@@ -1345,9 +1457,31 @@ def _build_validation_prompt(
             parts.append(f"CURRENT OUTLINE:\n{current_outline}\n---\n")
         
         parts.append(f"CURRENT DOCUMENT:\n{current_paper}\n---\n")
+        
+        # For Lean 4 verified theorem placement, surface the Lean certificate
+        # to the validator so it can reference what was verified.
+        metadata = submission.metadata or {}
+        if submission.mode == "rigor" and metadata.get("rigor_mode") == "lean_placement":
+            parts.append("LEAN 4 VERIFICATION CERTIFICATE (DO NOT RE-EVALUATE MATH):\n")
+            parts.append(f"Proof ID: {metadata.get('lean_proof_id', 'unknown')}\n")
+            parts.append(f"Theorem statement: {metadata.get('theorem_statement', '')}\n")
+            lean_code = str(metadata.get("lean_code", "") or "")
+            if lean_code:
+                parts.append("Lean 4 code (verified by the Lean 4 toolchain):\n")
+                parts.append(lean_code.strip() + "\n")
+            if metadata.get("placement_attempt"):
+                parts.append(f"Placement attempt: {metadata['placement_attempt']} of 2\n")
+            prior_feedback = str(metadata.get("validator_rejection_feedback", "") or "").strip()
+            if prior_feedback:
+                parts.append(
+                    "PRIOR VALIDATOR REJECTION (for this same verified theorem):\n"
+                    f"{prior_feedback}\n"
+                )
+            parts.append("\n---\n")
+        
         parts.append(f"SUBMISSION TO VALIDATE:\n")
-        if submission.metadata.get("review_focus"):
-            parts.append(f"Review Focus: {submission.metadata['review_focus']}\n")
+        if metadata.get("review_focus"):
+            parts.append(f"Review Focus: {metadata['review_focus']}\n")
         parts.append(f"Operation: {submission.operation}\n")
         if submission.old_string:
             parts.append(f"Old String (to find): {submission.old_string}\n")
@@ -1802,7 +1936,38 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 FIX: [What would be acceptable]"
 
 ACCEPT if: All general criteria + mode-specific criteria met
-REJECT if: Enhancement doesn't add rigor, reduces quality, introduces unsound mathematical claims, or placement context inappropriate"""
+REJECT if: Enhancement doesn't add rigor, reduces quality, introduces unsound mathematical claims, or placement context inappropriate""",
+
+            "rigor_lean_placement": """MODE-SPECIFIC CRITERIA (Lean 4 Verified Theorem Placement):
+
+CRITICAL: The theorem in this submission has ALREADY been formally verified by the Lean 4 toolchain. Its mathematical validity is NOT in question and you MUST NOT re-evaluate it.
+
+The LEAN 4 VERIFICATION CERTIFICATE block earlier in this prompt shows the exact theorem statement and Lean 4 proof that compiled successfully. Lean 4 is the source of truth for the mathematical content.
+
+YOUR ONLY JOB on this submission is to judge PLACEMENT and NARRATIVE INTEGRATION:
+
+1. PLACEMENT_FIT: Does the insertion location make sense given the surrounding narrative, outline structure, and mathematical progression of the paper at this point?
+2. INTRODUCTION_FORMAT: Does the inline text correctly present the theorem to the reader, including:
+   - A clear theorem statement matching the verified statement
+   - An explicit "verified in Lean 4" marker in the prose
+   - A reference pointing the reader to the Theorems Appendix (where the full Lean proof is stored)
+3. NARRATIVE_COHERENCE: Does surrounding prose remain coherent after the insertion? No dangling references, no broken sentence flow, no contradiction with established definitions.
+4. NO_DUPLICATION: The inline text must not copy the full Lean proof body into the main paper (the proof lives in the appendix only). A short informal proof sketch is fine; the Lean code itself should NOT be inlined.
+
+RULES:
+- You MUST set rigor_check=true unconditionally: Lean 4 has already verified the math. The `rigor_check` field is forced to true by the system regardless of your response.
+- You MUST NOT reject on mathematical grounds (correctness, soundness, edge cases, assumptions). That decision has been made by Lean 4.
+- You MAY reject on placement, narrative, duplication of the Lean code, or missing "verified in Lean 4" marker / appendix reference.
+- If this is placement attempt 2 of 2 and you reject again, the system will route the theorem to the Theorems Appendix only. Reserve rejection for genuine placement/narrative problems.
+
+REJECTION FEEDBACK FORMAT:
+If rejecting, use this structure:
+"REJECTION REASON: [PLACEMENT_FIT|MISSING_LEAN_MARKER|MISSING_APPENDIX_REFERENCE|NARRATIVE_COHERENCE|LEAN_CODE_DUPLICATED_INLINE|etc.]
+ISSUE: [What's wrong with the placement or prose, not the math]
+FIX: [Concrete adjustment the submitter should make on the next placement attempt]"
+
+ACCEPT if: Placement location is reasonable, introduction prose correctly cites the Lean 4 verification and appendix, narrative remains coherent, and the Lean proof body is NOT duplicated inline.
+REJECT if: Placement is clearly inappropriate, the "verified in Lean 4" / appendix reference is missing, narrative breaks, or the full Lean code is pasted into the main paper text."""
         }
         
         return base_prompt + mode_specific.get(mode, mode_specific["construction"])
diff --git a/backend/data/proofs/.gitkeep b/backend/data/proofs/.gitkeep
new file mode 100644
index 0000000..e69de29
diff --git a/backend/scripts/cache_openrouter_models.py b/backend/scripts/cache_openrouter_models.py
index 8117848..7bfca81 100644
--- a/backend/scripts/cache_openrouter_models.py
+++ b/backend/scripts/cache_openrouter_models.py
@@ -14,7 +14,7 @@
 sys.path.insert(0, str(Path(__file__).parent.parent.parent))
 
 from backend.shared.openrouter_client import OpenRouterClient
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
 
 
 async def cache_models():
@@ -58,7 +58,7 @@ async def cache_models():
                 print(f"  {display_name} -> {model_id}")
         
         # Cache to JSON
-        cache_file = Path(__file__).parent.parent / "data" / "model_cache.json"
+        cache_file = Path(system_config.data_dir) / "model_cache.json"
         cache_file.parent.mkdir(parents=True, exist_ok=True)
         
         with open(cache_file, 'w', encoding='utf-8') as f:
diff --git a/backend/shared/api_client_manager.py b/backend/shared/api_client_manager.py
index 47a6a23..5b34592 100644
--- a/backend/shared/api_client_manager.py
+++ b/backend/shared/api_client_manager.py
@@ -23,7 +23,8 @@
 )
 from backend.shared.boost_manager import boost_manager
 from backend.shared.boost_logger import boost_logger
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
+from backend.shared.fastembed_provider import FASTEMBED_MODEL_NAME, FastEmbedProvider
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.models import ModelConfig
 from backend.shared.token_tracker import token_tracker
@@ -41,6 +42,7 @@ class APIClientManager:
     def __init__(self):
         self._openrouter_client: Optional[OpenRouterClient] = None
         self._openrouter_api_key: Optional[str] = None
+        self._fastembed_provider: Optional[FastEmbedProvider] = None
         
         # Track which roles have fallen back to LM Studio
         # Format: {role_id: "openrouter" | "lm_studio"}
@@ -230,6 +232,13 @@ def set_openrouter_api_key(self, api_key: str) -> None:
         else:
             self._openrouter_client = None
             logger.info("OpenRouter client disabled (no API key)")
+
+    def _get_fastembed_provider(self, model_name: Optional[str] = None) -> FastEmbedProvider:
+        """Return the hosted in-process embedding provider for generic mode."""
+        desired_model = model_name or FASTEMBED_MODEL_NAME
+        if self._fastembed_provider is None or self._fastembed_provider.model_name != desired_model:
+            self._fastembed_provider = FastEmbedProvider(model_name=desired_model)
+        return self._fastembed_provider
     
     def configure_role(self, role_id: str, config: ModelConfig) -> None:
         """
@@ -295,6 +304,8 @@ async def generate_completion(
         temperature: float = 0.0,
         max_tokens: Optional[int] = None,
         response_format: Optional[Dict[str, str]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
         **kwargs
     ) -> Dict[str, Any]:
         """
@@ -361,7 +372,9 @@ async def generate_completion(
                             temperature=temperature,
                             max_tokens=max_tokens or boost_manager.boost_config.boost_max_output_tokens,
                             response_format=response_format,
-                            provider=boost_provider
+                            provider=boost_provider,
+                            tools=tools,
+                            tool_choice=tool_choice,
                         ),
                         role_id=role_id,
                         model=boost_model,
@@ -705,7 +718,9 @@ async def generate_completion(
                             temperature=temperature,
                             max_tokens=max_tokens or role_config.max_output_tokens,
                             response_format=response_format,
-                            provider=openrouter_provider
+                            provider=openrouter_provider,
+                            tools=tools,
+                            tool_choice=tool_choice,
                         ),
                         role_id=role_id,
                         model=openrouter_model,
@@ -1007,6 +1022,8 @@ async def generate_completion(
                     temperature=temperature,
                     max_tokens=max_tokens,
                     response_format=response_format,
+                    tools=tools,
+                    tool_choice=tool_choice,
                     **kwargs
                 ),
                 role_id=role_id,
@@ -1136,6 +1153,8 @@ async def _try_free_model_rotation(
                             temperature=temperature,
                             max_tokens=max_tokens,
                             response_format=response_format,
+                            tools=tools,
+                            tool_choice=tool_choice,
                         ),
                         role_id=role_id,
                         model=alt_model,
@@ -1185,6 +1204,8 @@ async def _try_free_model_rotation(
                         temperature=temperature,
                         max_tokens=max_tokens,
                         response_format=response_format,
+                        tools=tools,
+                        tool_choice=tool_choice,
                     ),
                     role_id=role_id,
                     model=auto_model,
@@ -1281,6 +1302,11 @@ async def get_embeddings(self, texts: List[str], model: str = None) -> List[List
         """
         if not texts:
             return []
+
+        if system_config.generic_mode:
+            provider_model = None if model in (None, rag_config.embedding_model) else model
+            logger.debug("Generic mode enabled - using FastEmbed for embeddings")
+            return await self._get_fastembed_provider(provider_model).embed(texts)
         
         # Try LM Studio first (local, free)
         try:
diff --git a/backend/shared/boost_logger.py b/backend/shared/boost_logger.py
index c7b6bd8..257cb59 100644
--- a/backend/shared/boost_logger.py
+++ b/backend/shared/boost_logger.py
@@ -11,6 +11,8 @@
 from typing import Dict, Any, List, Optional
 from pathlib import Path
 
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 
@@ -20,7 +22,6 @@ class BoostLogger:
     Stores logs in data/boost_api_log.txt with JSON entries.
     """
     
-    LOG_FILE = "backend/data/boost_api_log.txt"
     MAX_LOG_ENTRIES = 500  # Maximum entries to keep in log
     
     _instance = None
@@ -42,11 +43,15 @@ def __init__(self):
     
     def _ensure_log_file(self) -> None:
         """Ensure the log file and directory exist."""
-        log_path = Path(self.LOG_FILE)
+        log_path = self._get_log_path()
         log_path.parent.mkdir(parents=True, exist_ok=True)
         
         if not log_path.exists():
             log_path.write_text("")
+
+    def _get_log_path(self) -> Path:
+        """Return the instance-scoped boost log path."""
+        return Path(system_config.data_dir) / "boost_api_log.txt"
     
     async def log_boost_call(
         self,
@@ -94,7 +99,7 @@ async def log_boost_call(
                 }
                 
                 # Append to log file
-                with open(self.LOG_FILE, "a", encoding="utf-8") as f:
+                with open(self._get_log_path(), "a", encoding="utf-8") as f:
                     f.write(json.dumps(log_entry) + "\n")
                 
                 logger.debug(f"Logged boost call: task={task_id}, model={model}, success={success}")
@@ -108,13 +113,13 @@ async def log_boost_call(
     async def _trim_log_if_needed(self) -> None:
         """Trim log file if it exceeds MAX_LOG_ENTRIES."""
         try:
-            with open(self.LOG_FILE, "r", encoding="utf-8") as f:
+            with open(self._get_log_path(), "r", encoding="utf-8") as f:
                 lines = f.readlines()
             
             if len(lines) > self.MAX_LOG_ENTRIES:
                 # Keep only the most recent entries
                 lines = lines[-self.MAX_LOG_ENTRIES:]
-                with open(self.LOG_FILE, "w", encoding="utf-8") as f:
+                with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.writelines(lines)
                 logger.debug(f"Trimmed boost log to {self.MAX_LOG_ENTRIES} entries")
                 
@@ -133,10 +138,11 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
         """
         async with self._lock:
             try:
-                if not os.path.exists(self.LOG_FILE):
+                log_path = self._get_log_path()
+                if not os.path.exists(log_path):
                     return []
                 
-                with open(self.LOG_FILE, "r", encoding="utf-8") as f:
+                with open(log_path, "r", encoding="utf-8") as f:
                     lines = f.readlines()
                 
                 logs = []
@@ -176,7 +182,7 @@ async def clear_logs(self) -> None:
         """Clear all boost API logs."""
         async with self._lock:
             try:
-                with open(self.LOG_FILE, "w", encoding="utf-8") as f:
+                with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.write("")
                 logger.info("Boost logs cleared")
             except Exception as e:
diff --git a/backend/shared/boost_manager.py b/backend/shared/boost_manager.py
index 9fd8164..d26f883 100644
--- a/backend/shared/boost_manager.py
+++ b/backend/shared/boost_manager.py
@@ -22,14 +22,11 @@
 import os
 from typing import Optional, Set, Callable, Any, Dict, List
 
+from backend.shared.config import system_config
 from backend.shared.models import BoostConfig
 
 logger = logging.getLogger(__name__)
 
-# Persistence file path
-BOOST_STATE_FILE = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'data', 'boost_state.json')
-
-
 # Category prefixes for different roles — labels match Settings panel titles exactly.
 # Autonomous Research agents share the same prefixes as their parent roles
 # (see module docstring for full mapping).
@@ -99,12 +96,18 @@ def __init__(self):
         self._load_state()
         
         logger.info("BoostManager initialized")
+
+    @staticmethod
+    def _get_state_file() -> str:
+        """Return the instance-scoped boost state file."""
+        return str(os.path.join(system_config.data_dir, "boost_state.json"))
     
     def _load_state(self) -> None:
         """Load persisted boost state from disk."""
         try:
-            if os.path.exists(BOOST_STATE_FILE):
-                with open(BOOST_STATE_FILE, 'r', encoding='utf-8') as f:
+            state_file = self._get_state_file()
+            if os.path.exists(state_file):
+                with open(state_file, 'r', encoding='utf-8') as f:
                     state = json.load(f)
                 
                 # Restore boost config if it was enabled
@@ -134,7 +137,8 @@ def _save_state(self) -> None:
         """Persist current boost state to disk."""
         try:
             # Ensure data directory exists
-            os.makedirs(os.path.dirname(BOOST_STATE_FILE), exist_ok=True)
+            state_file = self._get_state_file()
+            os.makedirs(os.path.dirname(state_file), exist_ok=True)
             
             state = {
                 'enabled': self.boost_config is not None and self.boost_config.enabled,
@@ -149,7 +153,7 @@ def _save_state(self) -> None:
                 'boosted_task_ids': list(self.boosted_task_ids)
             }
             
-            with open(BOOST_STATE_FILE, 'w', encoding='utf-8') as f:
+            with open(state_file, 'w', encoding='utf-8') as f:
                 json.dump(state, f, indent=2)
             
             logger.debug("Boost state saved to disk")
diff --git a/backend/shared/build_info.py b/backend/shared/build_info.py
new file mode 100644
index 0000000..94ae74c
--- /dev/null
+++ b/backend/shared/build_info.py
@@ -0,0 +1,120 @@
+"""
+Build identity helpers for the shared update contract.
+"""
+from __future__ import annotations
+
+from dataclasses import dataclass
+from functools import lru_cache
+import json
+import logging
+import os
+from pathlib import Path
+from typing import Any
+
+logger = logging.getLogger(__name__)
+
+REPO_ROOT = Path(__file__).resolve().parents[2]
+BUILD_MANIFEST_PATH = REPO_ROOT / "moto-update-manifest.json"
+PACKAGE_JSON_PATH = REPO_ROOT / "package.json"
+
+_DEFAULT_BUILD_INFO = {
+    "manifest_version": 1,
+    "version": "0.0.0-dev",
+    "build_commit": "dev",
+    "update_channel": "main",
+    "api_contract_version": "build5-v1",
+}
+
+_ENV_OVERRIDES = {
+    "MOTO_VERSION": "version",
+    "MOTO_BUILD_COMMIT": "build_commit",
+    "MOTO_UPDATE_CHANNEL": "update_channel",
+    "MOTO_API_CONTRACT_VERSION": "api_contract_version",
+}
+
+
+@dataclass(frozen=True)
+class BuildInfo:
+    """Normalized build identity shared by runtime APIs and updater metadata."""
+
+    version: str
+    build_commit: str
+    update_channel: str
+    api_contract_version: str
+    manifest_version: int = 1
+
+    def as_features_payload(self, capability_overrides: dict[str, Any] | None = None) -> dict[str, Any]:
+        """Return the public `/api/features` payload with optional capability flags."""
+        payload: dict[str, Any] = {
+            "version": self.version,
+            "build_commit": self.build_commit,
+            "update_channel": self.update_channel,
+            "api_contract_version": self.api_contract_version,
+        }
+        if capability_overrides:
+            payload.update(capability_overrides)
+        return payload
+
+
+def _load_json(path: Path) -> dict[str, Any] | None:
+    try:
+        return json.loads(path.read_text(encoding="utf-8"))
+    except FileNotFoundError:
+        return None
+    except json.JSONDecodeError as exc:
+        logger.warning("Ignoring invalid build metadata file at %s: %s", path, exc)
+        return None
+    except OSError as exc:
+        logger.warning("Failed to read build metadata file at %s: %s", path, exc)
+        return None
+
+
+def _load_default_version() -> str:
+    package_json = _load_json(PACKAGE_JSON_PATH)
+    if isinstance(package_json, dict):
+        version = str(package_json.get("version", "")).strip()
+        if version:
+            return version
+    return str(_DEFAULT_BUILD_INFO["version"])
+
+
+def _coerce_manifest_version(value: Any) -> int:
+    try:
+        return int(value)
+    except (TypeError, ValueError):
+        return int(_DEFAULT_BUILD_INFO["manifest_version"])
+
+
+@lru_cache(maxsize=1)
+def get_build_info() -> BuildInfo:
+    """Resolve build identity from the committed manifest with env overrides."""
+    payload: dict[str, Any] = dict(_DEFAULT_BUILD_INFO)
+    payload["version"] = _load_default_version()
+
+    manifest = _load_json(BUILD_MANIFEST_PATH)
+    if isinstance(manifest, dict):
+        for field in ("version", "build_commit", "update_channel", "api_contract_version"):
+            value = str(manifest.get(field, "")).strip()
+            if value:
+                payload[field] = value
+        payload["manifest_version"] = _coerce_manifest_version(
+            manifest.get("manifest_version", payload["manifest_version"])
+        )
+    else:
+        logger.warning(
+            "Build manifest not found at %s; falling back to package metadata defaults.",
+            BUILD_MANIFEST_PATH,
+        )
+
+    for env_name, field_name in _ENV_OVERRIDES.items():
+        override = os.environ.get(env_name, "").strip()
+        if override:
+            payload[field_name] = override
+
+    return BuildInfo(
+        version=str(payload["version"]),
+        build_commit=str(payload["build_commit"]),
+        update_channel=str(payload["update_channel"]),
+        api_contract_version=str(payload["api_contract_version"]),
+        manifest_version=_coerce_manifest_version(payload["manifest_version"]),
+    )
diff --git a/backend/shared/config.py b/backend/shared/config.py
index d220e49..1f965f5 100644
--- a/backend/shared/config.py
+++ b/backend/shared/config.py
@@ -2,12 +2,21 @@
 Configuration for the ASI Aggregator System.
 Defines RAG parameters, context allocation, and system constants.
 """
+from pathlib import Path
 from typing import List, Optional
-from pydantic_settings import BaseSettings
+
+from pydantic import AliasChoices, Field, model_validator
+from pydantic_settings import BaseSettings, SettingsConfigDict
 
 
 class RAGConfig(BaseSettings):
     """RAG system configuration."""
+
+    model_config = SettingsConfigDict(
+        env_file=".env",
+        env_file_encoding="utf-8",
+        extra="ignore",
+    )
     
     # Chunk size configurations (chars)
     submitter_chunk_intervals: List[int] = [256, 512, 768, 1024]
@@ -54,7 +63,10 @@ class RAGConfig(BaseSettings):
     similarity_threshold: float = 0.85
     
     # LM Studio API
-    lm_studio_base_url: str = "http://127.0.0.1:1234"
+    lm_studio_base_url: str = Field(
+        default="http://127.0.0.1:1234",
+        validation_alias=AliasChoices("MOTO_LM_STUDIO_BASE_URL", "LM_STUDIO_BASE_URL"),
+    )
     embedding_model: str = "text-embedding-nomic-embed-text-v1.5"
     
     # OpenRouter API (Global Configuration)
@@ -110,6 +122,45 @@ def get_chunk_overlap(self, chunk_size: int) -> int:
 
 class SystemConfig(BaseSettings):
     """System-wide configuration."""
+
+    model_config = SettingsConfigDict(
+        env_file=".env",
+        env_file_encoding="utf-8",
+        extra="ignore",
+    )
+
+    # Deployment mode
+    generic_mode: bool = False
+
+    # Instance/runtime identity
+    instance_id: str = Field(
+        default="default",
+        validation_alias=AliasChoices("MOTO_INSTANCE_ID", "INSTANCE_ID"),
+    )
+    backend_host: str = Field(
+        default="0.0.0.0",
+        validation_alias=AliasChoices("MOTO_BACKEND_HOST", "HOST"),
+    )
+    backend_port: int = Field(
+        default=8000,
+        validation_alias=AliasChoices("MOTO_BACKEND_PORT", "PORT"),
+    )
+    frontend_port: int = Field(
+        default=5173,
+        validation_alias=AliasChoices("MOTO_FRONTEND_PORT", "FRONTEND_PORT"),
+    )
+    secret_namespace: Optional[str] = Field(
+        default=None,
+        validation_alias=AliasChoices("MOTO_SECRET_NAMESPACE", "SECRET_NAMESPACE"),
+    )
+    internal_proxy_secret: Optional[str] = Field(
+        default=None,
+        validation_alias=AliasChoices("MOTO_INTERNAL_PROXY_SECRET", "INTERNAL_PROXY_SECRET"),
+    )
+    frontend_storage_prefix: Optional[str] = Field(
+        default=None,
+        validation_alias=AliasChoices("MOTO_FRONTEND_STORAGE_PREFIX", "FRONTEND_STORAGE_PREFIX"),
+    )
     
     # Aggregator submitter settings (configurable 1-10 submitters)
     default_num_submitters: int = 3  # Default number of submitters
@@ -117,6 +168,7 @@ class SystemConfig(BaseSettings):
     min_submitters: int = 1  # Minimum submitters
     consecutive_rejection_reset_threshold: int = 15
     queue_overflow_threshold: int = 10
+    per_submitter_queue_threshold: int = 4  # Pause an individual submitter when it already has more than this many submissions queued (fairness cap)
     
     # Compiler settings (Phase 2)
     # NOTE: Compiler contexts are set by user in GUI, these are just default fallbacks
@@ -157,19 +209,76 @@ class SystemConfig(BaseSettings):
     # Wolfram Alpha integration (optional)
     wolfram_alpha_enabled: bool = False
     wolfram_alpha_api_key: Optional[str] = None
+
+    # Lean 4 proof verification integration (optional)
+    lean4_enabled: bool = Field(
+        default=False,
+        validation_alias=AliasChoices("MOTO_LEAN4_ENABLED", "LEAN4_ENABLED"),
+    )
+    lean4_lsp_enabled: bool = Field(
+        default=False,
+        validation_alias=AliasChoices("MOTO_LEAN4_LSP_ENABLED", "LEAN4_LSP_ENABLED"),
+    )
+    lean4_path: str = Field(
+        default="",
+        validation_alias=AliasChoices("MOTO_LEAN4_PATH", "LEAN4_PATH"),
+    )
+    lean4_workspace_dir: str = Field(
+        default="",
+        validation_alias=AliasChoices("MOTO_LEAN4_WORKSPACE_DIR", "LEAN4_WORKSPACE_DIR"),
+    )
+    lean4_proof_timeout: int = Field(
+        default=120,
+        validation_alias=AliasChoices("MOTO_LEAN4_PROOF_TIMEOUT", "LEAN4_PROOF_TIMEOUT"),
+    )
+    lean4_lsp_idle_timeout: int = Field(
+        default=600,
+        validation_alias=AliasChoices("MOTO_LEAN4_LSP_IDLE_TIMEOUT", "LEAN4_LSP_IDLE_TIMEOUT"),
+    )
+    # Maximum number of theorem candidates whose Lean 4 formalization attempts
+    # may run concurrently within a single proof-verification stage. Novelty
+    # assessment and proof-database persistence remain serialized after each
+    # candidate's Lean pipeline completes.
+    proof_max_parallel_candidates: int = Field(
+        default=6,
+        validation_alias=AliasChoices(
+            "MOTO_PROOF_MAX_PARALLEL_CANDIDATES",
+            "PROOF_MAX_PARALLEL_CANDIDATES",
+        ),
+    )
+
+    # Optional SMT / Z3 integration foundation (Build 4)
+    smt_enabled: bool = Field(
+        default=False,
+        validation_alias=AliasChoices("MOTO_SMT_ENABLED", "SMT_ENABLED"),
+    )
+    z3_path: str = Field(
+        default="",
+        validation_alias=AliasChoices("MOTO_Z3_PATH", "Z3_PATH"),
+    )
+    smt_timeout: int = Field(
+        default=30,
+        validation_alias=AliasChoices("MOTO_SMT_TIMEOUT", "SMT_TIMEOUT"),
+    )
     
     # File paths
-    data_dir: str = "backend/data"
-    logs_dir: str = "backend/logs"
-    user_uploads_dir: str = "backend/data/user_uploads"
-    chroma_db_dir: str = "backend/data/chroma_db"
-    
-    shared_training_file: str = "backend/data/rag_shared_training.txt"
-    compiler_outline_file: str = "backend/data/compiler_outline.txt"
-    compiler_paper_file: str = "backend/data/compiler_paper.txt"
-    compiler_rejections_file: str = "backend/data/compiler_last_10_rejections.txt"
-    compiler_acceptances_file: str = "backend/data/compiler_last_10_acceptances.txt"
-    compiler_declines_file: str = "backend/data/compiler_last_10_declines.txt"
+    data_dir: str = Field(
+        default="backend/data",
+        validation_alias=AliasChoices("MOTO_DATA_ROOT", "DATA_DIR"),
+    )
+    logs_dir: Optional[str] = Field(
+        default="backend/logs",
+        validation_alias=AliasChoices("MOTO_LOG_ROOT", "LOGS_DIR"),
+    )
+    user_uploads_dir: Optional[str] = None
+    chroma_db_dir: Optional[str] = None
+    
+    shared_training_file: Optional[str] = None
+    compiler_outline_file: Optional[str] = None
+    compiler_paper_file: Optional[str] = None
+    compiler_rejections_file: Optional[str] = None
+    compiler_acceptances_file: Optional[str] = None
+    compiler_declines_file: Optional[str] = None
     
     # ========================================================================
     # AUTONOMOUS RESEARCH FILE PATHS (Part 3) - DUAL-PATH ARCHITECTURE
@@ -196,20 +305,79 @@ class SystemConfig(BaseSettings):
     # ========================================================================
     
     # Legacy paths (backward compatibility - do not use for new features)
-    auto_brainstorms_dir: str = "backend/data/auto_brainstorms"
-    auto_papers_dir: str = "backend/data/auto_papers"
-    auto_papers_archive_dir: str = "backend/data/auto_papers/archive"
-    auto_research_metadata_file: str = "backend/data/auto_research_metadata.json"
-    auto_research_stats_file: str = "backend/data/auto_research_stats.json"
-    auto_workflow_state_file: str = "backend/data/auto_workflow_state.json"
-    auto_research_topic_rejections_file: str = "backend/data/auto_research_topic_rejections.txt"
+    auto_brainstorms_dir: Optional[str] = None
+    auto_papers_dir: Optional[str] = None
+    auto_papers_archive_dir: Optional[str] = None
+    auto_research_metadata_file: Optional[str] = None
+    auto_research_stats_file: Optional[str] = None
+    auto_workflow_state_file: Optional[str] = None
+    auto_research_topic_rejections_file: Optional[str] = None
     
     # Session-based organization (preferred for new features)
-    auto_sessions_base_dir: str = "backend/data/auto_sessions"
-    
-    class Config:
-        env_file = ".env"
-        env_file_encoding = "utf-8"
+    auto_sessions_base_dir: Optional[str] = None
+
+    @model_validator(mode="after")
+    def _derive_instance_paths(self) -> "SystemConfig":
+        """Derive all mutable runtime paths from the instance data root."""
+        default_data_dir = Path("backend/data")
+        current_data_dir = Path(self.data_dir)
+        current_logs_dir = Path(self.logs_dir) if self.logs_dir else None
+
+        if current_logs_dir is None:
+            self.logs_dir = "backend/logs" if current_data_dir == default_data_dir else str(current_data_dir / "_logs")
+        elif current_logs_dir == Path("backend/logs") and current_data_dir != default_data_dir:
+            self.logs_dir = str(current_data_dir / "_logs")
+
+        def _join_data_path(*parts: str) -> str:
+            return str(current_data_dir.joinpath(*parts))
+
+        if not self.user_uploads_dir:
+            self.user_uploads_dir = _join_data_path("user_uploads")
+        if not self.chroma_db_dir:
+            self.chroma_db_dir = _join_data_path("chroma_db")
+
+        if not self.shared_training_file:
+            self.shared_training_file = _join_data_path("rag_shared_training.txt")
+        if not self.compiler_outline_file:
+            self.compiler_outline_file = _join_data_path("compiler_outline.txt")
+        if not self.compiler_paper_file:
+            self.compiler_paper_file = _join_data_path("compiler_paper.txt")
+        if not self.compiler_rejections_file:
+            self.compiler_rejections_file = _join_data_path("compiler_last_10_rejections.txt")
+        if not self.compiler_acceptances_file:
+            self.compiler_acceptances_file = _join_data_path("compiler_last_10_acceptances.txt")
+        if not self.compiler_declines_file:
+            self.compiler_declines_file = _join_data_path("compiler_last_10_declines.txt")
+
+        if not self.auto_brainstorms_dir:
+            self.auto_brainstorms_dir = _join_data_path("auto_brainstorms")
+        if not self.auto_papers_dir:
+            self.auto_papers_dir = _join_data_path("auto_papers")
+        if not self.auto_papers_archive_dir:
+            self.auto_papers_archive_dir = _join_data_path("auto_papers", "archive")
+        if not self.auto_research_metadata_file:
+            self.auto_research_metadata_file = _join_data_path("auto_research_metadata.json")
+        if not self.auto_research_stats_file:
+            self.auto_research_stats_file = _join_data_path("auto_research_stats.json")
+        if not self.auto_workflow_state_file:
+            self.auto_workflow_state_file = _join_data_path("auto_workflow_state.json")
+        if not self.auto_research_topic_rejections_file:
+            self.auto_research_topic_rejections_file = _join_data_path("auto_research_topic_rejections.txt")
+        if not self.auto_sessions_base_dir:
+            self.auto_sessions_base_dir = _join_data_path("auto_sessions")
+        if not self.lean4_workspace_dir:
+            self.lean4_workspace_dir = _join_data_path("lean4_workspace")
+
+        if self.secret_namespace is not None:
+            self.secret_namespace = self.secret_namespace.strip() or None
+
+        if self.internal_proxy_secret is not None:
+            self.internal_proxy_secret = self.internal_proxy_secret.strip() or None
+
+        if self.frontend_storage_prefix is not None:
+            self.frontend_storage_prefix = self.frontend_storage_prefix.strip() or None
+
+        return self
 
 
 # Global configuration instances
diff --git a/backend/shared/critique_memory.py b/backend/shared/critique_memory.py
index 637a639..4309285 100644
--- a/backend/shared/critique_memory.py
+++ b/backend/shared/critique_memory.py
@@ -52,7 +52,7 @@
 
 def _get_legacy_data_dir() -> Path:
     """Return the shared legacy data directory for critique storage."""
-    return Path(__file__).resolve().parents[1] / "data"
+    return Path(system_config.data_dir)
 
 
 def _get_legacy_critiques_dir(paper_type: PaperType) -> Path:
diff --git a/backend/shared/fastembed_provider.py b/backend/shared/fastembed_provider.py
new file mode 100644
index 0000000..6472182
--- /dev/null
+++ b/backend/shared/fastembed_provider.py
@@ -0,0 +1,63 @@
+"""
+FastEmbed embedding provider for generic mode.
+"""
+from __future__ import annotations
+
+import asyncio
+import logging
+from typing import List
+
+logger = logging.getLogger(__name__)
+
+FASTEMBED_MODEL_NAME = "nomic-ai/nomic-embed-text-v1.5"
+
+
+class FastEmbedProvider:
+    """Lazy wrapper around the optional FastEmbed dependency."""
+
+    def __init__(self, model_name: str = FASTEMBED_MODEL_NAME):
+        self.model_name = model_name
+        self._model = None
+        self._init_lock = asyncio.Lock()
+
+    def _create_model(self):
+        try:
+            from fastembed import TextEmbedding
+        except ImportError as exc:
+            raise RuntimeError(
+                "Generic mode requires the optional 'fastembed' dependency. "
+                "Install requirements-generic.txt for hosted deployments."
+            ) from exc
+
+        logger.info("Initializing FastEmbed model '%s'", self.model_name)
+        return TextEmbedding(model_name=self.model_name)
+
+    async def _get_model(self):
+        if self._model is None:
+            async with self._init_lock:
+                if self._model is None:
+                    self._model = await asyncio.to_thread(self._create_model)
+        return self._model
+
+    async def embed(self, texts: List[str]) -> List[List[float]]:
+        """Generate embeddings using the hosted in-process model."""
+        if not texts:
+            return []
+
+        model = await self._get_model()
+
+        def _embed_sync() -> List[List[float]]:
+            normalized = []
+            for embedding in model.embed(texts):
+                if hasattr(embedding, "tolist"):
+                    normalized.append(embedding.tolist())
+                else:
+                    normalized.append(list(embedding))
+            return normalized
+
+        try:
+            return await asyncio.to_thread(_embed_sync)
+        except Exception as exc:
+            raise RuntimeError(
+                f"FastEmbed failed to generate embeddings with '{self.model_name}': {exc}"
+            ) from exc
diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
new file mode 100644
index 0000000..ea46270
--- /dev/null
+++ b/backend/shared/lean4_client.py
@@ -0,0 +1,1635 @@
+"""
+Lean 4 clients for formal proof verification.
+"""
+from __future__ import annotations
+
+import asyncio
+import json
+import logging
+import re
+import shutil
+import uuid
+from contextlib import suppress
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Any, Optional
+
+from backend.shared.config import system_config
+
+logger = logging.getLogger(__name__)
+
+
+# Regexes used to reject vacuous proofs. A `sorry` or `admit` anywhere in the
+# theorem body lets Lean 4 compile the file successfully (only emitting a
+# warning), which historically made the verifier report `success=True` for
+# proofs that were not proofs at all. These patterns match the tokens only
+# when they are standalone identifiers so that legitimate substrings (like
+# `sorryFree` or `admittedly`) are not flagged.
+_FORBIDDEN_PROOF_TOKEN_PATTERNS: tuple[tuple[str, re.Pattern[str]], ...] = (
+    ("sorry", re.compile(r"(?<![A-Za-z0-9_'])sorry(?![A-Za-z0-9_'])")),
+    ("admit", re.compile(r"(?<![A-Za-z0-9_'])admit(?![A-Za-z0-9_'])")),
+)
+
+# Lean 4 emits this warning whenever a declaration's body still contains
+# `sorry`. We pick it up in the diagnostics output because it is the
+# authoritative signal from Lean that the proof is incomplete.
+_SORRY_WARNING_MARKERS: tuple[str, ...] = (
+    "declaration uses 'sorry'",
+    "uses 'sorry'",
+    "contains 'sorry'",
+    # Lean 4 also emits a warning about `sorryAx` when the axiom leaks into
+    # the term elaborator. Treat it the same as a sorry warning.
+    "uses sorry",
+    "contains sorry",
+)
+
+
+@dataclass
+class Lean4Result:
+    """Result of one Lean 4 proof check."""
+    success: bool
+    error_output: str = ""
+    goal_states: str = ""
+    raw_stderr: str = ""
+    tactic_error_slice: str = ""
+    failing_tactic_index: int = -1
+
+
+def _strip_lean_comments_and_strings(code: str) -> str:
+    """Best-effort removal of Lean 4 comments and string literals.
+
+    The forbidden-token scan runs on the stripped text so that a legitimate
+    string literal containing the word ``sorry`` (for example in a
+    documentation block) does not cause a false rejection. This is a
+    deliberate approximation: we accept an occasional over-strip over
+    misclassifying a real ``sorry`` in code as harmless.
+    """
+    if not code:
+        return ""
+
+    without_block_comments = re.sub(r"/-.*?-/", " ", code, flags=re.DOTALL)
+    without_line_comments = re.sub(r"--[^\n]*", " ", without_block_comments)
+    without_strings = re.sub(r'"(?:\\.|[^"\\])*"', ' "" ', without_line_comments)
+    return without_strings
+
+
+def _detect_forbidden_placeholder(code: str) -> Optional[str]:
+    """Return the forbidden token name if ``code`` contains a placeholder proof.
+
+    Checks for bare ``sorry`` / ``admit`` tokens after stripping comments and
+    string literals. Returns ``None`` when the code is free of known
+    placeholder markers.
+    """
+    stripped = _strip_lean_comments_and_strings(code)
+    for token_name, pattern in _FORBIDDEN_PROOF_TOKEN_PATTERNS:
+        if pattern.search(stripped):
+            return token_name
+    return None
+
+
+def _output_contains_sorry_warning(output: str) -> bool:
+    lowered = (output or "").lower()
+    return any(marker in lowered for marker in _SORRY_WARNING_MARKERS)
+
+
+_PLACEHOLDER_REJECTION_PREFIX = "PROOF REJECTED: PLACEHOLDER USED"
+_MATHLIB_CACHE_ARCHIVE_RE = re.compile(r"\(([^()\r\n]+?\.ltar)\)")
+
+# Markdown fence markers the LLM occasionally emits inside the `lean_code`
+# JSON field even when instructed to return raw code. Strip them defensively so
+# Lean 4 does not fail to parse the generated file on a stray ```lean line.
+_LEAN_FENCE_OPEN_RE = re.compile(r"^\s*```(?:lean4?|lean)?\s*$", re.IGNORECASE)
+_LEAN_FENCE_CLOSE_RE = re.compile(r"^\s*```\s*$")
+
+# Recognizes Lean's "unsolved goals" / "no goals to be solved" diagnostic text.
+# We treat "no goals to be solved" specially because it almost always means the
+# model appended one tactic too many after the proof was already closed.
+_NO_GOALS_DIAGNOSTIC_RE = re.compile(
+    r"(no goals to be solved|no goals|goals accomplished already)",
+    re.IGNORECASE,
+)
+_NO_GOALS_HINT = (
+    "HINT: Lean reported 'no goals to be solved'. This almost always means the "
+    "previous tactic already closed the proof and the tactic at the reported "
+    "line/column is extraneous. Remove that tactic (or any tactics after the "
+    "goal-closing step) and resubmit. Do NOT add more tactics to try to fix it."
+)
+
+
+def _strip_markdown_fences(code: str) -> str:
+    """Remove stray ``` / ```lean fences from LLM output."""
+    if not code or "```" not in code:
+        return code
+
+    lines = code.splitlines()
+    cleaned: list[str] = []
+    in_fence = False
+    for line in lines:
+        if _LEAN_FENCE_OPEN_RE.match(line):
+            in_fence = not in_fence
+            continue
+        if _LEAN_FENCE_CLOSE_RE.match(line):
+            in_fence = not in_fence
+            continue
+        cleaned.append(line)
+    return "\n".join(cleaned)
+
+
+def _deduplicate_leading_import(code: str) -> str:
+    """Collapse repeated ``import Mathlib`` prefixes the model sometimes emits."""
+    if not code:
+        return code
+    lines = code.splitlines()
+    kept: list[str] = []
+    seen_imports: set[str] = set()
+    past_imports = False
+    for line in lines:
+        stripped = line.strip()
+        if stripped.startswith("import "):
+            if past_imports:
+                kept.append(line)
+                continue
+            if stripped in seen_imports:
+                continue
+            seen_imports.add(stripped)
+            kept.append(line)
+        else:
+            if stripped:
+                past_imports = True
+            kept.append(line)
+    return "\n".join(kept)
+
+
+def _format_placeholder_rejection(token_name: str, *, from_lean_diagnostic: bool) -> str:
+    """Produce a structured, model-readable error for placeholder proofs."""
+    if from_lean_diagnostic:
+        reason = (
+            "Lean 4 reported 'declaration uses sorry': the theorem body contains "
+            "`sorry` or another placeholder. Lean only emits a warning for this, "
+            "but MOTO rejects it because a proof with `sorry` is not a proof."
+        )
+    else:
+        reason = (
+            f"The submitted Lean 4 code contains a placeholder token `{token_name}`. "
+            "MOTO rejects proofs that use `sorry` or `admit` anywhere in the "
+            "theorem body because they do not actually prove the goal."
+        )
+    return (
+        f"{_PLACEHOLDER_REJECTION_PREFIX}\n"
+        f"{reason}\n"
+        "Required fix: produce a Lean 4 proof that closes every goal without "
+        "using `sorry`, `admit`, unresolved `axiom` stubs introduced solely to "
+        "trivialize the target theorem, or any other placeholder. If the result "
+        "cannot be proved yet, return a narrower lemma that you can fully "
+        "prove instead."
+    )
+
+
+class Lean4Client:
+    """Subprocess wrapper around the Lean 4 toolchain."""
+
+    def __init__(self, lean_path: str, workspace_dir: str) -> None:
+        self.lean_path = str(lean_path or "").strip()
+        self.workspace_dir = Path(workspace_dir).resolve()
+        self._workspace_ready = False
+        self._workspace_lock = asyncio.Lock()
+
+    def _resolve_executable(self, name: str) -> str:
+        if self.lean_path:
+            lean_bin = Path(self.lean_path).resolve()
+            sibling = lean_bin.parent / (f"{name}.exe" if lean_bin.suffix.lower() == ".exe" else name)
+            if sibling.exists():
+                return str(sibling)
+
+        resolved = shutil.which(name)
+        if resolved:
+            return resolved
+        return name
+
+    @property
+    def lake_path(self) -> str:
+        return self._resolve_executable("lake")
+
+    def uses_persistent_server(self) -> bool:
+        """Return True when the client keeps a long-lived Lean process."""
+        return False
+
+    def is_server_active(self) -> bool:
+        """Return True when the persistent server is currently alive."""
+        return False
+
+    async def warm_start(self) -> None:
+        """Perform optional startup work during FastAPI lifespan."""
+        return
+
+    async def close(self) -> None:
+        """Release client resources during backend shutdown."""
+        return
+
+    def get_mathlib_package_dir(self) -> Path:
+        """Return the resolved Mathlib package directory inside the workspace."""
+        return self.workspace_dir / ".lake" / "packages" / "mathlib"
+
+    def get_mathlib_source_roots(self) -> list[Path]:
+        """Return Mathlib source roots that can be indexed for lemma search."""
+        package_dir = self.get_mathlib_package_dir()
+        source_root = package_dir / "Mathlib"
+        return [source_root] if source_root.exists() else []
+
+    def get_mathlib_index_path(self) -> Path:
+        """Return the cache path used for the local Mathlib declaration index."""
+        return self.workspace_dir / ".moto_mathlib_index.json"
+
+    def get_mathlib_commit(self) -> str:
+        """Best-effort lookup of the pinned Mathlib revision for certificate export."""
+        manifest_path = self.workspace_dir / "lake-manifest.json"
+        if manifest_path.exists():
+            try:
+                manifest = json.loads(manifest_path.read_text(encoding="utf-8"))
+                for package in manifest.get("packages", []) or []:
+                    if package.get("name") != "mathlib":
+                        continue
+                    for key in ("rev", "inputRev", "version"):
+                        value = str(package.get(key, "")).strip()
+                        if value:
+                            return value
+            except Exception as exc:
+                logger.debug("Failed to read lake-manifest.json for Mathlib revision: %s", exc)
+
+        package_dir = self.get_mathlib_package_dir()
+        head_path = package_dir / ".git" / "HEAD"
+        if head_path.exists():
+            try:
+                head_value = head_path.read_text(encoding="utf-8").strip()
+                if head_value.startswith("ref:"):
+                    ref_name = head_value.split(":", 1)[1].strip()
+                    ref_path = package_dir / ".git" / ref_name
+                    if ref_path.exists():
+                        return ref_path.read_text(encoding="utf-8").strip()
+                if head_value:
+                    return head_value
+            except Exception as exc:
+                logger.debug("Failed to read Mathlib git HEAD: %s", exc)
+
+        toolchain_path = package_dir / "lean-toolchain"
+        if toolchain_path.exists():
+            try:
+                return toolchain_path.read_text(encoding="utf-8").strip()
+            except Exception as exc:
+                logger.debug("Failed to read Mathlib lean-toolchain: %s", exc)
+
+        return ""
+
+    async def _run_process(
+        self,
+        args: list[str],
+        *,
+        cwd: Path,
+        timeout: int,
+    ) -> tuple[int, str, str]:
+        process = await asyncio.create_subprocess_exec(
+            *args,
+            cwd=str(cwd),
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        try:
+            stdout_bytes, stderr_bytes = await asyncio.wait_for(process.communicate(), timeout=timeout)
+        except asyncio.CancelledError:
+            process.kill()
+            await process.communicate()
+            raise
+        except asyncio.TimeoutError:
+            process.kill()
+            await process.communicate()
+            return (
+                -1,
+                "",
+                f"Lean 4 process timed out after {timeout} seconds.",
+            )
+
+        stdout = stdout_bytes.decode("utf-8", errors="replace")
+        stderr = stderr_bytes.decode("utf-8", errors="replace")
+        return process.returncode, stdout, stderr
+
+    async def get_version(self) -> str:
+        """Return the Lean 4 version string when available."""
+        lean_cmd = self.lean_path or self._resolve_executable("lean")
+        returncode, stdout, stderr = await self._run_process(
+            [lean_cmd, "--version"],
+            cwd=self.workspace_dir if self.workspace_dir.exists() else Path.cwd(),
+            timeout=15,
+        )
+        if returncode != 0:
+            return (stderr or stdout).strip()
+        return (stdout or stderr).strip()
+
+    async def ensure_workspace(self) -> bool:
+        """Create a reusable Mathlib-enabled workspace if missing."""
+        async with self._workspace_lock:
+            return await self._ensure_workspace_locked()
+
+    async def _ensure_workspace_locked(self) -> bool:
+        """Create a reusable Mathlib-enabled workspace while holding the workspace lock."""
+        self.workspace_dir.mkdir(parents=True, exist_ok=True)
+
+        lean_toolchain_path = self.workspace_dir / "lean-toolchain"
+        lakefile_path = self.workspace_dir / "lakefile.lean"
+        root_file_path = self.workspace_dir / "MOTOProofWorkspace.lean"
+
+        if not lean_toolchain_path.exists():
+            lean_toolchain_path.write_text("leanprover/lean4:stable\n", encoding="utf-8")
+
+        if not lakefile_path.exists():
+            lakefile_path.write_text(
+                "\n".join(
+                    [
+                        "import Lake",
+                        "open Lake DSL",
+                        "",
+                        "package «moto_proof_workspace» where",
+                        "",
+                        "require mathlib from git",
+                        '  "https://github.com/leanprover-community/mathlib4.git"',
+                    ]
+                )
+                + "\n",
+                encoding="utf-8",
+            )
+
+        if not root_file_path.exists():
+            root_file_path.write_text("import Mathlib\n", encoding="utf-8")
+
+        lake_cmd = self.lake_path
+        if not shutil.which(Path(lake_cmd).name) and not Path(lake_cmd).exists():
+            logger.warning("Lean 4 workspace not ready: 'lake' executable was not found.")
+            return False
+
+        mathlib_pkg_dir = self.workspace_dir / ".lake" / "packages" / "mathlib"
+        needs_bootstrap = not mathlib_pkg_dir.exists()
+
+        if needs_bootstrap or not self._workspace_ready:
+            logger.info("Bootstrapping Lean 4 workspace at %s", self.workspace_dir)
+
+            update_rc, update_stdout, update_stderr = await self._run_process(
+                [lake_cmd, "update"],
+                cwd=self.workspace_dir,
+                timeout=max(system_config.lean4_proof_timeout, 120),
+            )
+            if update_rc != 0:
+                logger.warning(
+                    "Lean 4 workspace update failed: %s",
+                    (update_stderr or update_stdout).strip(),
+                )
+                return False
+
+            # The project's lean-toolchain MUST match Mathlib's pinned toolchain,
+            # otherwise `lake exe cache get` refuses to download the prebuilt
+            # `.olean` files. When that happens, every later `import Mathlib`
+            # tries to read object files compiled with a different Lean version
+            # (or missing entirely) and aborts with:
+            #     error: object file '.../Mathlib/....olean' ...
+            # Align the toolchains automatically and re-run `lake update` so the
+            # workspace is actually usable for proof checking.
+            if self._align_toolchain_with_mathlib(lean_toolchain_path, mathlib_pkg_dir):
+                logger.info(
+                    "Aligned workspace lean-toolchain with Mathlib; re-running lake update."
+                )
+                update_rc, update_stdout, update_stderr = await self._run_process(
+                    [lake_cmd, "update"],
+                    cwd=self.workspace_dir,
+                    timeout=max(system_config.lean4_proof_timeout, 120),
+                )
+                if update_rc != 0:
+                    logger.warning(
+                        "Lean 4 workspace update after toolchain alignment failed: %s",
+                        (update_stderr or update_stdout).strip(),
+                    )
+                    return False
+
+            cache_rc, cache_stdout, cache_stderr = await self._fetch_mathlib_cache(
+                lake_cmd=lake_cmd,
+                cwd=self.workspace_dir,
+            )
+            if cache_rc != 0:
+                logger.error(
+                    "Lean 4 Mathlib cache fetch failed; proof checking would hit "
+                    "'object file' errors. Details: %s",
+                    (cache_stderr or cache_stdout).strip(),
+                )
+                return False
+
+        self._workspace_ready = True
+        return True
+
+    async def _fetch_mathlib_cache(
+        self,
+        *,
+        lake_cmd: str,
+        cwd: Path,
+    ) -> tuple[int, str, str]:
+        """Fetch Mathlib's cache, retrying once after pruning corrupt downloads."""
+        timeout = max(system_config.lean4_proof_timeout, 600)
+        cache_args = [lake_cmd, "exe", "cache", "get"]
+        cache_rc, cache_stdout, cache_stderr = await self._run_process(
+            cache_args,
+            cwd=cwd,
+            timeout=timeout,
+        )
+        if cache_rc == 0:
+            return cache_rc, cache_stdout, cache_stderr
+
+        failed_output = "\n".join(part for part in (cache_stdout, cache_stderr) if part).strip()
+        removed_archives = self._remove_failed_mathlib_cache_archives(failed_output)
+        if removed_archives:
+            logger.warning(
+                "Lean 4 Mathlib cache fetch failed after corrupt archive download; "
+                "removed %d failed .ltar archive(s) and retrying once.",
+                removed_archives,
+            )
+        else:
+            logger.warning(
+                "Lean 4 Mathlib cache fetch failed; retrying once in case another "
+                "cache process left transient state behind. Details: %s",
+                failed_output,
+            )
+
+        return await self._run_process(
+            cache_args,
+            cwd=cwd,
+            timeout=timeout,
+        )
+
+    @staticmethod
+    def _remove_failed_mathlib_cache_archives(output: str) -> int:
+        """Delete only the failed `.ltar` archives named by `lake exe cache get`."""
+        removed = 0
+        seen: set[Path] = set()
+        for match in _MATHLIB_CACHE_ARCHIVE_RE.finditer(output or ""):
+            archive_path = Path(match.group(1).strip())
+            if archive_path in seen:
+                continue
+            seen.add(archive_path)
+
+            if archive_path.suffix.lower() != ".ltar":
+                continue
+            if archive_path.parent.name.lower() != "mathlib":
+                continue
+
+            try:
+                if archive_path.exists():
+                    archive_path.unlink()
+                    removed += 1
+            except OSError as exc:
+                logger.debug("Failed to remove corrupt Mathlib cache archive %s: %s", archive_path, exc)
+        return removed
+
+    @staticmethod
+    def _align_toolchain_with_mathlib(
+        workspace_toolchain_path: Path,
+        mathlib_pkg_dir: Path,
+    ) -> bool:
+        """Copy Mathlib's lean-toolchain into the workspace if they differ.
+
+        Returns True when a change was made, False otherwise.
+        """
+        mathlib_toolchain_path = mathlib_pkg_dir / "lean-toolchain"
+        if not mathlib_toolchain_path.exists():
+            return False
+
+        try:
+            mathlib_toolchain = mathlib_toolchain_path.read_text(encoding="utf-8").strip()
+        except OSError as exc:
+            logger.debug("Failed to read Mathlib lean-toolchain: %s", exc)
+            return False
+
+        if not mathlib_toolchain:
+            return False
+
+        try:
+            current_toolchain = (
+                workspace_toolchain_path.read_text(encoding="utf-8").strip()
+                if workspace_toolchain_path.exists()
+                else ""
+            )
+        except OSError as exc:
+            logger.debug("Failed to read workspace lean-toolchain: %s", exc)
+            current_toolchain = ""
+
+        if current_toolchain == mathlib_toolchain:
+            return False
+
+        try:
+            workspace_toolchain_path.write_text(
+                mathlib_toolchain + "\n", encoding="utf-8"
+            )
+        except OSError as exc:
+            logger.warning("Failed to write workspace lean-toolchain: %s", exc)
+            return False
+
+        logger.info(
+            "Updated workspace lean-toolchain: '%s' -> '%s'",
+            current_toolchain or "<missing>",
+            mathlib_toolchain,
+        )
+        return True
+
+    def _prepare_lean_code(self, lean_code: str) -> str:
+        stripped = (lean_code or "").strip()
+        if not stripped:
+            return ""
+
+        stripped = _strip_markdown_fences(stripped).strip()
+        stripped = _deduplicate_leading_import(stripped).strip()
+        if not stripped:
+            return ""
+
+        first_lines = stripped.splitlines()[:5]
+        if not any(line.strip().startswith("import ") for line in first_lines):
+            stripped = f"import Mathlib\n\n{stripped}"
+        return stripped + "\n"
+
+    @staticmethod
+    def _prioritize_errors_in_output(output: str) -> str:
+        """Reorder Lean 4 diagnostics so ``error:`` lines come first.
+
+        Lean 4 emits warnings (e.g., deprecation notices) alongside real
+        errors. The displayed error preview and the retry prompt excerpt can
+        get truncated on the warning line, hiding the actual failure from the
+        model. This helper surfaces error lines (and a few lines of trailing
+        context) before the remaining diagnostics without dropping any
+        information.
+        """
+        raw = output or ""
+        if not raw.strip():
+            return raw
+
+        lines = raw.splitlines()
+        error_pattern = re.compile(r":\s*error\s*:", re.IGNORECASE)
+        error_indices = [idx for idx, line in enumerate(lines) if error_pattern.search(line)]
+        if not error_indices:
+            return raw
+
+        ordered: list[str] = []
+        seen: set[int] = set()
+        for idx in error_indices:
+            for offset in range(idx, min(len(lines), idx + 4)):
+                if offset in seen:
+                    continue
+                seen.add(offset)
+                ordered.append(lines[offset])
+        for idx, line in enumerate(lines):
+            if idx in seen:
+                continue
+            seen.add(idx)
+            ordered.append(line)
+        return "\n".join(ordered)
+
+    @staticmethod
+    def _extract_goal_states(output: str) -> str:
+        goal_lines = [line for line in output.splitlines() if "⊢" in line or "goals" in line.lower()]
+        return "\n".join(goal_lines).strip()
+
+    @staticmethod
+    def _extract_error_line_number(output: str, filename: str) -> int:
+        pattern = re.compile(rf"{re.escape(filename)}:(\d+):\d+:\s+error:")
+        match = pattern.search(output or "")
+        if not match:
+            return -1
+        try:
+            return int(match.group(1))
+        except ValueError:
+            return -1
+
+    @staticmethod
+    def _has_no_goals_diagnostic(output: str) -> bool:
+        """Return True when Lean's output contains a 'no goals to be solved' error."""
+        return bool(_NO_GOALS_DIAGNOSTIC_RE.search(output or ""))
+
+    @staticmethod
+    def _annotate_no_goals_hint(error_output: str) -> str:
+        """Prepend the targeted 'no goals' hint if Lean reported that diagnostic.
+
+        Appending a concrete repair instruction to the feedback dramatically
+        improves the next LLM attempt, because the raw diagnostic by itself
+        tends to make models try to *add* more tactics rather than removing
+        the extraneous one.
+        """
+        if not error_output:
+            return error_output
+        if not Lean4Client._has_no_goals_diagnostic(error_output):
+            return error_output
+        if _NO_GOALS_HINT in error_output:
+            return error_output
+        return f"{_NO_GOALS_HINT}\n\n{error_output}"
+
+    @staticmethod
+    def _format_tactic_lines(tactic_list: list[str]) -> list[str]:
+        lines: list[str] = []
+        for tactic in tactic_list:
+            stripped = str(tactic or "").rstrip()
+            if not stripped:
+                continue
+            for line in stripped.splitlines():
+                lines.append(f"  {line.rstrip()}")
+        return lines
+
+    def _build_tactic_script(
+        self,
+        theorem_header: str,
+        tactic_list: list[str],
+    ) -> tuple[str, list[tuple[int, int, str]]]:
+        header = (theorem_header or "").strip()
+        if not header:
+            return "", []
+
+        if ":= by" not in header and not header.rstrip().endswith("by"):
+            header = f"{header} := by"
+
+        user_lines = header.splitlines()
+        formatted_tactic_lines = self._format_tactic_lines(tactic_list)
+        if not formatted_tactic_lines:
+            return "", []
+
+        tactic_ranges: list[tuple[int, int, str]] = []
+        current_line = len(user_lines) + 1
+        for tactic in tactic_list:
+            stripped = str(tactic or "").rstrip()
+            if not stripped:
+                continue
+            tactic_lines = [f"  {line.rstrip()}" for line in stripped.splitlines()]
+            start_line = current_line
+            end_line = current_line + len(tactic_lines) - 1
+            tactic_ranges.append((start_line, end_line, stripped))
+            user_lines.extend(tactic_lines)
+            current_line = end_line + 1
+
+        body = "\n".join(user_lines)
+        needs_import = not any(line.strip().startswith("import ") for line in user_lines[:5])
+        import_offset = 2 if needs_import else 0
+        code = self._prepare_lean_code(body)
+        adjusted_ranges = [
+            (start + import_offset, end + import_offset, tactic)
+            for start, end, tactic in tactic_ranges
+        ]
+        return code, adjusted_ranges
+
+    @staticmethod
+    def _extract_tactic_error_slice(
+        combined_output: str,
+        temp_filename: str,
+        tactic_ranges: list[tuple[int, int, str]],
+    ) -> tuple[str, int]:
+        error_line = Lean4Client._extract_error_line_number(combined_output, temp_filename)
+        failing_tactic_index = -1
+        failing_tactic = ""
+        if error_line >= 0:
+            for index, (start_line, end_line, tactic) in enumerate(tactic_ranges):
+                if start_line <= error_line <= end_line:
+                    failing_tactic_index = index
+                    failing_tactic = tactic
+                    break
+
+        output_lines = (combined_output or "").splitlines()
+        matching_index = next(
+            (
+                idx
+                for idx, line in enumerate(output_lines)
+                if temp_filename in line and "error:" in line
+            ),
+            -1,
+        )
+        if matching_index >= 0:
+            error_slice = "\n".join(output_lines[matching_index : matching_index + 6]).strip()
+        else:
+            error_slice = (combined_output or "").strip()
+
+        if failing_tactic:
+            error_slice = (
+                f"Likely failing tactic {failing_tactic_index + 1}: {failing_tactic}\n"
+                f"{error_slice}"
+            ).strip()
+        return error_slice, failing_tactic_index
+
+    async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
+        """Write a temp Lean file, run Lean 4, and return structured feedback."""
+        if not system_config.lean4_enabled:
+            return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
+
+        prepared_code = self._prepare_lean_code(lean_code)
+        if not prepared_code:
+            return Lean4Result(success=False, error_output="No Lean 4 code was provided.")
+
+        # Fast pre-check: reject placeholder proofs before invoking Lean so
+        # the model learns the rejection reason even when Lean would have
+        # compiled the file with only a warning.
+        placeholder = _detect_forbidden_placeholder(prepared_code)
+        if placeholder:
+            return Lean4Result(
+                success=False,
+                error_output=_format_placeholder_rejection(placeholder, from_lean_diagnostic=False),
+            )
+
+        workspace_ready = await self.ensure_workspace()
+        if not workspace_ready:
+            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+
+        temp_filename = f"MOTOProofCheck_{uuid.uuid4().hex}.lean"
+        temp_path = self.workspace_dir / temp_filename
+        try:
+            temp_path.write_text(prepared_code, encoding="utf-8")
+            returncode, stdout, stderr = await self._run_process(
+                [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
+                cwd=self.workspace_dir,
+                timeout=timeout,
+            )
+
+            combined_output = "\n".join(part for part in [stdout.strip(), stderr.strip()] if part).strip()
+            goal_states = self._extract_goal_states(combined_output)
+
+            # Positive pass: Lean must exit cleanly AND the diagnostics must
+            # not contain an `error:` line AND must not contain Lean's own
+            # "declaration uses 'sorry'" warning. We treat the sorry warning
+            # as a proof-level failure so vacuous proofs cannot slip through.
+            lowered = combined_output.lower()
+            has_error_diagnostic = "error:" in lowered
+            has_sorry_warning = _output_contains_sorry_warning(combined_output)
+            lean_exited_cleanly = returncode == 0
+            positive_pass = (
+                lean_exited_cleanly
+                and not has_error_diagnostic
+                and not has_sorry_warning
+            )
+
+            if positive_pass:
+                return Lean4Result(
+                    success=True,
+                    error_output="",
+                    goal_states=goal_states,
+                    raw_stderr=stderr.strip(),
+                )
+
+            if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
+                rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
+                detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
+                return Lean4Result(
+                    success=False,
+                    error_output=detail,
+                    goal_states=goal_states,
+                    raw_stderr=stderr.strip(),
+                )
+
+            error_output = combined_output or "Lean 4 rejected the proof without additional diagnostics."
+            return Lean4Result(
+                success=False,
+                error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+                goal_states=goal_states,
+                raw_stderr=stderr.strip(),
+            )
+        finally:
+            try:
+                if temp_path.exists():
+                    temp_path.unlink()
+            except OSError:
+                logger.debug("Could not remove temporary Lean file %s", temp_path)
+
+    async def check_tactic_script(
+        self,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int = 120,
+    ) -> Lean4Result:
+        """Compile-check a theorem header plus tactic list using the standard Lean subprocess path.
+
+        When Lean reports ``no goals to be solved`` at an identifiable tactic
+        index, this method performs a single deterministic auto-repair pass by
+        dropping the extraneous tactic(s) and re-checking before returning the
+        result. This avoids burning an LLM retry on a purely mechanical fix.
+        """
+        if not system_config.lean4_enabled:
+            return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
+
+        return await self._check_tactic_script_with_auto_repair(
+            theorem_header=theorem_header,
+            tactic_list=list(tactic_list or []),
+            timeout=timeout,
+            auto_repair_attempts_remaining=1,
+        )
+
+    async def _check_tactic_script_with_auto_repair(
+        self,
+        *,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int,
+        auto_repair_attempts_remaining: int,
+    ) -> Lean4Result:
+        result = await self._run_tactic_script_once(
+            theorem_header=theorem_header,
+            tactic_list=tactic_list,
+            timeout=timeout,
+        )
+
+        if (
+            not result.success
+            and auto_repair_attempts_remaining > 0
+            and result.failing_tactic_index >= 0
+            and self._has_no_goals_diagnostic(result.error_output)
+            and result.failing_tactic_index < len(tactic_list)
+        ):
+            trimmed = tactic_list[: result.failing_tactic_index]
+            if trimmed and trimmed != tactic_list:
+                logger.info(
+                    "Lean 4 reported 'no goals' at tactic index %s; "
+                    "auto-trimming %s trailing tactic(s) and retrying once.",
+                    result.failing_tactic_index,
+                    len(tactic_list) - len(trimmed),
+                )
+                repaired = await self._check_tactic_script_with_auto_repair(
+                    theorem_header=theorem_header,
+                    tactic_list=trimmed,
+                    timeout=timeout,
+                    auto_repair_attempts_remaining=auto_repair_attempts_remaining - 1,
+                )
+                if repaired.success:
+                    return repaired
+
+        return result
+
+    async def _run_tactic_script_once(
+        self,
+        *,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int,
+    ) -> Lean4Result:
+        prepared_code, tactic_ranges = self._build_tactic_script(theorem_header, tactic_list)
+        if not prepared_code:
+            return Lean4Result(success=False, error_output="No tactic script could be constructed from the provided theorem header and tactics.")
+
+        placeholder = _detect_forbidden_placeholder(prepared_code)
+        if placeholder:
+            return Lean4Result(
+                success=False,
+                error_output=_format_placeholder_rejection(placeholder, from_lean_diagnostic=False),
+            )
+
+        workspace_ready = await self.ensure_workspace()
+        if not workspace_ready:
+            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+
+        temp_filename = f"MOTOProofTacticCheck_{uuid.uuid4().hex}.lean"
+        temp_path = self.workspace_dir / temp_filename
+        try:
+            temp_path.write_text(prepared_code, encoding="utf-8")
+            returncode, stdout, stderr = await self._run_process(
+                [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
+                cwd=self.workspace_dir,
+                timeout=timeout,
+            )
+
+            combined_output = "\n".join(part for part in [stdout.strip(), stderr.strip()] if part).strip()
+            goal_states = self._extract_goal_states(combined_output)
+            lowered = combined_output.lower()
+            has_error_diagnostic = "error:" in lowered
+            has_sorry_warning = _output_contains_sorry_warning(combined_output)
+            lean_exited_cleanly = returncode == 0
+            positive_pass = (
+                lean_exited_cleanly
+                and not has_error_diagnostic
+                and not has_sorry_warning
+            )
+            tactic_error_slice, failing_tactic_index = self._extract_tactic_error_slice(
+                combined_output,
+                temp_filename,
+                tactic_ranges,
+            )
+
+            if positive_pass:
+                return Lean4Result(
+                    success=True,
+                    error_output="",
+                    goal_states=goal_states,
+                    raw_stderr=stderr.strip(),
+                    tactic_error_slice="",
+                    failing_tactic_index=-1,
+                )
+
+            if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
+                rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
+                detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
+                return Lean4Result(
+                    success=False,
+                    error_output=detail,
+                    goal_states=goal_states,
+                    raw_stderr=stderr.strip(),
+                    tactic_error_slice=rejection,
+                    failing_tactic_index=failing_tactic_index,
+                )
+
+            error_output = tactic_error_slice or combined_output or "Lean 4 rejected the tactic script without additional diagnostics."
+            return Lean4Result(
+                success=False,
+                error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+                goal_states=goal_states,
+                raw_stderr=stderr.strip(),
+                tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+                failing_tactic_index=failing_tactic_index,
+            )
+        finally:
+            try:
+                if temp_path.exists():
+                    temp_path.unlink()
+            except OSError:
+                logger.debug("Could not remove temporary Lean file %s", temp_path)
+
+
+class Lean4LspClient(Lean4Client):
+    """Persistent Lean LSP client with subprocess fallback."""
+
+    def __init__(self, lean_path: str, workspace_dir: str, *, idle_timeout: int = 600) -> None:
+        super().__init__(lean_path=lean_path, workspace_dir=workspace_dir)
+        self._idle_timeout = max(int(idle_timeout or 0), 0)
+        self._subprocess_fallback = Lean4Client(lean_path=lean_path, workspace_dir=workspace_dir)
+        self._server_process: Optional[asyncio.subprocess.Process] = None
+        self._reader_task: Optional[asyncio.Task[None]] = None
+        self._stderr_task: Optional[asyncio.Task[None]] = None
+        self._startup_lock = asyncio.Lock()
+        self._operation_lock = asyncio.Lock()
+        self._pending_responses: dict[int, asyncio.Future[Any]] = {}
+        self._diagnostics_by_uri: dict[str, dict[str, Any]] = {}
+        self._file_progress_by_uri: dict[str, dict[str, Any]] = {}
+        self._open_document_versions: dict[str, int] = {}
+        self._stderr_buffer: list[str] = []
+        self._next_request_id = 0
+        self._next_document_version = 0
+        self._initialized = False
+        self._lsp_healthy = True
+        self._idle_handle: Optional[asyncio.TimerHandle] = None
+        self._expected_shutdown = False
+
+    def uses_persistent_server(self) -> bool:
+        return True
+
+    def is_server_active(self) -> bool:
+        return bool(
+            self._server_process
+            and self._server_process.returncode is None
+            and self._initialized
+        )
+
+    async def warm_start(self) -> None:
+        """Best-effort startup of the persistent Lean server."""
+        if not system_config.lean4_enabled or not system_config.lean4_lsp_enabled:
+            return
+        if not self._lsp_healthy:
+            return
+        workspace_ready = await self.ensure_workspace()
+        if not workspace_ready:
+            logger.warning("Lean 4 LSP warm start skipped because the workspace is not ready.")
+            return
+        try:
+            await self._ensure_server_started()
+        except Exception as exc:
+            await self._mark_unhealthy(f"warm start failed: {exc}")
+
+    async def close(self) -> None:
+        await self._shutdown_server(mark_unhealthy=False)
+
+    def _cancel_idle_shutdown(self) -> None:
+        if self._idle_handle is not None:
+            self._idle_handle.cancel()
+            self._idle_handle = None
+
+    def _schedule_idle_shutdown(self) -> None:
+        self._cancel_idle_shutdown()
+        if self._idle_timeout <= 0 or not self.is_server_active():
+            return
+        loop = asyncio.get_running_loop()
+        self._idle_handle = loop.call_later(
+            self._idle_timeout,
+            lambda: asyncio.create_task(self._shutdown_if_idle()),
+        )
+
+    async def _shutdown_if_idle(self) -> None:
+        if self._operation_lock.locked():
+            self._schedule_idle_shutdown()
+            return
+        await self._shutdown_server(mark_unhealthy=False)
+
+    async def _shutdown_server(self, *, mark_unhealthy: bool) -> None:
+        self._cancel_idle_shutdown()
+
+        if mark_unhealthy:
+            self._lsp_healthy = False
+
+        # Signal the reader loop that any upcoming EOF is intentional so it
+        # does not log the shutdown as an unexpected failure.
+        self._expected_shutdown = True
+
+        process = self._server_process
+        self._server_process = None
+        self._initialized = False
+
+        pending = list(self._pending_responses.values())
+        self._pending_responses.clear()
+        for future in pending:
+            if not future.done():
+                future.set_exception(RuntimeError("Lean 4 LSP server stopped before replying."))
+
+        if process is not None:
+            if process.stdin is not None and not process.stdin.is_closing():
+                process.stdin.close()
+                with suppress(Exception):
+                    await process.stdin.wait_closed()
+            if process.returncode is None:
+                process.terminate()
+                try:
+                    await asyncio.wait_for(process.wait(), timeout=5)
+                except asyncio.TimeoutError:
+                    process.kill()
+                    with suppress(Exception):
+                        await process.wait()
+
+        for task_name in ("_reader_task", "_stderr_task"):
+            task = getattr(self, task_name)
+            if task is not None:
+                task.cancel()
+                with suppress(asyncio.CancelledError, Exception):
+                    await task
+                setattr(self, task_name, None)
+
+        self._diagnostics_by_uri.clear()
+        self._file_progress_by_uri.clear()
+        self._open_document_versions.clear()
+
+    def _stderr_tail(self) -> str:
+        return "\n".join(self._stderr_buffer[-200:]).strip()
+
+    def _next_id(self) -> int:
+        self._next_request_id += 1
+        return self._next_request_id
+
+    def _next_version(self) -> int:
+        self._next_document_version += 1
+        return self._next_document_version
+
+    async def _read_message(self, reader: asyncio.StreamReader) -> dict[str, Any]:
+        headers: dict[str, str] = {}
+        while True:
+            line = await reader.readline()
+            if not line:
+                raise EOFError("Lean 4 LSP stream closed.")
+            if line in (b"\r\n", b"\n"):
+                break
+            decoded = line.decode("utf-8", errors="replace").strip()
+            if ":" not in decoded:
+                continue
+            key, value = decoded.split(":", 1)
+            headers[key.strip().lower()] = value.strip()
+
+        content_length_raw = headers.get("content-length", "")
+        if not content_length_raw:
+            raise ValueError("Lean 4 LSP message did not include Content-Length.")
+
+        content_length = int(content_length_raw)
+        payload = await reader.readexactly(content_length)
+        return json.loads(payload.decode("utf-8", errors="replace"))
+
+    async def _write_message(self, payload: dict[str, Any]) -> None:
+        if self._server_process is None or self._server_process.stdin is None or self._server_process.returncode is not None:
+            raise RuntimeError("Lean 4 LSP server is not running.")
+
+        body = json.dumps(payload, separators=(",", ":")).encode("utf-8")
+        header = f"Content-Length: {len(body)}\r\n\r\n".encode("utf-8")
+        self._server_process.stdin.write(header + body)
+        await self._server_process.stdin.drain()
+
+    async def _send_request(self, method: str, params: dict[str, Any], *, timeout: int) -> Any:
+        request_id = self._next_id()
+        loop = asyncio.get_running_loop()
+        future: asyncio.Future[Any] = loop.create_future()
+        self._pending_responses[request_id] = future
+        await self._write_message(
+            {
+                "jsonrpc": "2.0",
+                "id": request_id,
+                "method": method,
+                "params": params,
+            }
+        )
+        try:
+            return await asyncio.wait_for(future, timeout=timeout)
+        finally:
+            self._pending_responses.pop(request_id, None)
+
+    async def _send_notification(self, method: str, params: dict[str, Any]) -> None:
+        await self._write_message(
+            {
+                "jsonrpc": "2.0",
+                "method": method,
+                "params": params,
+            }
+        )
+
+    def _store_diagnostics(self, params: dict[str, Any]) -> None:
+        uri = str(params.get("uri", "") or "").strip()
+        if not uri:
+            return
+        version = params.get("version")
+        if version is None:
+            version = self._open_document_versions.get(uri, -1)
+        self._diagnostics_by_uri[uri] = {
+            "version": int(version) if isinstance(version, int) else self._open_document_versions.get(uri, -1),
+            "diagnostics": list(params.get("diagnostics") or []),
+        }
+
+    def _store_file_progress(self, params: dict[str, Any]) -> None:
+        text_document = params.get("textDocument") or {}
+        uri = str(text_document.get("uri", "") or "").strip()
+        if not uri:
+            return
+        processing = list(params.get("processing") or [])
+        self._file_progress_by_uri[uri] = {
+            "version": text_document.get("version", self._open_document_versions.get(uri, -1)),
+            "fatal_error": any(item.get("kind") == "fatalError" for item in processing if isinstance(item, dict)),
+        }
+
+    async def _reader_loop(self) -> None:
+        assert self._server_process is not None and self._server_process.stdout is not None
+        reader = self._server_process.stdout
+
+        try:
+            while True:
+                payload = await self._read_message(reader)
+                if "id" in payload and ("result" in payload or "error" in payload):
+                    response_id = payload.get("id")
+                    future = self._pending_responses.get(response_id)
+                    if future is None or future.done():
+                        continue
+                    if "error" in payload and payload["error"]:
+                        error = payload["error"]
+                        future.set_exception(RuntimeError(f"Lean 4 LSP error: {error}"))
+                    else:
+                        future.set_result(payload.get("result"))
+                    continue
+
+                method = str(payload.get("method", "") or "")
+                params = payload.get("params") or {}
+                if method == "textDocument/publishDiagnostics" and isinstance(params, dict):
+                    self._store_diagnostics(params)
+                elif method == "$/lean/fileProgress" and isinstance(params, dict):
+                    self._store_file_progress(params)
+        except asyncio.CancelledError:
+            raise
+        except Exception as exc:
+            if self._expected_shutdown:
+                logger.info("Lean 4 LSP reader exited after idle shutdown")
+            else:
+                logger.warning("Lean 4 LSP reader stopped: %s", exc)
+            pending = list(self._pending_responses.values())
+            self._pending_responses.clear()
+            for future in pending:
+                if not future.done():
+                    future.set_exception(RuntimeError(f"Lean 4 LSP reader stopped: {exc}"))
+
+    async def _stderr_loop(self) -> None:
+        assert self._server_process is not None and self._server_process.stderr is not None
+        reader = self._server_process.stderr
+        try:
+            while True:
+                line = await reader.readline()
+                if not line:
+                    return
+                decoded = line.decode("utf-8", errors="replace").rstrip()
+                if decoded:
+                    self._stderr_buffer.append(decoded)
+                    if len(self._stderr_buffer) > 200:
+                        self._stderr_buffer = self._stderr_buffer[-200:]
+        except asyncio.CancelledError:
+            raise
+        except Exception as exc:
+            logger.debug("Lean 4 LSP stderr reader stopped: %s", exc)
+
+    async def _ensure_server_started(self) -> bool:
+        if not self._lsp_healthy:
+            return False
+
+        async with self._startup_lock:
+            if self.is_server_active():
+                return True
+
+            if self._server_process is not None and self._server_process.returncode is not None:
+                await self._shutdown_server(mark_unhealthy=False)
+
+            try:
+                process = await asyncio.create_subprocess_exec(
+                    self.lake_path,
+                    "serve",
+                    cwd=str(self.workspace_dir),
+                    stdin=asyncio.subprocess.PIPE,
+                    stdout=asyncio.subprocess.PIPE,
+                    stderr=asyncio.subprocess.PIPE,
+                )
+                self._server_process = process
+                self._expected_shutdown = False
+                self._reader_task = asyncio.create_task(self._reader_loop())
+                self._stderr_task = asyncio.create_task(self._stderr_loop())
+
+                root_uri = self.workspace_dir.resolve().as_uri()
+                await self._send_request(
+                    "initialize",
+                    {
+                        "processId": None,
+                        "rootPath": str(self.workspace_dir),
+                        "rootUri": root_uri,
+                        "capabilities": {},
+                        "clientInfo": {"name": "MOTO", "version": "build4"},
+                        "workspaceFolders": [
+                            {
+                                "uri": root_uri,
+                                "name": self.workspace_dir.name or "workspace",
+                            }
+                        ],
+                    },
+                    timeout=30,
+                )
+                await self._send_notification("initialized", {})
+                self._initialized = True
+                self._schedule_idle_shutdown()
+                logger.info("Lean 4 LSP server started for workspace %s", self.workspace_dir)
+                return True
+            except Exception as exc:
+                await self._mark_unhealthy(f"startup failed: {exc}")
+                return False
+
+    async def _mark_unhealthy(self, reason: str) -> None:
+        logger.warning("Lean 4 LSP unhealthy; falling back to subprocess mode: %s", reason)
+        await self._shutdown_server(mark_unhealthy=True)
+
+    @staticmethod
+    def _diagnostic_is_error(diagnostic: dict[str, Any]) -> bool:
+        severity = diagnostic.get("severity")
+        if severity is not None:
+            return int(severity) == 1
+        message = str(diagnostic.get("message", "") or "").strip()
+        return bool(message)
+
+    @staticmethod
+    def _severity_label(diagnostic: dict[str, Any]) -> str:
+        severity = diagnostic.get("severity")
+        try:
+            severity_num = int(severity)
+        except (TypeError, ValueError):
+            severity_num = 1
+        return {
+            1: "error",
+            2: "warning",
+            3: "information",
+            4: "hint",
+        }.get(severity_num, "error")
+
+    def _format_diagnostic_output(self, temp_filename: str, diagnostics: list[dict[str, Any]]) -> str:
+        lines: list[str] = []
+        for diagnostic in diagnostics:
+            range_info = diagnostic.get("range") or {}
+            start = range_info.get("start") or {}
+            line_number = int(start.get("line", 0) or 0) + 1
+            column_number = int(start.get("character", 0) or 0) + 1
+            severity = self._severity_label(diagnostic)
+            message = str(diagnostic.get("message", "") or "").strip() or "Lean 4 reported a diagnostic without a message."
+            message_lines = message.splitlines() or [message]
+            lines.append(f"{temp_filename}:{line_number}:{column_number}: {severity}: {message_lines[0]}")
+            lines.extend(message_lines[1:])
+        return "\n".join(lines).strip()
+
+    def _result_from_diagnostics(
+        self,
+        temp_filename: str,
+        diagnostics: list[dict[str, Any]],
+        *,
+        tactic_ranges: Optional[list[tuple[int, int, str]]] = None,
+        fatal_error: bool = False,
+    ) -> Lean4Result:
+        combined_output = self._format_diagnostic_output(temp_filename, diagnostics)
+        goal_states = self._extract_goal_states(combined_output)
+        raw_stderr = self._stderr_tail()
+        has_errors = fatal_error or any(self._diagnostic_is_error(diagnostic) for diagnostic in diagnostics)
+        has_sorry_warning = _output_contains_sorry_warning(combined_output) or any(
+            _output_contains_sorry_warning(str(diagnostic.get("message", "") or ""))
+            for diagnostic in diagnostics
+        )
+
+        if not has_errors and not has_sorry_warning:
+            return Lean4Result(
+                success=True,
+                error_output="",
+                goal_states=goal_states,
+                raw_stderr=raw_stderr,
+            )
+
+        if has_sorry_warning and not has_errors:
+            rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
+            detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
+            return Lean4Result(
+                success=False,
+                error_output=detail,
+                goal_states=goal_states,
+                raw_stderr=raw_stderr,
+                tactic_error_slice=rejection,
+                failing_tactic_index=-1,
+            )
+
+        tactic_error_slice = ""
+        failing_tactic_index = -1
+        if tactic_ranges:
+            tactic_error_slice, failing_tactic_index = self._extract_tactic_error_slice(
+                combined_output,
+                temp_filename,
+                tactic_ranges,
+            )
+
+        error_output = tactic_error_slice or combined_output
+        if not error_output and fatal_error:
+            error_output = "Lean 4 LSP reported a fatal error while processing the proof."
+        if not error_output:
+            error_output = "Lean 4 rejected the proof without additional diagnostics."
+
+        return Lean4Result(
+            success=False,
+            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            goal_states=goal_states,
+            raw_stderr=raw_stderr,
+            tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+            failing_tactic_index=failing_tactic_index,
+        )
+
+    async def _check_via_lsp(
+        self,
+        prepared_code: str,
+        *,
+        temp_filename: str,
+        timeout: int,
+        tactic_ranges: Optional[list[tuple[int, int, str]]] = None,
+    ) -> Lean4Result:
+        if not await self._ensure_server_started():
+            raise RuntimeError("Lean 4 LSP server is unavailable.")
+
+        temp_path = self.workspace_dir / temp_filename
+        uri = temp_path.resolve().as_uri()
+        version = self._next_version()
+        self._diagnostics_by_uri.pop(uri, None)
+        self._file_progress_by_uri.pop(uri, None)
+        self._open_document_versions[uri] = version
+
+        try:
+            temp_path.write_text(prepared_code, encoding="utf-8")
+            await self._send_notification(
+                "textDocument/didOpen",
+                {
+                    "textDocument": {
+                        "uri": uri,
+                        "languageId": "lean4",
+                        "version": version,
+                        "text": prepared_code,
+                    },
+                    "dependencyBuildMode": "once",
+                },
+            )
+            await self._send_request(
+                "textDocument/waitForDiagnostics",
+                {
+                    "uri": uri,
+                    "version": version,
+                },
+                timeout=timeout,
+            )
+
+            diagnostic_bundle = self._diagnostics_by_uri.get(uri) or {}
+            progress_bundle = self._file_progress_by_uri.get(uri) or {}
+            diagnostics = list(diagnostic_bundle.get("diagnostics") or [])
+            fatal_error = bool(progress_bundle.get("fatal_error"))
+            return self._result_from_diagnostics(
+                temp_filename,
+                diagnostics,
+                tactic_ranges=tactic_ranges,
+                fatal_error=fatal_error,
+            )
+        finally:
+            if self.is_server_active():
+                with suppress(Exception):
+                    await self._send_notification(
+                        "textDocument/didClose",
+                        {
+                            "textDocument": {
+                                "uri": uri,
+                            }
+                        },
+                    )
+            self._diagnostics_by_uri.pop(uri, None)
+            self._file_progress_by_uri.pop(uri, None)
+            self._open_document_versions.pop(uri, None)
+            with suppress(OSError):
+                if temp_path.exists():
+                    temp_path.unlink()
+
+    async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
+        """Check a proof through the persistent Lean LSP when healthy, otherwise fall back."""
+        if not system_config.lean4_enabled:
+            return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
+
+        prepared_code = self._prepare_lean_code(lean_code)
+        if not prepared_code:
+            return Lean4Result(success=False, error_output="No Lean 4 code was provided.")
+
+        placeholder = _detect_forbidden_placeholder(prepared_code)
+        if placeholder:
+            return Lean4Result(
+                success=False,
+                error_output=_format_placeholder_rejection(placeholder, from_lean_diagnostic=False),
+            )
+
+        workspace_ready = await self.ensure_workspace()
+        if not workspace_ready:
+            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+
+        if not self._lsp_healthy:
+            return await self._subprocess_fallback.check_proof(lean_code, timeout=timeout)
+
+        async with self._operation_lock:
+            self._cancel_idle_shutdown()
+            try:
+                result = await self._check_via_lsp(
+                    prepared_code,
+                    temp_filename=f"MOTOProofCheck_{uuid.uuid4().hex}.lean",
+                    timeout=timeout,
+                )
+                return result
+            except Exception as exc:
+                await self._mark_unhealthy(str(exc))
+                return await self._subprocess_fallback.check_proof(lean_code, timeout=timeout)
+            finally:
+                if self._lsp_healthy:
+                    self._schedule_idle_shutdown()
+
+    async def check_tactic_script(
+        self,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int = 120,
+    ) -> Lean4Result:
+        """Check a tactic script through the persistent Lean LSP when healthy, otherwise fall back.
+
+        Mirrors the subprocess path by performing one deterministic auto-repair
+        attempt when Lean reports ``no goals to be solved`` at a known tactic
+        index.
+        """
+        if not system_config.lean4_enabled:
+            return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
+
+        return await self._check_tactic_script_via_lsp_with_auto_repair(
+            theorem_header=theorem_header,
+            tactic_list=list(tactic_list or []),
+            timeout=timeout,
+            auto_repair_attempts_remaining=1,
+        )
+
+    async def _check_tactic_script_via_lsp_with_auto_repair(
+        self,
+        *,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int,
+        auto_repair_attempts_remaining: int,
+    ) -> Lean4Result:
+        result = await self._run_tactic_script_via_lsp_once(
+            theorem_header=theorem_header,
+            tactic_list=tactic_list,
+            timeout=timeout,
+        )
+
+        if (
+            not result.success
+            and auto_repair_attempts_remaining > 0
+            and result.failing_tactic_index >= 0
+            and self._has_no_goals_diagnostic(result.error_output)
+            and result.failing_tactic_index < len(tactic_list)
+        ):
+            trimmed = tactic_list[: result.failing_tactic_index]
+            if trimmed and trimmed != tactic_list:
+                logger.info(
+                    "Lean 4 LSP reported 'no goals' at tactic index %s; "
+                    "auto-trimming %s trailing tactic(s) and retrying once.",
+                    result.failing_tactic_index,
+                    len(tactic_list) - len(trimmed),
+                )
+                repaired = await self._check_tactic_script_via_lsp_with_auto_repair(
+                    theorem_header=theorem_header,
+                    tactic_list=trimmed,
+                    timeout=timeout,
+                    auto_repair_attempts_remaining=auto_repair_attempts_remaining - 1,
+                )
+                if repaired.success:
+                    return repaired
+
+        return result
+
+    async def _run_tactic_script_via_lsp_once(
+        self,
+        *,
+        theorem_header: str,
+        tactic_list: list[str],
+        timeout: int,
+    ) -> Lean4Result:
+        prepared_code, tactic_ranges = self._build_tactic_script(theorem_header, tactic_list)
+        if not prepared_code:
+            return Lean4Result(success=False, error_output="No tactic script could be constructed from the provided theorem header and tactics.")
+
+        placeholder = _detect_forbidden_placeholder(prepared_code)
+        if placeholder:
+            return Lean4Result(
+                success=False,
+                error_output=_format_placeholder_rejection(placeholder, from_lean_diagnostic=False),
+            )
+
+        workspace_ready = await self.ensure_workspace()
+        if not workspace_ready:
+            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+
+        if not self._lsp_healthy:
+            return await self._subprocess_fallback._run_tactic_script_once(
+                theorem_header=theorem_header,
+                tactic_list=tactic_list,
+                timeout=timeout,
+            )
+
+        async with self._operation_lock:
+            self._cancel_idle_shutdown()
+            try:
+                result = await self._check_via_lsp(
+                    prepared_code,
+                    temp_filename=f"MOTOProofTacticCheck_{uuid.uuid4().hex}.lean",
+                    timeout=timeout,
+                    tactic_ranges=tactic_ranges,
+                )
+                return result
+            except Exception as exc:
+                await self._mark_unhealthy(str(exc))
+                return await self._subprocess_fallback._run_tactic_script_once(
+                    theorem_header=theorem_header,
+                    tactic_list=tactic_list,
+                    timeout=timeout,
+                )
+            finally:
+                if self._lsp_healthy:
+                    self._schedule_idle_shutdown()
+
+
+_lean4_client: Optional[Lean4Client] = None
+
+
+def _build_client(lean_path: str, workspace_dir: str) -> Lean4Client:
+    if system_config.lean4_lsp_enabled:
+        return Lean4LspClient(
+            lean_path=lean_path,
+            workspace_dir=workspace_dir,
+            idle_timeout=system_config.lean4_lsp_idle_timeout,
+        )
+    return Lean4Client(
+        lean_path=lean_path,
+        workspace_dir=workspace_dir,
+    )
+
+
+def initialize_lean4_client(lean_path: Optional[str] = None, workspace_dir: Optional[str] = None) -> Lean4Client:
+    """Create or replace the singleton Lean 4 client."""
+    global _lean4_client
+    _lean4_client = _build_client(
+        lean_path=lean_path or system_config.lean4_path,
+        workspace_dir=workspace_dir or system_config.lean4_workspace_dir,
+    )
+    return _lean4_client
+
+
+def get_lean4_client() -> Lean4Client:
+    """Return the singleton Lean 4 client, creating it from config if needed."""
+    global _lean4_client
+    if _lean4_client is None:
+        _lean4_client = _build_client(
+            lean_path=system_config.lean4_path,
+            workspace_dir=system_config.lean4_workspace_dir,
+        )
+    return _lean4_client
+
+
+async def close_lean4_client() -> None:
+    """Close the singleton Lean 4 client if it owns a persistent server."""
+    client = _lean4_client
+    if client is not None:
+        await client.close()
+
+
+def clear_lean4_client() -> None:
+    """Reset the singleton Lean 4 client."""
+    global _lean4_client
+    _lean4_client = None
diff --git a/backend/shared/lm_studio_client.py b/backend/shared/lm_studio_client.py
index 63603e7..ebc0e1a 100644
--- a/backend/shared/lm_studio_client.py
+++ b/backend/shared/lm_studio_client.py
@@ -15,15 +15,16 @@
 import asyncio
 import time
 import os
+from pathlib import Path
 from datetime import datetime
 from typing import List, Dict, Any, Optional
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
 import logging
 
 logger = logging.getLogger(__name__)
 
-# Ensure logs directory exists
-os.makedirs("backend/logs", exist_ok=True)
+# Ensure instance-scoped logs directory exists
+Path(system_config.logs_dir).mkdir(parents=True, exist_ok=True)
 
 
 class LMStudioClient:
@@ -117,27 +118,31 @@ async def get_loaded_models(self) -> List[str]:
                 return []
             
             result_stdout = stdout.decode() if stdout else ""
+            result_stderr = stderr.decode(errors="replace").strip() if stderr else ""
             result_returncode = process.returncode
-            
-            if result_returncode == 0 and result_stdout:
-                # Parse output to extract model IDs
-                models = []
-                lines = result_stdout.strip().split('\n')
-                
-                for line in lines:
-                    # Skip headers, separators, and empty lines
-                    if not line or line.startswith('-') or line.startswith('ID') or line.startswith('Model'):
-                        continue
-                    
-                    # Extract model ID (first column)
-                    parts = line.strip().split()
-                    if parts:
-                        models.append(parts[0])
-                
+
+            if result_returncode == 0:
+                # Exit code 0 means success. Empty stdout simply means no models
+                # are loaded — that is a normal state, not an error.
+                models: List[str] = []
+                if result_stdout:
+                    for line in result_stdout.strip().split('\n'):
+                        # Skip headers, separators, and empty lines
+                        if not line or line.startswith('-') or line.startswith('ID') or line.startswith('Model'):
+                            continue
+                        # Extract model ID (first column)
+                        parts = line.strip().split()
+                        if parts:
+                            models.append(parts[0])
                 logger.debug(f"Loaded models from 'lms ps': {models}")
                 return models
             else:
-                logger.warning(f"'lms ps' returned code {result_returncode}")
+                if result_stderr:
+                    logger.warning(
+                        f"'lms ps' returned non-zero code {result_returncode}: {result_stderr}"
+                    )
+                else:
+                    logger.warning(f"'lms ps' returned non-zero code {result_returncode}")
                 return []
                 
         except FileNotFoundError:
@@ -154,19 +159,24 @@ async def generate_completion(
         temperature: float = 0.0,  # Default to deterministic generation - evolving context provides diversity
         max_tokens: Optional[int] = None,
         response_format: Optional[Dict[str, str]] = None,
-        skip_semaphore: bool = False
+        skip_semaphore: bool = False,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
         """
         Generate a completion using LM Studio API with validation and retry.
         
         Args:
             skip_semaphore: If True, skips model semaphore acquisition (for non-blocking operations)
+            tools: Optional OpenAI-compatible tool schemas (LM Studio 0.3+).
+            tool_choice: Optional tool-choice directive.
         """
         # Get model-specific semaphore (allows different models to run in parallel)
         if skip_semaphore:
             # Direct execution without semaphore
             return await self._execute_completion_request(
-                model, messages, temperature, max_tokens, response_format
+                model, messages, temperature, max_tokens, response_format,
+                tools=tools, tool_choice=tool_choice,
             )
         
         model_semaphore = await self._get_model_semaphore(model)
@@ -174,7 +184,8 @@ async def generate_completion(
         # ACQUIRE THIS MODEL'S SEMAPHORE to prevent concurrent requests to same model
         async with model_semaphore:
             return await self._execute_completion_request(
-                model, messages, temperature, max_tokens, response_format
+                model, messages, temperature, max_tokens, response_format,
+                tools=tools, tool_choice=tool_choice,
             )
     
     async def _execute_completion_request(
@@ -183,7 +194,9 @@ async def _execute_completion_request(
         messages: List[Dict[str, str]],
         temperature: float,
         max_tokens: Optional[int],
-        response_format: Optional[Dict[str, str]]
+        response_format: Optional[Dict[str, str]],
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
         """Execute the actual completion request (extracted for semaphore bypass)."""
         # Calculate approximate token count for logging
@@ -207,6 +220,16 @@ async def _execute_completion_request(
         if response_format:
             payload["response_format"] = response_format
         
+        # OpenAI-compatible tool calling (LM Studio 0.3+). We pass the tool
+        # list straight through; LM Studio's OpenAI-compatible server either
+        # surfaces tool_calls on the message or simply returns a normal
+        # completion if the loaded model ignores tool schemas. Callers
+        # detect the latter and fall back to single-shot.
+        if tools:
+            payload["tools"] = tools
+            if tool_choice is not None:
+                payload["tool_choice"] = tool_choice
+        
         # NOTE: Stop sequences were removed because they caused premature truncation
         # with certain models (e.g., Grok 4.1). Models will now generate until max_tokens
         # or natural completion. The json_parser handles any trailing garbage/padding.
@@ -407,11 +430,16 @@ async def _get_embeddings_with_retry(
                 raise
     
     async def test_connection(self) -> bool:
-        """Test connection to LM Studio."""
+        """Test connection to LM Studio (bounded, never blocks startup)."""
         try:
-            models = await self.list_models()
+            # Hard cap the startup probe so a LM Studio process that bound the
+            # port but never responds cannot stall the FastAPI lifespan.
+            models = await asyncio.wait_for(self.list_models(), timeout=5.0)
             logger.info(f"Successfully connected to LM Studio. Found {len(models)} models.")
             return True
+        except asyncio.TimeoutError:
+            logger.warning("LM Studio startup probe timed out after 5s; treating as unavailable.")
+            return False
         except Exception as e:
             logger.error(f"Failed to connect to LM Studio: {e}")
             return False
@@ -440,17 +468,44 @@ async def check_availability(self) -> Dict[str, Any]:
             # First check if server is reachable
             response = await self.client.get(f"{self.base_url}/v1/models", timeout=5.0)
             response.raise_for_status()
-            
+
             # Server is reachable
             result["available"] = True
-            
-            # Get loaded models
-            models = await self.get_loaded_models()
+
+            # Extract models from the /v1/models response as a reliable fallback.
+            # The `lms ps` CLI is preferred (it returns instance IDs), but the CLI
+            # may be missing from PATH or slow/timing out during startup while
+            # nomic is still loading. In either case we must NOT downgrade a
+            # successful /v1/models response to "no models" — that produces a
+            # phantom "LM Studio Offline" state even though embedding calls
+            # are succeeding.
+            http_models: List[str] = []
+            try:
+                data = response.json()
+                for entry in data.get("data", []) or []:
+                    if isinstance(entry, dict):
+                        model_id = entry.get("id")
+                        if isinstance(model_id, str) and model_id:
+                            http_models.append(model_id)
+            except Exception as parse_err:
+                logger.debug(f"Could not parse /v1/models response body: {parse_err}")
+
+            cli_models = await self.get_loaded_models()
+
+            if cli_models:
+                models = cli_models
+                source = "lms ps"
+            else:
+                models = http_models
+                source = "/v1/models"
+
             result["models"] = models
             result["model_count"] = len(models)
             result["has_models"] = len(models) > 0
-            
-            logger.info(f"LM Studio availability check: {len(models)} models loaded")
+
+            logger.debug(
+                f"LM Studio availability check: {len(models)} models loaded (source: {source})"
+            )
             return result
             
         except httpx.ConnectError:
diff --git a/backend/shared/models.py b/backend/shared/models.py
index 556de7f..9c10e22 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -1,9 +1,11 @@
 """
 Pydantic models for the ASI Aggregator System.
 """
+from dataclasses import dataclass
+from datetime import datetime
 from typing import List, Dict, Optional, Any, Literal
+
 from pydantic import BaseModel, Field
-from datetime import datetime
 
 
 class DocumentChunk(BaseModel):
@@ -464,6 +466,161 @@ class AutonomousResearchStartRequest(BaseModel):
     tier3_enabled: bool = False  # Default OFF — system stops at Tier 2 paper library
 
 
+# ============================================================================
+# LEAN 4 PROOF INTEGRATION MODELS
+# ============================================================================
+
+
+class MathlibLemmaHint(BaseModel):
+    """A locally confirmed Mathlib declaration that may help a proof attempt."""
+    requested_name: str
+    full_name: str = ""
+    declaration: str = ""
+    file_path: str = ""
+    line_number: int = 0
+
+
+class SmtHint(BaseModel):
+    """Optional SMT-derived guidance that can seed Lean proof attempts."""
+    result: Literal["sat", "unsat", "unknown"] = "unknown"
+    suggested_tactics: List[str] = Field(default_factory=list)
+    smtlib: str = ""
+
+
+class ProofCandidate(BaseModel):
+    """A theorem candidate extracted from a brainstorm or paper."""
+    theorem_id: str
+    statement: str
+    formal_sketch: str = ""
+    source_excerpt: str = ""
+    origin_source_id: str = ""
+    relevant_lemmas: List[MathlibLemmaHint] = Field(default_factory=list)
+    smt_hint: Optional[SmtHint] = None
+
+
+class FailedProofCandidate(BaseModel):
+    """Persisted failed theorem candidate that can be retried later."""
+    source_brainstorm_id: str
+    theorem_id: str
+    theorem_statement: str
+    formal_sketch: str = ""
+    source_excerpt: str = ""
+    error_summary: str = ""
+    suggested_lemma_targets: List[str] = Field(default_factory=list)
+    retry_count: int = 0
+    last_retry_source_id: str = ""
+    resolved_proof_id: Optional[str] = None
+    created_at: datetime = Field(default_factory=datetime.now)
+    updated_at: datetime = Field(default_factory=datetime.now)
+
+
+class ProofRoleConfigSnapshot(BaseModel):
+    """Persisted model/runtime config for proof-related agents."""
+    provider: Literal["lm_studio", "openrouter"] = "lm_studio"
+    model_id: str = ""
+    openrouter_provider: Optional[str] = None
+    lm_studio_fallback_id: Optional[str] = None
+    context_window: int = 131072
+    max_output_tokens: int = 25000
+
+
+class ProofRuntimeConfigSnapshot(BaseModel):
+    """Persisted proof runtime config used for manual proof checks."""
+    brainstorm: ProofRoleConfigSnapshot
+    paper: ProofRoleConfigSnapshot
+    validator: ProofRoleConfigSnapshot
+
+
+class ProofDependency(BaseModel):
+    """One dependency edge for a verified proof."""
+    kind: Literal["mathlib", "moto"]
+    name: str
+    source_ref: str = ""
+
+
+@dataclass
+class SmtResult:
+    """Result of one SMT solver check."""
+    success: bool
+    result: str = ""
+    stdout: str = ""
+    stderr: str = ""
+
+
+class ProofAttemptFeedback(BaseModel):
+    """Lean 4 attempt feedback captured for one theorem attempt."""
+    attempt: int
+    theorem_id: str
+    reasoning: str = ""
+    lean_code: str = ""
+    error_output: str = ""
+    goal_states: str = ""
+    strategy: Literal["full_script", "tactic_script"] = "full_script"
+    tactic_trace: List[str] = Field(default_factory=list)
+    success: bool = False
+
+
+class ProofRecord(BaseModel):
+    """Stored proof metadata for the proof library and prompt injection."""
+    proof_id: str
+    theorem_id: str = ""
+    theorem_statement: str
+    theorem_name: str = ""
+    formal_sketch: str = ""
+    source_type: Literal["brainstorm", "paper"]
+    source_id: str
+    source_title: str = ""
+    solver: str = "Lean 4"
+    lean_code: str
+    novel: bool = False
+    novelty_reasoning: str = ""
+    verification_notes: str = ""
+    attempt_count: int = 0
+    attempts: List[ProofAttemptFeedback] = Field(default_factory=list)
+    dependencies: List[ProofDependency] = Field(default_factory=list)
+    solver_hints: List[str] = Field(default_factory=list)
+    created_at: datetime = Field(default_factory=datetime.now)
+
+
+class ProofAttemptResult(BaseModel):
+    """Outcome of one theorem proof-attempt loop."""
+    theorem_id: str
+    theorem_statement: str
+    lean_code: str = ""
+    success: bool = False
+    novel: bool = False
+    attempts_used: int = 0
+    proof_id: Optional[str] = None
+    error_summary: str = ""
+
+
+class ProofStageResult(BaseModel):
+    """Aggregate outcome of one proof-verification stage run."""
+    source_type: Literal["brainstorm", "paper"]
+    source_id: str
+    total_candidates: int = 0
+    verified_count: int = 0
+    novel_count: int = 0
+    results: List[ProofAttemptResult] = Field(default_factory=list)
+
+
+class ProofCheckRequest(BaseModel):
+    """Request body for manually triggering a proof check."""
+    source_type: Literal["brainstorm", "paper"]
+    source_id: str
+
+
+class ProofSettingsUpdateRequest(BaseModel):
+    """Request body for updating runtime Lean 4 proof settings."""
+    enabled: bool
+    timeout: int = Field(default=120, ge=10, le=3600)
+    lean4_lsp_enabled: Optional[bool] = None
+    lean4_lsp_idle_timeout: Optional[int] = Field(default=None, ge=60, le=7200)
+    smt_enabled: Optional[bool] = None
+    z3_path: Optional[str] = None
+    smt_timeout: Optional[int] = Field(default=None, ge=1, le=600)
+
+
 # ============================================================================
 # TIER 3: FINAL ANSWER MODELS (Part 3 - Final Answer Generation)
 # ============================================================================
diff --git a/backend/shared/openrouter_client.py b/backend/shared/openrouter_client.py
index 3ba64b6..50b9c39 100644
--- a/backend/shared/openrouter_client.py
+++ b/backend/shared/openrouter_client.py
@@ -142,12 +142,16 @@ def _get_headers(self) -> Dict[str, str]:
             "X-Title": self.APP_TITLE
         }
     
-    async def list_models(self, free_only: bool = False) -> List[Dict[str, Any]]:
+    async def list_models(self, free_only: bool = False, raise_on_error: bool = False) -> List[Dict[str, Any]]:
         """
         List available models from OpenRouter.
         
         Args:
             free_only: If True, only return models with $0 pricing (both prompt and completion)
+            raise_on_error: If True, re-raise exceptions instead of swallowing them and
+                returning ``[]``. Callers that need to distinguish an invalid API key from
+                a transient network/OpenRouter hiccup (e.g. the set-api-key validation
+                endpoint) should pass ``True`` so they can surface an accurate error.
         
         Returns:
             List of model objects, each containing:
@@ -191,112 +195,130 @@ async def list_models(self, free_only: bool = False) -> List[Dict[str, Any]]:
             return sorted(models, key=lambda m: m.get("name", m.get("id", "")))
         except Exception as e:
             logger.error(f"Failed to list OpenRouter models: {e}")
+            if raise_on_error:
+                raise
             return []
     
-    async def get_model_providers(self, model_id: str) -> List[str]:
+    async def get_model_endpoints(self, model_id: str) -> List[Dict[str, Any]]:
         """
-        Get available providers/endpoints for a specific model using OpenRouter's
-        dedicated endpoints API.
-        
+        Get available endpoint metadata for a specific OpenRouter model.
+
         Args:
             model_id: The OpenRouter model identifier (e.g., "anthropic/claude-3.5-sonnet")
-            
+
         Returns:
-            List of provider names that offer this model.
-            Returns empty list if model not found or no providers available.
-            
-        Note:
-            Uses OpenRouter's /api/v1/models/:author/:slug/endpoints endpoint
-            to get the actual list of available providers for a model.
+            List of available endpoint dicts for the model. Each endpoint includes
+            provider_name, context_length, max_completion_tokens, and
+            max_prompt_tokens when available.
         """
         try:
             # Model ID format is "author/slug" (e.g., "anthropic/claude-3.5-sonnet")
             if "/" not in model_id:
                 logger.warning(f"Invalid model ID format (expected 'author/slug'): {model_id}")
                 return []
-            
+
             parts = model_id.split("/", 1)
             if len(parts) != 2:
                 logger.warning(f"Could not parse model ID: {model_id}")
                 return []
-            
+
             author, slug = parts
-            
-            # Call the dedicated endpoints API
+
             url = f"{self.BASE_URL}/models/{author}/{slug}/endpoints"
-            logger.debug(f"Fetching providers from: {url}")
-            
+            logger.debug(f"Fetching endpoints from: {url}")
+
             response = await self.client.get(
                 url,
                 headers=self._get_headers()
             )
-            
+
             if response.status_code == 404:
                 logger.warning(f"Model {model_id} not found in OpenRouter")
                 return []
-            
+
             response.raise_for_status()
             data = response.json()
-            
-            # Cache the response but don't spam logs with the full data
+
             logger.debug(f"OpenRouter endpoints API response for {model_id} (cached)")
-            
-            providers = []
-            
-            # The response should contain endpoint data with provider info
-            # Expected structure: {"data": {"endpoints": [{"provider_name": "...", ...}, ...]}}
-            # or similar variations
-            
+
+            cleaned_endpoints: List[Dict[str, Any]] = []
+
             if isinstance(data, dict):
-                # Check for 'data' wrapper
                 endpoints_data = data.get("data", data)
-                
-                # Check for 'endpoints' array
-                endpoints = None
+
+                raw_endpoints = None
                 if isinstance(endpoints_data, dict):
-                    endpoints = endpoints_data.get("endpoints", [])
+                    raw_endpoints = endpoints_data.get("endpoints")
+                    if raw_endpoints is None and any(
+                        key in endpoints_data for key in ("provider_name", "provider", "name", "id")
+                    ):
+                        raw_endpoints = [endpoints_data]
                 elif isinstance(endpoints_data, list):
-                    endpoints = endpoints_data
-                
-                if endpoints and isinstance(endpoints, list):
-                    for endpoint in endpoints:
-                        if isinstance(endpoint, dict):
-                            # Check if provider is available (status == 0 means available)
-                            status = endpoint.get("status", -1)
-                            if status < 0:
-                                # Skip unavailable providers
-                                provider_name = endpoint.get("provider_name", "unknown")
-                                logger.debug(f"Filtering out unavailable provider {provider_name} (status={status})")
-                                continue
-                            
-                            # Try various field names for provider
-                            provider = (
-                                endpoint.get("provider_name") or
-                                endpoint.get("provider") or
-                                endpoint.get("name") or
-                                endpoint.get("id")
+                    raw_endpoints = endpoints_data
+
+                if isinstance(raw_endpoints, list):
+                    for endpoint in raw_endpoints:
+                        if not isinstance(endpoint, dict):
+                            continue
+
+                        status = endpoint.get("status", -1)
+                        if status is None or status < 0:
+                            provider_name = endpoint.get("provider_name", "unknown")
+                            logger.debug(
+                                f"Filtering out unavailable provider {provider_name} (status={status})"
                             )
-                            if provider and isinstance(provider, str):
-                                providers.append(provider)
-                
-                # Also check top-level for provider info
-                if not providers:
-                    if "provider_name" in endpoints_data:
-                        providers.append(endpoints_data["provider_name"])
-                    elif "provider" in endpoints_data:
-                        providers.append(endpoints_data["provider"])
-            
-            # Deduplicate and sort (caching silently works behind the scenes)
-            unique_providers = sorted(list(set(providers)))
-            logger.debug(f"Available providers for {model_id}: {unique_providers}")
-            return unique_providers
-            
+                            continue
+
+                        provider_name = (
+                            endpoint.get("provider_name") or
+                            endpoint.get("provider") or
+                            endpoint.get("name") or
+                            endpoint.get("id")
+                        )
+
+                        cleaned_endpoints.append({
+                            "provider_name": provider_name,
+                            "context_length": endpoint.get("context_length"),
+                            "max_completion_tokens": endpoint.get("max_completion_tokens"),
+                            "max_prompt_tokens": endpoint.get("max_prompt_tokens"),
+                            "supported_parameters": endpoint.get("supported_parameters", []),
+                            "status": status,
+                            "tag": endpoint.get("tag"),
+                            "name": endpoint.get("name"),
+                            "quantization": endpoint.get("quantization"),
+                        })
+
+            logger.debug(f"Available endpoints for {model_id}: {len(cleaned_endpoints)}")
+            return cleaned_endpoints
+
         except httpx.HTTPStatusError as e:
-            logger.error(f"HTTP error fetching providers for {model_id}: {e.response.status_code}")
+            logger.error(f"HTTP error fetching endpoints for {model_id}: {e.response.status_code}")
             return []
         except Exception as e:
-            logger.error(f"Failed to get providers for model {model_id}: {e}")
+            logger.error(f"Failed to get endpoints for model {model_id}: {e}")
             return []
+
+    async def get_model_providers(self, model_id: str) -> List[str]:
+        """
+        Get available providers/endpoints for a specific model using OpenRouter's
+        dedicated endpoints API.
+
+        Args:
+            model_id: The OpenRouter model identifier (e.g., "anthropic/claude-3.5-sonnet")
+
+        Returns:
+            List of provider names that offer this model.
+            Returns empty list if model not found or no providers available.
+        """
+        endpoints = await self.get_model_endpoints(model_id)
+        providers = {
+            endpoint.get("provider_name")
+            for endpoint in endpoints
+            if isinstance(endpoint.get("provider_name"), str) and endpoint.get("provider_name")
+        }
+        unique_providers = sorted(providers)
+        logger.debug(f"Available providers for {model_id}: {unique_providers}")
+        return unique_providers
     
     async def generate_completion(
         self,
@@ -305,7 +327,9 @@ async def generate_completion(
         temperature: float = 0.0,
         max_tokens: Optional[int] = None,
         response_format: Optional[Dict[str, str]] = None,
-        provider: Optional[str] = None
+        provider: Optional[str] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
         """
         Generate a completion using OpenRouter API with validation and retry.
@@ -317,6 +341,9 @@ async def generate_completion(
             max_tokens: Maximum tokens to generate
             response_format: Optional response format constraints
             provider: Optional specific provider to use (None lets OpenRouter choose)
+            tools: Optional OpenAI-compatible tool schemas the model may call.
+            tool_choice: Optional tool-choice directive (e.g. "auto", "none",
+                or ``{"type": "function", "function": {"name": "..."}}``).
             
         Returns:
             API response dict
@@ -330,7 +357,14 @@ async def generate_completion(
         # ACQUIRE THIS MODEL'S SEMAPHORE to prevent concurrent requests
         async with model_semaphore:
             return await self._execute_completion_request(
-                model, messages, temperature, max_tokens, response_format, provider
+                model,
+                messages,
+                temperature,
+                max_tokens,
+                response_format,
+                provider,
+                tools=tools,
+                tool_choice=tool_choice,
             )
     
     def _is_reasoning_model_without_temperature(self, model: str) -> bool:
@@ -365,7 +399,9 @@ async def _execute_completion_request(
         temperature: float,
         max_tokens: Optional[int],
         response_format: Optional[Dict[str, str]],
-        provider: Optional[str] = None
+        provider: Optional[str] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
         """Execute the actual completion request."""
         # Check if this model is currently rate-limited (for free models)
@@ -406,6 +442,15 @@ async def _execute_completion_request(
         if response_format:
             payload["response_format"] = response_format
         
+        # OpenAI-compatible tool calling: pass tools + tool_choice straight
+        # through to OpenRouter. Providers that do not support tools tend to
+        # ignore the field, in which case the caller will see a response with
+        # no `tool_calls` and the single-shot fallback path applies.
+        if tools:
+            payload["tools"] = tools
+            if tool_choice is not None:
+                payload["tool_choice"] = tool_choice
+        
         # Add provider routing if specified
         if provider:
             payload["provider"] = {"order": [provider]}
diff --git a/backend/shared/secret_store.py b/backend/shared/secret_store.py
index c80181c..ab99722 100644
--- a/backend/shared/secret_store.py
+++ b/backend/shared/secret_store.py
@@ -10,9 +10,11 @@
 import keyring
 from keyring.errors import KeyringError, PasswordDeleteError
 
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
-_SERVICE_NAME = "MOTO-Autonomous-ASI"
+_DEFAULT_SERVICE_NAME = "MOTO-Autonomous-ASI"
 _OPENROUTER_KEY = "openrouter_api_key"
 _WOLFRAM_KEY = "wolfram_alpha_api_key"
 
@@ -21,6 +23,14 @@ class SecretStoreError(RuntimeError):
     """Raised when the secure secret store is unavailable or fails."""
 
 
+def _get_service_name() -> str:
+    """Return the OS-keyring service name for the active instance."""
+    namespace = system_config.secret_namespace
+    if namespace:
+        return f"{_DEFAULT_SERVICE_NAME}::{namespace}"
+    return _DEFAULT_SERVICE_NAME
+
+
 def _normalize_secret(value: Optional[str]) -> Optional[str]:
     """Trim whitespace and collapse empty values to None."""
     if value is None:
@@ -33,7 +43,7 @@ def _normalize_secret(value: Optional[str]) -> Optional[str]:
 def _get_secret(secret_name: str) -> Optional[str]:
     """Load a secret from the OS-backed keyring."""
     try:
-        return _normalize_secret(keyring.get_password(_SERVICE_NAME, secret_name))
+        return _normalize_secret(keyring.get_password(_get_service_name(), secret_name))
     except KeyringError as exc:
         raise SecretStoreError(
             "Secure credential storage is unavailable. Please ensure the OS keyring is accessible."
@@ -47,7 +57,7 @@ def _set_secret(secret_name: str, secret_value: str) -> None:
         raise ValueError("Secret value is required")
 
     try:
-        keyring.set_password(_SERVICE_NAME, secret_name, normalized)
+        keyring.set_password(_get_service_name(), secret_name, normalized)
     except KeyringError as exc:
         raise SecretStoreError(
             "Failed to persist the credential in the OS keyring."
@@ -57,7 +67,7 @@ def _set_secret(secret_name: str, secret_value: str) -> None:
 def _delete_secret(secret_name: str) -> None:
     """Delete a persisted secret if one exists."""
     try:
-        keyring.delete_password(_SERVICE_NAME, secret_name)
+        keyring.delete_password(_get_service_name(), secret_name)
     except PasswordDeleteError:
         return
     except KeyringError as exc:
@@ -66,6 +76,16 @@ def _delete_secret(secret_name: str) -> None:
         ) from exc
 
 
+def get_active_service_name() -> str:
+    """Return the OS-keyring service name this process is currently using.
+
+    Exposed for startup diagnostics so operators can verify the keyring
+    namespace has not drifted between launches (which would make saved API
+    keys look like they "disappeared").
+    """
+    return _get_service_name()
+
+
 def load_openrouter_api_key() -> Optional[str]:
     """Load the persisted global OpenRouter API key."""
     return _get_secret(_OPENROUTER_KEY)
diff --git a/backend/shared/smt_client.py b/backend/shared/smt_client.py
new file mode 100644
index 0000000..e056829
--- /dev/null
+++ b/backend/shared/smt_client.py
@@ -0,0 +1,133 @@
+"""
+Optional Z3 / SMT client wrappers.
+"""
+from __future__ import annotations
+
+import asyncio
+import logging
+import shutil
+from pathlib import Path
+from typing import Optional
+
+from backend.shared.config import system_config
+from backend.shared.models import SmtResult
+
+logger = logging.getLogger(__name__)
+
+
+class SmtClient:
+    """Thin async wrapper around an external Z3 binary."""
+
+    def __init__(self, z3_path: str, timeout: int) -> None:
+        self.z3_path = str(z3_path or "").strip()
+        self.timeout = max(int(timeout or 0), 1)
+
+    def _resolve_executable(self) -> str:
+        if self.z3_path:
+            candidate = Path(self.z3_path).resolve()
+            if candidate.exists():
+                return str(candidate)
+
+        for name in ("z3", "z3.exe"):
+            resolved = shutil.which(name)
+            if resolved:
+                return resolved
+        return self.z3_path or "z3"
+
+    async def _run_process(
+        self,
+        args: list[str],
+        *,
+        stdin_text: str = "",
+        timeout: Optional[int] = None,
+    ) -> tuple[int, str, str]:
+        process = await asyncio.create_subprocess_exec(
+            *args,
+            stdin=asyncio.subprocess.PIPE,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        effective_timeout = max(int(timeout or self.timeout), 1)
+        try:
+            stdout_bytes, stderr_bytes = await asyncio.wait_for(
+                process.communicate((stdin_text or "").encode("utf-8")),
+                timeout=effective_timeout,
+            )
+        except asyncio.TimeoutError:
+            process.kill()
+            await process.communicate()
+            return (
+                -1,
+                "",
+                f"Z3 process timed out after {effective_timeout} seconds.",
+            )
+
+        return (
+            process.returncode,
+            stdout_bytes.decode("utf-8", errors="replace"),
+            stderr_bytes.decode("utf-8", errors="replace"),
+        )
+
+    async def get_version(self) -> str:
+        """Return the Z3 version string when available."""
+        returncode, stdout, stderr = await self._run_process(
+            [self._resolve_executable(), "-version"],
+            timeout=15,
+        )
+        if returncode != 0:
+            return (stderr or stdout).strip()
+        return (stdout or stderr).strip()
+
+    async def check_smt2(self, smtlib: str, timeout: Optional[int] = None) -> SmtResult:
+        """Run an SMT-LIB payload through Z3 using stdin."""
+        if not system_config.smt_enabled:
+            return SmtResult(success=False, result="error", stderr="SMT support is disabled in system configuration.")
+
+        payload = (smtlib or "").strip()
+        if not payload:
+            return SmtResult(success=False, result="error", stderr="No SMT-LIB payload was provided.")
+
+        returncode, stdout, stderr = await self._run_process(
+            [self._resolve_executable(), "-smt2", "-in"],
+            stdin_text=payload + "\n",
+            timeout=timeout,
+        )
+        first_line = next((line.strip().lower() for line in stdout.splitlines() if line.strip()), "")
+        result = first_line if first_line in {"sat", "unsat", "unknown"} else "error"
+        success = returncode == 0 and result in {"sat", "unsat", "unknown"}
+        return SmtResult(
+            success=success,
+            result=result,
+            stdout=stdout.strip(),
+            stderr=stderr.strip(),
+        )
+
+
+_smt_client: Optional[SmtClient] = None
+
+
+def initialize_smt_client(z3_path: Optional[str] = None, timeout: Optional[int] = None) -> SmtClient:
+    """Create or replace the singleton SMT client."""
+    global _smt_client
+    _smt_client = SmtClient(
+        z3_path=z3_path or system_config.z3_path,
+        timeout=timeout or system_config.smt_timeout,
+    )
+    return _smt_client
+
+
+def get_smt_client() -> SmtClient:
+    """Return the singleton SMT client, creating it from config if needed."""
+    global _smt_client
+    if _smt_client is None:
+        _smt_client = SmtClient(
+            z3_path=system_config.z3_path,
+            timeout=system_config.smt_timeout,
+        )
+    return _smt_client
+
+
+def clear_smt_client() -> None:
+    """Reset the singleton SMT client."""
+    global _smt_client
+    _smt_client = None
diff --git a/docker/entrypoint.sh b/docker/entrypoint.sh
new file mode 100644
index 0000000..3816609
--- /dev/null
+++ b/docker/entrypoint.sh
@@ -0,0 +1,20 @@
+#!/bin/sh
+set -eu
+
+export MOTO_GENERIC_MODE="${MOTO_GENERIC_MODE:-true}"
+export HOST="${HOST:-0.0.0.0}"
+export PORT="${PORT:-8000}"
+export MOTO_DATA_ROOT="${MOTO_DATA_ROOT:-/app/backend/data}"
+
+mkdir -p "$MOTO_DATA_ROOT"
+
+if [ -n "${MOTO_LOG_ROOT:-}" ]; then
+    mkdir -p "$MOTO_LOG_ROOT"
+fi
+
+# `backend/api/main.py` remains the source of truth for hosted env validation.
+if [ "$#" -gt 0 ]; then
+    exec "$@"
+fi
+
+exec python -m backend.api.main
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index d914400..4efcf03 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.6",
+  "version": "1.0.7",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "asi-aggregator-frontend",
-      "version": "1.0.6",
+      "version": "1.0.7",
       "license": "MIT",
       "dependencies": {
         "dompurify": "^3.2.4",
diff --git a/frontend/package.json b/frontend/package.json
index 3cdeaf1..90b3c08 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -1,6 +1,6 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.6",
+  "version": "1.0.7",
   "description": "Frontend UI for MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "author": "Intrafere LLC",
   "license": "MIT",
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 9df0bde..e9a22f6 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -15,7 +15,8 @@ import {
   AutonomousResearchSettings,
   AutonomousResearchLogs,
   FinalAnswerView,
-  FinalAnswerLibrary
+  FinalAnswerLibrary,
+  MathematicalProofs
 } from './components/autonomous';
 import WorkflowPanel from './components/WorkflowPanel';
 import BoostControlModal from './components/BoostControlModal';
@@ -23,6 +24,7 @@ import StartupProviderSetupModal from './components/StartupProviderSetupModal';
 import OpenRouterApiKeyModal from './components/OpenRouterApiKeyModal';
 import OpenRouterPrivacyWarningModal from './components/OpenRouterPrivacyWarningModal';
 import CritiqueNotificationStack from './components/CritiqueNotificationStack';
+import ProofNotificationStack from './components/autonomous/ProofNotificationStack';
 import CreditExhaustionNotificationStack from './components/CreditExhaustionNotificationStack';
 import HungConnectionNotificationStack from './components/HungConnectionNotificationStack';
 import PaperCritiqueModal from './components/PaperCritiqueModal';
@@ -44,6 +46,16 @@ const AUTONOMOUS_TAB_STORAGE_KEY = 'autonomousActiveTab';
 const MANUAL_TAB_STORAGE_KEY = 'manualActiveTab';
 const LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY = 'singlePaperWriterExpanded';
 const EMBEDDING_MODEL_HINTS = ['embed', 'embedding', 'nomic', 'bge', 'e5', 'gte'];
+const AUTONOMOUS_ROLE_PREFIXES = ['validator', 'high_context', 'high_param', 'critique_submitter'];
+const DEFAULT_CAPABILITIES = Object.freeze({
+  genericMode: false,
+  lmStudioEnabled: true,
+  pdfDownloadAvailable: true,
+  version: '',
+  buildCommit: '',
+  updateChannel: 'main',
+  apiContractVersion: '',
+});
 
 function normalizeLoadedLmStudioModelId(modelId = '') {
   return String(modelId).replace(/:\d+$/, '');
@@ -66,6 +78,80 @@ function getUsableLoadedLmStudioChatModelId(loadedModels = []) {
   return '';
 }
 
+function normalizeFeaturesPayload(payload = {}) {
+  return {
+    genericMode: Boolean(payload.generic_mode),
+    lmStudioEnabled: payload.lm_studio_enabled !== false,
+    pdfDownloadAvailable: payload.pdf_download_available !== false,
+    version: payload.version || '',
+    buildCommit: payload.build_commit || '',
+    updateChannel: payload.update_channel || 'main',
+    apiContractVersion: payload.api_contract_version || '',
+  };
+}
+
+function normalizeRuntimeProvider(provider, lmStudioEnabled) {
+  return lmStudioEnabled ? (provider || 'lm_studio') : 'openrouter';
+}
+
+function normalizeRuntimeModelConfig(config = {}, lmStudioEnabled) {
+  const originalProvider = config.provider || 'lm_studio';
+  const shouldResetLmState = !lmStudioEnabled && originalProvider !== 'openrouter';
+
+  return {
+    ...config,
+    provider: normalizeRuntimeProvider(config.provider, lmStudioEnabled),
+    modelId: shouldResetLmState ? '' : (config.modelId || ''),
+    openrouterProvider: shouldResetLmState ? null : (config.openrouterProvider || null),
+    lmStudioFallbackId: lmStudioEnabled ? (config.lmStudioFallbackId || null) : null,
+  };
+}
+
+function normalizeAggregatorConfigForCapabilities(config, lmStudioEnabled) {
+  const originalValidatorProvider = config.validatorProvider || 'lm_studio';
+  const shouldResetValidator = !lmStudioEnabled && originalValidatorProvider !== 'openrouter';
+
+  return {
+    ...config,
+    submitterConfigs: (config.submitterConfigs || []).map((submitterConfig) =>
+      normalizeRuntimeModelConfig(submitterConfig, lmStudioEnabled)
+    ),
+    validatorProvider: normalizeRuntimeProvider(config.validatorProvider, lmStudioEnabled),
+    validatorModel: shouldResetValidator ? '' : (config.validatorModel || ''),
+    validatorOpenrouterProvider: shouldResetValidator
+      ? null
+      : (config.validatorOpenrouterProvider || null),
+    validatorLmStudioFallback: lmStudioEnabled ? (config.validatorLmStudioFallback || null) : null,
+  };
+}
+
+function normalizeAutonomousConfigForCapabilities(config, lmStudioEnabled) {
+  const nextConfig = {
+    ...config,
+    submitter_configs: (config.submitter_configs || []).map((submitterConfig) =>
+      normalizeRuntimeModelConfig(submitterConfig, lmStudioEnabled)
+    ),
+  };
+
+  AUTONOMOUS_ROLE_PREFIXES.forEach((rolePrefix) => {
+    const providerKey = `${rolePrefix}_provider`;
+    const modelKey = `${rolePrefix}_model`;
+    const openRouterProviderKey = `${rolePrefix}_openrouter_provider`;
+    const fallbackKey = `${rolePrefix}_lm_studio_fallback`;
+    const originalProvider = nextConfig[providerKey] || 'lm_studio';
+    const shouldResetRole = !lmStudioEnabled && originalProvider !== 'openrouter';
+
+    nextConfig[providerKey] = normalizeRuntimeProvider(nextConfig[providerKey], lmStudioEnabled);
+    nextConfig[modelKey] = shouldResetRole ? '' : (nextConfig[modelKey] || '');
+    nextConfig[openRouterProviderKey] = shouldResetRole
+      ? null
+      : (nextConfig[openRouterProviderKey] || null);
+    nextConfig[fallbackKey] = lmStudioEnabled ? (nextConfig[fallbackKey] || null) : null;
+  });
+
+  return nextConfig;
+}
+
 function App() {
   const [appMode, setAppMode] = useState(() => {
     const savedMode = localStorage.getItem(APP_MODE_STORAGE_KEY);
@@ -84,12 +170,8 @@ function App() {
       return 'autonomous';
     }
   });
-  const [autonomousActiveTab, setAutonomousActiveTab] = useState(
-    () => localStorage.getItem(AUTONOMOUS_TAB_STORAGE_KEY) || 'auto-interface'
-  );
-  const [manualActiveTab, setManualActiveTab] = useState(
-    () => localStorage.getItem(MANUAL_TAB_STORAGE_KEY) || 'aggregator-interface'
-  );
+  const [autonomousActiveTab, setAutonomousActiveTab] = useState('auto-interface');
+  const [manualActiveTab, setManualActiveTab] = useState('aggregator-interface');
   const activeTab = appMode === 'manual' ? manualActiveTab : autonomousActiveTab;
   const shimmerAccentsEnabled = (() => {
     const saved = localStorage.getItem('banner_shimmer_enabled');
@@ -101,6 +183,7 @@ function App() {
   
   // Boost modal state
   const [showBoostModal, setShowBoostModal] = useState(false);
+  const [showApiBoostTooltip, setShowApiBoostTooltip] = useState(false);
   
   // OpenRouter API Key modal state
   const [showOpenRouterKeyModal, setShowOpenRouterKeyModal] = useState(false);
@@ -117,7 +200,13 @@ function App() {
     usable_chat_model_id: '',
     has_usable_chat_model: false,
   });
-  const [hasOpenRouterKey, setHasOpenRouterKey] = useState(false);
+  // Tri-state: null = unknown (backend unreachable / cold-start in progress),
+  // true = key stored in backend, false = confirmed no key. The UI treats
+  // "unknown" neutrally (does NOT open the startup setup modal, does NOT flash
+  // a red "Set OpenRouter Key" chip) so that a slow-to-boot backend can never
+  // make a stored key look like it "disappeared".
+  const [hasOpenRouterKey, setHasOpenRouterKey] = useState(null);
+  const [capabilities, setCapabilities] = useState(DEFAULT_CAPABILITIES);
   
   // Track if any workflow is running (for WorkflowPanel visibility)
   const [anyWorkflowRunning, setAnyWorkflowRunning] = useState(false);
@@ -128,6 +217,10 @@ function App() {
     return savedState === 'true';
   });
 
+  // Update notice banner state (dismissible per session, re-appears on restart)
+  const [updateNotice, setUpdateNotice] = useState(null);
+  const [updateNoticeDismissed, setUpdateNoticeDismissed] = useState(false);
+
   useEffect(() => {
     localStorage.setItem(APP_MODE_STORAGE_KEY, appMode);
     localStorage.setItem(
@@ -256,6 +349,10 @@ function App() {
   const [critiqueNotifications, setCritiqueNotifications] = useState([]);
   const [selectedCritiquePaper, setSelectedCritiquePaper] = useState(null);
   const [showCritiqueModal, setShowCritiqueModal] = useState(false);
+  const [proofNotifications, setProofNotifications] = useState([]);
+  const [selectedProofId, setSelectedProofId] = useState(null);
+  const [proofRefreshToken, setProofRefreshToken] = useState(0);
+  const [latestProofDependencyEvent, setLatestProofDependencyEvent] = useState(null);
 
   // Credit exhaustion notification state (persistent until dismissed)
   const [creditExhaustionNotifications, setCreditExhaustionNotifications] = useState([]);
@@ -321,49 +418,85 @@ function App() {
   }, [autonomousConfig]);
 
   const syncProviderAvailability = useCallback(async () => {
+    let nextCapabilities = DEFAULT_CAPABILITIES;
+    try {
+      const featuresPayload = await api.getFeatures();
+      nextCapabilities = normalizeFeaturesPayload(featuresPayload);
+    } catch (err) {
+      console.error('Failed to fetch runtime feature flags:', err);
+    }
+
+    setCapabilities(nextCapabilities);
+
     let lmResult = {
       available: false,
       has_models: false,
       model_count: 0,
       models: [],
-      error: null,
+      error: nextCapabilities.lmStudioEnabled
+        ? null
+        : (nextCapabilities.genericMode
+            ? 'LM Studio is intentionally disabled in this hosted deployment.'
+            : null),
+      generic_mode: nextCapabilities.genericMode,
     };
 
-    try {
-      lmResult = await openRouterAPI.checkLMStudioAvailability();
-    } catch (err) {
-      console.error('Failed to check LM Studio availability:', err);
-      lmResult = {
-        available: false,
-        has_models: false,
-        model_count: 0,
-        models: [],
-        error: err.message || 'Failed to check LM Studio availability.',
-      };
+    if (nextCapabilities.lmStudioEnabled) {
+      try {
+        lmResult = await openRouterAPI.checkLMStudioAvailability();
+      } catch (err) {
+        console.error('Failed to check LM Studio availability:', err);
+        lmResult = {
+          available: false,
+          has_models: false,
+          model_count: 0,
+          models: [],
+          error: err.message || 'Failed to check LM Studio availability.',
+          generic_mode: nextCapabilities.genericMode,
+        };
+      }
     }
 
     const usableLmStudioChatModelId = getUsableLoadedLmStudioChatModelId(lmResult.models || []);
     const hasUsableLmStudioChatModel = Boolean(usableLmStudioChatModelId);
-    const lmAvailable = Boolean(lmResult.available && lmResult.has_models);
-    setLmStudioStatus({
+    const nextLmStudioStatus = {
       ...lmResult,
       usable_chat_model_id: usableLmStudioChatModelId,
       has_usable_chat_model: hasUsableLmStudioChatModel,
-    });
+    };
+    const lmAvailable = nextCapabilities.lmStudioEnabled && Boolean(lmResult.available && lmResult.has_models);
+    setLmStudioStatus(nextLmStudioStatus);
     setLmStudioAvailable(lmAvailable);
 
     let keyStatus = { has_key: false };
-    try {
-      keyStatus = await openRouterAPI.getApiKeyStatus();
-    } catch (err) {
-      console.error('Failed to check OpenRouter key status:', err);
+    let keyStatusOk = false;
+    // Retry aggressively (up to ~20s) to cover backend cold-start. The
+    // `/api/openrouter/api-key-status` endpoint is trivial (memory lookup),
+    // so any failure here means the backend literally is not yet accepting
+    // HTTP — we must NOT declare "no key" to the UI on that basis, because
+    // the real state is "unknown" and declaring it false would incorrectly
+    // open the startup provider setup modal over a stored key.
+    const delays = [200, 400, 800, 1200, 1500, 2000, 2000, 2500, 2500, 3000, 3000];
+    for (let attempt = 0; attempt < delays.length; attempt += 1) {
+      try {
+        keyStatus = await openRouterAPI.getApiKeyStatus();
+        keyStatusOk = true;
+        break;
+      } catch (err) {
+        if (attempt === delays.length - 1) {
+          console.warn('OpenRouter key-status probe still unreachable after initial cold-start window; background poller will retry.', err);
+        }
+        await new Promise((resolve) => setTimeout(resolve, delays[attempt]));
+      }
     }
 
     const finalHasOpenRouterKey = Boolean(keyStatus.has_key);
-    setHasOpenRouterKey(finalHasOpenRouterKey);
+    if (keyStatusOk) {
+      setHasOpenRouterKey(finalHasOpenRouterKey);
+    }
 
     let availableModels = [];
-    if (lmAvailable) {
+    if (nextCapabilities.lmStudioEnabled && lmAvailable) {
       try {
         const data = await api.getModels();
         availableModels = data.models || data || [];
@@ -377,14 +510,12 @@ function App() {
     }
 
     return {
+      capabilities: nextCapabilities,
       lmAvailable,
       hasOpenRouterKey: finalHasOpenRouterKey,
+      keyStatusReachable: keyStatusOk,
       hasUsableLmStudioChatModel,
-      lmStudioStatus: {
-        ...lmResult,
-        usable_chat_model_id: usableLmStudioChatModelId,
-        has_usable_chat_model: hasUsableLmStudioChatModel,
-      },
+      lmStudioStatus: nextLmStudioStatus,
       defaultLmStudioModelId: usableLmStudioChatModelId,
     };
   }, []);
@@ -393,20 +524,100 @@ function App() {
     syncProviderAvailability();
   }, [syncProviderAvailability]);
 
-  // Periodically re-check OpenRouter key status to keep indicator in sync
+  // Fetch update notice from the backend on mount
+  useEffect(() => {
+    api.getUpdateNotice()
+      .then((notice) => {
+        if (notice && notice.update_available) {
+          setUpdateNotice(notice);
+        }
+      })
+      .catch(() => {});
+  }, []);
+
+  useEffect(() => {
+    if (capabilities.lmStudioEnabled) {
+      return;
+    }
+
+    setConfig((prev) => {
+      const next = normalizeAggregatorConfigForCapabilities(prev, false);
+      return JSON.stringify(next) === JSON.stringify(prev) ? prev : next;
+    });
+
+    setAutonomousConfig((prev) => {
+      const next = normalizeAutonomousConfigForCapabilities(prev, false);
+      return JSON.stringify(next) === JSON.stringify(prev) ? prev : next;
+    });
+
+    if (localStorage.getItem(STARTUP_PROVIDER_CHOICE_STORAGE_KEY) === LM_STUDIO_STARTUP_CHOICE) {
+      localStorage.removeItem(STARTUP_PROVIDER_CHOICE_STORAGE_KEY);
+    }
+  }, [capabilities.lmStudioEnabled]);
+
+  // Periodically re-check OpenRouter key status to keep indicator in sync.
+  // We poll aggressively (5s) because the state mostly flips from "unknown"
+  // to "known" shortly after backend startup, and users notice any delay as
+  // "my key didn't save."
   useEffect(() => {
     const interval = setInterval(async () => {
       try {
         const keyStatus = await openRouterAPI.getApiKeyStatus();
-        setHasOpenRouterKey(keyStatus.has_key);
+        setHasOpenRouterKey(Boolean(keyStatus.has_key));
       } catch {
         // Backend unreachable, skip this cycle
       }
-    }, 30000);
+    }, 5000);
 
     return () => clearInterval(interval);
   }, []);
 
+  // Periodically re-check LM Studio availability so the header indicator
+  // recovers when LM Studio finishes starting after the initial page load
+  // (e.g. MOTO launches the browser before LM Studio's local server is
+  // ready to serve /v1/models). Without this, the first check returns
+  // unavailable and the "LM Studio Offline" badge sticks for the entire
+  // session even while nomic embedding calls are succeeding.
+  useEffect(() => {
+    if (!capabilities.lmStudioEnabled) {
+      return undefined;
+    }
+
+    const interval = setInterval(() => {
+      if (typeof document !== 'undefined' && document.visibilityState === 'hidden') {
+        return;
+      }
+      syncProviderAvailability().catch(() => {
+        // Backend unreachable or transient failure, skip this cycle
+      });
+    }, 15000);
+
+    return () => clearInterval(interval);
+  }, [capabilities.lmStudioEnabled, syncProviderAvailability]);
+
+  // Re-sync provider availability immediately when the tab becomes visible
+  // again. Users often switch to LM Studio to load a model and then return;
+  // waiting up to 15s for the next interval tick feels broken.
+  useEffect(() => {
+    if (!capabilities.lmStudioEnabled) {
+      return undefined;
+    }
+    if (typeof document === 'undefined') {
+      return undefined;
+    }
+
+    const handleVisibilityChange = () => {
+      if (document.visibilityState === 'visible') {
+        syncProviderAvailability().catch(() => {});
+      }
+    };
+
+    document.addEventListener('visibilitychange', handleVisibilityChange);
+    return () => {
+      document.removeEventListener('visibilitychange', handleVisibilityChange);
+    };
+  }, [capabilities.lmStudioEnabled, syncProviderAvailability]);
+
   // Check autonomous research status on mount (handles page refresh while running)
   // CRITICAL: Always load all data (brainstorms, papers, stats) on startup,
   // even when not running. This ensures users see existing data immediately
@@ -760,6 +971,176 @@ function App() {
         data
       });
     }));
+
+    unsubscribers.push(websocket.on('proof_framing_decided', (data) => {
+      addActivity({
+        event: 'proof_framing_decided',
+        timestamp: getTimestamp(data),
+        message: data.is_proof_amenable
+          ? 'Proof framing enabled for this research run'
+          : 'Proof framing not applied for this research run',
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_check_started', (data) => {
+      const prefix = data.trigger === 'manual'
+        ? 'Manual proof check started'
+        : data.trigger === 'retry'
+          ? 'Paper-stage proof retry started'
+          : 'Proof check started';
+      addActivity({
+        event: 'proof_check_started',
+        timestamp: getTimestamp(data),
+        message: `${prefix} for ${data.source_type} ${data.source_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_retry_scheduled', (data) => {
+      addActivity({
+        event: 'proof_retry_scheduled',
+        timestamp: getTimestamp(data),
+        message: `Scheduled ${data.count || 0} proof retry candidate(s) for paper ${data.source_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_retry_started', (data) => {
+      addActivity({
+        event: 'proof_retry_started',
+        timestamp: getTimestamp(data),
+        message: `Retrying ${data.count || 0} failed proof candidate(s) against paper ${data.source_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_check_no_candidates', (data) => {
+      addActivity({
+        event: 'proof_check_no_candidates',
+        timestamp: getTimestamp(data),
+        message: `No formal proof candidates found in ${data.source_type} ${data.source_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_check_candidates_found', (data) => {
+      addActivity({
+        event: 'proof_check_candidates_found',
+        timestamp: getTimestamp(data),
+        message: `Proof check found ${data.count || 0} theorem candidate(s)`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_attempt_started', (data) => {
+      addActivity({
+        event: 'proof_attempt_started',
+        timestamp: getTimestamp(data),
+        message: `Proof attempt ${data.attempt || 1} started: ${data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('smt_check_started', (data) => {
+      addActivity({
+        event: 'smt_check_started',
+        timestamp: getTimestamp(data),
+        message: `SMT check started: ${data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('smt_check_complete', (data) => {
+      addActivity({
+        event: 'smt_check_complete',
+        timestamp: getTimestamp(data),
+        message: `SMT check complete (${data.result || 'unknown'}): ${data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_attempt_failed', (data) => {
+      addActivity({
+        event: 'proof_attempt_failed',
+        timestamp: getTimestamp(data),
+        message: `Proof attempt ${data.attempt || '?'} failed: ${formatReason(data.error_summary, 960) || data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_verified', (data) => {
+      addActivity({
+        event: 'proof_verified',
+        timestamp: getTimestamp(data),
+        message: `Lean 4 verified: ${data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_attempts_exhausted', (data) => {
+      addActivity({
+        event: 'proof_attempts_exhausted',
+        timestamp: getTimestamp(data),
+        message: `Proof attempts exhausted: ${data.theorem_statement || data.theorem_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('novel_proof_discovered', (data) => {
+      setProofRefreshToken((prev) => prev + 1);
+      setProofNotifications((prev) => {
+        const next = [
+          ...prev,
+          {
+            id: `proof_${data.proof_id}_${Date.now()}`,
+            proof_id: data.proof_id,
+            theorem_statement: data.theorem_statement,
+            source_type: data.source_type,
+            source_id: data.source_id,
+            timestamp: getTimestamp(data),
+          }
+        ];
+        return next.length > 3 ? next.slice(-3) : next;
+      });
+      addActivity({
+        event: 'novel_proof_discovered',
+        timestamp: getTimestamp(data),
+        message: `Novel proof discovered: ${data.theorem_statement}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('known_proof_verified', (data) => {
+      setProofRefreshToken((prev) => prev + 1);
+      addActivity({
+        event: 'known_proof_verified',
+        timestamp: getTimestamp(data),
+        message: `Verified known proof recorded for ${data.source_type} ${data.source_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_dependency_added', (data) => {
+      setLatestProofDependencyEvent(data);
+      setProofRefreshToken((prev) => prev + 1);
+      addActivity({
+        event: 'proof_dependency_added',
+        timestamp: getTimestamp(data),
+        message: `Dependency graph updated for ${data.theorem_name || data.proof_id}`,
+        data
+      });
+    }));
+
+    unsubscribers.push(websocket.on('proof_check_complete', (data) => {
+      setProofRefreshToken((prev) => prev + 1);
+      addActivity({
+        event: 'proof_check_complete',
+        timestamp: getTimestamp(data),
+        message: `Proof check complete: ${data.verified_count || 0} verified, ${data.novel_count || 0} novel`,
+        data
+      });
+    }));
     
     unsubscribers.push(websocket.on('auto_research_started', () => {
       setAutonomousActivity([]);
@@ -1258,13 +1639,15 @@ function App() {
   // Autonomous handlers
   const handleAutonomousStart = async (researchPrompt) => {
     try {
+      const lmStudioEnabled = capabilities.lmStudioEnabled;
+
       // Convert frontend camelCase to backend snake_case for submitter_configs (includes OpenRouter fields)
       const submitterConfigs = autonomousConfig.submitter_configs?.map(cfg => ({
         submitter_id: cfg.submitterId,
-        provider: cfg.provider || 'lm_studio',
+        provider: normalizeRuntimeProvider(cfg.provider, lmStudioEnabled),
         model_id: cfg.modelId,
         openrouter_provider: cfg.openrouterProvider || null,
-        lm_studio_fallback_id: cfg.lmStudioFallbackId || null,
+        lm_studio_fallback_id: lmStudioEnabled ? (cfg.lmStudioFallbackId || null) : null,
         context_window: cfg.contextWindow,
         max_output_tokens: cfg.maxOutputTokens
       })) || [];
@@ -1273,31 +1656,51 @@ function App() {
         user_research_prompt: researchPrompt,
         submitter_configs: submitterConfigs,
         // Validator config with OpenRouter support
-        validator_provider: autonomousConfig.validator_provider,
+        validator_provider: normalizeRuntimeProvider(
+          autonomousConfig.validator_provider,
+          lmStudioEnabled
+        ),
         validator_model: autonomousConfig.validator_model,
         validator_openrouter_provider: autonomousConfig.validator_openrouter_provider,
-        validator_lm_studio_fallback: autonomousConfig.validator_lm_studio_fallback,
+        validator_lm_studio_fallback: lmStudioEnabled
+          ? autonomousConfig.validator_lm_studio_fallback
+          : null,
         validator_context_window: autonomousConfig.validator_context_window,
         validator_max_tokens: autonomousConfig.validator_max_tokens,
         // High-context submitter config with OpenRouter support
-        high_context_provider: autonomousConfig.high_context_provider,
+        high_context_provider: normalizeRuntimeProvider(
+          autonomousConfig.high_context_provider,
+          lmStudioEnabled
+        ),
         high_context_model: autonomousConfig.high_context_model,
         high_context_openrouter_provider: autonomousConfig.high_context_openrouter_provider,
-        high_context_lm_studio_fallback: autonomousConfig.high_context_lm_studio_fallback,
+        high_context_lm_studio_fallback: lmStudioEnabled
+          ? autonomousConfig.high_context_lm_studio_fallback
+          : null,
         high_context_context_window: autonomousConfig.high_context_context_window,
         high_context_max_tokens: autonomousConfig.high_context_max_tokens,
         // High-param submitter config with OpenRouter support
-        high_param_provider: autonomousConfig.high_param_provider,
+        high_param_provider: normalizeRuntimeProvider(
+          autonomousConfig.high_param_provider,
+          lmStudioEnabled
+        ),
         high_param_model: autonomousConfig.high_param_model,
         high_param_openrouter_provider: autonomousConfig.high_param_openrouter_provider,
-        high_param_lm_studio_fallback: autonomousConfig.high_param_lm_studio_fallback,
+        high_param_lm_studio_fallback: lmStudioEnabled
+          ? autonomousConfig.high_param_lm_studio_fallback
+          : null,
         high_param_context_window: autonomousConfig.high_param_context_window,
         high_param_max_tokens: autonomousConfig.high_param_max_tokens,
         // Critique submitter config with OpenRouter support
-        critique_submitter_provider: autonomousConfig.critique_submitter_provider,
+        critique_submitter_provider: normalizeRuntimeProvider(
+          autonomousConfig.critique_submitter_provider,
+          lmStudioEnabled
+        ),
         critique_submitter_model: autonomousConfig.critique_submitter_model,
         critique_submitter_openrouter_provider: autonomousConfig.critique_submitter_openrouter_provider,
-        critique_submitter_lm_studio_fallback: autonomousConfig.critique_submitter_lm_studio_fallback,
+        critique_submitter_lm_studio_fallback: lmStudioEnabled
+          ? autonomousConfig.critique_submitter_lm_studio_fallback
+          : null,
         critique_submitter_context_window: autonomousConfig.critique_submitter_context_window,
         critique_submitter_max_tokens: autonomousConfig.critique_submitter_max_tokens,
         tier3_enabled: autonomousConfig.tier3_enabled ?? false
@@ -1388,6 +1791,15 @@ function App() {
     setSelectedCritiquePaper(null);
   };
 
+  const handleDismissProofNotification = (notificationId) => {
+    setProofNotifications(prev => prev.filter(n => n.id !== notificationId));
+  };
+
+  const handleClickProofNotification = (proofId) => {
+    setSelectedProofId(proofId);
+    handleAutonomousTabSelect('auto-proofs');
+  };
+
   const handleModeChange = (nextMode) => {
     setAppMode(nextMode);
   };
@@ -1440,15 +1852,37 @@ function App() {
     setStartupSetupMessage('');
 
     const {
+      capabilities: nextCapabilities,
       lmAvailable,
       hasOpenRouterKey: keyPresent,
+      keyStatusReachable,
       hasUsableLmStudioChatModel,
     } = await syncProviderAvailability();
     if (keyPresent) {
       return;
     }
 
+    if (!keyStatusReachable) {
+      // Backend is still booting (e.g. Lean 4 warm start on a cold Mathlib
+      // cache can push this past 20s even though uvicorn itself should be up
+      // within seconds). Avoid opening the startup provider setup modal with
+      // stale "no key" info — the periodic poller re-checks every 5s and
+      // will surface the real state without forcing the user to re-enter a
+      // key that is already persisted.
+      return;
+    }
+
     const startupChoice = localStorage.getItem(STARTUP_PROVIDER_CHOICE_STORAGE_KEY);
+    if (!nextCapabilities.lmStudioEnabled) {
+      if (startupChoice === LM_STUDIO_STARTUP_CHOICE) {
+        setStartupSetupMessage(
+          'This deployment runs in hosted web mode, so LM Studio is intentionally disabled here. Configure OpenRouter to continue.'
+        );
+      }
+      setShowStartupSetupModal(true);
+      return;
+    }
+
     if (startupChoice === LM_STUDIO_STARTUP_CHOICE && lmAvailable && hasUsableLmStudioChatModel) {
       return;
     }
@@ -1481,6 +1915,13 @@ function App() {
   };
 
   const handleStartupLmStudioChoice = async () => {
+    if (!capabilities.lmStudioEnabled) {
+      setStartupSetupMessage(
+        'LM Studio is intentionally disabled in this deployment. Configure OpenRouter to continue.'
+      );
+      return;
+    }
+
     setCheckingLmStudioStartupChoice(true);
     setStartupSetupMessage('');
 
@@ -1527,14 +1968,15 @@ function App() {
     { id: 'auto-interface', label: 'Start Here: Autonomous Deep Research Controller', group: 'autonomous-main' },
     { id: 'auto-brainstorms', label: 'Autonomous Stage 1: Brainstorms', group: 'autonomous-main' },
     { id: 'auto-papers', label: 'Autonomous Stage 2: Papers', group: 'autonomous-main' },
+    { id: 'auto-proofs', label: 'Mathematical Proofs', group: 'autonomous-main' },
     ...(autonomousConfig.tier3_enabled ? [
-      { id: 'auto-final-answer', label: getFinalAnswerLabel(), subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-main' },
+      { id: 'auto-final-answer', label: getFinalAnswerLabel(), subtext: '(In Development / Highly Hallucinatory)', group: 'autonomous-main' },
     ] : []),
   ];
 
   const autonomousSettingsTabs = [
     { id: 'auto-stage2-history', label: 'Stage 2 Final Answers History', group: 'autonomous-settings' },
-    { id: 'auto-final-answer-library', label: 'Stage 3 Final Answers History', subtext: '(Very Experimental and Hallucinatory)', group: 'autonomous-settings' },
+    { id: 'auto-final-answer-library', label: 'Stage 3 Final Answers History', subtext: '(In Development / Highly Hallucinatory)', group: 'autonomous-settings' },
     { id: 'auto-logs', label: 'API Call Logs', group: 'autonomous-settings' },
     { id: 'auto-settings', label: 'Autonomous Model Selection & Settings', group: 'autonomous-settings' },
   ];
@@ -1590,7 +2032,7 @@ function App() {
   }, []);
 
   return (
-    <div className="app">
+    <div className={`app ${workflowPanelCollapsed ? 'workflow-panel-collapsed' : 'workflow-panel-expanded'}`}>
       {/* Banner Section */}
       <div className={`app-banner ${shimmerAccentsEnabled ? '' : 'no-shimmer'}`}>
         <div className="banner-content">
@@ -1602,6 +2044,35 @@ function App() {
           <p className="banner-variant">A Prototype Artificial Superintelligence - Novelty Seeking Autonomous S.T.E.M. Researcher For Automated Theorem Generation</p>
         </div>
       </div>
+
+      {/* Update Notice Banner — dismissible per session, reappears on restart */}
+      {updateNotice && !updateNoticeDismissed && (
+        <div className="update-notice-banner">
+          <div className="update-notice-content">
+            <span className="update-notice-icon">&#9432;</span>
+            <span className="update-notice-text">
+              <strong>Update available:</strong>{' '}
+              {updateNotice.installed_version} ({updateNotice.installed_commit})
+              {' '}&rarr;{' '}
+              {updateNotice.available_version} ({updateNotice.available_commit})
+              {' '}&mdash;{' '}
+              <span className="update-notice-detail">
+                {updateNotice.can_auto_apply
+                  ? 'Restart the launcher to apply this update.'
+                  : `Install layout: ${updateNotice.install_layout}. Pull the latest from GitHub main to update.`}
+              </span>
+            </span>
+          </div>
+          <button
+            className="update-notice-dismiss"
+            onClick={() => setUpdateNoticeDismissed(true)}
+            aria-label="Dismiss update notice"
+            title="Dismiss"
+          >
+            &#10005;
+          </button>
+        </div>
+      )}
       
       {/* CRITICAL: Boost buttons are ETERNAL - they NEVER disappear */}
       {/* These buttons are fixed-position, high z-index, and unconditionally rendered */}
@@ -1622,43 +2093,73 @@ function App() {
             <option value="manual">Advanced Manual S.T.E.M. ASI</option>
           </select>
         </div>
-        <button 
-          className="boost-btn"
-          onClick={() => setShowBoostModal(true)}
-          title="Configure API Boost"
-        >
-          ⚡ API Boost
-        </button>
-        <button 
-          className="openrouter-key-btn"
+        <div className="boost-control-row">
+          <div className="help-tooltip-anchor">
+            <button
+              type="button"
+              className="help-tooltip-btn"
+              aria-label="Learn about API Boost"
+              onMouseEnter={() => setShowApiBoostTooltip(true)}
+              onMouseLeave={() => setShowApiBoostTooltip(false)}
+              onFocus={() => setShowApiBoostTooltip(true)}
+              onBlur={() => setShowApiBoostTooltip(false)}
+            >
+              ?
+            </button>
+            {showApiBoostTooltip && (
+              <div className="help-tooltip-popup">
+                Use this mode to change your model selections mid-run. It is a good way to use your free daily OpenRouter credits without interrupting your research run. For the easiest setup, select your free model and enable "Use boost as next API call when available." Some free models may be more rate-limited on OpenRouter than others.
+              </div>
+            )}
+          </div>
+          <button
+            className="boost-btn"
+            onClick={() => setShowBoostModal(true)}
+            title="Configure API Boost"
+          >
+            API Boost
+          </button>
+        </div>
+        <button
+          className={`header-status-chip ${
+            hasOpenRouterKey === true
+              ? 'header-status-chip--ready'
+              : hasOpenRouterKey === false
+                ? 'header-status-chip--inactive'
+                : 'header-status-chip--pending'
+          }`}
           onClick={() => {
             setOpenRouterKeyReason('setup');
             setShowOpenRouterKeyModal(true);
           }}
-          title="Configure OpenRouter API Key"
-          style={{
-            marginLeft: '0.5rem',
-            padding: '0.4rem 0.8rem',
-            backgroundColor: hasOpenRouterKey ? '#2d5a27' : '#153815',
-            border: hasOpenRouterKey ? '1px solid #4CAF50' : '1px solid #1eff1c',
-            borderRadius: '4px',
-            color: '#fff',
-            cursor: 'pointer',
-            fontSize: '0.85rem',
-          }}
+          title={
+            hasOpenRouterKey === true
+              ? 'OpenRouter API key is configured'
+              : hasOpenRouterKey === false
+                ? 'Configure OpenRouter API Key'
+                : 'Checking OpenRouter key status...'
+          }
         >
-          {hasOpenRouterKey ? 'OpenRouter ✓' : 'Set OpenRouter Key'}
+          {hasOpenRouterKey === true
+            ? 'OpenRouter ✓'
+            : hasOpenRouterKey === false
+              ? 'Set OpenRouter Key'
+              : 'OpenRouter…'}
         </button>
-        {!lmStudioAvailable && (
-          <span style={{ 
-            marginLeft: '0.5rem', 
-            color: '#1eff1c', 
-            fontSize: '0.8rem',
-            padding: '0.25rem 0.5rem',
-            backgroundColor: 'rgba(30, 255, 28, 0.1)',
-            borderRadius: '4px',
-          }}>
-            LM Studio Offline
+        {capabilities.lmStudioEnabled ? (
+          <span
+            className={`header-status-chip ${
+              lmStudioAvailable ? 'header-status-chip--ready' : 'header-status-chip--inactive'
+            }`}
+            title={lmStudioAvailable
+              ? `LM Studio is online (${lmStudioStatus.model_count || 0} model${(lmStudioStatus.model_count || 0) === 1 ? '' : 's'} loaded)`
+              : (lmStudioStatus.error || 'LM Studio server is not reachable at 127.0.0.1:1234')}
+          >
+            {lmStudioAvailable ? 'LM Studio ✓' : 'LM Studio Offline'}
+          </span>
+        ) : capabilities.genericMode && (
+          <span className="header-status-chip header-status-chip--hosted">
+            Hosted Web Mode
           </span>
         )}
       </div>
@@ -1798,6 +2299,14 @@ function App() {
               }}
             />
           )}
+          {activeTab === 'auto-proofs' && (
+            <MathematicalProofs
+              api={autonomousAPI}
+              refreshToken={proofRefreshToken}
+              selectedProofId={selectedProofId}
+              latestDependencyEvent={latestProofDependencyEvent}
+            />
+          )}
           {activeTab === 'auto-final-answer' && (
             <FinalAnswerView
               api={autonomousAPI}
@@ -1826,11 +2335,16 @@ function App() {
             <AggregatorInterface
               config={config}
               setConfig={setConfig}
+              capabilities={capabilities}
               anyWorkflowRunning={anyWorkflowRunning}
             />
           )}
           {activeTab === 'aggregator-settings' && (
-            <AggregatorSettings config={config} setConfig={setConfig} />
+            <AggregatorSettings
+              config={config}
+              setConfig={setConfig}
+              capabilities={capabilities}
+            />
           )}
           {activeTab === 'aggregator-logs' && <AggregatorLogs />}
           {activeTab === 'aggregator-results' && <LiveResults />}
@@ -1838,10 +2352,13 @@ function App() {
           {activeTab === 'compiler-interface' && (
             <CompilerInterface
               activeTab={activeTab}
+              capabilities={capabilities}
               anyWorkflowRunning={anyWorkflowRunning}
             />
           )}
-          {activeTab === 'compiler-settings' && <CompilerSettings />}
+          {activeTab === 'compiler-settings' && (
+            <CompilerSettings capabilities={capabilities} />
+          )}
           {activeTab === 'compiler-logs' && <CompilerLogs />}
           {activeTab === 'compiler-live-paper' && <LivePaper />}
         </div>
@@ -1853,6 +2370,7 @@ function App() {
           config={autonomousConfig}
           onConfigChange={setAutonomousConfig}
           models={models}
+          capabilities={capabilities}
           isRunning={autonomousRunning}
         />
       )}
@@ -1872,7 +2390,15 @@ function App() {
                   Disclaimer & Quickstart
               </h2>
               <p style={{ fontSize: '1.1rem', lineHeight: '1.6', marginBottom: '1.5rem', color: '#1eff1c' }}>
-                <strong>QUICKSTART:</strong> In LM Studio, load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code> by <strong>Nomic AI</strong> (optional but recommended), or use only an OpenRouter API key instead of LM Studio. You must leave your PC on and awake during runtime, the program will often run for days without interruption.
+                {capabilities.lmStudioEnabled ? (
+                  <>
+                    <strong>QUICKSTART:</strong> In LM Studio, load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code> by <strong>Nomic AI</strong> (optional but recommended), or use only an OpenRouter API key instead of LM Studio. You must leave your PC on and awake during runtime, the program will often run for days without interruption.
+                  </>
+                ) : (
+                  <>
+                    <strong>QUICKSTART:</strong> This hosted deployment uses OpenRouter-only inference. Set your OpenRouter API key, choose a profile or role models, and then begin your research run. LM Studio is intentionally disabled in this environment.
+                  </>
+                )}
               </p>
               <div
                 style={{
@@ -1896,7 +2422,7 @@ function App() {
                   Legal Disclaimer
                 </p>
                 <p style={{ fontSize: '0.95rem', lineHeight: '1.5', margin: 0 }}>
-                  MOTO is an experimental prototype system and remains under active development. It directs selected AI models to generate novel solution attempts in response to your prompt. Outputs may be incorrect, incomplete, misleading, fabricated, poorly reasoned, or otherwise unsuitable for reliance without independent review, especially for high-stakes, academic, financial, legal, medical, engineering, or operational use.
+                  MOTO is a prototype system under active development. It directs selected AI models to generate novel solution attempts in response to your prompt. Outputs may be incorrect, incomplete, misleading, fabricated, poorly reasoned, or otherwise unsuitable for reliance without independent review, especially for high-stakes, academic, financial, legal, medical, engineering, or operational use.
                   <br />
                   <br />
                   This software and all generated content are provided as-is and at your own risk. By using MOTO, you acknowledge that you are solely responsible for reviewing, validating, and deciding how to use any output, and that the developers, operators, and contributors are not responsible or liable for incorrect solutions, hallucinations, omissions, formatting issues, infinite loops, wasted API calls, model or provider failures, data loss, third-party charges, or any direct or indirect loss, damage, cost, or liability resulting from use of the program or its outputs.
@@ -1915,6 +2441,7 @@ function App() {
 
       <StartupProviderSetupModal
         isOpen={showStartupSetupModal}
+        capabilities={capabilities}
         lmStudioAvailable={lmStudioAvailable}
         hasUsableLmStudioChatModel={Boolean(lmStudioStatus.has_usable_chat_model)}
         lmStudioModelCount={lmStudioStatus.model_count || 0}
@@ -1929,6 +2456,7 @@ function App() {
       <BoostControlModal 
         isOpen={showBoostModal}
         onClose={() => setShowBoostModal(false)}
+        capabilities={capabilities}
       />
       
       {/* OpenRouter API Key Modal */}
@@ -1937,6 +2465,7 @@ function App() {
         onClose={handleCloseOpenRouterKeyModal}
         onKeySet={handleOpenRouterKeySet}
         reason={openRouterKeyReason}
+        capabilities={capabilities}
       />
       
       {/* OpenRouter Privacy Warning Modal */}
@@ -1944,6 +2473,13 @@ function App() {
         isOpen={showPrivacyWarning}
         onClose={() => setShowPrivacyWarning(false)}
         errorData={privacyWarningData}
+        capabilities={capabilities}
+      />
+
+      <ProofNotificationStack
+        notifications={proofNotifications}
+        onDismiss={handleDismissProofNotification}
+        onClickNotification={handleClickProofNotification}
       />
       
       {/* Critique Notification Stack - Persists across all screens */}
@@ -1989,32 +2525,15 @@ function App() {
           </div>
           
           <div className="footer-section footer-links">
-            <a 
-              href="https://intrafere.com/moto-autonomous-home-ai/" 
-              target="_blank" 
-              rel="noopener noreferrer"
-              className="footer-link"
-            >
-              <span className="footer-icon">ℹ️</span>
-              Read More About MOTO ASI
-            </a>
             <a
               href="https://intrafere.com/structured-brainstorming-validated-feedback/"
               target="_blank"
               rel="noopener noreferrer"
-              className="footer-link"
+              className="footer-link footer-link-github"
             >
               <span className="footer-icon">ℹ️</span>
               How MOTO's Superintelligence Works
             </a>
-            <a 
-              href="https://intrafere.com/moto-news/" 
-              target="_blank" 
-              rel="noopener noreferrer"
-              className="footer-link footer-link-news"
-            >
-              MOTO News and Updates
-            </a>
             <a
               href="https://intrafere.com/order-a-custom-orchestrator/"
               target="_blank"
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 0a63b7c..6d0998b 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -1,17 +1,22 @@
 import React, { useState, useEffect, useRef } from 'react';
 import { boostAPI, openRouterAPI } from '../services/api';
+import {
+  computeOpenRouterAutoSettings,
+  findOpenRouterModel,
+  getProviderNames,
+} from '../utils/openRouterSelection';
 import './BoostControlModal.css';
 
 const BOOST_SETTINGS_STORAGE_KEY = 'boost_modal_settings';
 
-export default function BoostControlModal({ isOpen, onClose }) {
+export default function BoostControlModal({ isOpen, onClose, capabilities }) {
   const [apiKey, setApiKey] = useState('');
   const [boostModel, setBoostModel] = useState('');
   const [selectedProvider, setSelectedProvider] = useState('');
   const [contextWindow, setContextWindow] = useState(131072);
   const [maxOutputTokens, setMaxOutputTokens] = useState(25000);
   const [models, setModels] = useState([]);
-  const [providers, setProviders] = useState([]);
+  const [providerData, setProviderData] = useState(null);
   const [loading, setLoading] = useState(false);
   const [loadingProviders, setLoadingProviders] = useState(false);
   const [testing, setTesting] = useState(false);
@@ -25,6 +30,8 @@ export default function BoostControlModal({ isOpen, onClose }) {
   const mouseDownTargetRef = useRef(null);
 
   const hasAvailableKey = Boolean(apiKey.trim() || hasGlobalKey);
+  const providers = getProviderNames(providerData);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
   
   // Load saved settings from localStorage on mount
   useEffect(() => {
@@ -64,8 +71,8 @@ export default function BoostControlModal({ isOpen, onClose }) {
 
   const fetchProviders = async (modelId, keyOverride = undefined) => {
     if (!modelId) {
-      setProviders([]);
-      return;
+      setProviderData(null);
+      return null;
     }
 
     const effectiveKey = keyOverride === undefined ? apiKey.trim() : keyOverride;
@@ -73,19 +80,31 @@ export default function BoostControlModal({ isOpen, onClose }) {
     setLoadingProviders(true);
     try {
       const response = await boostAPI.getModelProviders(effectiveKey || null, modelId);
-      if (response.providers) {
-        setProviders(response.providers);
-      } else {
-        setProviders([]);
-      }
+      const nextProviderData = {
+        providers: response.providers || [],
+        endpoints: response.endpoints || [],
+      };
+      setProviderData(nextProviderData);
+      return nextProviderData;
     } catch (error) {
       console.error('Failed to fetch providers:', error);
-      setProviders([]);
+      setProviderData(null);
+      return null;
     } finally {
       setLoadingProviders(false);
     }
   };
 
+  const getAutoSettingsForModel = async (modelId, selectedProvider = null, keyOverride = undefined) => {
+    const model = findOpenRouterModel(models, modelId);
+    if (!model) {
+      return null;
+    }
+
+    const nextProviderData = await fetchProviders(modelId, keyOverride);
+    return computeOpenRouterAutoSettings(model, nextProviderData, selectedProvider);
+  };
+
   const fetchBoostStatus = async (keyOverride = undefined) => {
     const effectiveKey = keyOverride === undefined ? apiKey.trim() : keyOverride;
 
@@ -117,7 +136,7 @@ export default function BoostControlModal({ isOpen, onClose }) {
             console.error('Failed to sync boost settings to localStorage:', e);
           }
         } else {
-          setProviders([]);
+          setProviderData(null);
           // Boost not enabled - localStorage values are already loaded in useEffect
         }
       }
@@ -127,13 +146,17 @@ export default function BoostControlModal({ isOpen, onClose }) {
   };
 
   // Handle model selection change
-  const handleModelChange = (modelId) => {
+  const handleModelChange = async (modelId) => {
     setBoostModel(modelId);
     setSelectedProvider(''); // Reset provider when model changes
     if (modelId) {
-      fetchProviders(modelId);
+      const autoSettings = await getAutoSettingsForModel(modelId, null);
+      if (autoSettings) {
+        setContextWindow(autoSettings.contextWindow);
+        setMaxOutputTokens(autoSettings.maxOutputTokens);
+      }
     } else {
-      setProviders([]);
+      setProviderData(null);
     }
   };
 
@@ -156,6 +179,9 @@ export default function BoostControlModal({ isOpen, onClose }) {
           ? response.models.filter(model => model.pricing && model.pricing.prompt === '0' && model.pricing.completion === '0')
           : response.models;
         setModels(filtered);
+        if (boostModel) {
+          await fetchProviders(boostModel, effectiveKey);
+        }
         if (!silent) {
           setSuccess(`Models loaded successfully (${filtered.length} ${freeFilter ? 'free ' : ''}models)`);
         }
@@ -425,7 +451,15 @@ export default function BoostControlModal({ isOpen, onClose }) {
               <label>Provider</label>
               <select
                 value={selectedProvider}
-                onChange={(e) => setSelectedProvider(e.target.value)}
+                onChange={async (e) => {
+                  const providerName = e.target.value;
+                  setSelectedProvider(providerName);
+                  const autoSettings = await getAutoSettingsForModel(boostModel, providerName || null);
+                  if (autoSettings) {
+                    setContextWindow(autoSettings.contextWindow);
+                    setMaxOutputTokens(autoSettings.maxOutputTokens);
+                  }
+                }}
                 disabled={loading || loadingProviders}
               >
                 <option value="">Default (OpenRouter chooses)</option>
@@ -491,8 +525,12 @@ export default function BoostControlModal({ isOpen, onClose }) {
             <h4>How API Boost Works</h4>
             <ul>
               <li>Click tasks in the MOTO Workflow panel to toggle boost</li>
-              <li>Boosted tasks use your OpenRouter model instead of LM Studio</li>
-              <li>If credits run out, system falls back to LM Studio automatically</li>
+              <li>Boosted tasks use your selected OpenRouter model and optional host provider</li>
+              <li>
+                {lmStudioEnabled
+                  ? 'If boost credits or provider capacity fail, the task falls back to its primary model path for that call'
+                  : 'If boost credits or provider capacity fail, the task falls back to its primary hosted model path for that call'}
+              </li>
               <li>You can toggle which tasks use the boost at any time</li>
             </ul>
           </div>
diff --git a/frontend/src/components/CreditExhaustionNotificationStack.jsx b/frontend/src/components/CreditExhaustionNotificationStack.jsx
index 8c6f78a..bbf5eeb 100644
--- a/frontend/src/components/CreditExhaustionNotificationStack.jsx
+++ b/frontend/src/components/CreditExhaustionNotificationStack.jsx
@@ -94,8 +94,8 @@ export default function CreditExhaustionNotificationStack({ notifications, onDis
           style={{
             width: '320px',
             padding: '10px 16px',
-            backgroundColor: resetting ? '#333' : 'rgba(108, 92, 231, 0.9)',
-            border: '1px solid rgba(108, 92, 231, 0.6)',
+            backgroundColor: resetting ? '#333' : 'rgba(24, 204, 23, 0.9)',
+            border: '1px solid rgba(24, 204, 23, 0.6)',
             borderRadius: '10px',
             color: '#fff',
             fontSize: '13px',
@@ -104,8 +104,8 @@ export default function CreditExhaustionNotificationStack({ notifications, onDis
             opacity: resetting ? 0.6 : 1,
             transition: 'all 0.2s',
           }}
-          onMouseEnter={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(108, 92, 231, 1)'; }}
-          onMouseLeave={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(108, 92, 231, 0.9)'; }}
+          onMouseEnter={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(24, 204, 23, 1)'; }}
+          onMouseLeave={(e) => { if (!resetting) e.currentTarget.style.backgroundColor = 'rgba(24, 204, 23, 0.9)'; }}
         >
           {resetting ? 'Resetting...' : 'Retry OpenRouter (Credits Added)'}
         </button>
diff --git a/frontend/src/components/CritiqueNotificationStack.jsx b/frontend/src/components/CritiqueNotificationStack.jsx
index 01e5f31..4b9d74f 100644
--- a/frontend/src/components/CritiqueNotificationStack.jsx
+++ b/frontend/src/components/CritiqueNotificationStack.jsx
@@ -1,15 +1,25 @@
 import React from 'react';
 
+const ALERT_SCALE = 1.4;
+
+function scalePx(value) {
+  return `${Math.round(value * ALERT_SCALE)}px`;
+}
+
+function scaleNumber(value) {
+  return Math.round(value * ALERT_SCALE);
+}
+
 // Simple inline icon components
-const IconX = ({ className }) => (
-  <svg className={className} width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+const IconX = ({ className, size = 16 }) => (
+  <svg className={className} width={size} height={size} viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
     <line x1="18" y1="6" x2="6" y2="18"></line>
     <line x1="6" y1="6" x2="18" y2="18"></line>
   </svg>
 );
 
-const IconStar = ({ className }) => (
-  <svg className={className} width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
+const IconStar = ({ className, size = 16 }) => (
+  <svg className={className} width={size} height={size} viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2">
     <polygon points="12 2 15.09 8.26 22 9.27 17 14.14 18.18 21.02 12 17.77 5.82 21.02 7 14.14 2 9.27 8.91 8.26 12 2"></polygon>
   </svg>
 );
@@ -19,7 +29,7 @@ const IconStar = ({ className }) => (
  */
 function getRatingColor(rating) {
   if (rating >= 8) return { text: '#34d399', bg: '#10b981' };
-  if (rating >= 6.25) return { text: '#60a5fa', bg: '#3b82f6' };
+  if (rating >= 6.25) return { text: '#18cc17', bg: '#18cc17' };
   return { text: '#9ca3af', bg: '#6b7280' };
 }
 
@@ -52,7 +62,7 @@ export default function CritiqueNotificationStack({ notifications, onDismiss, on
         zIndex: 999999,
         display: 'flex',
         flexDirection: 'column',
-        gap: '8px',
+        gap: scalePx(8),
         pointerEvents: 'none', // Allow clicks through container
       }}
     >
@@ -96,12 +106,12 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       onMouseEnter={() => setIsHovered(true)}
       onMouseLeave={() => setIsHovered(false)}
       style={{
-        width: '280px',
-        minHeight: '80px',
+        width: scalePx(280),
+        minHeight: scalePx(80),
         background: `linear-gradient(135deg, ${isHovered ? 'rgba(20, 83, 45, 0.95)' : 'rgba(26, 26, 46, 0.95)'}, ${isHovered ? 'rgba(15, 60, 15, 0.95)' : 'rgba(17, 24, 39, 0.95)'})`,
         backdropFilter: 'blur(8px)',
-        borderRadius: '12px',
-        padding: '12px',
+        borderRadius: scalePx(12),
+        padding: scalePx(12),
         boxShadow: isHovered 
           ? '0 20px 40px -12px rgba(30, 255, 28, 0.5), 0 0 0 1px rgba(30, 255, 28, 0.5)'
           : '0 10px 30px -12px rgba(0, 0, 0, 0.8), 0 0 0 1px rgba(30, 255, 28, 0.3)',
@@ -109,7 +119,7 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
         cursor: 'pointer',
         transition: 'all 0.3s cubic-bezier(0.4, 0, 0.2, 1)',
         transform: isExiting 
-          ? 'translateX(320px) scale(0.8)' 
+          ? `translateX(${scalePx(320)}) scale(0.8)` 
           : `translateY(${index * 0}px) scale(${isHovered ? 1.02 : 1})`,
         opacity: isExiting ? 0 : 1,
         pointerEvents: 'auto', // Re-enable clicks for notification
@@ -117,25 +127,27 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       }}
     >
       {/* Header with star icon and rating */}
-      <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: '8px' }}>
-        <div style={{ display: 'flex', alignItems: 'center', gap: '8px' }}>
+      <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', marginBottom: scalePx(8) }}>
+        <div style={{ display: 'flex', alignItems: 'center', gap: scalePx(8) }}>
           <div
             style={{
-              padding: '6px',
+              padding: scalePx(6),
               backgroundColor: 'rgba(30, 255, 28, 0.2)',
-              borderRadius: '8px',
+              borderRadius: scalePx(8),
               display: 'flex',
               alignItems: 'center',
               justifyContent: 'center',
             }}
           >
-            <IconStar style={{ color: colors.text }} />
+            <div style={{ color: colors.text, display: 'flex', alignItems: 'center', justifyContent: 'center' }}>
+              <IconStar size={scaleNumber(16)} />
+            </div>
           </div>
           <div>
-            <div style={{ fontSize: '10px', color: '#9ca3af', textTransform: 'uppercase', letterSpacing: '0.05em' }}>
+            <div style={{ fontSize: scalePx(10), color: '#9ca3af', textTransform: 'uppercase', letterSpacing: '0.05em' }}>
               High Score
             </div>
-            <div style={{ color: colors.text, fontSize: '18px', fontWeight: '700', lineHeight: '1' }}>
+            <div style={{ color: colors.text, fontSize: scalePx(18), fontWeight: '700', lineHeight: '1' }}>
               {notification.average_rating.toFixed(1)}/10
             </div>
           </div>
@@ -145,10 +157,10 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
         <button
           onClick={handleDismiss}
           style={{
-            padding: '4px',
+            padding: scalePx(4),
             backgroundColor: 'transparent',
             border: 'none',
-            borderRadius: '6px',
+            borderRadius: scalePx(6),
             cursor: 'pointer',
             color: '#9ca3af',
             transition: 'all 0.2s',
@@ -165,14 +177,14 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
             e.target.style.color = '#9ca3af';
           }}
         >
-          <IconX />
+          <IconX size={scaleNumber(16)} />
         </button>
       </div>
 
       {/* Paper title */}
       <div
         style={{
-          fontSize: '13px',
+          fontSize: scalePx(13),
           fontWeight: '500',
           color: '#f3f4f6',
           lineHeight: '1.4',
@@ -190,9 +202,9 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       {/* Click hint */}
       <div
         style={{
-          fontSize: '10px',
+          fontSize: scalePx(10),
           color: '#1eff1c',
-          marginTop: '6px',
+          marginTop: scalePx(6),
           opacity: isHovered ? 1 : 0.7,
           transition: 'opacity 0.2s',
         }}
@@ -204,7 +216,7 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
       <style>{`
         @keyframes slideIn {
           from {
-            transform: translateX(320px) scale(0.8);
+            transform: translateX(${scalePx(320)}) scale(0.8);
             opacity: 0;
           }
           to {
diff --git a/frontend/src/components/HelpTooltip.jsx b/frontend/src/components/HelpTooltip.jsx
new file mode 100644
index 0000000..7a0eac1
--- /dev/null
+++ b/frontend/src/components/HelpTooltip.jsx
@@ -0,0 +1,129 @@
+import React, { useCallback, useEffect, useLayoutEffect, useRef, useState } from 'react';
+import { createPortal } from 'react-dom';
+
+export default function HelpTooltip({
+  label,
+  children,
+  anchorClassName = '',
+  popupClassName = '',
+  buttonClassName = '',
+  popupStyle,
+  buttonContent = '?',
+  useFixedPosition = false,
+}) {
+  const [isOpen, setIsOpen] = useState(false);
+  const [fixedPopupStyle, setFixedPopupStyle] = useState(null);
+  const buttonRef = useRef(null);
+  const popupRef = useRef(null);
+
+  const anchorClasses = ['help-tooltip-anchor', anchorClassName].filter(Boolean).join(' ');
+  const buttonClasses = ['help-tooltip-btn', buttonClassName].filter(Boolean).join(' ');
+  const popupClasses = ['help-tooltip-popup', popupClassName].filter(Boolean).join(' ');
+
+  const updateFixedPosition = useCallback(() => {
+    if (!useFixedPosition || !buttonRef.current || !popupRef.current || typeof window === 'undefined') {
+      return;
+    }
+
+    const buttonRect = buttonRef.current.getBoundingClientRect();
+    const popupRect = popupRef.current.getBoundingClientRect();
+    const gap = 10;
+    const viewportPadding = 16;
+
+    let left = buttonRect.right + gap;
+    if (left + popupRect.width > window.innerWidth - viewportPadding) {
+      left = Math.max(viewportPadding, window.innerWidth - popupRect.width - viewportPadding);
+    }
+
+    const top = Math.max(viewportPadding, buttonRect.top - popupRect.height - gap);
+
+    setFixedPopupStyle({
+      position: 'fixed',
+      top: `${top}px`,
+      left: `${left}px`,
+      right: 'auto',
+      bottom: 'auto',
+      zIndex: 100000,
+    });
+  }, [useFixedPosition]);
+
+  const showTooltip = () => {
+    setIsOpen(true);
+  };
+
+  const hideTooltip = () => {
+    setIsOpen(false);
+    setFixedPopupStyle(null);
+  };
+
+  useLayoutEffect(() => {
+    if (isOpen) {
+      updateFixedPosition();
+    }
+  }, [isOpen, updateFixedPosition]);
+
+  useEffect(() => {
+    if (!isOpen || !useFixedPosition || typeof window === 'undefined') {
+      return undefined;
+    }
+
+    const handleViewportChange = () => updateFixedPosition();
+    window.addEventListener('resize', handleViewportChange);
+    window.addEventListener('scroll', handleViewportChange, true);
+
+    return () => {
+      window.removeEventListener('resize', handleViewportChange);
+      window.removeEventListener('scroll', handleViewportChange, true);
+    };
+  }, [isOpen, updateFixedPosition, useFixedPosition]);
+
+  const handleClick = (event) => {
+    // Prevent nested labels from toggling their checkbox when the help icon is clicked.
+    event.preventDefault();
+    event.stopPropagation();
+  };
+
+  const tooltipPopup = isOpen ? (
+    <span
+      ref={popupRef}
+      className={popupClasses}
+      style={
+        useFixedPosition
+          ? {
+              position: 'fixed',
+              top: 0,
+              left: 0,
+              visibility: fixedPopupStyle ? 'visible' : 'hidden',
+              zIndex: 100000,
+              ...fixedPopupStyle,
+              ...popupStyle,
+            }
+          : popupStyle
+      }
+    >
+      {children}
+    </span>
+  ) : null;
+
+  return (
+    <span className={anchorClasses}>
+      <button
+        ref={buttonRef}
+        type="button"
+        className={buttonClasses}
+        aria-label={label}
+        onMouseEnter={showTooltip}
+        onMouseLeave={hideTooltip}
+        onFocus={showTooltip}
+        onBlur={hideTooltip}
+        onClick={handleClick}
+      >
+        {buttonContent}
+      </button>
+      {!useFixedPosition && tooltipPopup}
+      {useFixedPosition && tooltipPopup && typeof document !== 'undefined'
+        ? createPortal(tooltipPopup, document.body)
+        : null}
+    </span>
+  );
+}
diff --git a/frontend/src/components/OpenRouterApiKeyModal.jsx b/frontend/src/components/OpenRouterApiKeyModal.jsx
index 45f4ab3..7aefaf3 100644
--- a/frontend/src/components/OpenRouterApiKeyModal.jsx
+++ b/frontend/src/components/OpenRouterApiKeyModal.jsx
@@ -11,13 +11,21 @@ import './settings-common.css';
  * 2. LM Studio is unavailable and user needs OpenRouter as primary provider
  * 3. User explicitly wants to manage their API key
  */
-export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reason = 'setup' }) {
+export default function OpenRouterApiKeyModal({
+  isOpen,
+  onClose,
+  onKeySet,
+  reason = 'setup',
+  capabilities,
+}) {
   const [apiKey, setApiKey] = useState('');
   const [testing, setTesting] = useState(false);
   const [saving, setSaving] = useState(false);
   const [testResult, setTestResult] = useState(null);
   const [error, setError] = useState('');
   const [hasStoredKey, setHasStoredKey] = useState(false);
+  const genericMode = Boolean(capabilities?.genericMode);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
 
   // Reset state when modal opens
   useEffect(() => {
@@ -118,9 +126,17 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
   const reasonMessages = {
     setup: 'Configure your OpenRouter API key to use OpenRouter models for any role.',
     startup_setup: 'Save your OpenRouter API key to unlock cloud models. MOTO will apply the recommended default profile immediately, and you can switch to your team profile or another default profile later in Settings.',
-    lm_studio_unavailable: 'LM Studio is not available. Configure OpenRouter to continue.',
+    lm_studio_unavailable: lmStudioEnabled
+      ? 'LM Studio is not available. Configure OpenRouter to continue.'
+      : 'This deployment disables LM Studio. Configure OpenRouter to continue.',
     no_key: 'An OpenRouter API key is required to use OpenRouter models.',
   };
+  const storedKeyCopy = genericMode
+    ? 'An OpenRouter API key is already loaded in this running backend instance. Enter a new key below to replace it for this session.'
+    : 'An OpenRouter API key is already stored securely on the backend for this machine. Enter a new key below to replace it.';
+  const keyStorageFooter = genericMode
+    ? 'This API key is held in backend memory for the active hosted/runtime instance and sent to the backend for OpenRouter API calls. API Boost can reuse this key automatically, or you can override it inside the boost modal.'
+    : 'This API key is stored securely through the backend keyring integration and sent to the backend for OpenRouter API calls. API Boost can reuse this key automatically, or you can override it inside the boost modal.';
 
   return (
     <div 
@@ -183,7 +199,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
               href="https://openrouter.ai/keys" 
               target="_blank" 
               rel="noopener noreferrer"
-              style={{ color: '#6c5ce7' }}
+              style={{ color: '#18cc17' }}
             >
               openrouter.ai/keys
             </a>
@@ -212,8 +228,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
           <div className="test-result-banner test-result-banner--success" style={{
             marginBottom: '1rem',
           }}>
-            An OpenRouter API key is already stored securely on the backend for this machine.
-            Enter a new key below to replace it.
+            {storedKeyCopy}
           </div>
         )}
 
@@ -243,7 +258,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
             style={{
               flex: 1,
               padding: '0.75rem 1rem',
-              backgroundColor: '#6c5ce7',
+              backgroundColor: '#18cc17',
               border: 'none',
               borderRadius: '6px',
               color: '#fff',
@@ -281,8 +296,7 @@ export default function OpenRouterApiKeyModal({ isOpen, onClose, onKeySet, reaso
           backgroundColor: '#0d0d1a',
           borderRadius: '6px',
         }}>
-          This API key is stored securely through the backend keyring integration and sent to the backend for OpenRouter API calls.
-          API Boost can reuse this key automatically, or you can override it inside the boost modal.
+          {keyStorageFooter}
         </p>
       </div>
     </div>
diff --git a/frontend/src/components/OpenRouterPrivacyWarningModal.jsx b/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
index a610ff0..3985132 100644
--- a/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
+++ b/frontend/src/components/OpenRouterPrivacyWarningModal.jsx
@@ -7,9 +7,11 @@ import './settings-common.css';
  * Shows when user's OpenRouter privacy settings block access to free models.
  * Provides clear instructions on how to fix the issue.
  */
-function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData }) {
+function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData, capabilities }) {
   if (!isOpen) return null;
 
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+
   const handleOverlayClick = (e) => {
     if (e.target === e.currentTarget) {
       onClose();
@@ -168,9 +170,15 @@ function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData }) {
             <li style={{ marginBottom: '8px' }}>
               Use a paid OpenRouter model instead of a free model
             </li>
-            <li>
-              Configure an LM Studio fallback model in Settings
-            </li>
+            {lmStudioEnabled ? (
+              <li>
+                Configure an LM Studio fallback model in Settings
+              </li>
+            ) : (
+              <li>
+                Choose a different OpenRouter model or host provider for this role
+              </li>
+            )}
           </ul>
         </div>
 
@@ -217,7 +225,7 @@ function OpenRouterPrivacyWarningModal({ isOpen, onClose, errorData }) {
           lineHeight: '1.5'
         }}>
           <strong>Note:</strong> This is an OpenRouter account setting, not a MOTO setting. 
-          You only need to configure this once on OpenRouter's website.
+          You only need to configure this once on OpenRouter&apos;s website.
         </div>
       </div>
     </div>
diff --git a/frontend/src/components/StartupProviderSetupModal.jsx b/frontend/src/components/StartupProviderSetupModal.jsx
index 259c5ec..73276a6 100644
--- a/frontend/src/components/StartupProviderSetupModal.jsx
+++ b/frontend/src/components/StartupProviderSetupModal.jsx
@@ -3,6 +3,7 @@ import './settings-common.css';
 
 export default function StartupProviderSetupModal({
   isOpen,
+  capabilities,
   lmStudioAvailable,
   hasUsableLmStudioChatModel = false,
   lmStudioModelCount = 0,
@@ -14,6 +15,8 @@ export default function StartupProviderSetupModal({
 }) {
   if (!isOpen) return null;
 
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+
   return (
     <div
       className="inline-modal-overlay"
@@ -36,8 +39,17 @@ export default function StartupProviderSetupModal({
         </div>
 
         <p style={{ color: '#ddd', lineHeight: '1.6', marginBottom: '0.9rem' }}>
-          MOTO needs <strong>an OpenRouter API key or a running LM Studio server</strong> before you start.
-          The best experience is to use both: OpenRouter for cloud models and LM Studio for free, faster local RAG and embeddings.
+          {lmStudioEnabled ? (
+            <>
+              MOTO needs <strong>an OpenRouter API key or a running LM Studio server</strong> before you start.
+              The best experience is to use both: OpenRouter for cloud models and LM Studio for free, faster local RAG and embeddings.
+            </>
+          ) : (
+            <>
+              This hosted deployment needs <strong>an OpenRouter API key</strong> before you start.
+              LM Studio is intentionally disabled here, so all model selection and inference routes through OpenRouter.
+            </>
+          )}
         </p>
 
         <div
@@ -51,8 +63,17 @@ export default function StartupProviderSetupModal({
             lineHeight: '1.55',
           }}
         >
-          <strong>Highly recommended:</strong> install LM Studio even if you plan to use OpenRouter. LM Studio
-          gives MOTO free local embedding/RAG calls and noticeably faster retrieval than OpenRouter embeddings.
+          {lmStudioEnabled ? (
+            <>
+              <strong>Highly recommended:</strong> install LM Studio even if you plan to use OpenRouter. LM Studio
+              gives MOTO free local embedding/RAG calls and noticeably faster retrieval than OpenRouter embeddings.
+            </>
+          ) : (
+            <>
+              <strong>Hosted mode:</strong> after you save your OpenRouter key, MOTO will apply the recommended
+              OpenRouter profile immediately. You can fine-tune role models later in the settings screens.
+            </>
+          )}
         </div>
 
         <div style={{ display: 'grid', gap: '1rem', gridTemplateColumns: 'repeat(auto-fit, minmax(280px, 1fr))' }}>
@@ -61,10 +82,10 @@ export default function StartupProviderSetupModal({
               padding: '1rem',
               borderRadius: '10px',
               backgroundColor: '#1c1c33',
-              border: '1px solid #34345c',
+              border: '1px solid #18cc17',
             }}
           >
-            <h3 style={{ marginTop: 0, color: '#a29bfe' }}>OpenRouter Setup</h3>
+            <h3 style={{ marginTop: 0, color: '#18cc17' }}>OpenRouter Setup</h3>
             <ol style={{ margin: '0 0 1rem 1.1rem', padding: 0, color: '#d7d7e8', lineHeight: '1.55' }}>
               <li>Create or sign in to your account at <a href="https://openrouter.ai/" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>openrouter.ai</a>.</li>
               <li>Generate an API key at <a href="https://openrouter.ai/keys" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>openrouter.ai/keys</a>.</li>
@@ -76,7 +97,7 @@ export default function StartupProviderSetupModal({
               style={{
                 width: '100%',
                 padding: '0.8rem 1rem',
-                backgroundColor: '#6c5ce7',
+                backgroundColor: '#18cc17',
                 border: 'none',
                 borderRadius: '8px',
                 color: '#fff',
@@ -89,41 +110,43 @@ export default function StartupProviderSetupModal({
             </button>
           </div>
 
-          <div
-            style={{
-              padding: '1rem',
-              borderRadius: '10px',
-              backgroundColor: '#1c1c33',
-              border: '1px solid #2f5c36',
-            }}
-          >
-            <h3 style={{ marginTop: 0, color: '#7CFC90' }}>LM Studio Setup</h3>
-            <ol style={{ margin: '0 0 1rem 1.1rem', padding: 0, color: '#d7d7e8', lineHeight: '1.55' }}>
-              <li>Install LM Studio from <a href="https://lmstudio.ai/" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>lmstudio.ai</a>.</li>
-              <li>Enable Developer or Power User mode if needed, then open the server tab.</li>
-              <li>Load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code>.</li>
-              <li>Optionally load one or more local chat models, then start the local server on <code>http://127.0.0.1:1234</code>.</li>
-            </ol>
-            <button
-              type="button"
-              onClick={onConfirmLmStudio}
-              disabled={isCheckingLmStudio}
+          {lmStudioEnabled && (
+            <div
               style={{
-                width: '100%',
-                padding: '0.8rem 1rem',
-                backgroundColor: lmStudioAvailable && hasUsableLmStudioChatModel ? '#1f7a33' : '#21492a',
-                border: '1px solid #2f8f45',
-                borderRadius: '8px',
-                color: '#fff',
-                fontSize: '0.95rem',
-                fontWeight: '600',
-                cursor: isCheckingLmStudio ? 'not-allowed' : 'pointer',
-                opacity: isCheckingLmStudio ? 0.7 : 1,
+                padding: '1rem',
+                borderRadius: '10px',
+                backgroundColor: '#1c1c33',
+                border: '1px solid #2f5c36',
               }}
             >
-              {isCheckingLmStudio ? 'Checking LM Studio...' : "I'm Running LM Studio"}
-            </button>
-          </div>
+              <h3 style={{ marginTop: 0, color: '#7CFC90' }}>LM Studio Setup</h3>
+              <ol style={{ margin: '0 0 1rem 1.1rem', padding: 0, color: '#d7d7e8', lineHeight: '1.55' }}>
+                <li>Install LM Studio from <a href="https://lmstudio.ai/" target="_blank" rel="noopener noreferrer" style={{ color: '#8ab4ff' }}>lmstudio.ai</a>.</li>
+                <li>Enable Developer or Power User mode if needed, then open the server tab.</li>
+                <li>Load the embedding model <code>nomic-ai/nomic-embed-text-v1.5</code>.</li>
+                <li>Optionally load one or more local chat models, then start the local server on <code>http://127.0.0.1:1234</code>.</li>
+              </ol>
+              <button
+                type="button"
+                onClick={onConfirmLmStudio}
+                disabled={isCheckingLmStudio}
+                style={{
+                  width: '100%',
+                  padding: '0.8rem 1rem',
+                  backgroundColor: lmStudioAvailable && hasUsableLmStudioChatModel ? '#1f7a33' : '#21492a',
+                  border: '1px solid #2f8f45',
+                  borderRadius: '8px',
+                  color: '#fff',
+                  fontSize: '0.95rem',
+                  fontWeight: '600',
+                  cursor: isCheckingLmStudio ? 'not-allowed' : 'pointer',
+                  opacity: isCheckingLmStudio ? 0.7 : 1,
+                }}
+              >
+                {isCheckingLmStudio ? 'Checking LM Studio...' : "I'm Running LM Studio"}
+              </button>
+            </div>
+          )}
         </div>
 
         <div
@@ -131,17 +154,25 @@ export default function StartupProviderSetupModal({
             marginTop: '1rem',
             padding: '0.9rem 1rem',
             borderRadius: '8px',
-            backgroundColor: lmStudioAvailable ? 'rgba(30, 255, 28, 0.08)' : 'rgba(255, 184, 77, 0.08)',
-            border: lmStudioAvailable ? '1px solid rgba(30, 255, 28, 0.25)' : '1px solid rgba(255, 184, 77, 0.28)',
-            color: lmStudioAvailable ? '#dbffdd' : '#ffe1ad',
+            backgroundColor: lmStudioEnabled
+              ? (lmStudioAvailable ? 'rgba(30, 255, 28, 0.08)' : 'rgba(255, 184, 77, 0.08)')
+              : 'rgba(24, 204, 23, 0.12)',
+            border: lmStudioEnabled
+              ? (lmStudioAvailable ? '1px solid rgba(30, 255, 28, 0.25)' : '1px solid rgba(255, 184, 77, 0.28)')
+              : '1px solid rgba(24, 204, 23, 0.3)',
+            color: lmStudioEnabled ? (lmStudioAvailable ? '#dbffdd' : '#ffe1ad') : '#dbffdd',
             lineHeight: '1.5',
           }}
         >
-          {lmStudioAvailable && hasUsableLmStudioChatModel
-            ? `LM Studio is currently detected with ${lmStudioModelCount} loaded model${lmStudioModelCount === 1 ? '' : 's'}, including a usable chat model.`
-            : lmStudioAvailable
-              ? 'LM Studio is running, but you still need at least one loaded chat model in addition to embeddings.'
-              : `LM Studio is not detected yet${lmStudioError ? `: ${lmStudioError}` : '.'}`}
+          {lmStudioEnabled
+            ? (
+              lmStudioAvailable && hasUsableLmStudioChatModel
+                ? `LM Studio is currently detected with ${lmStudioModelCount} loaded model${lmStudioModelCount === 1 ? '' : 's'}, including a usable chat model.`
+                : lmStudioAvailable
+                  ? 'LM Studio is running, but you still need at least one loaded chat model in addition to embeddings.'
+                  : `LM Studio is not detected yet${lmStudioError ? `: ${lmStudioError}` : '.'}`
+            )
+            : 'Hosted web mode is active. LM Studio is disabled in this deployment, so OpenRouter is the required provider path.'}
         </div>
 
         {statusMessage && (
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index fd868e7..b8fad9b 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -3,7 +3,14 @@ import { websocket } from '../services/websocket';
 import { boostAPI, workflowAPI } from '../services/api';
 import './WorkflowPanel.css';
 
+const HOURLY_AUTO_OPEN_INTERVAL_SECONDS = 3600;
+const WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY = 'workflow_panel_last_auto_open_hour';
+
 const formatNumber = (n) => n.toLocaleString();
+const getStoredAutoOpenHour = () => {
+  const savedHour = Number.parseInt(localStorage.getItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY) || '0', 10);
+  return Number.isFinite(savedHour) && savedHour > 0 ? savedHour : 0;
+};
 
 const formatTime = (totalSeconds) => {
   const h = Math.floor(totalSeconds / 3600);
@@ -30,6 +37,8 @@ export default function WorkflowPanel({ isRunning }) {
   const [showPerModel, setShowPerModel] = useState(false);
   const [localElapsed, setLocalElapsed] = useState(0);
   const lastSyncRef = useRef(Date.now());
+  const hasElapsedSyncRef = useRef(false);
+  const lastAutoOpenedHourRef = useRef(getStoredAutoOpenHour());
 
   const expandPanel = useCallback(() => {
     setCollapsed(false);
@@ -73,6 +82,35 @@ export default function WorkflowPanel({ isRunning }) {
     }
   }, [boostEnabled, expandPanel]);
 
+  useEffect(() => {
+    if (!hasElapsedSyncRef.current) {
+      return;
+    }
+
+    if (localElapsed < 60 && lastAutoOpenedHourRef.current !== 0) {
+      lastAutoOpenedHourRef.current = 0;
+      localStorage.setItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY, '0');
+    }
+  }, [localElapsed]);
+
+  useEffect(() => {
+    if (!isRunning || !hasElapsedSyncRef.current) {
+      return;
+    }
+
+    const elapsedHours = Math.floor(localElapsed / HOURLY_AUTO_OPEN_INTERVAL_SECONDS);
+    if (elapsedHours < 1 || elapsedHours <= lastAutoOpenedHourRef.current) {
+      return;
+    }
+
+    if (collapsed) {
+      expandPanel();
+    }
+
+    lastAutoOpenedHourRef.current = elapsedHours;
+    localStorage.setItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY, elapsedHours.toString());
+  }, [collapsed, expandPanel, isRunning, localElapsed]);
+
   useEffect(() => {
     if (!isEditingBoostNext) {
       setBoostNextInput(boostNextCount > 0 ? boostNextCount.toString() : '');
@@ -120,10 +158,13 @@ export default function WorkflowPanel({ isRunning }) {
 
   // Token stats: initial fetch on mount and when isRunning changes
   useEffect(() => {
+    hasElapsedSyncRef.current = false;
+
     const fetchTokenStats = async () => {
       try {
         const resp = await workflowAPI.getTokenStats();
         if (resp.success) {
+          hasElapsedSyncRef.current = true;
           setTokenStats(resp);
           setLocalElapsed(resp.elapsed_seconds || 0);
           lastSyncRef.current = Date.now();
@@ -136,6 +177,7 @@ export default function WorkflowPanel({ isRunning }) {
   // Token stats: listen for real-time WebSocket updates
   useEffect(() => {
     const handleTokenUpdate = (data) => {
+      hasElapsedSyncRef.current = true;
       setTokenStats(data);
       setLocalElapsed(data.elapsed_seconds || 0);
       lastSyncRef.current = Date.now();
diff --git a/frontend/src/components/aggregator/AggregatorInterface.jsx b/frontend/src/components/aggregator/AggregatorInterface.jsx
index 343790d..7be6406 100644
--- a/frontend/src/components/aggregator/AggregatorInterface.jsx
+++ b/frontend/src/components/aggregator/AggregatorInterface.jsx
@@ -3,10 +3,16 @@ import { api } from '../../services/api';
 import TextFileUploader from '../TextFileUploader';
 import '../settings-common.css';
 
-export default function AggregatorInterface({ config, setConfig, anyWorkflowRunning = false }) {
+export default function AggregatorInterface({
+  config,
+  setConfig,
+  capabilities,
+  anyWorkflowRunning = false,
+}) {
   const [isRunning, setIsRunning] = useState(false);
   const [status, setStatus] = useState(null);
   const [uploadedFiles, setUploadedFiles] = useState([]);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
 
   useEffect(() => {
     fetchStatus();
@@ -80,10 +86,10 @@ export default function AggregatorInterface({ config, setConfig, anyWorkflowRunn
       // Format submitter configs for backend (includes OpenRouter provider fields)
       const formattedConfigs = submitterConfigs.map(s => ({
         submitter_id: s.submitterId,
-        provider: s.provider || 'lm_studio',
+        provider: lmStudioEnabled ? (s.provider || 'lm_studio') : 'openrouter',
         model_id: s.modelId,
         openrouter_provider: s.openrouterProvider || null,
-        lm_studio_fallback_id: s.lmStudioFallbackId || null,
+        lm_studio_fallback_id: lmStudioEnabled ? (s.lmStudioFallbackId || null) : null,
         context_window: s.contextWindow,
         max_output_tokens: s.maxOutputTokens
       }));
@@ -92,10 +98,10 @@ export default function AggregatorInterface({ config, setConfig, anyWorkflowRunn
         user_prompt: config.userPrompt,
         submitter_configs: formattedConfigs,
         // Validator config with OpenRouter support
-        validator_provider: config.validatorProvider || 'lm_studio',
+        validator_provider: lmStudioEnabled ? (config.validatorProvider || 'lm_studio') : 'openrouter',
         validator_model: config.validatorModel,
         validator_openrouter_provider: config.validatorOpenrouterProvider || null,
-        validator_lm_studio_fallback: config.validatorLmStudioFallback || null,
+        validator_lm_studio_fallback: lmStudioEnabled ? (config.validatorLmStudioFallback || null) : null,
         validator_context_size: config.validatorContextSize,
         validator_max_output_tokens: config.validatorMaxOutput || 25000,
         uploaded_files: config.uploadedFiles,
diff --git a/frontend/src/components/aggregator/AggregatorLogs.jsx b/frontend/src/components/aggregator/AggregatorLogs.jsx
index c1eebec..e837430 100644
--- a/frontend/src/components/aggregator/AggregatorLogs.jsx
+++ b/frontend/src/components/aggregator/AggregatorLogs.jsx
@@ -49,7 +49,7 @@ export default function AggregatorLogs() {
 
   const fetchRecoveryStatus = async () => {
     try {
-      const response = await fetch('http://localhost:8000/api/aggregator/status/recovery');
+      const response = await fetch('/api/aggregator/status/recovery');
       if (response.ok) {
         const data = await response.json();
         setRecoveryStatus(data);
@@ -61,7 +61,7 @@ export default function AggregatorLogs() {
 
   const fetchPersistedEvents = async () => {
     try {
-      const response = await fetch('http://localhost:8000/api/aggregator/events');
+      const response = await fetch('/api/aggregator/events');
       if (response.ok) {
         const data = await response.json();
         if (data.events && data.events.length > 0) {
@@ -253,7 +253,7 @@ export default function AggregatorLogs() {
                         Failures: {count}/{recoveryStatus.corruption_threshold}
                       </div>
                       {recoveryStatus.recovery_attempts && recoveryStatus.recovery_attempts[model] > 0 && (
-                        <div style={{ color: '#2196F3' }}>
+                        <div style={{ color: '#18cc17' }}>
                           Recoveries: {recoveryStatus.recovery_attempts[model]}
                         </div>
                       )}
diff --git a/frontend/src/components/aggregator/AggregatorSettings.jsx b/frontend/src/components/aggregator/AggregatorSettings.jsx
index a7baffb..46d0cf9 100644
--- a/frontend/src/components/aggregator/AggregatorSettings.jsx
+++ b/frontend/src/components/aggregator/AggregatorSettings.jsx
@@ -1,5 +1,12 @@
 import React, { useState, useEffect } from 'react';
 import { api, openRouterAPI } from '../../services/api';
+import {
+  computeOpenRouterAutoSettings,
+  findOpenRouterModel,
+  getProviderNames,
+  hasEndpointMetadata,
+} from '../../utils/openRouterSelection';
+import HelpTooltip from '../HelpTooltip';
 import '../settings-common.css';
 
 const DEFAULT_SUBMITTER_CONFIG = {
@@ -12,10 +19,10 @@ const DEFAULT_SUBMITTER_CONFIG = {
   maxOutputTokens: 25000
 };
 
-export default function AggregatorSettings({ config, setConfig }) {
+export default function AggregatorSettings({ config, setConfig, capabilities }) {
   const [lmStudioModels, setLmStudioModels] = useState([]);
   const [openRouterModels, setOpenRouterModels] = useState([]);
-  const [modelProviders, setModelProviders] = useState({}); // { modelId: [providers] }
+  const [modelProviders, setModelProviders] = useState({}); // { modelId: { providers: [], endpoints: [] } }
   const [loading, setLoading] = useState(true);
   const [saveMessage, setSaveMessage] = useState('');
   const [numSubmitters, setNumSubmitters] = useState(
@@ -42,6 +49,7 @@ export default function AggregatorSettings({ config, setConfig }) {
   const [freeModelLooping, setFreeModelLooping] = useState(true);
   const [freeModelAutoSelector, setFreeModelAutoSelector] = useState(true);
   const [isLoaded, setIsLoaded] = useState(false);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
 
   // Load settings from localStorage on mount
   useEffect(() => {
@@ -107,9 +115,66 @@ export default function AggregatorSettings({ config, setConfig }) {
   }, [isLoaded, numSubmitters, submitterConfigs, validatorProvider, validatorOpenrouterProvider, validatorLmStudioFallback, validatorMaxOutput, freeOnly, freeModelLooping, freeModelAutoSelector, modelProviders]);
 
   useEffect(() => {
-    fetchModels();
+    if (lmStudioEnabled) {
+      fetchModels();
+    } else {
+      setLmStudioModels([]);
+      setLoading(false);
+    }
     checkOpenRouterKey();
-  }, []);
+  }, [lmStudioEnabled]);
+
+  useEffect(() => {
+    if (lmStudioEnabled) {
+      return;
+    }
+
+    const normalizedSubmitters = submitterConfigs.map((submitterConfig) => {
+      const keepOpenRouterState = submitterConfig.provider === 'openrouter';
+      return {
+        ...submitterConfig,
+        provider: 'openrouter',
+        modelId: keepOpenRouterState ? (submitterConfig.modelId || '') : '',
+        openrouterProvider: keepOpenRouterState ? (submitterConfig.openrouterProvider || null) : null,
+        lmStudioFallbackId: null,
+      };
+    });
+    const keepValidatorOpenRouterState = validatorProvider === 'openrouter';
+
+    if (JSON.stringify(normalizedSubmitters) !== JSON.stringify(submitterConfigs)) {
+      setSubmitterConfigs(normalizedSubmitters);
+    }
+    if (validatorProvider !== 'openrouter') {
+      setValidatorProvider('openrouter');
+    }
+    if (validatorOpenrouterProvider !== (keepValidatorOpenRouterState ? (validatorOpenrouterProvider || null) : null)) {
+      setValidatorOpenrouterProvider(keepValidatorOpenRouterState ? (validatorOpenrouterProvider || null) : null);
+    }
+    if (validatorLmStudioFallback !== null) {
+      setValidatorLmStudioFallback(null);
+    }
+
+    setConfig((prev) => {
+      const next = {
+        ...prev,
+        submitterConfigs: normalizedSubmitters,
+        validatorProvider: 'openrouter',
+        validatorModel: keepValidatorOpenRouterState ? (prev.validatorModel || '') : '',
+        validatorOpenrouterProvider: keepValidatorOpenRouterState
+          ? (prev.validatorOpenrouterProvider || null)
+          : null,
+        validatorLmStudioFallback: null,
+      };
+      return JSON.stringify(next) === JSON.stringify(prev) ? prev : next;
+    });
+  }, [
+    lmStudioEnabled,
+    submitterConfigs,
+    validatorProvider,
+    validatorOpenrouterProvider,
+    validatorLmStudioFallback,
+    setConfig,
+  ]);
 
   const checkOpenRouterKey = async () => {
     try {
@@ -143,13 +208,151 @@ export default function AggregatorSettings({ config, setConfig }) {
   }, [freeOnly]);
 
   const fetchProvidersForModel = async (modelId) => {
-    if (!modelId || modelProviders[modelId]) return;
+    if (!modelId) return null;
+
+    const cachedProviderData = modelProviders[modelId];
+    if (hasEndpointMetadata(cachedProviderData)) {
+      return cachedProviderData;
+    }
+
     try {
       const result = await openRouterAPI.getProviders(modelId);
-      setModelProviders(prev => ({ ...prev, [modelId]: result.providers || [] }));
+      const providerData = {
+        providers: result.providers || [],
+        endpoints: result.endpoints || [],
+      };
+      setModelProviders(prev => ({ ...prev, [modelId]: providerData }));
+      return providerData;
     } catch (err) {
       console.error(`Failed to fetch providers for ${modelId}:`, err);
+      return cachedProviderData || null;
+    }
+  };
+
+  const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
+    const model = findOpenRouterModel(openRouterModels, modelId);
+    if (!model) {
+      return null;
+    }
+
+    const providerData = await fetchProvidersForModel(modelId);
+    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+  };
+
+  const handleSubmitterModelChange = async (submitterId, modelId) => {
+    const baseConfigs = submitterConfigs.map(c =>
+      c.submitterId === submitterId
+        ? { ...c, modelId, openrouterProvider: null }
+        : c
+    );
+    setSubmitterConfigs(baseConfigs);
+    setConfig(prev => ({ ...prev, submitterConfigs: baseConfigs }));
+
+    const targetConfig = baseConfigs.find(c => c.submitterId === submitterId);
+    if (targetConfig?.provider !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, null);
+    if (!autoSettings) {
+      return;
+    }
+
+    const nextConfigs = baseConfigs.map(c =>
+      c.submitterId === submitterId
+        ? {
+            ...c,
+            contextWindow: autoSettings.contextWindow,
+            maxOutputTokens: autoSettings.maxOutputTokens,
+          }
+        : c
+    );
+    setSubmitterConfigs(nextConfigs);
+    setConfig(prev => ({ ...prev, submitterConfigs: nextConfigs }));
+  };
+
+  const handleSubmitterOpenRouterProviderChange = async (submitterId, providerName) => {
+    const baseConfigs = submitterConfigs.map(c =>
+      c.submitterId === submitterId
+        ? { ...c, openrouterProvider: providerName }
+        : c
+    );
+    setSubmitterConfigs(baseConfigs);
+    setConfig(prev => ({ ...prev, submitterConfigs: baseConfigs }));
+
+    const targetConfig = baseConfigs.find(c => c.submitterId === submitterId);
+    if (!targetConfig?.modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(targetConfig.modelId, providerName);
+    if (!autoSettings) {
+      return;
+    }
+
+    const nextConfigs = baseConfigs.map(c =>
+      c.submitterId === submitterId
+        ? {
+            ...c,
+            contextWindow: autoSettings.contextWindow,
+            maxOutputTokens: autoSettings.maxOutputTokens,
+          }
+        : c
+    );
+    setSubmitterConfigs(nextConfigs);
+    setConfig(prev => ({ ...prev, submitterConfigs: nextConfigs }));
+  };
+
+  const handleValidatorModelChange = async (modelId) => {
+    setConfig(prev => ({
+      ...prev,
+      validatorModel: modelId,
+      validatorOpenrouterProvider: null,
+    }));
+    setValidatorOpenrouterProvider(null);
+
+    if (validatorProvider !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, null);
+    if (!autoSettings) {
+      return;
+    }
+
+    setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    setConfig(prev => ({
+      ...prev,
+      validatorModel: modelId,
+      validatorOpenrouterProvider: null,
+      validatorContextSize: autoSettings.contextWindow,
+      validatorMaxOutput: autoSettings.maxOutputTokens,
+    }));
+  };
+
+  const handleValidatorOpenRouterProviderChange = async (providerName) => {
+    setValidatorOpenrouterProvider(providerName);
+    setConfig(prev => ({
+      ...prev,
+      validatorOpenrouterProvider: providerName,
+    }));
+
+    if (!config.validatorModel) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(config.validatorModel, providerName);
+    if (!autoSettings) {
+      return;
     }
+
+    setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    setConfig(prev => ({
+      ...prev,
+      validatorOpenrouterProvider: providerName,
+      validatorContextSize: autoSettings.contextWindow,
+      validatorMaxOutput: autoSettings.maxOutputTokens,
+    }));
   };
 
   // Handle number of submitters change - expand/contract configs
@@ -182,13 +385,20 @@ export default function AggregatorSettings({ config, setConfig }) {
   };
 
   const fetchModels = async () => {
+    if (!lmStudioEnabled) {
+      setLmStudioModels([]);
+      setLoading(false);
+      return;
+    }
+
     try {
       const data = await api.getModels();
-      setLmStudioModels(data);
+      const nextModels = data.models || data || [];
+      setLmStudioModels(nextModels);
       
       // Auto-select first model if none selected (only for LM Studio provider)
-      if (data.length > 0) {
-        const firstModelId = data[0].id;
+      if (nextModels.length > 0) {
+        const firstModelId = nextModels[0].id;
         
         // Update submitter configs with first model if needed
         const updatedConfigs = submitterConfigs.map(s => ({
@@ -230,12 +440,7 @@ export default function AggregatorSettings({ config, setConfig }) {
         updated.openrouterProvider = null;
         updated.lmStudioFallbackId = null;
       }
-      
-      // If selecting OpenRouter model, fetch providers
-      if (field === 'modelId' && c.provider === 'openrouter' && safeValue) {
-        fetchProvidersForModel(safeValue);
-      }
-      
+
       return updated;
     });
     
@@ -289,32 +494,41 @@ export default function AggregatorSettings({ config, setConfig }) {
     onFallbackChange,
     label = 'Model'
   }) => {
-    const models = provider === 'openrouter' ? openRouterModels : lmStudioModels;
-    const providers = modelId && provider === 'openrouter' ? (modelProviders[modelId] || []) : [];
+    const effectiveProvider = lmStudioEnabled ? provider : 'openrouter';
+    const models = effectiveProvider === 'openrouter' ? openRouterModels : lmStudioModels;
+    const providers = modelId && effectiveProvider === 'openrouter'
+      ? getProviderNames(modelProviders[modelId])
+      : [];
     
     return (
       <>
         {/* Provider Toggle */}
         <div className="form-group form-group--compact">
           <label className="label--sm">Provider</label>
-          <div className="provider-toggle-group">
-            <button
-              type="button"
-              onClick={() => onProviderChange('lm_studio')}
-              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
-            >
-              LM Studio
-            </button>
-            <button
-              type="button"
-              onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
-              disabled={!hasOpenRouterKey}
-              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
-              title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
-            >
-              OpenRouter
-            </button>
-          </div>
+          {lmStudioEnabled ? (
+            <div className="provider-toggle-group">
+              <button
+                type="button"
+                onClick={() => onProviderChange('lm_studio')}
+                className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
+              >
+                LM Studio
+              </button>
+              <button
+                type="button"
+                onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
+                disabled={!hasOpenRouterKey}
+                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
+                title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
+              >
+                OpenRouter
+              </button>
+            </div>
+          ) : (
+            <small className="hint-text hint-text--dim">
+              OpenRouter is required in this deployment.
+            </small>
+          )}
         </div>
 
         {/* Model Selection */}
@@ -327,7 +541,7 @@ export default function AggregatorSettings({ config, setConfig }) {
           >
             <option value="">Select model...</option>
             {models.map(model => {
-              const isFree = provider === 'openrouter' && 
+              const isFree = effectiveProvider === 'openrouter' && 
                             model.pricing?.prompt === "0" && 
                             model.pricing?.completion === "0";
               const displayName = model.name || model.id;
@@ -343,7 +557,7 @@ export default function AggregatorSettings({ config, setConfig }) {
         </div>
 
         {/* OpenRouter Provider Selection (only for OpenRouter) */}
-        {provider === 'openrouter' && modelId && (
+        {effectiveProvider === 'openrouter' && modelId && (
           <div className="form-group form-group--compact">
             <label className="label--sm">Host Provider (optional)</label>
             <select
@@ -360,7 +574,7 @@ export default function AggregatorSettings({ config, setConfig }) {
         )}
 
         {/* LM Studio Fallback (only for OpenRouter) */}
-        {provider === 'openrouter' && (
+        {effectiveProvider === 'openrouter' && lmStudioEnabled && (
           <div className="form-group form-group--compact">
             <label className="label--sm label--muted">
               LM Studio Fallback (optional)
@@ -406,11 +620,15 @@ export default function AggregatorSettings({ config, setConfig }) {
 
       {loading ? (
         <div>Loading models...</div>
-      ) : lmStudioModels.length === 0 && !hasOpenRouterKey ? (
+      ) : lmStudioEnabled && lmStudioModels.length === 0 && !hasOpenRouterKey ? (
         <div className="error-text">
           <p>No models found. Make sure LM Studio is running on http://127.0.0.1:1234 or configure OpenRouter.</p>
           <button onClick={fetchModels} className="secondary">Retry</button>
         </div>
+      ) : !lmStudioEnabled && !hasOpenRouterKey ? (
+        <div className="error-text">
+          <p>This deployment disables LM Studio. Set an OpenRouter API key in the header to configure models.</p>
+        </div>
       ) : (
         <>
           {/* Number of Submitters Slider */}
@@ -451,7 +669,7 @@ export default function AggregatorSettings({ config, setConfig }) {
                   <h4 style={{ margin: 0 }} className={cfg.provider === 'openrouter' ? 'card-title--purple' : (cfg.submitterId === 1 ? 'card-title--green' : '')}>
                     Submitter {cfg.submitterId} 
                     {cfg.submitterId === 1 && <span className="provider-badge-inline"> (Main Submitter)</span>}
-                    {cfg.provider === 'openrouter' && <span className="provider-badge-inline" style={{ color: '#6c5ce7' }}> [OpenRouter]</span>}
+                    {cfg.provider === 'openrouter' && <span className="provider-badge-inline" style={{ color: '#18cc17' }}> [OpenRouter]</span>}
                   </h4>
                   {cfg.submitterId === 1 && numSubmitters > 1 && (
                     <button 
@@ -470,8 +688,8 @@ export default function AggregatorSettings({ config, setConfig }) {
                     openrouterProvider={cfg.openrouterProvider}
                     lmStudioFallbackId={cfg.lmStudioFallbackId}
                     onProviderChange={(p) => updateSubmitterConfig(cfg.submitterId, 'provider', p)}
-                    onModelChange={(m) => updateSubmitterConfig(cfg.submitterId, 'modelId', m)}
-                    onOpenrouterProviderChange={(p) => updateSubmitterConfig(cfg.submitterId, 'openrouterProvider', p)}
+                    onModelChange={(m) => handleSubmitterModelChange(cfg.submitterId, m)}
+                    onOpenrouterProviderChange={(p) => handleSubmitterOpenRouterProviderChange(cfg.submitterId, p)}
                     onFallbackChange={(f) => updateSubmitterConfig(cfg.submitterId, 'lmStudioFallbackId', f)}
                   />
 
@@ -522,16 +740,8 @@ export default function AggregatorSettings({ config, setConfig }) {
                 openrouterProvider={validatorOpenrouterProvider}
                 lmStudioFallbackId={validatorLmStudioFallback}
                 onProviderChange={updateValidatorProvider}
-                onModelChange={(m) => {
-                  setConfig({ ...config, validatorModel: m });
-                  if (validatorProvider === 'openrouter' && m) {
-                    fetchProvidersForModel(m);
-                  }
-                }}
-                onOpenrouterProviderChange={(p) => {
-                  setValidatorOpenrouterProvider(p);
-                  setConfig({ ...config, validatorOpenrouterProvider: p });
-                }}
+                onModelChange={handleValidatorModelChange}
+                onOpenrouterProviderChange={handleValidatorOpenRouterProviderChange}
                 onFallbackChange={(f) => {
                   setValidatorLmStudioFallback(f);
                   setConfig({ ...config, validatorLmStudioFallback: f });
@@ -554,7 +764,7 @@ export default function AggregatorSettings({ config, setConfig }) {
                 step="1024"
               />
               <small className="hint-text">
-                {validatorProvider === 'lm_studio' 
+                {validatorProvider === 'lm_studio' && lmStudioEnabled
                   ? 'Must match the context length you set in LM Studio for this model.'
                   : 'Set based on the OpenRouter model\'s context window.'
                 }
@@ -564,9 +774,13 @@ export default function AggregatorSettings({ config, setConfig }) {
             <div className="form-group">
               <label>
                 Validator Max Output Tokens{' '}
-                <span className="help-hint" title="Default: 25000">
-                  ℹ️
-                </span>
+                <HelpTooltip
+                  label="Learn about validator max output tokens"
+                  anchorClassName="help-tooltip-anchor--inline"
+                  buttonContent="?"
+                >
+                  Default: 25000
+                </HelpTooltip>
               </label>
               <input
                 type="number"
@@ -584,9 +798,11 @@ export default function AggregatorSettings({ config, setConfig }) {
             </div>
           </div>
 
-          <button onClick={fetchModels} className="secondary mr-05">
-            Refresh LM Studio Models
-          </button>
+          {lmStudioEnabled && (
+            <button onClick={fetchModels} className="secondary mr-05">
+              Refresh LM Studio Models
+            </button>
+          )}
           {hasOpenRouterKey && (
             <>
               <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary mr-05" disabled={loadingOpenRouter}>
@@ -611,7 +827,12 @@ export default function AggregatorSettings({ config, setConfig }) {
                     }}
                   />
                   Enable Free Model Looping
-                  <span className="help-hint" title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.">(?)</span>
+                  <HelpTooltip
+                    label="Learn about free model looping"
+                    anchorClassName="help-tooltip-anchor--inline"
+                  >
+                    When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
+                  </HelpTooltip>
                 </label>
                 <label className="settings-checkbox-label">
                   <input
@@ -623,7 +844,12 @@ export default function AggregatorSettings({ config, setConfig }) {
                     }}
                   />
                   Use OpenRouter Free Models Auto-Selector as Backup
-                  <span className="help-hint" title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping.">(?)</span>
+                  <HelpTooltip
+                    label="Learn about the free models auto-selector backup"
+                    anchorClassName="help-tooltip-anchor--inline"
+                  >
+                    When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
+                  </HelpTooltip>
                 </label>
               </div>
             </>
diff --git a/frontend/src/components/autonomous/ArchiveViewerModal.css b/frontend/src/components/autonomous/ArchiveViewerModal.css
index 86ba3c2..7dd8c6b 100644
--- a/frontend/src/components/autonomous/ArchiveViewerModal.css
+++ b/frontend/src/components/autonomous/ArchiveViewerModal.css
@@ -78,8 +78,8 @@
 }
 
 .archive-tab--active {
-  color: #60a5fa;
-  border-bottom-color: #60a5fa;
+  color: #18cc17;
+  border-bottom-color: #18cc17;
 }
 
 .archive-tab-icon {
@@ -163,7 +163,7 @@
 
 /* Detail view */
 .archive-back-btn {
-  color: #60a5fa;
+  color: #18cc17;
   background: transparent;
   border: none;
   cursor: pointer;
@@ -177,7 +177,7 @@
 }
 
 .archive-back-btn:hover {
-  color: #93c5fd;
+  color: #18cc17;
 }
 
 .archive-detail {
@@ -255,7 +255,7 @@
 .archive-icon-header {
   width: 20px;
   height: 20px;
-  color: #60a5fa;
+  color: #18cc17;
 }
 
 .archive-icon-close {
diff --git a/frontend/src/components/autonomous/AutonomousResearch.css b/frontend/src/components/autonomous/AutonomousResearch.css
index f05d2d4..061002a 100644
--- a/frontend/src/components/autonomous/AutonomousResearch.css
+++ b/frontend/src/components/autonomous/AutonomousResearch.css
@@ -84,7 +84,7 @@
 }
 
 .log-phase-badge {
-  background: #2563eb;
+  background: #18cc17;
   color: #fff;
   padding: 0.15rem 0.4rem;
   border-radius: var(--radius-sm);
@@ -223,6 +223,66 @@
   box-shadow: 0 4px 12px rgba(231, 76, 60, 0.4);
 }
 
+/* Runtime indicator: shown alongside the Stop Research button while a
+   research run is active so the user has an unmistakable "live" signal. */
+.runtime-indicator {
+  display: inline-flex;
+  align-items: center;
+  gap: 0.5rem;
+  padding: 0.45rem 0.85rem;
+  border-radius: 999px;
+  background: rgba(46, 204, 113, 0.12);
+  border: 1px solid rgba(46, 204, 113, 0.5);
+  color: #2ecc71;
+  font-weight: 600;
+  font-size: 0.85rem;
+  letter-spacing: 0.02em;
+  text-transform: uppercase;
+  user-select: none;
+  box-shadow: 0 0 0 0 rgba(46, 204, 113, 0.45);
+  animation: runtime-indicator-glow 2s ease-in-out infinite;
+}
+
+.runtime-indicator-dot {
+  width: 10px;
+  height: 10px;
+  border-radius: 50%;
+  background: #2ecc71;
+  box-shadow: 0 0 8px rgba(46, 204, 113, 0.9);
+  animation: runtime-indicator-pulse 1.2s ease-in-out infinite;
+}
+
+.runtime-indicator-label {
+  line-height: 1;
+}
+
+@keyframes runtime-indicator-pulse {
+  0%, 100% {
+    transform: scale(1);
+    opacity: 1;
+  }
+  50% {
+    transform: scale(1.35);
+    opacity: 0.6;
+  }
+}
+
+@keyframes runtime-indicator-glow {
+  0%, 100% {
+    box-shadow: 0 0 0 0 rgba(46, 204, 113, 0.35);
+  }
+  50% {
+    box-shadow: 0 0 0 6px rgba(46, 204, 113, 0);
+  }
+}
+
+@media (prefers-reduced-motion: reduce) {
+  .runtime-indicator,
+  .runtime-indicator-dot {
+    animation: none;
+  }
+}
+
 .btn-clear {
   background: var(--bg-secondary, #2a2a2a);
   color: var(--text-secondary, #888);
@@ -283,8 +343,8 @@
 
 .research-prompt-section textarea:focus {
   outline: none;
-  border-color: #3498db;
-  box-shadow: 0 0 0 2px rgba(52, 152, 219, 0.2);
+  border-color: #18cc17;
+  box-shadow: 0 0 0 2px rgba(24, 204, 23, 0.2);
 }
 
 .research-prompt-section textarea:disabled {
@@ -354,7 +414,7 @@
   padding: 0.2rem 0.5rem;
   border-radius: 4px;
   font-size: 0.85rem;
-  color: #3498db;
+  color: #18cc17;
   margin-left: 0.5rem;
 }
 
@@ -392,9 +452,9 @@
 }
 
 .brainstorm-stats .submission-count.pruned {
-  background: rgba(155, 89, 182, 0.15);
-  color: #9b59b6;
-  border: 1px solid rgba(155, 89, 182, 0.3);
+  background: rgba(24, 204, 23, 0.15);
+  color: #18cc17;
+  border: 1px solid rgba(24, 204, 23, 0.3);
 }
 
 .brainstorm-stats .submission-count.queue {
@@ -422,7 +482,7 @@
   display: block;
   font-size: 1.75rem;
   font-weight: 700;
-  color: #3498db;
+  color: #18cc17;
   margin-bottom: 0.25rem;
 }
 
@@ -506,8 +566,8 @@
 }
 
 .activity-info {
-  background: rgba(52, 152, 219, 0.1);
-  color: #3498db;
+  background: rgba(24, 204, 23, 0.1);
+  color: #18cc17;
 }
 
 .activity-neutral {
@@ -552,12 +612,12 @@
 }
 
 .brainstorm-card:hover {
-  border-color: #3498db;
+  border-color: #18cc17;
   transform: translateY(-2px);
 }
 
 .brainstorm-card.expanded {
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .brainstorm-card-header {
@@ -569,7 +629,7 @@
 
 .brainstorm-card-id {
   font-family: 'Fira Code', monospace;
-  color: #3498db;
+  color: #18cc17;
   font-size: 0.9rem;
 }
 
@@ -643,71 +703,6 @@
   margin: 0.25rem 0 0.5rem 0;
 }
 
-/* Help icon tooltip */
-.paper-library-help-icon {
-  display: inline-flex;
-  align-items: center;
-  justify-content: center;
-  width: 17px;
-  height: 17px;
-  border-radius: 50%;
-  background: rgba(255, 255, 255, 0.15);
-  border: 1px solid rgba(255, 255, 255, 0.3);
-  color: #ccc;
-  font-size: 0.7rem;
-  font-weight: 700;
-  cursor: pointer;
-  margin-left: 8px;
-  position: relative;
-  vertical-align: middle;
-  user-select: none;
-  flex-shrink: 0;
-}
-
-.paper-library-help-icon:hover,
-.paper-library-help-icon:focus {
-  background: rgba(255, 255, 255, 0.25);
-  color: #fff;
-  outline: none;
-}
-
-.paper-library-tooltip {
-  display: none;
-  position: absolute;
-  top: calc(100% + 8px);
-  left: 50%;
-  transform: translateX(-50%);
-  width: 380px;
-  background: #1e1e2e;
-  border: 1px solid rgba(255, 255, 255, 0.18);
-  border-radius: 8px;
-  padding: 14px 16px;
-  font-size: 0.78rem;
-  font-weight: 400;
-  color: #ccc;
-  line-height: 1.55;
-  z-index: 9999;
-  box-shadow: 0 8px 32px rgba(0, 0, 0, 0.55);
-  text-align: left;
-  white-space: normal;
-  pointer-events: none;
-}
-
-.paper-library-tooltip code {
-  background: rgba(255, 255, 255, 0.07);
-  border: 1px solid rgba(255, 255, 255, 0.12);
-  border-radius: 3px;
-  padding: 0.1em 0.3em;
-  font-size: 0.85em;
-  color: #c5c5c5;
-  font-family: 'Consolas', 'Monaco', monospace;
-}
-
-.paper-library-help-icon:hover .paper-library-tooltip,
-.paper-library-help-icon:focus .paper-library-tooltip {
-  display: block;
-}
-
 .paper-library-file-location {
   color: #aaa;
   font-size: 0.75rem;
@@ -748,7 +743,7 @@
 }
 
 .paper-card:hover {
-  border-color: #9b59b6;
+  border-color: #18cc17;
   transform: translateY(-2px);
 }
 
@@ -761,7 +756,7 @@
   z-index: 999;
   overflow-y: auto;
   box-shadow: 0 0 50px rgba(0, 0, 0, 0.8);
-  border-color: #9b59b6;
+  border-color: #18cc17;
   transform: none;
 }
 
@@ -774,7 +769,7 @@
 
 .paper-card-id {
   font-family: 'Fira Code', monospace;
-  color: #9b59b6;
+  color: #18cc17;
   font-size: 0.85rem;
 }
 
@@ -828,7 +823,7 @@
 .btn-download,
 .btn-download-raw,
 .btn-download-pdf {
-  background: linear-gradient(135deg, #3498db, #2980b9);
+  background: linear-gradient(135deg, #18cc17, #0f9110);
   color: white;
   border: none;
   padding: 0.35rem 0.7rem;
@@ -839,11 +834,28 @@
   font-size: 0.75rem;
 }
 
+.btn-download-small {
+  background: linear-gradient(135deg, #18cc17, #0f9110);
+  color: white;
+  border: none;
+  padding: 0.65rem 1.35rem;
+  border-radius: var(--radius-sm, 4px);
+  cursor: pointer;
+  font-size: 0.95rem;
+  font-weight: 600;
+  transition: all 0.2s ease;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  text-align: center;
+}
+
 .btn-download:hover,
 .btn-download-raw:hover,
-.btn-download-pdf:hover {
+.btn-download-pdf:hover,
+.btn-download-small:hover {
   transform: translateY(-1px);
-  box-shadow: 0 4px 12px rgba(52, 152, 219, 0.4);
+  box-shadow: 0 4px 12px rgba(24, 204, 23, 0.4);
 }
 
 .paper-full-content {
@@ -878,6 +890,8 @@
   box-shadow: inset -1px 0 0 rgba(170, 245, 181, 0.04);
   flex-shrink: 0;
   padding: 1.5rem 0;
+  position: relative;
+  z-index: 2;
 }
 
 .known-models-sidebar {
@@ -1008,16 +1022,31 @@
   gap: 1.5rem;
   overflow-y: auto;
   width: 100%;
+  /* Default: accounts for left sidebar (322px) + horizontal padding (3rem). */
   max-width: calc(100vw - 322px - 3rem);
   box-sizing: border-box;
+  position: relative;
+  z-index: 1;
+}
+
+/* When the WorkflowPanel sidebar is expanded (320px) or collapsed (50px),
+   slide settings content leftward so dropdowns/arrows don't get clipped
+   by the fixed-position panel overlay. */
+.app.workflow-panel-expanded .autonomous-settings {
+  max-width: calc(100vw - 322px - 3rem - 320px);
+  padding-right: 1.5rem;
+}
+
+.app.workflow-panel-collapsed .autonomous-settings {
+  max-width: calc(100vw - 322px - 3rem - 50px);
+  padding-right: 1.5rem;
 }
 
 .settings-group {
   background: var(--bg-secondary, #1e1e1e);
-  border: 1px solid var(--border-color, #333);
+  border: 1px solid #18cc17;
   border-radius: 8px;
   padding: 1rem;
-  border-right: 3px solid #3498db;
   width: 100%;
   max-width: 100%;
   box-sizing: border-box;
@@ -1026,8 +1055,8 @@
 
 /* Known Models Display - OLD (to be removed) */
 .known-models-display {
-  background: linear-gradient(135deg, rgba(52, 152, 219, 0.08), rgba(52, 152, 219, 0.05));
-  border: 1px solid rgba(52, 152, 219, 0.2);
+  background: linear-gradient(135deg, rgba(24, 204, 23, 0.08), rgba(24, 204, 23, 0.05));
+  border: 1px solid rgba(24, 204, 23, 0.2);
 }
 
 .models-grid {
@@ -1038,15 +1067,15 @@
 
 .model-card {
   background: var(--bg-tertiary, #252525);
-  border: 1px solid rgba(52, 152, 219, 0.2);
+  border: 1px solid rgba(24, 204, 23, 0.2);
   border-radius: 6px;
   padding: 0.75rem;
   transition: all 0.2s ease;
 }
 
 .model-card:hover {
-  border-color: #3498db;
-  background: rgba(52, 152, 219, 0.1);
+  border-color: #18cc17;
+  background: rgba(24, 204, 23, 0.1);
   transform: translateY(-2px);
 }
 
@@ -1059,8 +1088,8 @@
 }
 
 .model-badge {
-  background: rgba(52, 152, 219, 0.15);
-  color: #3498db;
+  background: rgba(24, 204, 23, 0.15);
+  color: #18cc17;
   padding: 0.3rem 0.6rem;
   border-radius: 4px;
   font-size: 0.75rem;
@@ -1097,7 +1126,7 @@
 .settings-row select,
 .settings-row input {
   background: var(--bg-tertiary, #252525);
-  border: 1px solid var(--border-color, #333);
+  border: 1px solid var(--border-default);
   border-radius: 6px;
   padding: 0.5rem 0.75rem;
   color: var(--text-primary, #e0e0e0);
@@ -1110,7 +1139,7 @@
 .settings-row select:focus,
 .settings-row input:focus {
   outline: none;
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .settings-row select:disabled,
@@ -1136,11 +1165,10 @@
 /* Per-submitter config section */
 .submitter-config-section {
   background: var(--bg-tertiary, #252525);
-  border: 1px solid var(--border-color, #333);
+  border: 1px solid #18cc17;
   border-radius: 6px;
   padding: 1rem;
   margin-bottom: 1rem;
-  border-right: 3px solid #3498db;
   width: 100%;
   max-width: 100%;
   box-sizing: border-box;
@@ -1161,8 +1189,8 @@
 /* Copy button for submitter configs */
 .copy-btn {
   background: var(--bg-secondary, #2a2a2a);
-  color: #3498db;
-  border: 1px solid #3498db;
+  color: #18cc17;
+  border: 1px solid #18cc17;
   padding: 0.35rem 0.75rem;
   border-radius: 4px;
   cursor: pointer;
@@ -1172,7 +1200,7 @@
 }
 
 .copy-btn:hover:not(:disabled) {
-  background: rgba(52, 152, 219, 0.2);
+  background: rgba(24, 204, 23, 0.2);
 }
 
 .copy-btn:disabled {
@@ -1216,7 +1244,7 @@
   display: block;
   font-size: 1.5rem;
   font-weight: 700;
-  color: #3498db;
+  color: #18cc17;
 }
 
 .metric-label {
@@ -1245,7 +1273,7 @@
 }
 
 .submitter-stat-card:hover {
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .submitter-header {
@@ -1260,7 +1288,7 @@
 }
 
 .submitter-header:hover {
-  background: rgba(52, 152, 219, 0.1);
+  background: rgba(24, 204, 23, 0.1);
 }
 
 .submitter-title {
@@ -1271,7 +1299,7 @@
 
 .submitter-model {
   font-family: 'Fira Code', monospace;
-  color: #3498db;
+  color: #18cc17;
   font-size: 0.85rem;
 }
 
@@ -1279,7 +1307,7 @@
   display: flex;
   gap: 1rem;
   padding: 0.5rem 1rem;
-  background: rgba(52, 152, 219, 0.05);
+  background: rgba(24, 204, 23, 0.05);
   border-top: 1px solid var(--border-color, #333);
   flex-wrap: wrap;
 }
@@ -1302,8 +1330,8 @@
 }
 
 .submitter-stats-line .stat-item.info {
-  color: #3498db;
-  background: rgba(52, 152, 219, 0.1);
+  color: #18cc17;
+  background: rgba(24, 204, 23, 0.1);
 }
 
 .submitter-expanded {
@@ -1384,13 +1412,13 @@
 
 .event-topic {
   font-family: 'Fira Code', monospace;
-  color: #3498db;
+  color: #18cc17;
   flex: 1;
 }
 
 .event-count {
   font-family: 'Fira Code', monospace;
-  color: #9b59b6;
+  color: #18cc17;
   font-weight: 600;
   font-size: 0.8rem;
 }
@@ -1435,8 +1463,8 @@
 }
 
 .auto-log-entry.log-info {
-  border-left-color: #3498db;
-  background: rgba(52, 152, 219, 0.08);
+  border-left-color: #18cc17;
+  background: rgba(24, 204, 23, 0.08);
 }
 
 .log-time {
@@ -1447,7 +1475,7 @@
 }
 
 .log-event {
-  color: #3498db;
+  color: #18cc17;
   flex-shrink: 0;
   min-width: 150px;
   font-weight: 600;
@@ -1507,11 +1535,11 @@
 }
 
 .submission-item:hover {
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .submission-item.expanded {
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .submission-header {
@@ -1530,7 +1558,7 @@
 
 .submission-number {
   font-family: 'Fira Code', monospace;
-  color: #3498db;
+  color: #18cc17;
   font-weight: 600;
   font-size: 0.9rem;
 }
@@ -1542,7 +1570,7 @@
 }
 
 .submission-toggle {
-  color: #3498db;
+  color: #18cc17;
   font-size: 0.8rem;
   flex-shrink: 0;
 }
@@ -1590,7 +1618,7 @@
 
 .btn-refresh:hover {
   background: var(--bg-tertiary, #333);
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .brainstorm-list-header {
@@ -1635,7 +1663,7 @@
 .toggle-icon {
   font-size: 0.8rem;
   margin-left: 0.5rem;
-  color: #3498db;
+  color: #18cc17;
 }
 
 .paper-meta {
@@ -1650,7 +1678,7 @@
   padding: 0.3rem 0.6rem;
   border-radius: 4px;
   font-size: 0.85rem;
-  color: #9b59b6;
+  color: #18cc17;
 }
 
 .paper-meta .word-count {
@@ -1743,13 +1771,13 @@
 }
 
 .outline-section .outline-content {
-  background: rgba(52, 152, 219, 0.05);
-  border-color: rgba(52, 152, 219, 0.2);
+  background: rgba(24, 204, 23, 0.05);
+  border-color: rgba(24, 204, 23, 0.2);
 }
 
 .paper-section .paper-content {
-  background: rgba(155, 89, 182, 0.05);
-  border-color: rgba(155, 89, 182, 0.2);
+  background: rgba(24, 204, 23, 0.05);
+  border-color: rgba(24, 204, 23, 0.2);
 }
 
 /* Manual Controls */
@@ -1808,12 +1836,25 @@
   background: linear-gradient(135deg, #e74c3c, #c0392b);
   color: white;
   border: none;
-  padding: 0.35rem 0.7rem;
   border-radius: 4px;
   cursor: pointer;
+  transition: all 0.2s ease;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  text-align: center;
+}
+
+.btn-delete-brainstorm {
+  padding: 0.65rem 1.35rem;
+  font-size: 0.95rem;
+  font-weight: 600;
+}
+
+.btn-delete-paper {
+  padding: 0.35rem 0.7rem;
   font-size: 0.75rem;
   font-weight: 500;
-  transition: all 0.2s ease;
 }
 
 .btn-delete-brainstorm:hover,
@@ -1916,13 +1957,13 @@
 }
 
 .final-answer-view.status-active {
-  border-color: #3498db;
+  border-color: #18cc17;
   animation: tier3-pulse 2s infinite;
 }
 
 @keyframes tier3-pulse {
-  0%, 100% { box-shadow: 0 0 10px rgba(52, 152, 219, 0.3); }
-  50% { box-shadow: 0 0 25px rgba(52, 152, 219, 0.5); }
+  0%, 100% { box-shadow: 0 0 10px rgba(24, 204, 23, 0.3); }
+  50% { box-shadow: 0 0 25px rgba(24, 204, 23, 0.5); }
 }
 
 .final-answer-header {
@@ -1975,7 +2016,7 @@
 }
 
 .final-status-badge.status-active {
-  background: linear-gradient(135deg, #3498db, #2980b9);
+  background: linear-gradient(135deg, #18cc17, #0f9110);
   color: white;
 }
 
@@ -2047,9 +2088,9 @@
 }
 
 .section-tab.active {
-  background: #3498db;
+  background: #18cc17;
   color: white;
-  border-color: #3498db;
+  border-color: #18cc17;
 }
 
 .content-controls {
@@ -2167,9 +2208,9 @@
 }
 
 .format-badge.short_form {
-  background: linear-gradient(135deg, rgba(155, 89, 182, 0.2), rgba(142, 68, 173, 0.2));
-  border: 1px solid rgba(155, 89, 182, 0.4);
-  color: #9b59b6;
+  background: linear-gradient(135deg, rgba(24, 204, 23, 0.2), rgba(15, 145, 16, 0.2));
+  border: 1px solid rgba(24, 204, 23, 0.4);
+  color: #18cc17;
 }
 
 .format-badge.long_form {
@@ -2219,7 +2260,7 @@
 }
 
 .chapter-item.writing {
-  border-left: 3px solid #3498db;
+  border-left: 3px solid #18cc17;
   animation: writing-pulse 1.5s infinite;
 }
 
@@ -2230,7 +2271,7 @@
 
 @keyframes writing-pulse {
   0%, 100% { background: var(--bg-secondary, #1e1e1e); }
-  50% { background: rgba(52, 152, 219, 0.1); }
+  50% { background: rgba(24, 204, 23, 0.1); }
 }
 
 .chapter-item.pending {
@@ -2247,7 +2288,7 @@
 
 .chapter-number {
   font-family: 'Fira Code', monospace;
-  color: #3498db;
+  color: #18cc17;
   font-weight: 600;
   font-size: 0.85rem;
 }
@@ -2274,8 +2315,8 @@
 }
 
 .chapter-status.chapter-writing {
-  background: rgba(52, 152, 219, 0.2);
-  color: #3498db;
+  background: rgba(24, 204, 23, 0.2);
+  color: #18cc17;
 }
 
 .chapter-status.chapter-pending {
@@ -2360,7 +2401,7 @@
 }
 
 .no-content-stats {
-  color: #3498db;
+  color: #18cc17;
   font-size: 1.1rem;
   font-weight: 600;
   margin-bottom: 0.5rem;
@@ -2473,7 +2514,7 @@
 }
 
 .tier3-papers-count {
-  color: #3498db;
+  color: #18cc17;
   font-size: 0.9rem;
   margin-bottom: 1.5rem;
   font-weight: 500;
diff --git a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
index 5478c1d..6f52ffd 100644
--- a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
@@ -34,18 +34,21 @@ const AutonomousResearchInterface = ({
   const [skipQueued, setSkipQueued] = useState(false);  // Skip has been queued pre-emptively
   const [explorationProgress, setExplorationProgress] = useState(null);  // Topic exploration phase tracking
   const [titleExplorationProgress, setTitleExplorationProgress] = useState(null);  // Paper title exploration tracking
-  const activityEndRef = useRef(null);
+  const activityFeedRef = useRef(null);
+  const prevActivityLengthRef = useRef(0);
 
   // Save research prompt to localStorage
   useEffect(() => {
     localStorage.setItem('autonomous_research_prompt', researchPrompt);
   }, [researchPrompt]);
 
-  // Auto-scroll activity feed
+  // Auto-scroll activity feed only when new items are added (not on mount/tab switch)
   useEffect(() => {
-    if (activityEndRef.current) {
-      activityEndRef.current.scrollIntoView({ behavior: 'smooth' });
+    const currentLength = activity ? activity.length : 0;
+    if (currentLength > prevActivityLengthRef.current && activityFeedRef.current) {
+      activityFeedRef.current.scrollTop = activityFeedRef.current.scrollHeight;
     }
+    prevActivityLengthRef.current = currentLength;
   }, [activity]);
 
   // Listen for critique phase events in activity feed
@@ -307,6 +310,35 @@ const AutonomousResearchInterface = ({
         return '✓';
       case 'final_answer_complete':
         return '◆';
+      case 'proof_framing_decided':
+        return 'P';
+      case 'proof_check_started':
+        return '◌';
+      case 'proof_retry_scheduled':
+        return '↺';
+      case 'proof_retry_started':
+        return '↻';
+      case 'proof_check_candidates_found':
+        return '#';
+      case 'proof_check_no_candidates':
+        return '-';
+      case 'smt_check_started':
+        return 'S';
+      case 'smt_check_complete':
+        return 'Z';
+      case 'proof_attempt_started':
+        return '>';
+      case 'proof_attempt_failed':
+      case 'proof_attempts_exhausted':
+        return '⚠';
+      case 'proof_verified':
+      case 'known_proof_verified':
+      case 'proof_check_complete':
+        return '✓';
+      case 'novel_proof_discovered':
+        return '◆';
+      case 'proof_dependency_added':
+        return '↗';
       default:
         return '•';
     }
@@ -328,11 +360,23 @@ const AutonomousResearchInterface = ({
         event === 'tier3_chapter_complete' ||
         event === 'tier3_short_form_complete' ||
         event === 'tier3_long_form_complete' ||
-        event === 'reference_selection_complete') {
+        event === 'reference_selection_complete' ||
+        event === 'proof_verified' ||
+        event === 'novel_proof_discovered' ||
+        event === 'known_proof_verified' ||
+        event === 'proof_check_complete' ||
+        event === 'proof_dependency_added' ||
+        event === 'smt_check_complete') {
       return 'activity-success';
     }
     // Rejection events
-    if (event.includes('rejected') || event === 'compiler_rejection' || event === 'tier3_rejection') {
+    if (
+        event.includes('rejected') ||
+        event === 'compiler_rejection' ||
+        event === 'tier3_rejection' ||
+        event === 'proof_attempt_failed' ||
+        event === 'proof_attempts_exhausted'
+    ) {
       return 'activity-reject';
     }
     // Info events (reviews, starts, tier3 progress, etc.)
@@ -354,7 +398,14 @@ const AutonomousResearchInterface = ({
         event === 'critique_phase_ended' ||
         event === 'critique_phase_skipped' ||
         event === 'brainstorm_continuation_decided' ||
-        event === 'brainstorm_paper_limit_reached') {
+        event === 'brainstorm_paper_limit_reached' ||
+        event === 'proof_framing_decided' ||
+        event === 'proof_retry_scheduled' ||
+        event === 'proof_retry_started' ||
+        event === 'proof_check_candidates_found' ||
+        event === 'proof_check_no_candidates' ||
+        event === 'proof_attempt_started' ||
+        event === 'smt_check_started') {
       return 'activity-info';
     }
     return 'activity-neutral';
@@ -378,9 +429,20 @@ const AutonomousResearchInterface = ({
               Start Research
             </button>
           ) : (
-            <button className="btn-stop" onClick={onStop}>
-              Stop Research
-            </button>
+            <>
+              <span
+                className="runtime-indicator"
+                role="status"
+                aria-live="polite"
+                title="Autonomous research is currently running"
+              >
+                <span className="runtime-indicator-dot" aria-hidden="true"></span>
+                <span className="runtime-indicator-label">Running</span>
+              </span>
+              <button className="btn-stop" onClick={onStop}>
+                Stop Research
+              </button>
+            </>
           )}
           <button 
             className={`btn-clear ${showClearConfirm ? 'btn-confirm' : ''}`}
@@ -431,7 +493,7 @@ const AutonomousResearchInterface = ({
         </div>
 
         {explorationProgress && (
-          <div className="current-brainstorm" style={{ borderLeft: '3px solid #a855f7' }}>
+          <div className="current-brainstorm" style={{ borderLeft: '3px solid #18cc17' }}>
             <span className="status-label">Topic Exploration:</span>
             <p className="brainstorm-prompt" style={{ color: '#c4b5fd' }}>
               Brainstorming candidate directions ({explorationProgress.accepted}/{explorationProgress.target} accepted)
@@ -665,10 +727,10 @@ const AutonomousResearchInterface = ({
       {/* Activity Feed */}
       <div className="activity-section">
         <h3>Live Activity</h3>
-        <div className="activity-feed">
+        <div className="activity-feed" ref={activityFeedRef}>
           {activity.length === 0 ? (
             <div className="activity-empty">
-              No activity yet. Start autonomous research to see updates.
+              No activity yet. Wait about 20 to 30 minutes. If you have not yet, press the start button under your prompt entry to begin research.
             </div>
           ) : (
             activity.map((item, index) => (
@@ -684,7 +746,6 @@ const AutonomousResearchInterface = ({
               </div>
             ))
           )}
-          <div ref={activityEndRef} />
         </div>
       </div>
     </div>
diff --git a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
index e5a37bb..b7a1aff 100644
--- a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
@@ -21,7 +21,8 @@ const EMPTY_API_STATS = Object.freeze({
 });
 
 const AutonomousResearchLogs = ({ stats, events }) => {
-  const eventsEndRef = useRef(null);
+  const eventsContainerRef = useRef(null);
+  const prevEventsLengthRef = useRef(0);
   const [expandedSubmitters, setExpandedSubmitters] = useState({});
   
   // API Logs state
@@ -32,10 +33,13 @@ const AutonomousResearchLogs = ({ stats, events }) => {
   const [apiAutoRefresh, setApiAutoRefresh] = useState(true);
   const abortControllerRef = useRef(null);
 
+  // Auto-scroll event log only when new events are added (not on mount/tab switch)
   useEffect(() => {
-    if (eventsEndRef.current) {
-      eventsEndRef.current.scrollIntoView({ behavior: 'smooth' });
+    const currentLength = events ? events.length : 0;
+    if (currentLength > prevEventsLengthRef.current && eventsContainerRef.current) {
+      eventsContainerRef.current.scrollTop = eventsContainerRef.current.scrollHeight;
     }
+    prevEventsLengthRef.current = currentLength;
   }, [events]);
 
   // Fetch API logs
@@ -294,6 +298,40 @@ const AutonomousResearchLogs = ({ stats, events }) => {
         return data.should_remove 
           ? `Redundancy: Removed ${data.paper_id}` 
           : 'Redundancy: No removal needed';
+      case 'proof_framing_decided':
+        return data.is_proof_amenable
+          ? 'Proof framing enabled for this run'
+          : 'Proof framing not applied for this run';
+      case 'proof_check_started':
+        if (data.trigger === 'manual') {
+          return `Manual proof check started for ${data.source_type} ${data.source_id}`;
+        }
+        if (data.trigger === 'retry') {
+          return `Paper-stage proof retry started for ${data.source_type} ${data.source_id}`;
+        }
+        return `Proof check started for ${data.source_type} ${data.source_id}`;
+      case 'proof_retry_scheduled':
+        return `Scheduled ${data.count || 0} proof retry candidate(s) for paper ${data.source_id}`;
+      case 'proof_retry_started':
+        return `Retrying ${data.count || 0} failed proof candidate(s) against paper ${data.source_id}`;
+      case 'proof_check_no_candidates':
+        return `No formal theorem candidates found in ${data.source_type} ${data.source_id}`;
+      case 'proof_check_candidates_found':
+        return `Proof candidates found: ${data.count || 0}`;
+      case 'proof_attempt_started':
+        return `Proof attempt ${data.attempt || 1}: ${data.theorem_statement || data.theorem_id}`;
+      case 'proof_attempt_failed':
+        return `Proof attempt ${data.attempt || '?'} failed: ${data.error_summary || data.theorem_statement || data.theorem_id}`;
+      case 'proof_verified':
+        return `Lean 4 verified: ${data.theorem_statement || data.theorem_id}`;
+      case 'proof_attempts_exhausted':
+        return `Proof attempts exhausted: ${data.theorem_statement || data.theorem_id}`;
+      case 'novel_proof_discovered':
+        return `Novel proof discovered: ${data.theorem_statement}`;
+      case 'known_proof_verified':
+        return `Known proof verified for ${data.source_type} ${data.source_id}`;
+      case 'proof_check_complete':
+        return `Proof check complete: ${data.verified_count || 0} verified, ${data.novel_count || 0} novel`;
       default:
         return event.event;
     }
@@ -301,6 +339,28 @@ const AutonomousResearchLogs = ({ stats, events }) => {
 
   const getEventClass = (event) => {
     const eventName = event.event || '';
+    if (eventName === 'proof_attempt_failed' || eventName === 'proof_attempts_exhausted') {
+      return 'log-reject';
+    }
+    if (
+      eventName === 'proof_verified' ||
+      eventName === 'novel_proof_discovered' ||
+      eventName === 'known_proof_verified' ||
+      eventName === 'proof_check_complete'
+    ) {
+      return 'log-success';
+    }
+    if (
+      eventName === 'proof_framing_decided' ||
+      eventName === 'proof_check_started' ||
+      eventName === 'proof_retry_scheduled' ||
+      eventName === 'proof_retry_started' ||
+      eventName === 'proof_check_no_candidates' ||
+      eventName === 'proof_check_candidates_found' ||
+      eventName === 'proof_attempt_started'
+    ) {
+      return 'log-info';
+    }
     if (eventName.includes('completed') || eventName.includes('accepted') || eventName === 'submission_accepted' || eventName === 'topic_exploration_complete' || eventName === 'paper_title_exploration_complete') {
       return 'log-success';
     }
@@ -663,7 +723,7 @@ const AutonomousResearchLogs = ({ stats, events }) => {
 
       {/* Event Log */}
       <h4 style={{ marginTop: '20px' }}>Event Log</h4>
-      <div className="logs-events">
+      <div className="logs-events" ref={eventsContainerRef}>
         {(!events || events.length === 0) ? (
           <div className="auto-empty-state">
             No events recorded yet.
@@ -686,7 +746,6 @@ const AutonomousResearchLogs = ({ stats, events }) => {
             </div>
           ))
         )}
-        <div ref={eventsEndRef} />
       </div>
     </div>
   );
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index 5bf898e..81b72ed 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -6,6 +6,12 @@
  */
 import React, { useState, useEffect } from 'react';
 import { openRouterAPI, api, autonomousAPI } from '../../services/api';
+import {
+  computeOpenRouterAutoSettings,
+  findOpenRouterModel,
+  getProviderNames,
+  hasEndpointMetadata,
+} from '../../utils/openRouterSelection';
 import {
   AUTONOMOUS_SETTINGS_STORAGE_KEY,
   AUTONOMOUS_PROFILES_STORAGE_KEY,
@@ -14,6 +20,7 @@ import {
   applyAutonomousProfileSelection,
   getStoredAutonomousSettings,
 } from '../../utils/autonomousProfiles';
+import HelpTooltip from '../HelpTooltip';
 import './AutonomousResearch.css';
 import '../settings-common.css';
 
@@ -28,35 +35,57 @@ const DEFAULT_SUBMITTER_CONFIG = {
 };
 
 // ModelSelector component - extracted outside to prevent recreation on every render
-const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProviderChange, onModelChange, onOpenrouterProviderChange, onFallbackChange, lmStudioModels, openRouterModels, modelProviders, hasOpenRouterKey, isRunning }) => {
-  const currentModels = provider === 'openrouter' ? openRouterModels : lmStudioModels;
-  const providers = modelId && provider === 'openrouter' ? (modelProviders[modelId] || []) : [];
+const ModelSelector = ({
+  provider,
+  modelId,
+  openrouterProv,
+  fallback,
+  onProviderChange,
+  onModelChange,
+  onOpenrouterProviderChange,
+  onFallbackChange,
+  lmStudioModels,
+  openRouterModels,
+  modelProviders,
+  hasOpenRouterKey,
+  isRunning,
+  lmStudioEnabled,
+}) => {
+  const effectiveProvider = lmStudioEnabled ? provider : 'openrouter';
+  const currentModels = effectiveProvider === 'openrouter' ? openRouterModels : lmStudioModels;
+  const providers = modelId && effectiveProvider === 'openrouter'
+    ? getProviderNames(modelProviders[modelId])
+    : [];
 
   return (
     <>
       {/* Provider Toggle */}
       <div className="settings-row">
         <label>Provider</label>
-        <div className="provider-toggle-group">
-          <button
-            type="button"
-            className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
-            onClick={() => onProviderChange('lm_studio')}
-            disabled={isRunning}
-          >
-            LM Studio
-          </button>
-          <button
-            type="button"
-            className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
-            onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
-            disabled={isRunning || !hasOpenRouterKey}
-            style={!hasOpenRouterKey ? { color: '#666' } : undefined}
-            title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
-          >
-            OpenRouter
-          </button>
-        </div>
+        {lmStudioEnabled ? (
+          <div className="provider-toggle-group">
+            <button
+              type="button"
+              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
+              onClick={() => onProviderChange('lm_studio')}
+              disabled={isRunning}
+            >
+              LM Studio
+            </button>
+            <button
+              type="button"
+              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
+              onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
+              disabled={isRunning || !hasOpenRouterKey}
+              style={!hasOpenRouterKey ? { color: '#666' } : undefined}
+              title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
+            >
+              OpenRouter
+            </button>
+          </div>
+        ) : (
+          <small className="settings-hint">OpenRouter is required in this deployment.</small>
+        )}
       </div>
 
       {/* Model Selection */}
@@ -69,7 +98,7 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
         >
           <option value="">Select model...</option>
           {currentModels.map(m => {
-            const isFree = provider === 'openrouter' && 
+            const isFree = effectiveProvider === 'openrouter' && 
                           m.pricing?.prompt === "0" && 
                           m.pricing?.completion === "0";
             const displayName = m.name || m.id;
@@ -85,7 +114,7 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
       </div>
 
       {/* OpenRouter Provider (if OpenRouter) */}
-      {provider === 'openrouter' && modelId && (
+      {effectiveProvider === 'openrouter' && modelId && (
         <div className="settings-row">
           <label>Host Provider (optional)</label>
           <select
@@ -102,7 +131,7 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
       )}
 
       {/* LM Studio Fallback (if OpenRouter) */}
-      {provider === 'openrouter' && (
+      {effectiveProvider === 'openrouter' && lmStudioEnabled && (
         <div className="settings-row">
           <label className="label--muted">LM Studio Fallback (optional)</label>
           <select
@@ -123,8 +152,26 @@ const ModelSelector = ({ provider, modelId, openrouterProv, fallback, onProvider
 };
 
 // RoleConfig component - extracted outside to prevent recreation on every render
-const RoleConfig = ({ title, hint, rolePrefix, borderColor = '#333', localConfig, handleProviderChange, handleModelChange, handleChange, handleNumericBlur, isRunning, lmStudioModels, openRouterModels, modelProviders, hasOpenRouterKey }) => {
-  const provider = localConfig[`${rolePrefix}_provider`] || 'lm_studio';
+const RoleConfig = ({
+  title,
+  hint,
+  rolePrefix,
+  borderColor = '#333',
+  localConfig,
+  handleProviderChange,
+  handleModelChange,
+  handleOpenRouterProviderChange,
+  handleChange,
+  handleNumericBlur,
+  isRunning,
+  lmStudioModels,
+  openRouterModels,
+  modelProviders,
+  hasOpenRouterKey,
+  lmStudioEnabled,
+}) => {
+  const storedProvider = localConfig[`${rolePrefix}_provider`] || 'lm_studio';
+  const provider = lmStudioEnabled ? storedProvider : 'openrouter';
   const modelId = localConfig[`${rolePrefix}_model`] || '';
   const openrouterProv = localConfig[`${rolePrefix}_openrouter_provider`];
   const fallback = localConfig[`${rolePrefix}_lm_studio_fallback`];
@@ -148,13 +195,14 @@ const RoleConfig = ({ title, hint, rolePrefix, borderColor = '#333', localConfig
         fallback={fallback}
         onProviderChange={(p) => handleProviderChange(rolePrefix, p)}
         onModelChange={(m) => handleModelChange(rolePrefix, m)}
-        onOpenrouterProviderChange={(p) => handleChange(`${rolePrefix}_openrouter_provider`, p)}
+        onOpenrouterProviderChange={(p) => handleOpenRouterProviderChange(rolePrefix, p)}
         onFallbackChange={(f) => handleChange(`${rolePrefix}_lm_studio_fallback`, f)}
         lmStudioModels={lmStudioModels}
         openRouterModels={openRouterModels}
         modelProviders={modelProviders}
         hasOpenRouterKey={hasOpenRouterKey}
         isRunning={isRunning}
+        lmStudioEnabled={lmStudioEnabled}
       />
 
       <div className="settings-row">
@@ -188,7 +236,7 @@ const RoleConfig = ({ title, hint, rolePrefix, borderColor = '#333', localConfig
   );
 };
 
-const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning }) => {
+const AutonomousResearchSettings = ({ config, onConfigChange, models, capabilities, isRunning }) => {
   // Models and OpenRouter state
   const [lmStudioModels, setLmStudioModels] = useState(models || []);
   const [openRouterModels, setOpenRouterModels] = useState([]);
@@ -215,6 +263,16 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
   const [hasStoredWolframKey, setHasStoredWolframKey] = useState(false);
   const [wolframTestResult, setWolframTestResult] = useState('');
   const [testingWolfram, setTestingWolfram] = useState(false);
+  const [proofStatus, setProofStatus] = useState(null);
+  const [proofSettingsEnabled, setProofSettingsEnabled] = useState(false);
+  const [proofSettingsTimeout, setProofSettingsTimeout] = useState('120');
+  const [proofSettingsLspEnabled, setProofSettingsLspEnabled] = useState(false);
+  const [proofSettingsLspIdleTimeout, setProofSettingsLspIdleTimeout] = useState('600');
+  const [proofSettingsSmtEnabled, setProofSettingsSmtEnabled] = useState(false);
+  const [proofSettingsZ3Path, setProofSettingsZ3Path] = useState('');
+  const [proofSettingsSmtTimeout, setProofSettingsSmtTimeout] = useState('30');
+  const [savingProofSettings, setSavingProofSettings] = useState(false);
+  const [proofSettingsMessage, setProofSettingsMessage] = useState('');
   
   // Critique prompt editor state
   const [advancedSettingsExpanded, setAdvancedSettingsExpanded] = useState(false);
@@ -222,6 +280,9 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
   const [customCritiquePrompt, setCustomCritiquePrompt] = useState('');
   const [critiquePromptSaved, setCritiquePromptSaved] = useState(false);
   const [defaultCritiquePrompt, setDefaultCritiquePrompt] = useState('');
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+  const genericMode = Boolean(capabilities?.genericMode);
+  const showLean4Settings = Boolean(lmStudioEnabled && proofStatus?.lean4_path && !genericMode);
 
   const handleCollapsibleKeyDown = (event, toggleFn) => {
     if (event.key === 'Enter' || event.key === ' ') {
@@ -387,17 +448,46 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
       }
 
       // Try to fetch fresh LM Studio models
-      try {
-        const freshModels = await api.getModels();
-        setLmStudioModels(freshModels);
-      } catch (err) {
-        console.error('Failed to fetch LM Studio models:', err);
+      if (lmStudioEnabled) {
+        try {
+          const freshModels = await api.getModels();
+          setLmStudioModels(freshModels.models || freshModels || []);
+        } catch (err) {
+          console.error('Failed to fetch LM Studio models:', err);
+        }
+      } else {
+        setLmStudioModels([]);
       }
       
       setIsLoadedFromStorage(true);
     };
     init();
-  }, []);
+  }, [lmStudioEnabled]);
+
+  useEffect(() => {
+    if (genericMode) {
+      setProofStatus(null);
+      return;
+    }
+
+    const loadProofStatus = async () => {
+      try {
+        const status = await autonomousAPI.getProofStatus();
+        setProofStatus(status);
+        setProofSettingsEnabled(Boolean(status.lean4_enabled));
+        setProofSettingsTimeout(String(status.lean4_proof_timeout ?? 120));
+        setProofSettingsLspEnabled(Boolean(status.lean4_lsp_enabled));
+        setProofSettingsLspIdleTimeout(String(status.lean4_lsp_idle_timeout ?? 600));
+        setProofSettingsSmtEnabled(Boolean(status.smt_enabled));
+        setProofSettingsZ3Path(status.z3_path || '');
+        setProofSettingsSmtTimeout(String(status.smt_timeout ?? 30));
+      } catch (err) {
+        console.error('Failed to load Lean 4 proof status:', err);
+      }
+    };
+
+    loadProofStatus();
+  }, [genericMode]);
 
   // Fetch providers for any OpenRouter models after settings are loaded
   useEffect(() => {
@@ -449,12 +539,81 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, isRunning
     localStorage.setItem(AUTONOMOUS_SETTINGS_STORAGE_KEY, JSON.stringify(settings));
   }, [isLoadedFromStorage, numSubmitters, submitterConfigs, localConfig, freeOnly, freeModelLooping, freeModelAutoSelector, tier3Enabled, modelProviders, selectedProfile]);
 
+  useEffect(() => {
+    if (!isLoadedFromStorage || lmStudioEnabled) {
+      return;
+    }
+
+    setLmStudioModels([]);
+
+    const normalizedSubmitters = submitterConfigs.map((submitterConfig) => {
+      const keepOpenRouterState = submitterConfig.provider === 'openrouter';
+      return {
+        ...submitterConfig,
+        provider: 'openrouter',
+        modelId: keepOpenRouterState ? (submitterConfig.modelId || '') : '',
+        openrouterProvider: keepOpenRouterState ? (submitterConfig.openrouterProvider || null) : null,
+        lmStudioFallbackId: null,
+      };
+    });
+
+    const normalizedLocalConfig = { ...localConfig };
+    ['validator', 'high_context', 'high_param', 'critique_submitter'].forEach((rolePrefix) => {
+      const providerKey = `${rolePrefix}_provider`;
+      const modelKey = `${rolePrefix}_model`;
+      const openRouterProviderKey = `${rolePrefix}_openrouter_provider`;
+      const fallbackKey = `${rolePrefix}_lm_studio_fallback`;
+      const keepOpenRouterState = normalizedLocalConfig[providerKey] === 'openrouter';
+
+      normalizedLocalConfig[providerKey] = 'openrouter';
+      normalizedLocalConfig[modelKey] = keepOpenRouterState ? (normalizedLocalConfig[modelKey] || '') : '';
+      normalizedLocalConfig[openRouterProviderKey] = keepOpenRouterState
+        ? (normalizedLocalConfig[openRouterProviderKey] || null)
+        : null;
+      normalizedLocalConfig[fallbackKey] = null;
+    });
+
+    if (JSON.stringify(normalizedSubmitters) !== JSON.stringify(submitterConfigs)) {
+      setSubmitterConfigs(normalizedSubmitters);
+    }
+    if (JSON.stringify(normalizedLocalConfig) !== JSON.stringify(localConfig)) {
+      setLocalConfig(normalizedLocalConfig);
+    }
+
+    const currentConfig = {
+      ...localConfig,
+      submitter_configs: submitterConfigs.slice(0, numSubmitters),
+      tier3_enabled: tier3Enabled,
+    };
+    const nextConfig = {
+      ...normalizedLocalConfig,
+      submitter_configs: normalizedSubmitters.slice(0, numSubmitters),
+      tier3_enabled: tier3Enabled,
+    };
+    if (JSON.stringify(nextConfig) !== JSON.stringify(currentConfig)) {
+      onConfigChange(nextConfig);
+    }
+  }, [
+    isLoadedFromStorage,
+    lmStudioEnabled,
+    submitterConfigs,
+    localConfig,
+    numSubmitters,
+    tier3Enabled,
+    onConfigChange,
+  ]);
+
   // Update LM Studio models when prop changes
   useEffect(() => {
+    if (!lmStudioEnabled) {
+      setLmStudioModels([]);
+      return;
+    }
+
     if (models && models.length > 0) {
       setLmStudioModels(models);
     }
-  }, [models]);
+  }, [models, lmStudioEnabled]);
 
   // Propagate tier3Enabled to parent config whenever it changes
   useEffect(() => {
@@ -536,13 +695,35 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   }, []);
 
   const fetchProvidersForModel = async (modelId) => {
-    if (!modelId || modelProviders[modelId]) return;
+    if (!modelId) return null;
+
+    const cachedProviderData = modelProviders[modelId];
+    if (hasEndpointMetadata(cachedProviderData)) {
+      return cachedProviderData;
+    }
+
     try {
       const result = await openRouterAPI.getProviders(modelId);
-      setModelProviders(prev => ({ ...prev, [modelId]: result.providers || [] }));
+      const providerData = {
+        providers: result.providers || [],
+        endpoints: result.endpoints || [],
+      };
+      setModelProviders(prev => ({ ...prev, [modelId]: providerData }));
+      return providerData;
     } catch (err) {
       console.error(`Failed to fetch providers for ${modelId}:`, err);
+      return cachedProviderData || null;
+    }
+  };
+
+  const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
+    const model = findOpenRouterModel(openRouterModels, modelId);
+    if (!model) {
+      return null;
     }
+
+    const providerData = await fetchProvidersForModel(modelId);
+    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
   };
 
   const markProfileAsCustom = () => {
@@ -611,11 +792,60 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   };
 
   // Handle model change with provider fetching for OpenRouter
-  const handleModelChange = (rolePrefix, modelId) => {
-    handleChange(`${rolePrefix}_model`, modelId);
-    if (localConfig[`${rolePrefix}_provider`] === 'openrouter' && modelId) {
-      fetchProvidersForModel(modelId);
+  const handleModelChange = async (rolePrefix, modelId) => {
+    const newConfig = {
+      ...localConfig,
+      [`${rolePrefix}_model`]: modelId,
+      [`${rolePrefix}_openrouter_provider`]: null,
+    };
+    markProfileAsCustom();
+    setLocalConfig(newConfig);
+    onConfigChange({ ...newConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
+
+    if (localConfig[`${rolePrefix}_provider`] !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, null);
+    if (!autoSettings) {
+      return;
     }
+
+    const autofilledConfig = {
+      ...newConfig,
+      [`${rolePrefix}_context_window`]: autoSettings.contextWindow,
+      [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens,
+    };
+    setLocalConfig(autofilledConfig);
+    onConfigChange({ ...autofilledConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
+  };
+
+  const handleOpenRouterProviderChange = async (rolePrefix, providerName) => {
+    const newConfig = {
+      ...localConfig,
+      [`${rolePrefix}_openrouter_provider`]: providerName,
+    };
+    markProfileAsCustom();
+    setLocalConfig(newConfig);
+    onConfigChange({ ...newConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
+
+    const modelId = newConfig[`${rolePrefix}_model`];
+    if (newConfig[`${rolePrefix}_provider`] !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, providerName);
+    if (!autoSettings) {
+      return;
+    }
+
+    const autofilledConfig = {
+      ...newConfig,
+      [`${rolePrefix}_context_window`]: autoSettings.contextWindow,
+      [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens,
+    };
+    setLocalConfig(autofilledConfig);
+    onConfigChange({ ...autofilledConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
   };
 
   // Handle number of submitters change
@@ -685,12 +915,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         [field]: newValue
       };
     }
-    
-    // Fetch providers if selecting OpenRouter model
-    if (field === 'modelId' && newConfigs[index].provider === 'openrouter' && newValue) {
-      fetchProvidersForModel(newValue);
-    }
-    
+
     markProfileAsCustom();
     setSubmitterConfigs(newConfigs);
     
@@ -700,6 +925,70 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
   };
 
+  const handleSubmitterModelChange = async (index, modelId) => {
+    const newConfigs = [...submitterConfigs];
+    newConfigs[index] = {
+      ...newConfigs[index],
+      modelId,
+      openrouterProvider: null,
+    };
+
+    markProfileAsCustom();
+    setSubmitterConfigs(newConfigs);
+    onConfigChange({ ...localConfig, submitter_configs: newConfigs.slice(0, numSubmitters) });
+
+    if (newConfigs[index].provider !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, null);
+    if (!autoSettings) {
+      return;
+    }
+
+    const autofilledConfigs = [...newConfigs];
+    autofilledConfigs[index] = {
+      ...autofilledConfigs[index],
+      contextWindow: autoSettings.contextWindow,
+      maxOutputTokens: autoSettings.maxOutputTokens,
+    };
+
+    setSubmitterConfigs(autofilledConfigs);
+    onConfigChange({ ...localConfig, submitter_configs: autofilledConfigs.slice(0, numSubmitters) });
+  };
+
+  const handleSubmitterOpenRouterProviderChange = async (index, providerName) => {
+    const newConfigs = [...submitterConfigs];
+    newConfigs[index] = {
+      ...newConfigs[index],
+      openrouterProvider: providerName,
+    };
+
+    markProfileAsCustom();
+    setSubmitterConfigs(newConfigs);
+    onConfigChange({ ...localConfig, submitter_configs: newConfigs.slice(0, numSubmitters) });
+
+    const modelId = newConfigs[index].modelId;
+    if (newConfigs[index].provider !== 'openrouter' || !modelId) {
+      return;
+    }
+
+    const autoSettings = await getAutoSettingsForModel(modelId, providerName);
+    if (!autoSettings) {
+      return;
+    }
+
+    const autofilledConfigs = [...newConfigs];
+    autofilledConfigs[index] = {
+      ...autofilledConfigs[index],
+      contextWindow: autoSettings.contextWindow,
+      maxOutputTokens: autoSettings.maxOutputTokens,
+    };
+
+    setSubmitterConfigs(autofilledConfigs);
+    onConfigChange({ ...localConfig, submitter_configs: autofilledConfigs.slice(0, numSubmitters) });
+  };
+
   // Handler for when user finishes editing a submitter numeric field
   const handleSubmitterNumericBlur = (index, field, value) => {
     const numericFields = ['contextWindow', 'maxOutputTokens'];
@@ -791,6 +1080,42 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
   };
 
+  const handleSaveProofSettings = async () => {
+    const parsedTimeout = parseInt(proofSettingsTimeout, 10);
+    const timeout = Number.isFinite(parsedTimeout) ? parsedTimeout : 120;
+    const parsedLspIdleTimeout = parseInt(proofSettingsLspIdleTimeout, 10);
+    const lspIdleTimeout = Number.isFinite(parsedLspIdleTimeout) ? parsedLspIdleTimeout : 600;
+    const parsedSmtTimeout = parseInt(proofSettingsSmtTimeout, 10);
+    const smtTimeout = Number.isFinite(parsedSmtTimeout) ? parsedSmtTimeout : 30;
+
+    try {
+      setSavingProofSettings(true);
+      setProofSettingsMessage('');
+      const status = await autonomousAPI.updateProofSettings({
+        enabled: proofSettingsEnabled,
+        timeout,
+        lean4_lsp_enabled: proofSettingsLspEnabled,
+        lean4_lsp_idle_timeout: lspIdleTimeout,
+        smt_enabled: proofSettingsSmtEnabled,
+        z3_path: proofSettingsZ3Path,
+        smt_timeout: smtTimeout,
+      });
+      setProofStatus(status);
+      setProofSettingsEnabled(Boolean(status.lean4_enabled));
+      setProofSettingsTimeout(String(status.lean4_proof_timeout ?? timeout));
+      setProofSettingsLspEnabled(Boolean(status.lean4_lsp_enabled));
+      setProofSettingsLspIdleTimeout(String(status.lean4_lsp_idle_timeout ?? lspIdleTimeout));
+      setProofSettingsSmtEnabled(Boolean(status.smt_enabled));
+      setProofSettingsZ3Path(status.z3_path || '');
+      setProofSettingsSmtTimeout(String(status.smt_timeout ?? smtTimeout));
+      setProofSettingsMessage('Lean 4 / SMT proof settings saved.');
+    } catch (err) {
+      setProofSettingsMessage(`Failed to save Lean 4 / SMT proof settings: ${err.message}`);
+    } finally {
+      setSavingProofSettings(false);
+    }
+  };
+
   const handleRestoreCritiquePrompt = () => {
     localStorage.removeItem('autonomous_critique_custom_prompt');
     setCustomCritiquePrompt(defaultCritiquePrompt);
@@ -918,18 +1243,22 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         <div className="known-models-sidebar">
           <h3 className="flex-row-center">
             <span>Highlighted Models</span>
-            <div className="tooltip-anchor">
+            <div className="help-tooltip-anchor">
               <button
-                className="info-tooltip-btn info-tooltip-btn--orange"
+                type="button"
+                className="help-tooltip-btn"
+                aria-label="Learn about highlighted models"
                 onMouseEnter={() => setShowTestedModelsTooltip(true)}
                 onMouseLeave={() => setShowTestedModelsTooltip(false)}
+                onFocus={() => setShowTestedModelsTooltip(true)}
+                onBlur={() => setShowTestedModelsTooltip(false)}
               >
                 ?
               </button>
               {showTestedModelsTooltip && (
                 /* sidebar-escape: fixed positioning so the tooltip breaks out of the
-                   322px sidebar and renders freely. See settings-common.css for coords. */
-                <div className="tooltip-popup tooltip-popup--sidebar-escape">
+                   322px sidebar and renders freely. See index.css for coords. */
+                <div className="help-tooltip-popup help-tooltip-popup--sidebar-escape">
                   The models and hosts listed here are not affiliated with MOTO or Intrafere LLC. This chart reflects developer-tested configurations intended to help guide model selection. All statements regarding pricing, performance, roles, rankings, or capabilities are speculative and based on individual testing experience. Intrafere LLC and the MOTO development team make no guarantees about the accuracy of this chart. MOTO is compatible with the majority of models, including many not listed here.
                 </div>
               )}
@@ -944,18 +1273,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="models-podium-label">Leaderboard</div>
               <div className="model-item model-item--ranked model-item--gold">
                 <div className="flex-row-center">
-                  <div className="model-item-name">Kimi K2.5</div>
+                  <div className="model-item-name">Kimi K2.6</div>
                   <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
-                  <div className="tooltip-anchor" style={{ zIndex: 100 }}>
+                  <div className="help-tooltip-anchor" style={{ zIndex: 100 }}>
                     <button
-                      className="info-tooltip-btn info-tooltip-btn--gold"
+                      type="button"
+                      className="help-tooltip-btn"
+                      aria-label="Learn about the King of the Hill ranking"
                       onMouseEnter={() => setShowKothTooltip(true)}
                       onMouseLeave={() => setShowKothTooltip(false)}
+                      onFocus={() => setShowKothTooltip(true)}
+                      onBlur={() => setShowKothTooltip(false)}
                     >
                       ?
                     </button>
                     {showKothTooltip && (
-                      <div className="tooltip-popup tooltip-popup--fixed" style={{ top: '50px', right: '20px' }}>
+                      <div
+                        className="help-tooltip-popup"
+                        style={{ top: 'auto', bottom: 'calc(100% + 10px)', left: 'calc(100% + 10px)', right: 'auto' }}
+                      >
                         This model was chosen by the Intrafere developers as the best overall performer in the MOTO harness, optimized for cost, speed, and knowledge.
                       </div>
                     )}
@@ -978,11 +1314,15 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   <div className="ranking-badge ranking-badge--bronze">🥉 BRONZE</div>
                 </div>
                 <div className="model-item-badge">Balanced knowledge and speed at low cost</div>
-                <div className="model-item-note">(outputs may corrupt over time depending on host)</div>
               </div>
             </div>
 
             {/* Alphabetical list (rest of models) */}
+
+            <div className="model-item">
+              <div className="model-item-name">Arcee AI's Trinity Large</div>
+              <div className="model-item-badge">Highly knowledgeable</div>
+            </div>
             
             <div className="model-item">
               <div className="model-item-name">Amazon Nova Pro/Premier</div>
@@ -1030,9 +1370,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             </div>
             
             <div className="model-item">
-              <div className="model-item-name">GPT OSS</div>
+              <div className="model-item-name">OpenAI's GPT OSS</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
-              <div className="model-item-note">(outputs may corrupt over time depending on host)</div>
             </div>
             
             <div className="model-item">
@@ -1094,11 +1433,27 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       <div className="settings-group" style={{ marginBottom: '1.5rem' }}>
         <h4>Profile Selection</h4>
         <p className="settings-info">
-          Load a recommended profile or create your own custom profile. (These models and hosts are not affiliated with MOTO/Intrafere)
+          Load one of the preselected example profiles as a starting point, or create your own custom profile. (These models and hosts are not affiliated with MOTO/Intrafere)
         </p>
         
         <div className="settings-row">
-          <label>Select Profile</label>
+          <label>
+            Select Profile
+            <HelpTooltip
+              label="Learn how profile selection works"
+              anchorClassName="help-tooltip-anchor--inline"
+              buttonClassName="help-tooltip-btn--green"
+              useFixedPosition
+            >
+              <strong>Profile menu guide</strong>
+              <br /><br />
+              <code>-- Custom Settings --</code> means no saved profile is currently loaded, so you are editing the settings manually.
+              <br /><br />
+              <code>Recommended Profiles</code> are preselected example profiles you can load as starting points.
+              <br /><br />
+              <code>My Profiles</code> contains any custom profiles you save from your current settings.
+            </HelpTooltip>
+          </label>
           <select
             value={selectedProfile}
             onChange={(e) => {
@@ -1219,20 +1574,22 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
       {/* Show only free models + model refresh controls — grouped at top */}
       <div className="model-refresh-controls">
-        <button 
-          className="secondary"
-          onClick={async () => {
-            try {
-              const freshModels = await api.getModels();
-              setLmStudioModels(freshModels);
-            } catch (err) {
-              console.error('Failed to refresh LM Studio models:', err);
-            }
-          }}
-          disabled={isRunning}
-        >
-          Refresh LM Studio Models
-        </button>
+        {lmStudioEnabled && (
+          <button 
+            className="secondary"
+            onClick={async () => {
+              try {
+                const freshModels = await api.getModels();
+                setLmStudioModels(freshModels.models || freshModels || []);
+              } catch (err) {
+                console.error('Failed to refresh LM Studio models:', err);
+              }
+            }}
+            disabled={isRunning}
+          >
+            Refresh LM Studio Models
+          </button>
+        )}
         {hasOpenRouterKey && (
           <>
             <button 
@@ -1301,13 +1658,16 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
         {/* Per-submitter configuration */}
         {submitterConfigs.slice(0, numSubmitters).map((cfg, idx) => (
+          (() => {
+            const effectiveProvider = lmStudioEnabled ? cfg.provider : 'openrouter';
+            return (
           <div 
             key={idx} 
-            className={`submitter-config-section${cfg.provider === 'openrouter' ? ' role-config-card--openrouter-orange' : (idx === 0 ? ' role-config-card--main' : '')}`}
+            className={`submitter-config-section${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter-orange' : (idx === 0 ? ' role-config-card--main' : '')}`}
           >
-            <h5 className={cfg.provider === 'openrouter' ? 'card-title--orange' : (idx === 0 ? 'card-title--green' : '')}>
+            <h5 className={effectiveProvider === 'openrouter' ? 'card-title--orange' : (idx === 0 ? 'card-title--green' : '')}>
               {idx === 0 ? 'Submitter 1 (Main Submitter)' : `Submitter ${idx + 1}`}
-              {cfg.provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
+              {effectiveProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
             </h5>
             
             <ModelSelector
@@ -1316,14 +1676,15 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               openrouterProv={cfg.openrouterProvider}
               fallback={cfg.lmStudioFallbackId}
               onProviderChange={(p) => handleSubmitterConfigChange(idx, 'provider', p)}
-              onModelChange={(m) => handleSubmitterConfigChange(idx, 'modelId', m)}
-              onOpenrouterProviderChange={(p) => handleSubmitterConfigChange(idx, 'openrouterProvider', p)}
+              onModelChange={(m) => handleSubmitterModelChange(idx, m)}
+              onOpenrouterProviderChange={(p) => handleSubmitterOpenRouterProviderChange(idx, p)}
               onFallbackChange={(f) => handleSubmitterConfigChange(idx, 'lmStudioFallbackId', f)}
               lmStudioModels={lmStudioModels}
               openRouterModels={openRouterModels}
               modelProviders={modelProviders}
               hasOpenRouterKey={hasOpenRouterKey}
               isRunning={isRunning}
+              lmStudioEnabled={lmStudioEnabled}
             />
 
             <div className="settings-row">
@@ -1354,6 +1715,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               />
             </div>
           </div>
+            );
+          })()
         ))}
       </div>
 
@@ -1371,6 +1734,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
+          handleOpenRouterProviderChange={handleOpenRouterProviderChange}
           handleChange={handleChange}
           handleNumericBlur={handleNumericBlur}
           isRunning={isRunning}
@@ -1378,6 +1742,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           openRouterModels={openRouterModels}
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
+          lmStudioEnabled={lmStudioEnabled}
         />
       </div>
 
@@ -1396,6 +1761,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
+          handleOpenRouterProviderChange={handleOpenRouterProviderChange}
           handleChange={handleChange}
           handleNumericBlur={handleNumericBlur}
           isRunning={isRunning}
@@ -1403,6 +1769,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           openRouterModels={openRouterModels}
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
+          lmStudioEnabled={lmStudioEnabled}
         />
 
         <RoleConfig
@@ -1413,6 +1780,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
+          handleOpenRouterProviderChange={handleOpenRouterProviderChange}
           handleChange={handleChange}
           handleNumericBlur={handleNumericBlur}
           isRunning={isRunning}
@@ -1420,6 +1788,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           openRouterModels={openRouterModels}
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
+          lmStudioEnabled={lmStudioEnabled}
         />
 
         <RoleConfig
@@ -1430,6 +1799,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
+          handleOpenRouterProviderChange={handleOpenRouterProviderChange}
           handleChange={handleChange}
           handleNumericBlur={handleNumericBlur}
           isRunning={isRunning}
@@ -1437,6 +1807,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           openRouterModels={openRouterModels}
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
+          lmStudioEnabled={lmStudioEnabled}
         />
       </div>
 
@@ -1477,6 +1848,184 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 </p>
               </div>
 
+              {showLean4Settings && (
+                <div style={{ marginBottom: '1.5rem' }}>
+                  <h4 className="form-group--compact">Lean 4 Proof Solver</h4>
+                  <small className="hint-text">
+                    Desktop-only controls for the automatic proof checker, manual proof runs, and certificate export.
+                  </small>
+
+                  <div className="settings-row">
+                    <label>Lean 4 Status</label>
+                    <div>
+                      <strong>{proofStatus?.lean4_enabled ? 'Enabled' : 'Disabled'}</strong>
+                      <small className="settings-hint" style={{ display: 'block', marginTop: '0.35rem' }}>
+                        Workspace: {proofStatus?.workspace_ready ? 'Ready' : 'Not ready yet'}
+                      </small>
+                    </div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Lean Version</label>
+                    <div>{proofStatus?.lean4_version || 'Unavailable'}</div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Mathlib Revision</label>
+                    <div>{proofStatus?.mathlib_commit || 'Unavailable'}</div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Lean Binary</label>
+                    <div>{proofStatus?.lean4_path || 'Launcher-managed / not detected yet'}</div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Workspace Directory</label>
+                    <div>{proofStatus?.lean4_workspace_dir || 'Unavailable'}</div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Persistent LSP Status</label>
+                    <div>
+                      {proofStatus?.lsp_active
+                        ? 'Active'
+                        : proofStatus?.lsp_available
+                          ? 'Available'
+                          : 'Disabled'}
+                    </div>
+                  </div>
+
+                  <div className="settings-row">
+                    <label>Z3 Status</label>
+                    <div>
+                      <strong>{proofStatus?.smt_available ? 'Ready' : 'Unavailable'}</strong>
+                      <small className="settings-hint" style={{ display: 'block', marginTop: '0.35rem' }}>
+                        {proofStatus?.z3_version || 'No Z3 version detected yet'}
+                      </small>
+                    </div>
+                  </div>
+
+                  <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ cursor: isRunning ? 'not-allowed' : 'pointer', marginTop: '1rem' }}>
+                    <input
+                      type="checkbox"
+                      checked={proofSettingsEnabled}
+                      onChange={(e) => setProofSettingsEnabled(e.target.checked)}
+                      disabled={isRunning || savingProofSettings}
+                    />
+                    <span className="settings-option-copy">
+                      <span className="settings-option-title">Enable Lean 4 proof verification</span>
+                      <span className="settings-option-description">
+                        Turns on automatic proof checks after brainstorm and paper completion plus manual proof checks from the Proofs tab.
+                      </span>
+                    </span>
+                  </label>
+
+                  <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ cursor: isRunning ? 'not-allowed' : 'pointer', marginTop: '1rem' }}>
+                    <input
+                      type="checkbox"
+                      checked={proofSettingsLspEnabled}
+                      onChange={(e) => setProofSettingsLspEnabled(e.target.checked)}
+                      disabled={isRunning || savingProofSettings}
+                    />
+                    <span className="settings-option-copy">
+                      <span className="settings-option-title">Enable persistent Lean LSP mode</span>
+                      <span className="settings-option-description">
+                        Keeps a warm Lean server available for lower-latency proof verification while preserving subprocess fallback.
+                      </span>
+                    </span>
+                  </label>
+
+                  <div className="settings-row">
+                    <label>Proof Timeout (seconds)</label>
+                    <input
+                      type="number"
+                      value={proofSettingsTimeout}
+                      onChange={(e) => setProofSettingsTimeout(e.target.value)}
+                      disabled={isRunning || savingProofSettings}
+                      min={10}
+                      max={3600}
+                      step={5}
+                    />
+                  </div>
+
+                  <div className="settings-row">
+                    <label>LSP Idle Timeout (seconds)</label>
+                    <input
+                      type="number"
+                      value={proofSettingsLspIdleTimeout}
+                      onChange={(e) => setProofSettingsLspIdleTimeout(e.target.value)}
+                      disabled={isRunning || savingProofSettings}
+                      min={60}
+                      max={7200}
+                      step={30}
+                    />
+                  </div>
+
+                  <div style={{ marginTop: '1rem' }}>
+                    <h5 className="form-group--compact">SMT (Z3) Integration</h5>
+                    <small className="hint-text">
+                      Optional early theorem classification and Lean tactic hinting for arithmetic-friendly proof goals. Lean 4 remains authoritative for every stored proof.
+                    </small>
+                  </div>
+
+                  <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ cursor: isRunning ? 'not-allowed' : 'pointer', marginTop: '1rem' }}>
+                    <input
+                      type="checkbox"
+                      checked={proofSettingsSmtEnabled}
+                      onChange={(e) => setProofSettingsSmtEnabled(e.target.checked)}
+                      disabled={isRunning || savingProofSettings}
+                    />
+                    <span className="settings-option-copy">
+                      <span className="settings-option-title">Enable SMT-assisted proof guidance</span>
+                      <span className="settings-option-description">
+                        Runs Z3 on conservative SMT-amenable goals and feeds any successful result back into Lean proof prompting as hints only.
+                      </span>
+                    </span>
+                  </label>
+
+                  <div className="settings-row">
+                    <label>Z3 Binary Path</label>
+                    <input
+                      type="text"
+                      value={proofSettingsZ3Path}
+                      onChange={(e) => setProofSettingsZ3Path(e.target.value)}
+                      disabled={isRunning || savingProofSettings}
+                      placeholder="Optional explicit z3 path"
+                    />
+                  </div>
+
+                  <div className="settings-row">
+                    <label>SMT Timeout (seconds)</label>
+                    <input
+                      type="number"
+                      value={proofSettingsSmtTimeout}
+                      onChange={(e) => setProofSettingsSmtTimeout(e.target.value)}
+                      disabled={isRunning || savingProofSettings}
+                      min={1}
+                      max={600}
+                      step={1}
+                    />
+                  </div>
+
+                  <div className="actions-row">
+                    <button
+                      className="btn-success-sm"
+                      onClick={handleSaveProofSettings}
+                      disabled={isRunning || savingProofSettings}
+                    >
+                      {savingProofSettings ? 'Saving...' : 'Save Proof Settings'}
+                    </button>
+                  </div>
+
+                  {proofSettingsMessage && (
+                    <div className={`test-result-banner ${proofSettingsMessage.startsWith('Failed') ? 'test-result-banner--error' : 'test-result-banner--success'}`}>
+                      {proofSettingsMessage}
+                    </div>
+                  )}
+                </div>
+              )}
+
               <h4 className="form-group--compact">Wolfram Alpha Integration (Optional)</h4>
               <small className="hint-text">
                 Enable Wolfram Alpha API for computational verification in rigor mode. When selecting your key select "full results" for your key type, then copy your APP ID and save it here. This key is also shared with the manual compiler mode.
@@ -1512,12 +2061,22 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                       type="password"
                       value={wolframApiKey}
                       onChange={(e) => setWolframApiKey(e.target.value)}
-                      placeholder={hasStoredWolframKey && !wolframApiKey ? "Stored securely on backend. Enter a new App ID to replace it." : "Enter your Wolfram Alpha App ID"}
+                      placeholder={
+                        hasStoredWolframKey && !wolframApiKey
+                          ? (
+                            genericMode
+                              ? 'Loaded in the current backend session. Enter a new App ID to replace it.'
+                              : 'Stored securely on backend. Enter a new App ID to replace it.'
+                          )
+                          : 'Enter your Wolfram Alpha App ID'
+                      }
                       className="input-dark"
                     />
                     {hasStoredWolframKey && !wolframApiKey && (
                       <small className="hint-text">
-                        A Wolfram Alpha key is already stored securely on the backend for this machine.
+                        {genericMode
+                          ? 'A Wolfram Alpha key is already loaded in the current backend session.'
+                          : 'A Wolfram Alpha key is already stored securely on the backend for this machine.'}
                       </small>
                     )}
                   </div>
@@ -1558,11 +2117,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             {/* Tier 3 Final Answer Toggle */}
             <div className="settings-subsection settings-subsection--accent-danger">
               <div className="settings-subsection-header">
-                <h5 className="settings-subsection-title">Experimental / Ending Options</h5>
+                <h5 className="settings-subsection-title">Advanced / Ending Options</h5>
               </div>
               <h4 className="form-group--compact">Stage 3: Final Answer Generation</h4>
               <p className="settings-info">
-                Feature in construction. Enabling this is optional and not recommended. Stage 3 is a highly experimental mode. Most users should not enable this feature — it is expensive and wasteful at this current stage of development. When enabled, the system will automatically synthesize all completed Stage 2 papers into a final answer that is often book-length or greater. This feature is highly hallucinatory — Stage 2 papers are the recommended final output. Disabled by default; final paper quality is currently much lower than Stage 2 papers. Once optimized and better-functioning, this mode will be advertised more.
+                Feature in construction. Enabling this is optional and not recommended. Stage 3 is an in-development mode. Most users should not enable this feature — it is expensive and wasteful at this current stage of development. When enabled, the system will automatically synthesize all completed Stage 2 papers into a final answer that is often book-length or greater. This feature is highly hallucinatory — Stage 2 papers are the recommended final output. Disabled by default; final paper quality is currently much lower than Stage 2 papers. Once optimized and better-functioning, this mode will be advertised more.
               </p>
               <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}>
                 <input
@@ -1572,7 +2131,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   disabled={isRunning}
                 />
                 <span className="settings-option-copy">
-                  <span className="settings-option-title">Enable Stage 3 Final Answer Generation (Very Experimental)</span>
+                  <span className="settings-option-title">Enable Stage 3 Final Answer Generation (In Development)</span>
                   <span className="settings-option-description">
                     Allows the system to synthesize completed Stage 2 papers into a final answer after enough papers accumulate.
                   </span>
@@ -1703,10 +2262,13 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                     <span className="settings-option-copy">
                       <span className="settings-option-title">
                         Enable Free Model Looping
-                        <span
-                          title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
-                          className="help-hint"
-                        >(?)</span>
+                        <HelpTooltip
+                          label="Learn about free model looping"
+                          anchorClassName="help-tooltip-anchor--inline"
+                          popupStyle={{ top: 'auto', bottom: 'calc(100% + 10px)', left: 'calc(100% + 10px)', right: 'auto' }}
+                        >
+                          When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
+                        </HelpTooltip>
                       </span>
                       <span className="settings-option-description">
                         Automatically rotate to the next selected free model when one hits a rate limit.
@@ -1725,10 +2287,13 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                     <span className="settings-option-copy">
                       <span className="settings-option-title">
                         Use OpenRouter Free Models Auto-Selector as Backup
-                        <span
-                          title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
-                          className="help-hint"
-                        >(?)</span>
+                        <HelpTooltip
+                          label="Learn about the free models auto-selector backup"
+                          anchorClassName="help-tooltip-anchor--inline"
+                          popupStyle={{ top: 'auto', bottom: 'calc(100% + 10px)', left: 'calc(100% + 10px)', right: 'auto' }}
+                        >
+                          When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
+                        </HelpTooltip>
                       </span>
                       <span className="settings-option-description">
                         Falls back to OpenRouter&apos;s free router when every selected free model is temporarily exhausted.
diff --git a/frontend/src/components/autonomous/BrainstormList.jsx b/frontend/src/components/autonomous/BrainstormList.jsx
index 27f6447..5c10613 100644
--- a/frontend/src/components/autonomous/BrainstormList.jsx
+++ b/frontend/src/components/autonomous/BrainstormList.jsx
@@ -6,6 +6,7 @@ import React, { useState, useEffect, useRef } from 'react';
 import './AutonomousResearch.css';
 import { websocket } from '../../services/websocket';
 import LatexRenderer from '../LatexRenderer';
+import { useProofCheckRuntime } from '../../hooks/useProofCheckRuntime';
 import { prependDisclaimer } from '../../utils/disclaimerHelper';
 
 const BrainstormList = ({ brainstorms, onRefresh, api }) => {
@@ -18,6 +19,13 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
   const [showLatex, setShowLatex] = useState(true);
   const [userChoseLatex, setUserChoseLatex] = useState(false);
   const unsubscribeRef = useRef(null);
+  const [proofActionMessage, setProofActionMessage] = useState('');
+  const {
+    getSourceState,
+    manualCheckEnabled,
+    manualCheckReason,
+    queueManualProofCheck,
+  } = useProofCheckRuntime();
 
   // Auto-disable LaTeX rendering when brainstorm grows large (>50k chars).
   // Only fires if the user has not explicitly toggled the LaTeX checkbox.
@@ -129,6 +137,20 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
     URL.revokeObjectURL(url);
   };
 
+  const handleProofCheck = async (e, brainstorm) => {
+    e.stopPropagation();
+    try {
+      setProofActionMessage('');
+      await queueManualProofCheck({
+        sourceType: 'brainstorm',
+        sourceId: brainstorm.topic_id,
+      });
+      setProofActionMessage(`Queued proof check for brainstorm ${brainstorm.topic_id}.`);
+    } catch (error) {
+      setProofActionMessage(`Failed to queue proof check: ${error.message}`);
+    }
+  };
+
   const formatDate = (dateStr) => {
     if (!dateStr) return 'N/A';
     return new Date(dateStr).toLocaleString();
@@ -165,6 +187,12 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
         (WARNING: Any given brainstorm idea may be pruned/deleted if the AI deems it to hurt the collective database quality. These brainstorms are the real powerhouse behind the ASI creativity! The brainstorms themselves often contain many great ideas that get turned into the stage 2 papers.)
       </div>
 
+      {proofActionMessage && (
+        <div className={`test-result-banner ${proofActionMessage.startsWith('Failed') ? 'test-result-banner--error' : 'test-result-banner--success'}`}>
+          {proofActionMessage}
+        </div>
+      )}
+
       {brainstorms.map((brainstorm) => (
         <div
           key={brainstorm.topic_id}
@@ -212,13 +240,39 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
                 </div>
               </div>
             ) : (
-              <button 
-                className="btn-delete-brainstorm"
-                onClick={(e) => handleDeleteClick(e, brainstorm.topic_id)}
-                title="Delete brainstorm and associated papers"
-              >
-                Delete
-              </button>
+              <>
+                {(() => {
+                  const proofCheckState = getSourceState('brainstorm', brainstorm.topic_id);
+                  const proofCheckLabel = proofCheckState?.status === 'queued'
+                    ? 'Queueing Proof Check...'
+                    : proofCheckState?.status === 'running'
+                      ? `Proof Check Running${proofCheckState.candidateCount ? ` (${proofCheckState.candidateCount})` : '...'}`
+                      : 'Try to prove with Lean 4 theorem prover';
+                  const disabledReason = brainstorm.status !== 'complete'
+                    ? 'Manual proof checks require a completed brainstorm.'
+                    : manualCheckReason;
+                  return (
+                    <button
+                      className="btn-download-small"
+                      onClick={(e) => handleProofCheck(e, brainstorm)}
+                      disabled={!manualCheckEnabled || Boolean(proofCheckState) || brainstorm.status !== 'complete'}
+                      title={proofCheckState?.status === 'running'
+                        ? 'A proof verification is already running for this brainstorm.'
+                        : disabledReason || 'Queue a manual proof check for this brainstorm.'}
+                    >
+                      {proofCheckLabel}
+                    </button>
+                  );
+                })()}
+
+                <button 
+                  className="btn-delete-brainstorm"
+                  onClick={(e) => handleDeleteClick(e, brainstorm.topic_id)}
+                  title="Delete brainstorm and associated papers"
+                >
+                  Delete
+                </button>
+              </>
             )}
           </div>
 
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
index 398072f..8b700e5 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
@@ -291,7 +291,7 @@ function FinalAnswerLibrary() {
       {/* Header */}
       <div className="library-header">
         <h2>📚 Stage 3 Final Answers History</h2>
-        <p>If you have enabled Tier 3 experimental final answer generation, completed Stage 3 answers will appear here. Browse all completed research volumes and short-form answers from your autonomous research sessions.</p>
+        <p>If you have enabled Tier 3 final answer generation, completed Stage 3 answers will appear here. Browse all completed research volumes and short-form answers from your autonomous research sessions.</p>
         <div className="library-stats">
           <span className="stat-badge">
             {finalAnswers.length} {finalAnswers.length === 1 ? 'Answer' : 'Answers'}
diff --git a/frontend/src/components/autonomous/FinalAnswerView.jsx b/frontend/src/components/autonomous/FinalAnswerView.jsx
index 47bad41..55d0e2e 100644
--- a/frontend/src/components/autonomous/FinalAnswerView.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerView.jsx
@@ -9,6 +9,7 @@ import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
 import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
+import { getRuntimeDataPath } from '../../utils/runtimeConfig';
 import './AutonomousResearch.css';
 
 const FinalAnswerView = ({ api, isRunning, status }) => {
@@ -400,7 +401,7 @@ const FinalAnswerView = ({ api, isRunning, status }) => {
       <div className="tier3-section content-section">
         <h4>Final Answer Paper</h4>
         <div className="paper-library-file-location" style={{ fontSize: '0.75em', color: '#aaa', marginBottom: '0.75em', lineHeight: '1.5' }}>
-          📁 For manual file retrieval, the short-form final answer is saved at: <code>backend/data/auto_sessions/[session_folder]/final_answer/final_short_form_paper.txt</code>. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
+          📁 For manual file retrieval, the short-form final answer is saved at: <code>{getRuntimeDataPath('auto_sessions/[session_folder]/final_answer/final_short_form_paper.txt')}</code>. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
         </div>
         {shortFormPaper ? (
           <div className="paper-content-container" ref={containerRef}>
@@ -435,7 +436,7 @@ const FinalAnswerView = ({ api, isRunning, status }) => {
       <div className="tier3-section content-section">
         <h4>Volume Content</h4>
         <div className="paper-library-file-location" style={{ fontSize: '0.75em', color: '#aaa', marginBottom: '0.75em', lineHeight: '1.5' }}>
-          📁 For manual file retrieval, the long-form volume is saved at: <code>backend/data/auto_sessions/[session_folder]/final_answer/final_volume.txt</code>. Individual chapter papers are stored as <code>chapter_[index]_paper.txt</code> in the same directory. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
+          📁 For manual file retrieval, the long-form volume is saved at: <code>{getRuntimeDataPath('auto_sessions/[session_folder]/final_answer/final_volume.txt')}</code>. Individual chapter papers are stored as <code>chapter_[index]_paper.txt</code> in the same directory. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
         </div>
         {volumeContent && volumeContent.content ? (
           <div className="volume-content-container" ref={containerRef}>
@@ -611,7 +612,7 @@ const FinalAnswerView = ({ api, isRunning, status }) => {
                         disabled={(!shortFormPaper && !volumeContent)}
                         title="Ask validator to critique this final answer"
                         style={{
-                          background: 'linear-gradient(135deg, #9b59b6 0%, #8e44ad 100%)',
+                          background: 'linear-gradient(135deg, #18cc17 0%, #0f9110 100%)',
                           border: 'none',
                           color: '#fff',
                           padding: '0.5rem 1rem',
diff --git a/frontend/src/components/autonomous/LiveTier3Progress.jsx b/frontend/src/components/autonomous/LiveTier3Progress.jsx
index 4627349..504ed6e 100644
--- a/frontend/src/components/autonomous/LiveTier3Progress.jsx
+++ b/frontend/src/components/autonomous/LiveTier3Progress.jsx
@@ -401,8 +401,8 @@ const LiveTier3Progress = ({ api, status }) => {
         }
 
         .tier3-status-gray { background: #4a4a4a; color: #ccc; }
-        .tier3-status-blue { background: #1e40af; color: #93c5fd; }
-        .tier3-status-purple { background: #6b21a8; color: #d8b4fe; }
+        .tier3-status-blue { background: #0f5a10; color: #7dff6f; }
+        .tier3-status-purple { background: #0f5a10; color: #7dff6f; }
         .tier3-status-green { background: #166534; color: #86efac; }
         .tier3-status-gold { background: #0f5a10; color: #7dff6f; }
 
diff --git a/frontend/src/components/autonomous/MathematicalProofs.css b/frontend/src/components/autonomous/MathematicalProofs.css
new file mode 100644
index 0000000..f6ef116
--- /dev/null
+++ b/frontend/src/components/autonomous/MathematicalProofs.css
@@ -0,0 +1,400 @@
+.math-proofs-view {
+  padding: 1.5rem;
+  display: flex;
+  flex-direction: column;
+  gap: 1rem;
+  color: var(--text-primary, #e5e7eb);
+}
+
+.math-proofs-header {
+  display: flex;
+  justify-content: space-between;
+  gap: 1rem;
+  align-items: flex-start;
+  flex-wrap: wrap;
+}
+
+.math-proofs-header h2 {
+  margin: 0 0 0.35rem 0;
+  color: var(--text-primary, #f3f4f6);
+}
+
+.math-proofs-header p {
+  margin: 0;
+  color: var(--text-secondary, #9ca3af);
+  max-width: 60rem;
+}
+
+.math-proofs-status-group {
+  display: flex;
+  align-items: center;
+  gap: 0.75rem;
+  flex-wrap: wrap;
+}
+
+.math-proofs-status,
+.math-proofs-count,
+.math-proofs-version,
+.math-proofs-filter,
+.math-proofs-refresh {
+  border-radius: 999px;
+  border: 1px solid var(--border-default, #374151);
+  background: var(--surface-2, #111827);
+  color: var(--text-primary, #f3f4f6);
+  padding: 0.5rem 0.85rem;
+  font-size: 0.9rem;
+}
+
+.math-proofs-status.ready {
+  border-color: rgba(34, 197, 94, 0.5);
+  color: #86efac;
+}
+
+.math-proofs-status.pending {
+  border-color: rgba(250, 204, 21, 0.4);
+  color: #fde68a;
+}
+
+.math-proofs-status.disabled {
+  border-color: rgba(248, 113, 113, 0.4);
+  color: #fca5a5;
+}
+
+.math-proofs-toolbar {
+  display: flex;
+  justify-content: space-between;
+  gap: 1rem;
+  flex-wrap: wrap;
+}
+
+.math-proofs-toolbar-groups,
+.math-proofs-version-group {
+  display: flex;
+  gap: 0.75rem;
+  flex-wrap: wrap;
+}
+
+.math-proofs-manual-panel {
+  display: flex;
+  justify-content: space-between;
+  gap: 1rem;
+  flex-wrap: wrap;
+  padding: 1rem 1.1rem;
+  border-radius: 1rem;
+  border: 1px solid var(--border-default, #374151);
+  background: rgba(255, 255, 255, 0.02);
+}
+
+.math-proofs-manual-copy {
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+}
+
+.math-proofs-manual-copy strong {
+  color: var(--text-primary, #f3f4f6);
+}
+
+.math-proofs-manual-copy span {
+  color: var(--text-secondary, #9ca3af);
+}
+
+.math-proofs-manual-controls {
+  display: flex;
+  align-items: center;
+  gap: 0.75rem;
+  flex-wrap: wrap;
+}
+
+.math-proofs-manual-controls select,
+.math-proofs-run-check {
+  border-radius: 0.8rem;
+  border: 1px solid var(--border-default, #374151);
+  background: var(--surface-2, #111827);
+  color: var(--text-primary, #f3f4f6);
+  padding: 0.6rem 0.8rem;
+  font-size: 0.92rem;
+}
+
+.math-proofs-run-check {
+  cursor: pointer;
+  transition: border-color 0.2s ease, background 0.2s ease, transform 0.2s ease;
+}
+
+.math-proofs-run-check:hover:not(:disabled) {
+  border-color: var(--accent-green, #22c55e);
+  transform: translateY(-1px);
+}
+
+.math-proofs-run-check:disabled {
+  cursor: not-allowed;
+  opacity: 0.6;
+}
+
+.math-proofs-banner {
+  padding: 0.95rem 1rem;
+  border-radius: 0.9rem;
+  border: 1px solid var(--border-default, #374151);
+  background: rgba(255, 255, 255, 0.02);
+}
+
+.math-proofs-banner.success {
+  color: #86efac;
+  border-color: rgba(34, 197, 94, 0.35);
+}
+
+.math-proofs-banner.error {
+  color: #fca5a5;
+  border-color: rgba(248, 113, 113, 0.35);
+}
+
+.math-proofs-filters {
+  display: flex;
+  gap: 0.75rem;
+  flex-wrap: wrap;
+}
+
+.math-proofs-filter,
+.math-proofs-refresh,
+.math-proof-expand {
+  cursor: pointer;
+  transition: border-color 0.2s ease, background 0.2s ease, transform 0.2s ease;
+}
+
+.math-proofs-filter:hover,
+.math-proofs-refresh:hover,
+.math-proof-expand:hover {
+  border-color: var(--accent-green, #22c55e);
+  transform: translateY(-1px);
+}
+
+.math-proofs-filter.active {
+  background: rgba(34, 197, 94, 0.14);
+  color: #86efac;
+}
+
+.math-proofs-filter:disabled {
+  cursor: not-allowed;
+  opacity: 0.55;
+  transform: none;
+}
+
+.math-proofs-empty,
+.math-proofs-error {
+  padding: 1.25rem;
+  border-radius: 1rem;
+  border: 1px solid var(--border-default, #374151);
+  background: var(--surface-2, #111827);
+  color: var(--text-secondary, #9ca3af);
+}
+
+.math-proofs-error {
+  color: #fca5a5;
+  border-color: rgba(248, 113, 113, 0.4);
+}
+
+.math-proofs-list {
+  display: grid;
+  gap: 1rem;
+}
+
+.math-proof-card {
+  border: 1px solid var(--border-default, #374151);
+  border-radius: 1rem;
+  background: linear-gradient(180deg, rgba(17, 24, 39, 0.95), rgba(15, 23, 42, 0.96));
+  padding: 1rem 1.1rem;
+  box-shadow: 0 10px 30px rgba(0, 0, 0, 0.18);
+}
+
+.math-proof-card.novel {
+  border-color: rgba(34, 197, 94, 0.35);
+}
+
+.math-proof-card.known {
+  border-color: rgba(96, 165, 250, 0.28);
+}
+
+.math-proof-card-header {
+  display: flex;
+  justify-content: space-between;
+  gap: 1rem;
+  align-items: flex-start;
+}
+
+.math-proof-card-topline {
+  display: flex;
+  gap: 0.65rem;
+  flex-wrap: wrap;
+  margin-bottom: 0.5rem;
+}
+
+.math-proof-badge,
+.math-proof-source {
+  display: inline-flex;
+  align-items: center;
+  border-radius: 999px;
+  padding: 0.2rem 0.6rem;
+  font-size: 0.78rem;
+  border: 1px solid var(--border-default, #374151);
+  background: rgba(255, 255, 255, 0.03);
+}
+
+.math-proof-badge.novel {
+  color: #86efac;
+  border-color: rgba(34, 197, 94, 0.35);
+}
+
+.math-proof-badge.known {
+  color: #18cc17;
+  border-color: rgba(96, 165, 250, 0.35);
+}
+
+.math-proof-source {
+  color: var(--text-secondary, #9ca3af);
+}
+
+.math-proof-card h3 {
+  margin: 0 0 0.5rem 0;
+  font-size: 1.05rem;
+  line-height: 1.45;
+}
+
+.math-proof-summary {
+  margin: 0;
+  color: var(--text-secondary, #9ca3af);
+  line-height: 1.55;
+}
+
+.math-proof-expand {
+  padding: 0.55rem 0.85rem;
+  border-radius: 0.75rem;
+  border: 1px solid var(--border-default, #374151);
+  background: rgba(255, 255, 255, 0.02);
+  color: var(--text-primary, #f3f4f6);
+  white-space: nowrap;
+}
+
+.math-proof-meta {
+  margin-top: 0.8rem;
+  display: flex;
+  flex-wrap: wrap;
+  gap: 1rem;
+  color: var(--text-secondary, #9ca3af);
+  font-size: 0.86rem;
+}
+
+.math-proof-details {
+  margin-top: 1rem;
+  display: grid;
+  gap: 0.85rem;
+}
+
+.math-proof-actions {
+  display: flex;
+  gap: 0.75rem;
+  flex-wrap: wrap;
+}
+
+.math-proof-download {
+  display: inline-flex;
+  align-items: center;
+  border-radius: 0.8rem;
+  border: 1px solid rgba(34, 197, 94, 0.28);
+  background: rgba(34, 197, 94, 0.08);
+  color: #86efac;
+  padding: 0.55rem 0.8rem;
+  text-decoration: none;
+  transition: border-color 0.2s ease, transform 0.2s ease;
+}
+
+.math-proof-download:hover {
+  border-color: rgba(34, 197, 94, 0.5);
+  transform: translateY(-1px);
+}
+
+.math-proof-detail-block {
+  border: 1px solid rgba(148, 163, 184, 0.16);
+  border-radius: 0.85rem;
+  background: rgba(255, 255, 255, 0.02);
+  padding: 0.85rem 0.95rem;
+}
+
+.math-proof-detail-block strong {
+  display: block;
+  margin-bottom: 0.45rem;
+  color: var(--text-primary, #f3f4f6);
+}
+
+.math-proof-dependency-groups {
+  display: grid;
+  gap: 0.85rem;
+}
+
+.math-proof-dependency-heading {
+  font-size: 0.88rem;
+  font-weight: 600;
+  color: var(--text-primary, #f3f4f6);
+  margin-bottom: 0.45rem;
+}
+
+.math-proof-dependency-list {
+  margin: 0;
+  padding-left: 1rem;
+  display: grid;
+  gap: 0.4rem;
+  color: var(--text-secondary, #cbd5e1);
+}
+
+.math-proof-dependency-list li {
+  display: grid;
+  gap: 0.12rem;
+}
+
+.math-proof-dependency-kind {
+  display: inline-flex;
+  width: fit-content;
+  border-radius: 999px;
+  border: 1px solid rgba(96, 165, 250, 0.3);
+  background: rgba(96, 165, 250, 0.08);
+  color: #18cc17;
+  font-size: 0.72rem;
+  padding: 0.08rem 0.45rem;
+}
+
+.math-proof-dependency-source,
+.math-proof-dependency-empty {
+  color: var(--text-secondary, #9ca3af);
+  font-size: 0.84rem;
+}
+
+.math-proof-code {
+  margin: 0;
+  padding: 0.85rem;
+  border-radius: 0.75rem;
+  background: #020617;
+  color: #d1fae5;
+  overflow-x: auto;
+  white-space: pre-wrap;
+  word-break: break-word;
+  font-size: 0.86rem;
+  line-height: 1.45;
+}
+
+@media (max-width: 900px) {
+  .math-proofs-manual-controls {
+    width: 100%;
+  }
+
+  .math-proofs-manual-controls select,
+  .math-proofs-run-check {
+    width: 100%;
+  }
+
+  .math-proof-card-header {
+    flex-direction: column;
+  }
+
+  .math-proof-expand {
+    width: 100%;
+  }
+}
diff --git a/frontend/src/components/autonomous/MathematicalProofs.jsx b/frontend/src/components/autonomous/MathematicalProofs.jsx
new file mode 100644
index 0000000..b77cddc
--- /dev/null
+++ b/frontend/src/components/autonomous/MathematicalProofs.jsx
@@ -0,0 +1,694 @@
+import React, { useEffect, useMemo, useState } from 'react';
+import './MathematicalProofs.css';
+import ProofGraph from './ProofGraph';
+
+function formatDate(isoString) {
+  if (!isoString) {
+    return 'Unknown';
+  }
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function truncate(text, maxLength = 220) {
+  if (!text) {
+    return '';
+  }
+  return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
+}
+
+function getLeanStatusLabel(status) {
+  if (!status?.lean4_enabled) {
+    return 'Lean 4 Disabled';
+  }
+  if (status?.lsp_active) {
+    return status.workspace_ready ? 'Lean 4 Ready (LSP)' : 'Lean 4 LSP Starting';
+  }
+  if (status.workspace_ready) {
+    return 'Lean 4 Ready';
+  }
+  return 'Lean 4 Initializing';
+}
+
+function createEmptyGraphState() {
+  return {
+    loading: false,
+    loaded: false,
+    error: '',
+    nodes: [],
+    edgesMoto: [],
+    edgesMathlib: [],
+  };
+}
+
+function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, latestDependencyEvent = null }) {
+  const [proofs, setProofs] = useState([]);
+  const [proofStatus, setProofStatus] = useState(null);
+  const [brainstorms, setBrainstorms] = useState([]);
+  const [papers, setPapers] = useState([]);
+  const [filter, setFilter] = useState('novel');
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState(null);
+  const [expandedProofId, setExpandedProofId] = useState(null);
+  const [manualSourceType, setManualSourceType] = useState('brainstorm');
+  const [manualSourceId, setManualSourceId] = useState('');
+  const [manualCheckPending, setManualCheckPending] = useState(false);
+  const [manualCheckMessage, setManualCheckMessage] = useState('');
+  const [dependencyStateByProofId, setDependencyStateByProofId] = useState({});
+  const [viewMode, setViewMode] = useState('list');
+  const [proofGraphState, setProofGraphState] = useState(createEmptyGraphState);
+
+  const loadProofs = async () => {
+    try {
+      setLoading(true);
+      setError(null);
+      setProofGraphState(createEmptyGraphState());
+
+      const [proofsResponse, statusResponse, brainstormsResponse, papersResponse] = await Promise.all([
+        api.getProofs(),
+        api.getProofStatus(),
+        api.getBrainstorms(),
+        api.getPapers(),
+      ]);
+
+      setProofs(proofsResponse.proofs || []);
+      setProofStatus(statusResponse);
+      setBrainstorms(brainstormsResponse.brainstorms || []);
+      setPapers(papersResponse.papers || []);
+    } catch (err) {
+      setError(`Failed to load proofs: ${err.message}`);
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    loadProofs();
+  }, [refreshToken]);
+
+  useEffect(() => {
+    if (!selectedProofId) {
+      return;
+    }
+    setFilter('novel');
+    setViewMode('list');
+    setExpandedProofId(selectedProofId);
+  }, [selectedProofId]);
+
+  const expandedDependencyState = expandedProofId ? dependencyStateByProofId[expandedProofId] : null;
+
+  useEffect(() => {
+    if (!expandedProofId || !proofStatus?.lean4_enabled) {
+      return;
+    }
+    if (expandedDependencyState?.loading || expandedDependencyState?.loaded) {
+      return;
+    }
+
+    let cancelled = false;
+    setDependencyStateByProofId((prev) => ({
+      ...prev,
+      [expandedProofId]: {
+        loading: true,
+        loaded: false,
+        dependsOn: [],
+        dependedOnBy: [],
+        mathlibDependedOnBy: [],
+      },
+    }));
+
+    api.getProofDependencies(expandedProofId)
+      .then((response) => {
+        if (cancelled) {
+          return;
+        }
+        setDependencyStateByProofId((prev) => ({
+          ...prev,
+          [expandedProofId]: {
+            loading: false,
+            loaded: true,
+            dependsOn: response.depends_on || [],
+            dependedOnBy: response.depended_on_by || [],
+            mathlibDependedOnBy: response.mathlib_depended_on_by || [],
+          },
+        }));
+      })
+      .catch(() => {
+        if (cancelled) {
+          return;
+        }
+        setDependencyStateByProofId((prev) => ({
+          ...prev,
+          [expandedProofId]: {
+            loading: false,
+            loaded: true,
+            dependsOn: [],
+            dependedOnBy: [],
+            mathlibDependedOnBy: [],
+          },
+        }));
+      });
+
+    return () => {
+      cancelled = true;
+    };
+  }, [api, expandedDependencyState, expandedProofId, proofStatus?.lean4_enabled]);
+
+  useEffect(() => {
+    if (!latestDependencyEvent || viewMode !== 'graph' || !proofGraphState.loaded) {
+      return;
+    }
+
+    setProofGraphState((previous) => {
+      if (!previous.loaded) {
+        return previous;
+      }
+
+      const nodeIds = new Set(previous.nodes.map((node) => node.proof_id));
+      const dependencyPayload = latestDependencyEvent.dependencies || [];
+      const needsRefetch = !nodeIds.has(latestDependencyEvent.proof_id) || dependencyPayload.some(
+        (dependency) => dependency.kind === 'moto' && dependency.source_ref && !nodeIds.has(dependency.source_ref)
+      );
+
+      if (needsRefetch) {
+        return createEmptyGraphState();
+      }
+
+      const edgesMoto = [...previous.edgesMoto];
+      const edgesMathlib = [...previous.edgesMathlib];
+      const motoKeys = new Set(edgesMoto.map((edge) => `${edge.from}->${edge.to}:${edge.name || ''}`));
+      const mathlibKeys = new Set(edgesMathlib.map((edge) => `${edge.from}->${edge.name}:${edge.source_ref || ''}`));
+
+      dependencyPayload.forEach((dependency) => {
+        if (dependency.kind === 'moto' && dependency.source_ref) {
+          const key = `${latestDependencyEvent.proof_id}->${dependency.source_ref}:${dependency.name || ''}`;
+          if (!motoKeys.has(key)) {
+            motoKeys.add(key);
+            edgesMoto.push({
+              from: latestDependencyEvent.proof_id,
+              to: dependency.source_ref,
+              name: dependency.name,
+            });
+          }
+          return;
+        }
+
+        if (dependency.kind === 'mathlib') {
+          const key = `${latestDependencyEvent.proof_id}->${dependency.name}:${dependency.source_ref || ''}`;
+          if (!mathlibKeys.has(key)) {
+            mathlibKeys.add(key);
+            edgesMathlib.push({
+              from: latestDependencyEvent.proof_id,
+              name: dependency.name,
+              source_ref: dependency.source_ref,
+            });
+          }
+        }
+      });
+
+      return {
+        ...previous,
+        edgesMoto,
+        edgesMathlib,
+      };
+    });
+  }, [latestDependencyEvent, proofGraphState.loaded, viewMode]);
+
+  useEffect(() => {
+    if (viewMode !== 'graph' || !proofStatus?.lean4_enabled) {
+      return;
+    }
+    if (proofGraphState.loading || proofGraphState.loaded) {
+      return;
+    }
+
+    let cancelled = false;
+    setProofGraphState((previous) => ({
+      ...previous,
+      loading: true,
+      error: '',
+    }));
+
+    api.getProofGraph()
+      .then((response) => {
+        if (cancelled) {
+          return;
+        }
+        setProofGraphState({
+          loading: false,
+          loaded: true,
+          error: '',
+          nodes: response.nodes || [],
+          edgesMoto: response.edges_moto || [],
+          edgesMathlib: response.edges_mathlib || [],
+        });
+      })
+      .catch((err) => {
+        if (cancelled) {
+          return;
+        }
+        setProofGraphState({
+          loading: false,
+          loaded: true,
+          error: `Failed to load proof graph: ${err.message}`,
+          nodes: [],
+          edgesMoto: [],
+          edgesMathlib: [],
+        });
+      });
+
+    return () => {
+      cancelled = true;
+    };
+  }, [api, proofGraphState.loaded, proofGraphState.loading, proofStatus?.lean4_enabled, viewMode]);
+
+  const availableBrainstorms = useMemo(
+    () => brainstorms.filter((brainstorm) => brainstorm.status === 'complete'),
+    [brainstorms]
+  );
+
+  const availablePapers = useMemo(
+    () => papers.filter((paper) => paper.status === 'complete'),
+    [papers]
+  );
+
+  const availableSources = useMemo(
+    () => (manualSourceType === 'brainstorm' ? availableBrainstorms : availablePapers),
+    [manualSourceType, availableBrainstorms, availablePapers]
+  );
+
+  useEffect(() => {
+    if (availableSources.length === 0) {
+      setManualSourceId('');
+      return;
+    }
+
+    const sourceIdKey = manualSourceType === 'brainstorm' ? 'topic_id' : 'paper_id';
+    const hasSelectedSource = availableSources.some((source) => source[sourceIdKey] === manualSourceId);
+    if (!hasSelectedSource) {
+      setManualSourceId(availableSources[0][sourceIdKey]);
+    }
+  }, [availableSources, manualSourceId, manualSourceType]);
+
+  const counts = useMemo(() => {
+    if (proofStatus?.proof_counts) {
+      return proofStatus.proof_counts;
+    }
+    const novel = proofs.filter((proof) => proof.novel).length;
+    return {
+      total: proofs.length,
+      novel,
+      known: proofs.length - novel,
+    };
+  }, [proofStatus, proofs]);
+
+  const visibleProofs = useMemo(() => {
+    if (filter === 'novel') {
+      return proofs.filter((proof) => proof.novel);
+    }
+    return proofs;
+  }, [proofs, filter]);
+  const visibleProofIds = useMemo(
+    () => visibleProofs.map((proof) => proof.proof_id),
+    [visibleProofs]
+  );
+  const showManualPanel = Boolean(proofStatus?.lean4_path);
+  const manualChecksDisabled = !proofStatus?.lean4_enabled || !proofStatus?.manual_check_ready || availableSources.length === 0;
+  const manualChecksDisabledReason = !proofStatus
+    ? 'Loading proof runtime status...'
+    : !proofStatus?.lean4_enabled
+      ? 'Lean 4 proof checks are disabled.'
+    : !proofStatus?.manual_check_ready
+      ? (proofStatus?.manual_check_message || 'Manual proof checks are not ready yet.')
+      : availableSources.length === 0
+        ? 'No completed sources are available yet.'
+        : '';
+
+  const handleSelectGraphProof = (proofId) => {
+    setExpandedProofId(proofId);
+    setViewMode('list');
+  };
+
+  const handleRunProofCheck = async () => {
+    if (!manualSourceId) {
+      return;
+    }
+
+    try {
+      setManualCheckPending(true);
+      setManualCheckMessage('');
+      await api.runProofCheck({
+        sourceType: manualSourceType,
+        sourceId: manualSourceId,
+      });
+      setManualCheckMessage(`Queued proof check for ${manualSourceType} ${manualSourceId}.`);
+    } catch (err) {
+      setManualCheckMessage(`Failed to queue proof check: ${err.message}`);
+    } finally {
+      setManualCheckPending(false);
+    }
+  };
+
+  return (
+    <div className="math-proofs-view">
+      <div className="math-proofs-header">
+        <div>
+          <h2>Mathematical Proofs</h2>
+          <p>
+            Lean 4 verification runs automatically after brainstorm and paper completion.
+          </p>
+        </div>
+
+        <div className="math-proofs-status-group">
+          <span className={`math-proofs-status ${proofStatus?.workspace_ready ? 'ready' : 'pending'} ${proofStatus?.lean4_enabled ? '' : 'disabled'}`}>
+            {getLeanStatusLabel(proofStatus)}
+          </span>
+          <span className="math-proofs-count">
+            {counts.novel || 0} novel / {counts.total || 0} total
+          </span>
+          <button className="math-proofs-refresh" onClick={loadProofs}>
+            Refresh
+          </button>
+        </div>
+      </div>
+
+      <div className="math-proofs-toolbar">
+        <div className="math-proofs-toolbar-groups">
+          <div className="math-proofs-filters">
+            <button
+              className={`math-proofs-filter ${filter === 'novel' ? 'active' : ''}`}
+              onClick={() => setFilter('novel')}
+            >
+              Novel Proofs
+            </button>
+            <button
+              className={`math-proofs-filter ${filter === 'all' ? 'active' : ''}`}
+              onClick={() => setFilter('all')}
+            >
+              All Verified Proofs
+            </button>
+          </div>
+
+          <div className="math-proofs-filters">
+            <button
+              className={`math-proofs-filter ${viewMode === 'list' ? 'active' : ''}`}
+              onClick={() => setViewMode('list')}
+            >
+              List
+            </button>
+            <button
+              className={`math-proofs-filter ${viewMode === 'graph' ? 'active' : ''}`}
+              onClick={() => setViewMode('graph')}
+              disabled={!proofStatus?.lean4_enabled}
+              title={!proofStatus?.lean4_enabled ? 'Graph view requires Lean 4 proof data.' : undefined}
+            >
+              Graph
+            </button>
+          </div>
+        </div>
+
+        <div className="math-proofs-version-group">
+          <div className="math-proofs-version">
+            {proofStatus?.lean4_version || 'Lean 4 version unavailable'}
+          </div>
+          {proofStatus?.lsp_available && (
+            <div className="math-proofs-version">
+              {proofStatus.lsp_active ? 'Persistent LSP Active' : 'Persistent LSP Ready'}
+            </div>
+          )}
+          {proofStatus?.smt_enabled && (
+            <div className="math-proofs-version">
+              {proofStatus.smt_available ? 'Z3 Ready' : 'Z3 Unavailable'}
+            </div>
+          )}
+        </div>
+      </div>
+
+      {showManualPanel && (
+        <div className="math-proofs-manual-panel">
+          <div className="math-proofs-manual-copy">
+            <strong>Manual proof check</strong>
+            <span>Queue a Lean 4 proof pass for any completed brainstorm or paper.</span>
+          </div>
+          <div className="math-proofs-manual-controls">
+            <select
+              value={manualSourceType}
+              onChange={(event) => setManualSourceType(event.target.value)}
+              disabled={manualCheckPending}
+            >
+              <option value="brainstorm">Brainstorm</option>
+              <option value="paper">Paper</option>
+            </select>
+            <select
+              value={manualSourceId}
+              onChange={(event) => setManualSourceId(event.target.value)}
+              disabled={manualCheckPending || availableSources.length === 0}
+            >
+              {availableSources.length === 0 && <option value="">No completed sources available</option>}
+              {manualSourceType === 'brainstorm' &&
+                availableBrainstorms.map((brainstorm) => (
+                  <option key={brainstorm.topic_id} value={brainstorm.topic_id}>
+                    {brainstorm.topic_id} - {truncate(brainstorm.topic_prompt, 80)}
+                  </option>
+                ))}
+              {manualSourceType === 'paper' &&
+                availablePapers.map((paper) => (
+                  <option key={paper.paper_id} value={paper.paper_id}>
+                    {paper.paper_id} - {truncate(paper.title, 80)}
+                  </option>
+                ))}
+            </select>
+            <button
+              className="math-proofs-run-check"
+              onClick={handleRunProofCheck}
+              disabled={manualChecksDisabled || manualCheckPending}
+              title={manualChecksDisabledReason || undefined}
+            >
+              {manualCheckPending ? 'Queueing...' : 'Run Proof Check'}
+            </button>
+          </div>
+        </div>
+      )}
+
+      {manualCheckMessage && (
+        <div className={`math-proofs-banner ${manualCheckMessage.startsWith('Failed') ? 'error' : 'success'}`}>
+          {manualCheckMessage}
+        </div>
+      )}
+
+      {loading && <div className="math-proofs-empty">Loading proof database...</div>}
+      {!loading && error && <div className="math-proofs-error">{error}</div>}
+
+      {!loading && !error && visibleProofs.length === 0 && (
+        <div className="math-proofs-empty">
+          No proofs verified yet. Proofs are automatically checked at brainstorm and paper completion.
+        </div>
+      )}
+
+      {!loading && !error && visibleProofs.length > 0 && viewMode === 'graph' && (
+        <>
+          {!proofStatus?.lean4_enabled && (
+            <div className="math-proofs-empty">
+              Graph view is unavailable while Lean 4 proof support is disabled.
+            </div>
+          )}
+          {proofStatus?.lean4_enabled && proofGraphState.loading && (
+            <div className="math-proofs-empty">Loading proof dependency graph...</div>
+          )}
+          {proofStatus?.lean4_enabled && !proofGraphState.loading && proofGraphState.error && (
+            <div className="math-proofs-error">{proofGraphState.error}</div>
+          )}
+          {proofStatus?.lean4_enabled && !proofGraphState.loading && !proofGraphState.error && (
+            <ProofGraph
+              nodes={proofGraphState.nodes}
+              edgesMoto={proofGraphState.edgesMoto}
+              edgesMathlib={proofGraphState.edgesMathlib}
+              visibleProofIds={visibleProofIds}
+              expandedProofId={expandedProofId}
+              onSelectProof={handleSelectGraphProof}
+            />
+          )}
+        </>
+      )}
+
+      {!loading && !error && visibleProofs.length > 0 && viewMode === 'list' && (
+        <div className="math-proofs-list">
+          {visibleProofs.map((proof) => {
+            const isExpanded = expandedProofId === proof.proof_id;
+            const dependencyState = dependencyStateByProofId[proof.proof_id];
+            const dependsOn = dependencyState?.dependsOn || [];
+            const dependedOnBy = dependencyState?.dependedOnBy || [];
+            const mathlibDependedOnBy = dependencyState?.mathlibDependedOnBy || [];
+            const showDependencyDetails = Boolean(
+              proofStatus?.lean4_enabled &&
+              (dependencyState?.loading || dependsOn.length > 0 || dependedOnBy.length > 0 || mathlibDependedOnBy.length > 0)
+            );
+            return (
+              <article
+                key={proof.proof_id}
+                className={`math-proof-card ${proof.novel ? 'novel' : 'known'}`}
+              >
+                <div className="math-proof-card-header">
+                  <div>
+                    <div className="math-proof-card-topline">
+                      <span className={`math-proof-badge ${proof.novel ? 'novel' : 'known'}`}>
+                        {proof.novel ? 'Novel Proof' : 'Known Proof'}
+                      </span>
+                      <span className="math-proof-source">
+                        {proof.source_type} {proof.source_id}
+                      </span>
+                    </div>
+                    <h3>{proof.theorem_statement}</h3>
+                    <p className="math-proof-summary">
+                      {truncate(proof.novelty_reasoning || proof.formal_sketch || 'Lean 4 verified this proof.')}
+                    </p>
+                  </div>
+
+                  <button
+                    className="math-proof-expand"
+                    onClick={() => setExpandedProofId(isExpanded ? null : proof.proof_id)}
+                  >
+                    {isExpanded ? 'Hide Details' : 'View Details'}
+                  </button>
+                </div>
+
+                <div className="math-proof-meta">
+                  <span>Solver: {proof.solver || 'Lean 4'}</span>
+                  <span>Attempts: {proof.attempt_count || proof.attempts?.length || 0}</span>
+                  <span>Created: {formatDate(proof.created_at)}</span>
+                </div>
+
+                {isExpanded && (
+                  <div className="math-proof-details">
+                    <div className="math-proof-actions">
+                      <a
+                        className="math-proof-download"
+                        href={api.getProofCertificateUrl(proof.proof_id)}
+                        download={`${proof.proof_id}_certificate.json`}
+                      >
+                        Download Certificate (JSON)
+                      </a>
+                      <a
+                        className="math-proof-download"
+                        href={api.getProofLeanDownloadUrl(proof.proof_id)}
+                        download={`${proof.proof_id}.lean`}
+                      >
+                        Download .lean
+                      </a>
+                    </div>
+
+                    {proof.theorem_name && (
+                      <div className="math-proof-detail-block">
+                        <strong>Theorem Name</strong>
+                        <div>{proof.theorem_name}</div>
+                      </div>
+                    )}
+
+                    {proof.source_title && (
+                      <div className="math-proof-detail-block">
+                        <strong>Source Title</strong>
+                        <div>{proof.source_title}</div>
+                      </div>
+                    )}
+
+                    {proof.formal_sketch && (
+                      <div className="math-proof-detail-block">
+                        <strong>Formal Sketch</strong>
+                        <div>{proof.formal_sketch}</div>
+                      </div>
+                    )}
+
+                    {proof.novelty_reasoning && (
+                      <div className="math-proof-detail-block">
+                        <strong>Novelty Review</strong>
+                        <div>{proof.novelty_reasoning}</div>
+                      </div>
+                    )}
+
+                    {proof.solver_hints?.length > 0 && (
+                      <div className="math-proof-detail-block">
+                        <strong>Solver Hints Used</strong>
+                        <div>{proof.solver_hints.join(', ')}</div>
+                      </div>
+                    )}
+
+                    {showDependencyDetails && (
+                      <div className="math-proof-detail-block">
+                        <strong>Proof Dependencies</strong>
+                        {dependencyState?.loading ? (
+                          <div className="math-proof-dependency-empty">Loading dependency graph...</div>
+                        ) : (
+                          <div className="math-proof-dependency-groups">
+                            {dependsOn.length > 0 && (
+                              <div>
+                                <div className="math-proof-dependency-heading">Depends on</div>
+                                <ul className="math-proof-dependency-list">
+                                  {dependsOn.map((dependency, index) => (
+                                    <li key={`${dependency.kind}-${dependency.name}-${index}`}>
+                                      <span className="math-proof-dependency-kind">{dependency.kind}</span>
+                                      <span>{dependency.name}</span>
+                                      {dependency.source_ref && (
+                                        <span className="math-proof-dependency-source">{dependency.source_ref}</span>
+                                      )}
+                                    </li>
+                                  ))}
+                                </ul>
+                              </div>
+                            )}
+
+                            {dependedOnBy.length > 0 && (
+                              <div>
+                                <div className="math-proof-dependency-heading">Depended on by</div>
+                                <ul className="math-proof-dependency-list">
+                                  {dependedOnBy.map((dependency) => (
+                                    <li key={dependency.proof_id}>
+                                      <span>{dependency.theorem_name || dependency.proof_id}</span>
+                                      <span className="math-proof-dependency-source">
+                                        {truncate(dependency.theorem_statement, 120)}
+                                      </span>
+                                    </li>
+                                  ))}
+                                </ul>
+                              </div>
+                            )}
+
+                            {mathlibDependedOnBy.length > 0 && (
+                              <div>
+                                <div className="math-proof-dependency-heading">Shared Mathlib Usage</div>
+                                <ul className="math-proof-dependency-list">
+                                  {mathlibDependedOnBy.map((entry) => (
+                                    <li key={entry.name}>
+                                      <span className="math-proof-dependency-kind">mathlib</span>
+                                      <span>{entry.name}</span>
+                                      <span className="math-proof-dependency-source">
+                                        {entry.dependents?.length || 0} proof(s) also use this lemma
+                                      </span>
+                                    </li>
+                                  ))}
+                                </ul>
+                              </div>
+                            )}
+                          </div>
+                        )}
+                      </div>
+                    )}
+
+                    <div className="math-proof-detail-block">
+                      <strong>Lean 4 Code</strong>
+                      <pre className="math-proof-code">{proof.lean_code}</pre>
+                    </div>
+                  </div>
+                )}
+              </article>
+            );
+          })}
+        </div>
+      )}
+    </div>
+  );
+}
+
+export default MathematicalProofs;
diff --git a/frontend/src/components/autonomous/PaperLibrary.jsx b/frontend/src/components/autonomous/PaperLibrary.jsx
index 16b1c02..c030110 100644
--- a/frontend/src/components/autonomous/PaperLibrary.jsx
+++ b/frontend/src/components/autonomous/PaperLibrary.jsx
@@ -7,11 +7,14 @@ import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
 import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
+import { useProofCheckRuntime } from '../../hooks/useProofCheckRuntime';
+import { getRuntimeDataPath } from '../../utils/runtimeConfig';
 
 const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
   const [expandedId, setExpandedId] = useState(null);
   const [expandedContent, setExpandedContent] = useState(null);
   const [loading, setLoading] = useState(false);
+  const [showLibraryTooltip, setShowLibraryTooltip] = useState(false);
   const [deleteConfirm, setDeleteConfirm] = useState(null);
   const [deleting, setDeleting] = useState(false);
   const [isGeneratingPDF, setIsGeneratingPDF] = useState(false);
@@ -19,6 +22,13 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
   // Critique modal state
   const [critiqueModalOpen, setCritiqueModalOpen] = useState(false);
   const [critiquePaper, setCritiquePaper] = useState(null);
+  const [proofActionMessage, setProofActionMessage] = useState('');
+  const {
+    getSourceState,
+    manualCheckEnabled,
+    manualCheckReason,
+    queueManualProofCheck,
+  } = useProofCheckRuntime();
 
   const handleCardClick = async (paperId) => {
     if (expandedId === paperId) {
@@ -84,6 +94,20 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
     downloadRawText(content, filename, outline);
   };
 
+  const handleProofCheck = async (e, paperId) => {
+    e.stopPropagation();
+    try {
+      setProofActionMessage('');
+      await queueManualProofCheck({
+        sourceType: 'paper',
+        sourceId: paperId,
+      });
+      setProofActionMessage(`Queued proof check for paper ${paperId}.`);
+    } catch (error) {
+      setProofActionMessage(`Failed to queue proof check: ${error.message}`);
+    }
+  };
+
   const handleDownloadPDF = async (e, paper) => {
     e.stopPropagation();
 
@@ -128,7 +152,7 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
   // Get color for critique rating badge
   const getCritiqueColor = (rating) => {
     if (rating >= 8) return '#10b981'; // Green
-    if (rating >= 6.25) return '#3b82f6'; // Blue
+    if (rating >= 6.25) return '#18cc17'; // Green
     if (rating >= 4) return '#eab308'; // Yellow
     if (rating >= 2) return '#f97316'; // Orange
     return '#ef4444'; // Red
@@ -168,19 +192,31 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
       <div className="paper-library-header">
         <h3>
           Paper Library ({papers.length} Papers)
-          <span className="paper-library-help-icon" tabIndex={0}>
-            ?
-            <span className="paper-library-tooltip">
-              <strong>HOW THIS PAGE WORKS</strong>
-              <br /><br />
-              This paper database will continue to accumulate until the AI harness autonomously decides to generate the final answer or until the user forces final answer generation. Papers utilize their respective brainstorm topics during writing and may undergo critique-revision before final appearance on this page.
-              <br /><br />
-              Papers may start off mediocre, however will improve over time as the AI selects internal papers for future reference or removal. Paper quality greatly improves with higher parameter models.
-              <br /><br />
-              Accumulating a large amount of papers before final answer generation is normal (i.e. 10 to 20 papers with several pruned/deleted). When forcing final answer generation the AI will decide either: 1.) not enough info — brainstorm more, 2.) write answer — new short form paper, 3.) write answer, longform volume — organize select accepted papers into a longform volume with chapters, write gap papers (if applicable), conclusion chapter then introduction chapter.
-              <br /><br />
-              <span style={{ color: '#f0a' }}>📁 Manual file retrieval:</span> Paper files are saved at <code>backend/data/auto_sessions/[session_folder]/papers/</code> — each paper is stored as <code>paper_[id].txt</code> with a matching <code>paper_[id]_abstract.txt</code> and <code>paper_[id]_outline.txt</code>. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
-            </span>
+          <span className="help-tooltip-anchor help-tooltip-anchor--inline">
+            <button
+              type="button"
+              className="help-tooltip-btn"
+              aria-label="Learn how the paper library works"
+              onMouseEnter={() => setShowLibraryTooltip(true)}
+              onMouseLeave={() => setShowLibraryTooltip(false)}
+              onFocus={() => setShowLibraryTooltip(true)}
+              onBlur={() => setShowLibraryTooltip(false)}
+            >
+              ?
+            </button>
+            {showLibraryTooltip && (
+              <span className="help-tooltip-popup help-tooltip-popup--center">
+                <strong>HOW THIS PAGE WORKS</strong>
+                <br /><br />
+                This paper database will continue to accumulate until the AI harness autonomously decides to generate the final answer or until the user forces final answer generation. Papers utilize their respective brainstorm topics during writing and may undergo critique-revision before final appearance on this page.
+                <br /><br />
+                Papers may start off mediocre, however will improve over time as the AI selects internal papers for future reference or removal. Paper quality greatly improves with higher parameter models.
+                <br /><br />
+                Accumulating a large amount of papers before final answer generation is normal (i.e. 10 to 20 papers with several pruned/deleted). When forcing final answer generation the AI will decide either: 1.) not enough info — brainstorm more, 2.) write answer — new short form paper, 3.) write answer, longform volume — organize select accepted papers into a longform volume with chapters, write gap papers (if applicable), conclusion chapter then introduction chapter.
+                <br /><br />
+                <span style={{ color: '#f0a' }}>📁 Manual file retrieval:</span> Paper files are saved at <code>{getRuntimeDataPath('auto_sessions/[session_folder]/papers')}</code> — each paper is stored as <code>paper_[id].txt</code> with a matching <code>paper_[id]_abstract.txt</code> and <code>paper_[id]_outline.txt</code>. Session folders are named after your research prompt and timestamp (e.g. <code>solve_riemann_hypothesis_2026-03-20_14-30/</code>).
+              </span>
+            )}
           </span>
         </h3>
         <button onClick={onRefresh} className="btn-refresh">
@@ -194,6 +230,12 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
         Pruned Papers: {archivedCount}
       </div>
 
+      {proofActionMessage && (
+        <div className={`test-result-banner ${proofActionMessage.startsWith('Failed') ? 'test-result-banner--error' : 'test-result-banner--success'}`}>
+          {proofActionMessage}
+        </div>
+      )}
+
       <div className="paper-grid">
         {papers.map((paper) => (
           <div
@@ -246,6 +288,28 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
             {expandedId === paper.paper_id && (
               <>
                 <div className="paper-actions">
+                  {(() => {
+                    const proofCheckState = getSourceState('paper', paper.paper_id);
+                    const proofCheckLabel = proofCheckState?.status === 'queued'
+                      ? 'Queueing Proof Check...'
+                      : proofCheckState?.status === 'running'
+                        ? `Proof Check Running${proofCheckState.candidateCount ? ` (${proofCheckState.candidateCount})` : '...'}`
+                        : 'Try to prove with Lean 4 theorem prover';
+                    const proofCheckTitle = proofCheckState?.status === 'running'
+                      ? 'A proof verification is already running for this paper.'
+                      : manualCheckReason || 'Queue a manual proof check for this paper.';
+                    return (
+                      <button
+                        className="btn-download"
+                        onClick={(e) => handleProofCheck(e, paper.paper_id)}
+                        disabled={!manualCheckEnabled || Boolean(proofCheckState)}
+                        title={proofCheckTitle}
+                      >
+                        {proofCheckLabel}
+                      </button>
+                    );
+                  })()}
+
                   <button
                     className="btn-download"
                     onClick={(e) => handleDownloadPDF(e, paper)}
diff --git a/frontend/src/components/autonomous/ProofGraph.css b/frontend/src/components/autonomous/ProofGraph.css
new file mode 100644
index 0000000..cad3c63
--- /dev/null
+++ b/frontend/src/components/autonomous/ProofGraph.css
@@ -0,0 +1,155 @@
+.proof-graph-panel {
+  display: grid;
+  gap: 0.9rem;
+  border: 1px solid rgba(148, 163, 184, 0.16);
+  border-radius: 1rem;
+  background: rgba(255, 255, 255, 0.02);
+  padding: 1rem;
+}
+
+.proof-graph-topbar {
+  display: flex;
+  justify-content: space-between;
+  gap: 1rem;
+  flex-wrap: wrap;
+}
+
+.proof-graph-copy {
+  display: grid;
+  gap: 0.3rem;
+}
+
+.proof-graph-copy strong {
+  color: var(--text-primary, #f3f4f6);
+}
+
+.proof-graph-copy span,
+.proof-graph-hover-subtitle {
+  color: var(--text-secondary, #9ca3af);
+  line-height: 1.45;
+}
+
+.proof-graph-hover-card {
+  min-width: min(28rem, 100%);
+  max-width: 34rem;
+  display: grid;
+  gap: 0.45rem;
+  border: 1px solid rgba(148, 163, 184, 0.16);
+  border-radius: 0.9rem;
+  background: rgba(2, 6, 23, 0.55);
+  padding: 0.85rem 0.95rem;
+}
+
+.proof-graph-hover-title {
+  color: var(--text-primary, #f3f4f6);
+  font-weight: 600;
+}
+
+.proof-graph-badges {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.4rem;
+}
+
+.proof-graph-badge {
+  display: inline-flex;
+  align-items: center;
+  border-radius: 999px;
+  border: 1px solid rgba(96, 165, 250, 0.28);
+  background: rgba(96, 165, 250, 0.08);
+  color: #bfdbfe;
+  padding: 0.2rem 0.55rem;
+  font-size: 0.76rem;
+  line-height: 1.2;
+}
+
+.proof-graph-badge.muted {
+  border-color: rgba(148, 163, 184, 0.22);
+  background: rgba(148, 163, 184, 0.08);
+  color: var(--text-secondary, #9ca3af);
+}
+
+.proof-graph-canvas {
+  overflow-x: auto;
+  overflow-y: hidden;
+  border-radius: 0.85rem;
+  border: 1px solid rgba(148, 163, 184, 0.12);
+  background:
+    radial-gradient(circle at top, rgba(34, 197, 94, 0.07), transparent 42%),
+    linear-gradient(180deg, rgba(15, 23, 42, 0.96), rgba(2, 6, 23, 0.98));
+}
+
+.proof-graph-svg {
+  display: block;
+  min-width: 100%;
+}
+
+.proof-graph-edge {
+  fill: none;
+  stroke: rgba(96, 165, 250, 0.55);
+  stroke-width: 2;
+}
+
+.proof-graph-arrowhead {
+  fill: rgba(96, 165, 250, 0.75);
+}
+
+.proof-graph-node-group {
+  cursor: pointer;
+  outline: none;
+}
+
+.proof-graph-node-group:focus .proof-graph-node-frame,
+.proof-graph-node-group:hover .proof-graph-node-frame {
+  stroke-width: 2.5;
+}
+
+.proof-graph-node-frame {
+  fill: rgba(17, 24, 39, 0.95);
+  stroke: rgba(148, 163, 184, 0.24);
+  stroke-width: 1.5;
+  transition: stroke 0.2s ease, transform 0.2s ease;
+}
+
+.proof-graph-node-group.novel .proof-graph-node-frame {
+  stroke: rgba(34, 197, 94, 0.45);
+}
+
+.proof-graph-node-group.known .proof-graph-node-frame {
+  stroke: rgba(96, 165, 250, 0.32);
+}
+
+.proof-graph-node-group.selected .proof-graph-node-frame {
+  stroke: rgba(250, 204, 21, 0.9);
+}
+
+.proof-graph-node-proof-id,
+.proof-graph-node-mathlib {
+  fill: #18cc17;
+  font-size: 12px;
+}
+
+.proof-graph-node-title {
+  fill: #f8fafc;
+  font-size: 14px;
+  font-weight: 600;
+}
+
+.proof-graph-node-source {
+  fill: #94a3b8;
+  font-size: 12px;
+}
+
+.proof-graph-empty {
+  padding: 0.95rem 1rem;
+  border-radius: 0.85rem;
+  border: 1px solid rgba(148, 163, 184, 0.16);
+  background: rgba(255, 255, 255, 0.02);
+  color: var(--text-secondary, #9ca3af);
+}
+
+@media (max-width: 900px) {
+  .proof-graph-hover-card {
+    min-width: 100%;
+  }
+}
diff --git a/frontend/src/components/autonomous/ProofGraph.jsx b/frontend/src/components/autonomous/ProofGraph.jsx
new file mode 100644
index 0000000..8406d10
--- /dev/null
+++ b/frontend/src/components/autonomous/ProofGraph.jsx
@@ -0,0 +1,355 @@
+import React, { useMemo, useState } from 'react';
+import './ProofGraph.css';
+
+const NODE_WIDTH = 236;
+const NODE_HEIGHT = 110;
+const X_GAP = 72;
+const Y_GAP = 30;
+const PADDING = 28;
+
+function truncate(text, maxLength = 96) {
+  if (!text) {
+    return '';
+  }
+  return text.length > maxLength ? `${text.slice(0, maxLength - 3)}...` : text;
+}
+
+function wrapSvgText(text, maxCharsPerLine = 30, maxLines = 3) {
+  const normalized = String(text || '').replace(/\s+/g, ' ').trim();
+  if (!normalized) {
+    return ['Untitled proof'];
+  }
+
+  const words = normalized.split(' ');
+  const lines = [];
+  let currentLine = '';
+
+  for (const word of words) {
+    const candidate = currentLine ? `${currentLine} ${word}` : word;
+    if (candidate.length <= maxCharsPerLine) {
+      currentLine = candidate;
+      continue;
+    }
+
+    if (currentLine) {
+      lines.push(currentLine);
+    }
+    currentLine = word;
+
+    if (lines.length === maxLines - 1) {
+      break;
+    }
+  }
+
+  if (currentLine && lines.length < maxLines) {
+    lines.push(currentLine);
+  }
+
+  if (lines.length === maxLines && words.join(' ').length > lines.join(' ').length) {
+    const lastLine = lines[maxLines - 1];
+    lines[maxLines - 1] = truncate(lastLine, Math.max(8, maxCharsPerLine - 3));
+  }
+
+  return lines;
+}
+
+function ProofGraph({
+  nodes = [],
+  edgesMoto = [],
+  edgesMathlib = [],
+  visibleProofIds = [],
+  expandedProofId = null,
+  onSelectProof,
+}) {
+  const [hoveredProofId, setHoveredProofId] = useState(null);
+
+  const visibleIdSet = useMemo(() => new Set(visibleProofIds), [visibleProofIds]);
+
+  const graphData = useMemo(() => {
+    const filteredNodes = nodes.filter((node) => visibleIdSet.has(node.proof_id));
+    const nodeById = new Map(filteredNodes.map((node) => [node.proof_id, node]));
+
+    const filteredMotoEdges = edgesMoto.filter(
+      (edge) => nodeById.has(edge.from) && nodeById.has(edge.to)
+    );
+
+    const mathlibByProofId = new Map();
+    for (const edge of edgesMathlib) {
+      if (!nodeById.has(edge.from)) {
+        continue;
+      }
+      const entries = mathlibByProofId.get(edge.from) || [];
+      entries.push(edge);
+      mathlibByProofId.set(edge.from, entries);
+    }
+
+    const dependenciesByProofId = new Map();
+    for (const node of filteredNodes) {
+      dependenciesByProofId.set(node.proof_id, []);
+    }
+    for (const edge of filteredMotoEdges) {
+      dependenciesByProofId.get(edge.from).push(edge.to);
+    }
+
+    const layerCache = new Map();
+    const visiting = new Set();
+    const getLayer = (proofId) => {
+      if (layerCache.has(proofId)) {
+        return layerCache.get(proofId);
+      }
+      if (visiting.has(proofId)) {
+        return 0;
+      }
+
+      visiting.add(proofId);
+      const dependencies = dependenciesByProofId.get(proofId) || [];
+      const layer = dependencies.length > 0
+        ? 1 + Math.max(...dependencies.map((dependencyId) => getLayer(dependencyId)))
+        : 0;
+      visiting.delete(proofId);
+      layerCache.set(proofId, layer);
+      return layer;
+    };
+
+    const layers = new Map();
+    for (const node of filteredNodes) {
+      const layer = getLayer(node.proof_id);
+      const entries = layers.get(layer) || [];
+      entries.push(node);
+      layers.set(layer, entries);
+    }
+
+    const orderedLayers = Array.from(layers.entries())
+      .sort((left, right) => left[0] - right[0])
+      .map(([layer, layerNodes]) => {
+        const sortedNodes = [...layerNodes].sort((left, right) => {
+          const leftName = left.theorem_name || left.theorem_statement || left.proof_id;
+          const rightName = right.theorem_name || right.theorem_statement || right.proof_id;
+          return leftName.localeCompare(rightName);
+        });
+        return { layer, nodes: sortedNodes };
+      });
+
+    const maxLayerHeight = Math.max(
+      ...orderedLayers.map(({ nodes: layerNodes }) => (
+        layerNodes.length * NODE_HEIGHT + Math.max(layerNodes.length - 1, 0) * Y_GAP
+      )),
+      NODE_HEIGHT
+    );
+
+    const width = Math.max(
+      PADDING * 2 + NODE_WIDTH,
+      PADDING * 2 + orderedLayers.length * NODE_WIDTH + Math.max(orderedLayers.length - 1, 0) * X_GAP
+    );
+    const height = PADDING * 2 + maxLayerHeight;
+
+    const positions = new Map();
+    orderedLayers.forEach(({ layer, nodes: layerNodes }) => {
+      const layerHeight = layerNodes.length * NODE_HEIGHT + Math.max(layerNodes.length - 1, 0) * Y_GAP;
+      const startY = PADDING + Math.max((maxLayerHeight - layerHeight) / 2, 0);
+      const x = PADDING + layer * (NODE_WIDTH + X_GAP);
+
+      layerNodes.forEach((node, index) => {
+        positions.set(node.proof_id, {
+          x,
+          y: startY + index * (NODE_HEIGHT + Y_GAP),
+        });
+      });
+    });
+
+    return {
+      filteredNodes,
+      filteredMotoEdges,
+      mathlibByProofId,
+      nodeById,
+      positions,
+      width,
+      height,
+    };
+  }, [nodes, edgesMathlib, edgesMoto, visibleIdSet]);
+
+  const hoveredNode = hoveredProofId ? graphData.nodeById.get(hoveredProofId) : null;
+  const hoveredMathlibRefs = hoveredProofId
+    ? (graphData.mathlibByProofId.get(hoveredProofId) || [])
+    : [];
+
+  if (graphData.filteredNodes.length === 0) {
+    return (
+      <div className="proof-graph-empty">
+        No proofs match the current filter. Switch to "All Verified Proofs" to inspect the full graph.
+      </div>
+    );
+  }
+
+  return (
+    <div className="proof-graph-panel">
+      <div className="proof-graph-topbar">
+        <div className="proof-graph-copy">
+          <strong>Proof ancestry graph</strong>
+          <span>
+            Showing {graphData.filteredNodes.length} proof{graphData.filteredNodes.length === 1 ? '' : 's'}.
+            Solid arrows run from a dependency to the proof that uses it.
+          </span>
+        </div>
+
+        <div className="proof-graph-hover-card">
+          {hoveredNode ? (
+            <>
+              <div className="proof-graph-hover-title">
+                {hoveredNode.theorem_name || hoveredNode.proof_id}
+              </div>
+              <div className="proof-graph-hover-subtitle">
+                {truncate(hoveredNode.theorem_statement, 150)}
+              </div>
+              <div className="proof-graph-badges">
+                {hoveredMathlibRefs.length > 0 ? (
+                  hoveredMathlibRefs.slice(0, 8).map((reference, index) => (
+                    <span
+                      key={`${reference.from}-${reference.name}-${index}`}
+                      className="proof-graph-badge"
+                      title={reference.source_ref || reference.name}
+                    >
+                      {reference.name}
+                    </span>
+                  ))
+                ) : (
+                  <span className="proof-graph-badge muted">No Mathlib references tracked</span>
+                )}
+              </div>
+            </>
+          ) : (
+            <>
+              <div className="proof-graph-hover-title">Hover a node</div>
+              <div className="proof-graph-hover-subtitle">
+                Hover a proof node to inspect its tracked Mathlib references.
+              </div>
+            </>
+          )}
+        </div>
+      </div>
+
+      <div className="proof-graph-canvas">
+        <svg
+          className="proof-graph-svg"
+          viewBox={`0 0 ${graphData.width} ${graphData.height}`}
+          preserveAspectRatio="xMinYMin meet"
+        >
+          <defs>
+            <marker
+              id="proof-graph-arrowhead"
+              markerWidth="8"
+              markerHeight="8"
+              refX="7"
+              refY="4"
+              orient="auto"
+            >
+              <path d="M 0 0 L 8 4 L 0 8 z" className="proof-graph-arrowhead" />
+            </marker>
+          </defs>
+
+          {graphData.filteredMotoEdges.map((edge) => {
+            const dependencyPosition = graphData.positions.get(edge.to);
+            const proofPosition = graphData.positions.get(edge.from);
+            if (!dependencyPosition || !proofPosition) {
+              return null;
+            }
+
+            const startX = dependencyPosition.x + NODE_WIDTH;
+            const startY = dependencyPosition.y + NODE_HEIGHT / 2;
+            const endX = proofPosition.x;
+            const endY = proofPosition.y + NODE_HEIGHT / 2;
+            const controlOffset = Math.max((endX - startX) / 2, 24);
+            const path = [
+              `M ${startX} ${startY}`,
+              `C ${startX + controlOffset} ${startY}, ${endX - controlOffset} ${endY}, ${endX} ${endY}`,
+            ].join(' ');
+
+            return (
+              <path
+                key={`${edge.to}->${edge.from}`}
+                d={path}
+                className="proof-graph-edge"
+                markerEnd="url(#proof-graph-arrowhead)"
+              />
+            );
+          })}
+
+          {graphData.filteredNodes.map((node) => {
+            const position = graphData.positions.get(node.proof_id);
+            if (!position) {
+              return null;
+            }
+
+            const titleLines = wrapSvgText(
+              node.theorem_name || node.theorem_statement || node.proof_id,
+              30,
+              3
+            );
+            const sourceLine = truncate(
+              `${node.source_type} ${node.source_id}`.trim(),
+              30
+            );
+            const mathlibCount = (graphData.mathlibByProofId.get(node.proof_id) || []).length;
+            const isSelected = node.proof_id === expandedProofId;
+
+            const handleActivate = () => {
+              if (typeof onSelectProof === 'function') {
+                onSelectProof(node.proof_id);
+              }
+            };
+
+            const handleKeyDown = (event) => {
+              if (event.key === 'Enter' || event.key === ' ') {
+                event.preventDefault();
+                handleActivate();
+              }
+            };
+
+            return (
+              <g
+                key={node.proof_id}
+                className={`proof-graph-node-group ${node.is_novel ? 'novel' : 'known'} ${isSelected ? 'selected' : ''}`}
+                transform={`translate(${position.x}, ${position.y})`}
+                onClick={handleActivate}
+                onKeyDown={handleKeyDown}
+                onMouseEnter={() => setHoveredProofId(node.proof_id)}
+                onMouseLeave={() => setHoveredProofId((current) => (current === node.proof_id ? null : current))}
+                role="button"
+                tabIndex={0}
+              >
+                <rect
+                  className="proof-graph-node-frame"
+                  width={NODE_WIDTH}
+                  height={NODE_HEIGHT}
+                  rx="18"
+                  ry="18"
+                />
+                <text className="proof-graph-node-proof-id" x="16" y="24">
+                  {node.proof_id}
+                </text>
+                {titleLines.map((line, index) => (
+                  <text
+                    key={`${node.proof_id}-line-${index}`}
+                    className="proof-graph-node-title"
+                    x="16"
+                    y={48 + index * 18}
+                  >
+                    {line}
+                  </text>
+                ))}
+                <text className="proof-graph-node-source" x="16" y={NODE_HEIGHT - 18}>
+                  {sourceLine || 'Source unavailable'}
+                </text>
+                <text className="proof-graph-node-mathlib" x={NODE_WIDTH - 16} y="24" textAnchor="end">
+                  {mathlibCount} mathlib
+                </text>
+              </g>
+            );
+          })}
+        </svg>
+      </div>
+    </div>
+  );
+}
+
+export default ProofGraph;
diff --git a/frontend/src/components/autonomous/ProofNotificationStack.jsx b/frontend/src/components/autonomous/ProofNotificationStack.jsx
new file mode 100644
index 0000000..8ff6b32
--- /dev/null
+++ b/frontend/src/components/autonomous/ProofNotificationStack.jsx
@@ -0,0 +1,128 @@
+import React from 'react';
+
+const ALERT_SCALE = 1.4;
+
+function scalePx(value) {
+  return `${Math.round(value * ALERT_SCALE)}px`;
+}
+
+function truncate(text, maxLength = 120) {
+  if (!text) {
+    return '';
+  }
+  return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
+}
+
+export default function ProofNotificationStack({ notifications, onDismiss, onClickNotification }) {
+  if (!notifications || notifications.length === 0) {
+    return null;
+  }
+
+  return (
+    <div
+      style={{
+        position: 'fixed',
+        bottom: scalePx(116),
+        right: '20px',
+        zIndex: 999998,
+        display: 'flex',
+        flexDirection: 'column',
+        gap: scalePx(8),
+        pointerEvents: 'none',
+      }}
+    >
+      {notifications.map((notification) => (
+        <div
+          key={notification.id}
+          onClick={() => onClickNotification(notification.proof_id)}
+          onKeyDown={(event) => {
+            if (event.key === 'Enter' || event.key === ' ') {
+              event.preventDefault();
+              onClickNotification(notification.proof_id);
+            }
+          }}
+          role="button"
+          tabIndex={0}
+          style={{
+            width: scalePx(320),
+            textAlign: 'left',
+            borderRadius: scalePx(14),
+            border: '1.5px solid #ffd65c',
+            background: 'linear-gradient(135deg, rgba(8, 35, 22, 0.96), rgba(15, 23, 42, 0.96))',
+            boxShadow:
+              '0 16px 36px rgba(0, 0, 0, 0.35), 0 0 12px rgba(255, 214, 92, 0.35), inset 0 0 0 1px rgba(255, 194, 57, 0.25)',
+            padding: `${scalePx(14)} ${scalePx(14)} ${scalePx(12)} ${scalePx(14)}`,
+            color: '#f8fafc',
+            cursor: 'pointer',
+            pointerEvents: 'auto',
+          }}
+        >
+          <div
+            style={{
+              display: 'flex',
+              justifyContent: 'space-between',
+              gap: scalePx(12),
+              alignItems: 'flex-start',
+            }}
+          >
+            <div>
+              <div
+                style={{
+                  fontSize: scalePx(10),
+                  letterSpacing: '0.08em',
+                  textTransform: 'uppercase',
+                  color: '#ffd65c',
+                  marginBottom: scalePx(6),
+                  fontWeight: 700,
+                }}
+              >
+                Congratulations! Novel Mathematical Proof Discovered
+              </div>
+              <div
+                style={{
+                  fontSize: scalePx(13),
+                  lineHeight: 1.45,
+                  color: '#e2e8f0',
+                  fontWeight: 500,
+                }}
+                title={notification.theorem_statement}
+              >
+                {truncate(notification.theorem_statement)}
+              </div>
+              <div
+                style={{
+                  marginTop: scalePx(8),
+                  fontSize: scalePx(11),
+                  lineHeight: 1.4,
+                  color: '#1eff1c',
+                  fontWeight: 600,
+                }}
+              >
+                Verified by Lean 4. Click to open Mathematical Proofs.
+              </div>
+            </div>
+
+            <button
+              type="button"
+              onClick={(event) => {
+                event.stopPropagation();
+                onDismiss(notification.id);
+              }}
+              style={{
+                border: 'none',
+                background: 'transparent',
+                color: '#94a3b8',
+                cursor: 'pointer',
+                fontSize: scalePx(16),
+                lineHeight: 1,
+                padding: 0,
+              }}
+            >
+              x
+            </button>
+          </div>
+        </div>
+      ))}
+    </div>
+  );
+}
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.jsx b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
index 4d53aa5..ab75a71 100644
--- a/frontend/src/components/autonomous/Stage2PaperHistory.jsx
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
@@ -4,13 +4,14 @@ import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
 import { buildResearchRunGroups } from '../../utils/researchRunHistory';
+import { useProofCheckRuntime } from '../../hooks/useProofCheckRuntime';
 import './FinalAnswerLibrary.css';
 import './AutonomousResearch.css';
 import './Stage2PaperHistory.css';
 
 function getCritiqueColor(rating) {
   if (rating >= 8) return '#10b981';
-  if (rating >= 6.25) return '#3b82f6';
+  if (rating >= 6.25) return '#18cc17';
   if (rating >= 4) return '#eab308';
   if (rating >= 2) return '#f97316';
   return '#ef4444';
@@ -41,6 +42,13 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
   const [generatingPdfId, setGeneratingPdfId] = useState(null);
   const [critiqueModalOpen, setCritiqueModalOpen] = useState(false);
   const [critiquePaper, setCritiquePaper] = useState(null);
+  const [proofActionMessage, setProofActionMessage] = useState('');
+  const {
+    getSourceState,
+    manualCheckEnabled,
+    manualCheckReason,
+    queueManualProofCheck,
+  } = useProofCheckRuntime();
 
   useEffect(() => {
     loadPaperHistory();
@@ -91,6 +99,20 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
     }
   };
 
+  const handleProofCheck = async (event, paper) => {
+    event.stopPropagation();
+    try {
+      setProofActionMessage('');
+      await queueManualProofCheck({
+        sourceType: 'paper',
+        sourceId: paper.history_id,
+      });
+      setProofActionMessage(`Queued proof check for paper ${paper.paper_id}.`);
+    } catch (error) {
+      setProofActionMessage(`Failed to queue proof check: ${error.message}`);
+    }
+  };
+
   const runGroups = useMemo(() => (
     buildResearchRunGroups({
       sessionsResponse,
@@ -289,6 +311,12 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
         </div>
       </div>
 
+      {proofActionMessage && (
+        <div className={`test-result-banner ${proofActionMessage.startsWith('Failed') ? 'test-result-banner--error' : 'test-result-banner--success'}`}>
+          {proofActionMessage}
+        </div>
+      )}
+
       <div className="library-controls">
         <input
           type="text"
@@ -400,6 +428,28 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                       {expandedId === paper.history_id && (
                         <>
                           <div className="paper-actions">
+                            {(() => {
+                              const proofCheckState = getSourceState('paper', paper.history_id);
+                              const proofCheckLabel = proofCheckState?.status === 'queued'
+                                ? 'Queueing Proof Check...'
+                                : proofCheckState?.status === 'running'
+                                  ? `Proof Check Running${proofCheckState.candidateCount ? ` (${proofCheckState.candidateCount})` : '...'}`
+                                  : 'Try to prove with Lean 4 theorem prover';
+                              const proofCheckTitle = proofCheckState?.status === 'running'
+                                ? 'A proof verification is already running for this paper.'
+                                : manualCheckReason || 'Queue a manual proof check for this paper.';
+                              return (
+                                <button
+                                  className="btn-download"
+                                  onClick={(e) => handleProofCheck(e, paper)}
+                                  disabled={!manualCheckEnabled || Boolean(proofCheckState)}
+                                  title={proofCheckTitle}
+                                >
+                                  {proofCheckLabel}
+                                </button>
+                              );
+                            })()}
+
                             <button
                               className="btn-download"
                               onClick={(e) => handleDownloadPDF(e, paper)}
diff --git a/frontend/src/components/autonomous/index.js b/frontend/src/components/autonomous/index.js
index ff55385..3d03683 100644
--- a/frontend/src/components/autonomous/index.js
+++ b/frontend/src/components/autonomous/index.js
@@ -9,4 +9,5 @@ export { default as AutonomousResearchSettings } from './AutonomousResearchSetti
 export { default as AutonomousResearchLogs } from './AutonomousResearchLogs';
 export { default as FinalAnswerView } from './FinalAnswerView';
 export { default as FinalAnswerLibrary } from './FinalAnswerLibrary';
+export { default as MathematicalProofs } from './MathematicalProofs';
 
diff --git a/frontend/src/components/compiler/CompilerInterface.jsx b/frontend/src/components/compiler/CompilerInterface.jsx
index 604921f..4b53975 100644
--- a/frontend/src/components/compiler/CompilerInterface.jsx
+++ b/frontend/src/components/compiler/CompilerInterface.jsx
@@ -2,8 +2,9 @@ import React, { useState, useEffect } from 'react';
 import { compilerAPI } from '../../services/api';
 import { websocket } from '../../services/websocket';
 import TextFileUploader from '../TextFileUploader';
+import { getRuntimeDataPath } from '../../utils/runtimeConfig';
 
-function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
+function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false }) {
   const [compilerPrompt, setCompilerPrompt] = useState('');
   const [status, setStatus] = useState({ is_running: false });
   const [isStarting, setIsStarting] = useState(false);
@@ -17,6 +18,33 @@ function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
   const [paperVersion, setPaperVersion] = useState(1);
   const [isSkipping, setIsSkipping] = useState(false);
   const [skipQueued, setSkipQueued] = useState(false);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+
+  const normalizeCompilerSettingsForCapabilities = (settings = {}) => {
+    if (lmStudioEnabled) {
+      return settings;
+    }
+
+    const nextSettings = { ...settings };
+    const rolePrefixes = ['validator', 'highContext', 'highParam', 'critiqueSubmitter'];
+
+    rolePrefixes.forEach((rolePrefix) => {
+      const providerKey = `${rolePrefix}Provider`;
+      const modelKey = `${rolePrefix}Model`;
+      const openRouterProviderKey = `${rolePrefix}OpenrouterProvider`;
+      const fallbackKey = `${rolePrefix}LmStudioFallback`;
+      const keepOpenRouterState = nextSettings[providerKey] === 'openrouter';
+
+      nextSettings[providerKey] = 'openrouter';
+      nextSettings[modelKey] = keepOpenRouterState ? (nextSettings[modelKey] || '') : '';
+      nextSettings[openRouterProviderKey] = keepOpenRouterState
+        ? (nextSettings[openRouterProviderKey] || null)
+        : null;
+      nextSettings[fallbackKey] = null;
+    });
+
+    return nextSettings;
+  };
 
   useEffect(() => {
     loadStatus();
@@ -73,19 +101,22 @@ function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
     if (activeTab === 'compiler-interface') {
       loadSettings();
     }
-  }, [activeTab]);
+  }, [activeTab, lmStudioEnabled]);
 
   const loadSettings = () => {
     const savedSettings = localStorage.getItem('compiler_settings');
     if (savedSettings) {
       try {
-        const settings = JSON.parse(savedSettings);
+        const settings = normalizeCompilerSettingsForCapabilities(JSON.parse(savedSettings));
         if (settings.validatorContextSize) setValidatorContextSize(settings.validatorContextSize);
         if (settings.highContextContextSize) setHighContextContextSize(settings.highContextContextSize);
         if (settings.highParamContextSize) setHighParamContextSize(settings.highParamContextSize);
         if (settings.critiqueSubmitterContextSize) setCritiqueSubmitterContextSize(settings.critiqueSubmitterContextSize);
         // Store for use in handleStart
         window.compilerSettings = settings;
+        if (!lmStudioEnabled) {
+          localStorage.setItem('compiler_settings', JSON.stringify(settings));
+        }
       } catch (error) {
         console.error('Failed to load compiler settings:', error);
       }
@@ -147,31 +178,35 @@ function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
       await compilerAPI.start({
         compiler_prompt: compilerPrompt,
         // Validator config with OpenRouter support
-        validator_provider: settings.validatorProvider || 'lm_studio',
+        validator_provider: lmStudioEnabled ? (settings.validatorProvider || 'lm_studio') : 'openrouter',
         validator_model: settings.validatorModel,
         validator_openrouter_provider: settings.validatorOpenrouterProvider || null,
-        validator_lm_studio_fallback: settings.validatorLmStudioFallback || null,
+        validator_lm_studio_fallback: lmStudioEnabled ? (settings.validatorLmStudioFallback || null) : null,
         validator_context_size: settings.validatorContextSize || validatorContextSize,
         validator_max_output_tokens: settings.validatorMaxOutput || 25000,
         // High-context submitter config with OpenRouter support
-        high_context_provider: settings.highContextProvider || 'lm_studio',
+        high_context_provider: lmStudioEnabled ? (settings.highContextProvider || 'lm_studio') : 'openrouter',
         high_context_model: settings.highContextModel,
         high_context_openrouter_provider: settings.highContextOpenrouterProvider || null,
-        high_context_lm_studio_fallback: settings.highContextLmStudioFallback || null,
+        high_context_lm_studio_fallback: lmStudioEnabled ? (settings.highContextLmStudioFallback || null) : null,
         high_context_context_size: settings.highContextContextSize || highContextContextSize,
         high_context_max_output_tokens: settings.highContextMaxOutput || 25000,
         // High-param submitter config with OpenRouter support
-        high_param_provider: settings.highParamProvider || 'lm_studio',
+        high_param_provider: lmStudioEnabled ? (settings.highParamProvider || 'lm_studio') : 'openrouter',
         high_param_model: settings.highParamModel,
         high_param_openrouter_provider: settings.highParamOpenrouterProvider || null,
-        high_param_lm_studio_fallback: settings.highParamLmStudioFallback || null,
+        high_param_lm_studio_fallback: lmStudioEnabled ? (settings.highParamLmStudioFallback || null) : null,
         high_param_context_size: settings.highParamContextSize || highParamContextSize,
         high_param_max_output_tokens: settings.highParamMaxOutput || 25000,
         // Critique submitter config with OpenRouter support
-        critique_submitter_provider: settings.critiqueSubmitterProvider || 'lm_studio',
+        critique_submitter_provider: lmStudioEnabled
+          ? (settings.critiqueSubmitterProvider || 'lm_studio')
+          : 'openrouter',
         critique_submitter_model: settings.critiqueSubmitterModel,
         critique_submitter_openrouter_provider: settings.critiqueSubmitterOpenrouterProvider || null,
-        critique_submitter_lm_studio_fallback: settings.critiqueSubmitterLmStudioFallback || null,
+        critique_submitter_lm_studio_fallback: lmStudioEnabled
+          ? (settings.critiqueSubmitterLmStudioFallback || null)
+          : null,
         critique_submitter_context_window: settings.critiqueSubmitterContextSize || critiqueSubmitterContextSize,
         critique_submitter_max_tokens: settings.critiqueSubmitterMaxOutput || 25000
       });
@@ -372,7 +407,7 @@ function CompilerInterface({ activeTab, anyWorkflowRunning = false }) {
       <div className="info-section">
         <h3>Aggregator Database</h3>
         <p>The compiler will read from the aggregator's accepted submissions database.</p>
-        <p>Location: <code>backend/data/rag_shared_training.txt</code></p>
+        <p>Location: <code>{getRuntimeDataPath('rag_shared_training.txt')}</code></p>
       </div>
     </div>
   );
diff --git a/frontend/src/components/compiler/CompilerLogs.jsx b/frontend/src/components/compiler/CompilerLogs.jsx
index ca7bb79..0d56f57 100644
--- a/frontend/src/components/compiler/CompilerLogs.jsx
+++ b/frontend/src/components/compiler/CompilerLogs.jsx
@@ -138,6 +138,9 @@ function CompilerLogs() {
     websocket.on('phase_transition', handleCompilerEvent);
     websocket.on('phase_completion_signal', handleCompilerEvent);
 
+    // Wolfram Alpha tool call events (Phase 3) - main writer invoked Wolfram
+    websocket.on('compiler_wolfram_call', handleCompilerEvent);
+
     return () => {
       clearInterval(interval);
       clearInterval(recoveryInterval);
@@ -173,6 +176,9 @@ function CompilerLogs() {
       // Phase transition events cleanup
       websocket.off('phase_transition', handleCompilerEvent);
       websocket.off('phase_completion_signal', handleCompilerEvent);
+
+      // Wolfram tool cleanup
+      websocket.off('compiler_wolfram_call', handleCompilerEvent);
     };
   }, []);
 
@@ -196,7 +202,7 @@ function CompilerLogs() {
 
   const loadRecoveryStatus = async () => {
     try {
-      const response = await fetch('http://localhost:8000/api/compiler/status/recovery');
+      const response = await fetch('/api/compiler/status/recovery');
       if (response.ok) {
         const data = await response.json();
         setRecoveryStatus(data);
@@ -323,6 +329,16 @@ function CompilerLogs() {
       return `Outline updated`;
     }
 
+    // Wolfram Alpha tool call (Phase 3)
+    if (type === 'compiler_wolfram_call') {
+      const n = data.calls_used ?? '?';
+      const cap = data.max_calls ?? 20;
+      const query = (data.query || '').substring(0, 80);
+      const preview = (data.result_preview || '').substring(0, 80);
+      const previewSuffix = preview ? ` - ${preview}` : '';
+      return `[Wolfram ${n}/${cap}] ${query}${previewSuffix}`;
+    }
+
     // Default: show raw JSON
     return JSON.stringify(data, null, 2);
   };
@@ -338,6 +354,9 @@ function CompilerLogs() {
     if (type?.includes('critique') || type?.includes('phase') || type?.includes('rewrite')) {
       return 'event-info';
     }
+    if (type === 'compiler_wolfram_call') {
+      return 'event-info';
+    }
     if (type?.includes('decline') || type?.includes('skipped')) {
       return 'event-warning';
     }
diff --git a/frontend/src/components/compiler/CompilerSettings.jsx b/frontend/src/components/compiler/CompilerSettings.jsx
index e22f2c2..c6c4bba 100644
--- a/frontend/src/components/compiler/CompilerSettings.jsx
+++ b/frontend/src/components/compiler/CompilerSettings.jsx
@@ -1,10 +1,17 @@
 import React, { useState, useEffect } from 'react';
 import { openRouterAPI, api, aggregatorAPI, compilerAPI } from '../../services/api';
+import {
+  computeOpenRouterAutoSettings,
+  findOpenRouterModel,
+  getProviderNames,
+  hasEndpointMetadata,
+} from '../../utils/openRouterSelection';
+import HelpTooltip from '../HelpTooltip';
 import '../settings-common.css';
 
 const SETTINGS_KEY = 'compiler_settings';
 
-function CompilerSettings() {
+function CompilerSettings({ capabilities }) {
   // LM Studio and OpenRouter models
   const [lmStudioModels, setLmStudioModels] = useState([]);
   const [openRouterModels, setOpenRouterModels] = useState([]);
@@ -62,6 +69,18 @@ function CompilerSettings() {
   const [customCritiquePrompt, setCustomCritiquePrompt] = useState('');
   const [critiquePromptSaved, setCritiquePromptSaved] = useState(false);
   const [defaultCritiquePrompt, setDefaultCritiquePrompt] = useState('');
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+  const genericMode = Boolean(capabilities?.genericMode);
+
+  const normalizeRoleState = (provider, model, openrouterProvider) => {
+    const keepOpenRouterState = provider === 'openrouter';
+    return {
+      provider: 'openrouter',
+      model: keepOpenRouterState ? (model || '') : '',
+      openrouterProvider: keepOpenRouterState ? (openrouterProvider || null) : null,
+      lmStudioFallback: null,
+    };
+  };
 
   // Load settings from localStorage on mount
   useEffect(() => {
@@ -78,11 +97,15 @@ function CompilerSettings() {
       }
 
       // Fetch LM Studio models
-      try {
-        const models = await api.getModels();
-        setLmStudioModels(models);
-      } catch (err) {
-        console.error('Failed to fetch LM Studio models:', err);
+      if (lmStudioEnabled) {
+        try {
+          const models = await api.getModels();
+          setLmStudioModels(models.models || models || []);
+        } catch (err) {
+          console.error('Failed to fetch LM Studio models:', err);
+        }
+      } else {
+        setLmStudioModels([]);
       }
 
       // Load saved settings
@@ -148,7 +171,84 @@ function CompilerSettings() {
     };
 
     loadSettings();
-  }, []);
+  }, [lmStudioEnabled]);
+
+  useEffect(() => {
+    if (lmStudioEnabled) {
+      return;
+    }
+
+    setLmStudioModels([]);
+
+    const nextValidator = normalizeRoleState(
+      validatorProvider,
+      validatorModel,
+      validatorOpenrouterProvider
+    );
+    const nextHighContext = normalizeRoleState(
+      highContextProvider,
+      highContextModel,
+      highContextOpenrouterProvider
+    );
+    const nextHighParam = normalizeRoleState(
+      highParamProvider,
+      highParamModel,
+      highParamOpenrouterProvider
+    );
+    const nextCritique = normalizeRoleState(
+      critiqueSubmitterProvider,
+      critiqueSubmitterModel,
+      critiqueSubmitterOpenrouterProvider
+    );
+
+    if (validatorProvider !== nextValidator.provider) setValidatorProvider(nextValidator.provider);
+    if (validatorModel !== nextValidator.model) setValidatorModel(nextValidator.model);
+    if (validatorOpenrouterProvider !== nextValidator.openrouterProvider) {
+      setValidatorOpenrouterProvider(nextValidator.openrouterProvider);
+    }
+    if (validatorLmStudioFallback !== null) setValidatorLmStudioFallback(null);
+
+    if (highContextProvider !== nextHighContext.provider) setHighContextProvider(nextHighContext.provider);
+    if (highContextModel !== nextHighContext.model) setHighContextModel(nextHighContext.model);
+    if (highContextOpenrouterProvider !== nextHighContext.openrouterProvider) {
+      setHighContextOpenrouterProvider(nextHighContext.openrouterProvider);
+    }
+    if (highContextLmStudioFallback !== null) setHighContextLmStudioFallback(null);
+
+    if (highParamProvider !== nextHighParam.provider) setHighParamProvider(nextHighParam.provider);
+    if (highParamModel !== nextHighParam.model) setHighParamModel(nextHighParam.model);
+    if (highParamOpenrouterProvider !== nextHighParam.openrouterProvider) {
+      setHighParamOpenrouterProvider(nextHighParam.openrouterProvider);
+    }
+    if (highParamLmStudioFallback !== null) setHighParamLmStudioFallback(null);
+
+    if (critiqueSubmitterProvider !== nextCritique.provider) {
+      setCritiqueSubmitterProvider(nextCritique.provider);
+    }
+    if (critiqueSubmitterModel !== nextCritique.model) setCritiqueSubmitterModel(nextCritique.model);
+    if (critiqueSubmitterOpenrouterProvider !== nextCritique.openrouterProvider) {
+      setCritiqueSubmitterOpenrouterProvider(nextCritique.openrouterProvider);
+    }
+    if (critiqueSubmitterLmStudioFallback !== null) setCritiqueSubmitterLmStudioFallback(null);
+  }, [
+    lmStudioEnabled,
+    validatorProvider,
+    validatorModel,
+    validatorOpenrouterProvider,
+    validatorLmStudioFallback,
+    highContextProvider,
+    highContextModel,
+    highContextOpenrouterProvider,
+    highContextLmStudioFallback,
+    highParamProvider,
+    highParamModel,
+    highParamOpenrouterProvider,
+    highParamLmStudioFallback,
+    critiqueSubmitterProvider,
+    critiqueSubmitterModel,
+    critiqueSubmitterOpenrouterProvider,
+    critiqueSubmitterLmStudioFallback,
+  ]);
 
   // Fetch providers for any OpenRouter models after settings are loaded
   useEffect(() => {
@@ -269,15 +369,37 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   }, []);
 
   const fetchProvidersForModel = async (modelId) => {
-    if (!modelId || modelProviders[modelId]) return;
+    if (!modelId) return null;
+
+    const cachedProviderData = modelProviders[modelId];
+    if (hasEndpointMetadata(cachedProviderData)) {
+      return cachedProviderData;
+    }
+
     try {
       const result = await openRouterAPI.getProviders(modelId);
-      setModelProviders(prev => ({ ...prev, [modelId]: result.providers || [] }));
+      const providerData = {
+        providers: result.providers || [],
+        endpoints: result.endpoints || [],
+      };
+      setModelProviders(prev => ({ ...prev, [modelId]: providerData }));
+      return providerData;
     } catch (err) {
       console.error(`Failed to fetch providers for ${modelId}:`, err);
+      return cachedProviderData || null;
     }
   };
 
+  const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
+    const model = findOpenRouterModel(openRouterModels, modelId);
+    if (!model) {
+      return null;
+    }
+
+    const providerData = await fetchProvidersForModel(modelId);
+    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+  };
+
   // Critique prompt handlers
   const handleSaveCritiquePrompt = () => {
     localStorage.setItem('compiler_critique_custom_prompt', customCritiquePrompt);
@@ -340,6 +462,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
   // Handler for "Use Aggregator Models" button
   const handleUseAggregatorModels = async () => {
+    if (!lmStudioEnabled) {
+      alert('Use Aggregator Models is unavailable when this deployment disables LM Studio.');
+      return;
+    }
+
     try {
       const response = await aggregatorAPI.getSettings();
       const settings = response.data;
@@ -388,53 +515,62 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     maxOutput, setMaxOutput,
     borderColor = '#333'
   }) => {
-    const models = provider === 'openrouter' ? openRouterModels : lmStudioModels;
-    const providers = model && provider === 'openrouter' ? (modelProviders[model] || []) : [];
+    const effectiveProvider = lmStudioEnabled ? provider : 'openrouter';
+    const models = effectiveProvider === 'openrouter' ? openRouterModels : lmStudioModels;
+    const providers = model && effectiveProvider === 'openrouter'
+      ? getProviderNames(modelProviders[model])
+      : [];
 
     return (
       <div
-        className={`role-config-card role-config-card--highlight${provider === 'openrouter' ? ' role-config-card--openrouter' : ''}`}
-        style={{ borderColor: provider === 'openrouter' ? undefined : borderColor, padding: '1.5rem' }}
+        className={`role-config-card role-config-card--highlight${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter' : ''}`}
+        style={{ borderColor: effectiveProvider === 'openrouter' ? undefined : borderColor, padding: '1.5rem' }}
       >
-        <h3 style={{ margin: '0 0 0.5rem 0', color: provider === 'openrouter' ? '#a29bfe' : borderColor }}>
+        <h3 style={{ margin: '0 0 0.5rem 0', color: effectiveProvider === 'openrouter' ? '#18cc17' : borderColor }}>
           {title}
-          {provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
+          {effectiveProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
         </h3>
         <small className="role-description">{description}</small>
 
         {/* Provider Toggle */}
         <div className="form-group">
           <label>Provider</label>
-          <div className="provider-toggle-group">
-            <button
-              type="button"
-              onClick={() => {
-                setProvider('lm_studio');
-                setModel('');
-                setOpenrouterProv(null);
-                setFallback(null);
-              }}
-              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
-            >
-              LM Studio
-            </button>
-            <button
-              type="button"
-              onClick={() => {
-                if (hasOpenRouterKey) {
-                  setProvider('openrouter');
+          {lmStudioEnabled ? (
+            <div className="provider-toggle-group">
+              <button
+                type="button"
+                onClick={() => {
+                  setProvider('lm_studio');
                   setModel('');
                   setOpenrouterProv(null);
                   setFallback(null);
-                }
-              }}
-              disabled={!hasOpenRouterKey}
-              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
-              title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
-            >
-              OpenRouter
-            </button>
-          </div>
+                }}
+                className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
+              >
+                LM Studio
+              </button>
+              <button
+                type="button"
+                onClick={() => {
+                  if (hasOpenRouterKey) {
+                    setProvider('openrouter');
+                    setModel('');
+                    setOpenrouterProv(null);
+                    setFallback(null);
+                  }
+                }}
+                disabled={!hasOpenRouterKey}
+                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
+                title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
+              >
+                OpenRouter
+              </button>
+            </div>
+          ) : (
+            <small className="hint-text hint-text--dim">
+              OpenRouter is required in this deployment.
+            </small>
+          )}
         </div>
 
         {/* Model Selection */}
@@ -442,17 +578,22 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           <label>Model</label>
           <select
             value={model || ''}
-            onChange={(e) => {
+            onChange={async (e) => {
               const m = e.target.value;
               setModel(m);
-              if (provider === 'openrouter' && m) {
-                fetchProvidersForModel(m);
+              setOpenrouterProv(null);
+              if (effectiveProvider === 'openrouter' && m) {
+                const autoSettings = await getAutoSettingsForModel(m, null);
+                if (autoSettings) {
+                  setContextSize(autoSettings.contextWindow);
+                  setMaxOutput(autoSettings.maxOutputTokens);
+                }
               }
             }}
           >
             <option value="">Select model...</option>
             {models.map(m => {
-              const isFree = provider === 'openrouter' && 
+              const isFree = effectiveProvider === 'openrouter' && 
                             m.pricing?.prompt === "0" && 
                             m.pricing?.completion === "0";
               const displayName = m.name || m.id;
@@ -468,12 +609,20 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         </div>
 
         {/* OpenRouter Provider (if OpenRouter) */}
-        {provider === 'openrouter' && model && (
+        {effectiveProvider === 'openrouter' && model && (
           <div className="form-group">
             <label>Host Provider (optional)</label>
             <select
               value={openrouterProv || ''}
-              onChange={(e) => setOpenrouterProv(e.target.value || null)}
+              onChange={async (e) => {
+                const providerName = e.target.value || null;
+                setOpenrouterProv(providerName);
+                const autoSettings = await getAutoSettingsForModel(model, providerName);
+                if (autoSettings) {
+                  setContextSize(autoSettings.contextWindow);
+                  setMaxOutput(autoSettings.maxOutputTokens);
+                }
+              }}
             >
               <option value="">Auto (let OpenRouter choose)</option>
               {providers.map(p => (
@@ -484,7 +633,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         )}
 
         {/* LM Studio Fallback (if OpenRouter) */}
-        {provider === 'openrouter' && (
+        {effectiveProvider === 'openrouter' && lmStudioEnabled && (
           <div className="form-group">
             <label className="label--muted">LM Studio Fallback (optional)</label>
             <select
@@ -614,21 +763,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       <div className="settings-panel settings-panel--blue">
         <h3 style={{ marginBottom: '1rem' }}>Model Management</h3>
         <div className="model-refresh-controls">
-          <button 
-            onClick={handleUseAggregatorModels}
-            className="secondary btn-primary-blue"
-          >
-            Use Aggregator Models
-          </button>
-          <button 
-            onClick={async () => {
-              const models = await api.getModels();
-              setLmStudioModels(models);
-            }} 
-            className="secondary"
-          >
-            Refresh LM Studio Models
-          </button>
+          {lmStudioEnabled && (
+            <>
+              <button 
+                onClick={handleUseAggregatorModels}
+                className="secondary btn-primary-blue"
+              >
+                Use Aggregator Models
+              </button>
+              <button 
+                onClick={async () => {
+                  const models = await api.getModels();
+                  setLmStudioModels(models.models || models || []);
+                }} 
+                className="secondary"
+              >
+                Refresh LM Studio Models
+              </button>
+            </>
+          )}
           {hasOpenRouterKey && (
             <>
               <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary">
@@ -653,10 +806,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                     }}
                   />
                   Enable Free Model Looping
-                  <span
-                    title="When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits."
-                    className="help-hint"
-                  >(?)</span>
+                  <HelpTooltip
+                    label="Learn about free model looping"
+                    anchorClassName="help-tooltip-anchor--inline"
+                  >
+                    When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
+                  </HelpTooltip>
                 </label>
                 <label className="settings-checkbox-label">
                   <input
@@ -668,17 +823,21 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                     }}
                   />
                   Use OpenRouter Free Models Auto-Selector as Backup
-                  <span
-                    title="When all selected free models are rate-limited, use OpenRouter's Free Models Router (openrouter/free) as a last resort backup. Works independently of Free Model Looping."
-                    className="help-hint"
-                  >(?)</span>
+                  <HelpTooltip
+                    label="Learn about the free models auto-selector backup"
+                    anchorClassName="help-tooltip-anchor--inline"
+                  >
+                    When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
+                  </HelpTooltip>
                 </label>
               </div>
             </>
           )}
         </div>
         <small className="hint-text" style={{ marginTop: '0.75rem' }}>
-          "Use Aggregator Models" copies your aggregator's model selection to all compiler roles.
+          {lmStudioEnabled
+            ? '"Use Aggregator Models" copies your aggregator\'s model selection to all compiler roles.'
+            : 'LM Studio tools are hidden in hosted mode. Configure compiler roles directly with OpenRouter models below.'}
         </small>
       </div>
 
@@ -714,13 +873,23 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 type="password"
                 value={wolframApiKey}
                 onChange={(e) => setWolframApiKey(e.target.value)}
-                placeholder={hasStoredWolframKey && !wolframApiKey ? "Stored securely on backend. Enter a new App ID to replace it." : "Enter your Wolfram Alpha App ID"}
+                placeholder={
+                  hasStoredWolframKey && !wolframApiKey
+                    ? (
+                      genericMode
+                        ? 'Loaded in the current backend session. Enter a new App ID to replace it.'
+                        : 'Stored securely on backend. Enter a new App ID to replace it.'
+                    )
+                    : 'Enter your Wolfram Alpha App ID'
+                }
                 className="input-dark"
                 style={{ marginBottom: '0.5rem' }}
               />
               {hasStoredWolframKey && !wolframApiKey && (
                 <small className="hint-text">
-                  A Wolfram Alpha key is already stored securely on the backend for this machine.
+                  {genericMode
+                    ? 'A Wolfram Alpha key is already loaded in the current backend session.'
+                    : 'A Wolfram Alpha key is already stored securely on the backend for this machine.'}
                 </small>
               )}
             </div>
diff --git a/frontend/src/components/critique-modal.css b/frontend/src/components/critique-modal.css
index 3c6a656..c2f9210 100644
--- a/frontend/src/components/critique-modal.css
+++ b/frontend/src/components/critique-modal.css
@@ -475,14 +475,14 @@
 
 /* Rating color classes (text) */
 .critique-color--emerald { color: #34d399; }
-.critique-color--blue    { color: #60a5fa; }
+.critique-color--blue    { color: #18cc17; }
 .critique-color--yellow  { color: #facc15; }
 .critique-color--orange  { color: #fb923c; }
 .critique-color--red     { color: #f87171; }
 
 /* Rating color classes (bar fill) */
 .critique-bg--emerald { background-color: #10b981; }
-.critique-bg--blue    { background-color: #3b82f6; }
+.critique-bg--blue    { background-color: #18cc17; }
 .critique-bg--yellow  { background-color: #eab308; }
 .critique-bg--orange  { background-color: #f97316; }
 .critique-bg--red     { background-color: #ef4444; }
diff --git a/frontend/src/components/settings-common.css b/frontend/src/components/settings-common.css
index df7573a..8845e5e 100644
--- a/frontend/src/components/settings-common.css
+++ b/frontend/src/components/settings-common.css
@@ -41,7 +41,7 @@
 }
 
 .provider-toggle-btn.active-or {
-  background: #6c5ce7;
+  background: #18cc17;
 }
 
 .provider-toggle-btn.active-or-orange {
@@ -148,8 +148,8 @@
 
 /* OpenRouter status banner */
 .openrouter-banner {
-  background: rgba(108, 92, 231, 0.08);
-  border: 1px solid rgba(108, 92, 231, 0.35);
+  background: rgba(24, 204, 23, 0.08);
+  border: 1px solid rgba(24, 204, 23, 0.35);
   border-radius: var(--radius-md);
   padding: 1rem;
   margin-bottom: 1.5rem;
@@ -161,7 +161,7 @@
 }
 
 .openrouter-banner__text {
-  color: #a29bfe;
+  color: #18cc17;
   margin: 0;
 }
 
@@ -185,7 +185,7 @@
 }
 
 .role-config-card--openrouter {
-  border-color: rgba(108, 92, 231, 0.35);
+  border-color: #18cc17;
   background: rgba(26, 26, 56, 0.8);
 }
 
@@ -208,7 +208,7 @@
 
 /* Card title colours */
 .card-title--green { color: var(--accent-green); }
-.card-title--purple { color: #a29bfe; }
+.card-title--purple { color: #18cc17; }
 .card-title--orange { color: #FF6700; }
 
 /* Inline provider badge */
@@ -416,7 +416,7 @@
 /* Purple accent button */
 .btn-accent-purple {
   padding: 0.5rem 1.5rem;
-  background: #9b59b6;
+  background: #18cc17;
   border: none;
   border-radius: var(--radius-sm);
   color: #fff;
@@ -573,7 +573,7 @@
 }
 
 .tag-badge--purple {
-  background: #9b59b6;
+  background: #18cc17;
   color: #fff;
 }
 
@@ -679,86 +679,6 @@
 .model-item--silver { border-left: 5px solid #c0c0c0; }
 .model-item--bronze { border-left: 5px solid #cd7f32; }
 
-/* Info tooltip button (? circle) */
-.info-tooltip-btn {
-  background: transparent;
-  padding: 0;
-  border-radius: var(--radius-sm);
-  cursor: pointer;
-  font-weight: bold;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  transition: all var(--transition-fast);
-}
-
-.info-tooltip-btn--orange {
-  border: 2px solid #FF6700;
-  color: #FF6700;
-  font-size: 0.7rem;
-  width: 16px;
-  height: 16px;
-}
-
-.info-tooltip-btn--gold {
-  border: 2px solid #f4c430;
-  color: #ffd54a;
-  box-shadow: 0 0 8px rgba(255, 204, 51, 0.22);
-  font-size: 0.8rem;
-  width: 20px;
-  height: 20px;
-}
-
-.info-tooltip-btn:hover {
-  filter: brightness(1.3);
-}
-
-/* Tooltip popup */
-.tooltip-popup {
-  background: var(--surface-2);
-  border: 2px solid #FF6700;
-  border-radius: var(--radius-sm);
-  padding: 12px 16px;
-  font-size: 0.85rem;
-  color: #FF6700;
-  font-weight: 500;
-  box-shadow: var(--shadow-lg);
-  pointer-events: none;
-  z-index: 1000;
-}
-
-.tooltip-popup--absolute {
-  position: absolute;
-  top: calc(100% + 8px);
-  left: 50%;
-  transform: translateX(-50%);
-}
-
-.tooltip-popup--fixed {
-  position: fixed;
-}
-
-/*
- * sidebar-escape tooltip: uses position:fixed instead of absolute so it can
- * break out of the narrow 322px left sidebar without being clipped or squished.
- * left: 326px sits flush against the sidebar's right edge (322px wide + 4px gap).
- * top: 62px aligns it with roughly where the "?" button sits in the sidebar header.
- * Adjust top if the header height ever changes.
- */
-.tooltip-popup--sidebar-escape {
-  position: fixed;
-  left: 276px;
-  top: 112px;
-  width: 340px;
-  z-index: 9999;
-}
-
-/* Tooltip anchor wrapper */
-.tooltip-anchor {
-  position: relative;
-  display: inline-block;
-}
-
 /* Modal overlay and content (shared by inline modals) */
 .inline-modal-overlay {
   position: fixed;
diff --git a/frontend/src/hooks/useProofCheckRuntime.js b/frontend/src/hooks/useProofCheckRuntime.js
new file mode 100644
index 0000000..32f6a82
--- /dev/null
+++ b/frontend/src/hooks/useProofCheckRuntime.js
@@ -0,0 +1,153 @@
+import { useCallback, useEffect, useMemo, useState } from 'react';
+import { autonomousAPI } from '../services/api';
+import { websocket } from '../services/websocket';
+
+function buildSourceKey(sourceType, sourceId) {
+  return `${sourceType}:${sourceId}`;
+}
+
+export function useProofCheckRuntime() {
+  const [proofStatus, setProofStatus] = useState(null);
+  const [runtimeError, setRuntimeError] = useState('');
+  const [activeChecks, setActiveChecks] = useState({});
+  const [queuedChecks, setQueuedChecks] = useState({});
+
+  const refreshProofStatus = useCallback(async () => {
+    try {
+      const status = await autonomousAPI.getProofStatus();
+      setProofStatus(status);
+      setRuntimeError('');
+      return status;
+    } catch (err) {
+      setRuntimeError(err.message || 'Failed to load proof status');
+      return null;
+    }
+  }, []);
+
+  useEffect(() => {
+    refreshProofStatus();
+  }, [refreshProofStatus]);
+
+  useEffect(() => {
+    const unsubscribeStarted = websocket.on('proof_check_started', (data) => {
+      const sourceKey = buildSourceKey(data.source_type, data.source_id);
+      setActiveChecks((prev) => ({
+        ...prev,
+        [sourceKey]: {
+          status: 'running',
+          candidateCount: prev[sourceKey]?.candidateCount ?? null,
+        },
+      }));
+      setQueuedChecks((prev) => {
+        if (!prev[sourceKey]) {
+          return prev;
+        }
+        const next = { ...prev };
+        delete next[sourceKey];
+        return next;
+      });
+    });
+
+    const unsubscribeCandidates = websocket.on('proof_check_candidates_found', (data) => {
+      const sourceKey = buildSourceKey(data.source_type, data.source_id);
+      setActiveChecks((prev) => ({
+        ...prev,
+        [sourceKey]: {
+          status: 'running',
+          candidateCount: data.count ?? null,
+        },
+      }));
+    });
+
+    const unsubscribeComplete = websocket.on('proof_check_complete', (data) => {
+      const sourceKey = buildSourceKey(data.source_type, data.source_id);
+      setActiveChecks((prev) => {
+        if (!prev[sourceKey]) {
+          return prev;
+        }
+        const next = { ...prev };
+        delete next[sourceKey];
+        return next;
+      });
+      setQueuedChecks((prev) => {
+        if (!prev[sourceKey]) {
+          return prev;
+        }
+        const next = { ...prev };
+        delete next[sourceKey];
+        return next;
+      });
+      refreshProofStatus();
+    });
+
+    return () => {
+      unsubscribeStarted();
+      unsubscribeCandidates();
+      unsubscribeComplete();
+    };
+  }, [refreshProofStatus]);
+
+  const queueManualProofCheck = useCallback(async ({ sourceType, sourceId }) => {
+    const sourceKey = buildSourceKey(sourceType, sourceId);
+    setQueuedChecks((prev) => ({
+      ...prev,
+      [sourceKey]: true,
+    }));
+
+    try {
+      return await autonomousAPI.runProofCheck({ sourceType, sourceId });
+    } catch (err) {
+      setQueuedChecks((prev) => {
+        if (!prev[sourceKey]) {
+          return prev;
+        }
+        const next = { ...prev };
+        delete next[sourceKey];
+        return next;
+      });
+      throw err;
+    }
+  }, []);
+
+  const getSourceState = useCallback((sourceType, sourceId) => {
+    const sourceKey = buildSourceKey(sourceType, sourceId);
+    if (activeChecks[sourceKey]) {
+      return activeChecks[sourceKey];
+    }
+    if (queuedChecks[sourceKey]) {
+      return {
+        status: 'queued',
+        candidateCount: null,
+      };
+    }
+    return null;
+  }, [activeChecks, queuedChecks]);
+
+  const isSourceBusy = useCallback((sourceType, sourceId) => {
+    return Boolean(getSourceState(sourceType, sourceId));
+  }, [getSourceState]);
+
+  const manualCheckReason = useMemo(() => {
+    if (!proofStatus) {
+      return 'Loading proof runtime status...';
+    }
+    if (!proofStatus.lean4_enabled) {
+      return 'Lean 4 proof checks are disabled.';
+    }
+    if (!proofStatus.manual_check_ready) {
+      return proofStatus.manual_check_message || 'Manual proof checks are not ready yet.';
+    }
+    return '';
+  }, [proofStatus]);
+
+  return {
+    proofStatus,
+    runtimeError,
+    refreshProofStatus,
+    queueManualProofCheck,
+    getSourceState,
+    isSourceBusy,
+    manualCheckEnabled: Boolean(proofStatus?.lean4_enabled && proofStatus?.manual_check_ready),
+    manualCheckReason,
+  };
+}
diff --git a/frontend/src/index.css b/frontend/src/index.css
index d27e9cc..6666081 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -16,8 +16,8 @@
 
   /* Semantic accent colours (unchanged hues, new aliases) */
   --accent-green: #4CAF50;
-  --accent-blue: #2196F3;
-  --accent-purple: #9C27B0;
+  --accent-blue: #18cc17;
+  --accent-purple: #18cc17;
   --accent-red: #f44336;
   --accent-orange: #ff9800;
 
@@ -61,6 +61,14 @@
   box-sizing: border-box;
 }
 
+/* Always reserve vertical scrollbar space on the page itself, so switching
+   between tabs whose content height crosses the viewport threshold does not
+   shift centered elements (banner, logo) horizontally as the scrollbar
+   appears/disappears. */
+html {
+  scrollbar-gutter: stable;
+}
+
 body {
   font-family: 'Inter', -apple-system, BlinkMacSystemFont, 'Segoe UI', 'Roboto', 'Oxygen',
     'Ubuntu', 'Cantarell', 'Fira Sans', 'Droid Sans', 'Helvetica Neue',
@@ -178,7 +186,7 @@ code {
 }
 
 .banner-variant {
-  color: #ffa726;
+  color: #18cc17;
   font-size: 0.95rem;
   margin: 0.85rem 0 0 0;
   font-weight: 500;
@@ -242,17 +250,17 @@ code {
 .mode-switch-control {
   min-width: 250px;
   padding: 0.7rem 0.8rem 0.8rem;
-  background: rgba(11, 11, 15, 0.92);
-  border: 1px solid var(--border-default);
+  background: linear-gradient(180deg, rgba(13, 18, 14, 0.92), rgba(11, 11, 15, 0.94));
+  border: 1px solid rgba(30, 255, 28, 0.16);
   border-radius: var(--radius-md);
-  box-shadow: var(--shadow-md);
+  box-shadow: 0 10px 24px rgba(0, 0, 0, 0.34);
   backdrop-filter: blur(8px);
 }
 
 .mode-switch-label {
   display: block;
   margin-bottom: 0.45rem;
-  color: var(--text-secondary);
+  color: rgba(255, 255, 255, 0.9);
   font-size: 0.72rem;
   font-weight: 700;
   letter-spacing: 0.08em;
@@ -260,11 +268,18 @@ code {
 }
 
 .mode-switch-select {
+  appearance: none;
+  -webkit-appearance: none;
   min-width: 0;
-  padding: 0.6rem 0.8rem;
-  background: linear-gradient(180deg, var(--surface-2), var(--surface-1));
-  border: 1px solid var(--border-strong);
-  color: var(--text-primary);
+  width: 100%;
+  padding: 0.6rem 2.2rem 0.6rem 0.8rem;
+  background:
+    url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='14' height='14' viewBox='0 0 14 14'%3E%3Cpath d='M3 5.25L7 9l4-3.75' fill='none' stroke='%231eff1c' stroke-width='1.8' stroke-linecap='round' stroke-linejoin='round'/%3E%3C/svg%3E")
+      no-repeat right 0.8rem center / 14px,
+    linear-gradient(180deg, rgba(22, 27, 23, 0.98), rgba(15, 18, 16, 0.98));
+  border: 1px solid rgba(30, 255, 28, 0.22);
+  border-radius: var(--radius-sm);
+  color: #fff;
   font-size: 0.9rem;
   font-weight: 600;
   cursor: pointer;
@@ -272,7 +287,15 @@ code {
 }
 
 .mode-switch-select:hover {
-  border-color: rgba(30, 255, 28, 0.28);
+  border-color: rgba(30, 255, 28, 0.34);
+}
+
+.mode-switch-select:focus-visible {
+  outline: none;
+  border-color: rgba(30, 255, 28, 0.45);
+  box-shadow:
+    inset 0 1px 0 rgba(255, 255, 255, 0.04),
+    0 0 0 3px rgba(30, 255, 28, 0.12);
 }
 
 .mode-switch-select option {
@@ -281,22 +304,226 @@ code {
 }
 
 .boost-btn {
-  background: linear-gradient(135deg, var(--gold) 0%, #7dff6f 100%);
-  color: #000;
-  border: none;
-  padding: 0.5rem 1rem;
+  min-height: 34px;
+  background: linear-gradient(180deg, rgba(20, 37, 22, 0.92), rgba(11, 16, 13, 0.96));
+  color: #fff;
+  border: 1px solid rgba(30, 255, 28, 0.24);
+  padding: 0.5rem 0.95rem;
   border-radius: var(--radius-sm);
-  font-size: 0.9rem;
-  font-weight: 700;
+  font-size: 0.84rem;
+  font-weight: 600;
   cursor: pointer;
-  box-shadow: var(--shadow-gold);
+  box-shadow: 0 8px 18px rgba(0, 0, 0, 0.26);
   transition: all var(--transition-fast);
   white-space: nowrap;
 }
 
 .boost-btn:hover {
-  transform: translateY(-2px);
-  box-shadow: 0 6px 20px rgba(30, 255, 28, 0.35);
+  transform: translateY(-1px);
+  border-color: rgba(30, 255, 28, 0.38);
+  box-shadow: 0 10px 22px rgba(0, 0, 0, 0.3);
+}
+
+.boost-control-row {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+}
+
+.app-header-tooltip-anchor,
+.help-tooltip-anchor {
+  position: relative;
+  display: inline-flex;
+  align-items: center;
+}
+
+.help-tooltip-anchor--inline {
+  margin-left: 8px;
+  vertical-align: middle;
+}
+
+.app-header-help-btn,
+.help-tooltip-btn {
+  width: 18px;
+  height: 18px;
+  padding: 0;
+  border: 1px solid rgba(30, 255, 28, 0.24);
+  border-radius: 999px;
+  background: linear-gradient(180deg, rgba(20, 37, 22, 0.92), rgba(11, 16, 13, 0.96));
+  color: #fff;
+  font-size: 0.75rem;
+  font-weight: 700;
+  line-height: 1;
+  font-family: inherit;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  cursor: help;
+  appearance: none;
+  box-shadow: 0 8px 18px rgba(0, 0, 0, 0.22);
+  transition:
+    border-color var(--transition-fast),
+    filter var(--transition-fast),
+    transform var(--transition-fast),
+    box-shadow var(--transition-fast);
+}
+
+.help-tooltip-btn--green {
+  border-color: #4caf50;
+  background: rgba(14, 30, 18, 0.96);
+  color: #4caf50;
+}
+
+.app-header-help-btn:hover,
+.app-header-help-btn:focus-visible,
+.help-tooltip-btn:hover,
+.help-tooltip-btn:focus-visible {
+  border-color: rgba(30, 255, 28, 0.38);
+  filter: brightness(1.08);
+  transform: translateY(-1px);
+  box-shadow: 0 10px 20px rgba(0, 0, 0, 0.26);
+}
+
+.app-header-help-btn:focus-visible,
+.help-tooltip-btn:focus-visible {
+  outline: 1px solid rgba(30, 255, 28, 0.45);
+  outline-offset: 2px;
+}
+
+.help-tooltip-btn--green:focus-visible {
+  outline-color: rgba(30, 255, 28, 0.45);
+}
+
+.app-header-tooltip-popup,
+.help-tooltip-popup {
+  position: absolute;
+  top: calc(100% + 10px);
+  right: 0;
+  width: min(360px, calc(100vw - 96px));
+  padding: 0.8rem 0.9rem;
+  background: linear-gradient(180deg, rgba(14, 18, 15, 0.98), rgba(11, 11, 15, 0.99));
+  border: 1px solid rgba(30, 255, 28, 0.28);
+  border-radius: var(--radius-sm);
+  box-shadow: var(--shadow-lg);
+  color: #fff;
+  font-size: 0.8rem;
+  line-height: 1.45;
+  white-space: normal;
+  box-sizing: border-box;
+  z-index: 1002;
+  pointer-events: none;
+}
+
+.app-header-tooltip-popup::before,
+.help-tooltip-popup::before {
+  content: '';
+  position: absolute;
+  top: -7px;
+  right: 16px;
+  width: 12px;
+  height: 12px;
+  background: rgba(13, 16, 14, 0.99);
+  border-top: 1px solid rgba(30, 255, 28, 0.28);
+  border-left: 1px solid rgba(30, 255, 28, 0.28);
+  transform: rotate(45deg);
+}
+
+.help-tooltip-popup--center {
+  left: 50%;
+  right: auto;
+  width: min(380px, calc(100vw - 96px));
+  transform: translateX(-50%);
+}
+
+.help-tooltip-popup--center::before {
+  left: 50%;
+  right: auto;
+  transform: translateX(-50%) rotate(45deg);
+}
+
+.help-tooltip-popup--fixed {
+  position: fixed;
+}
+
+.help-tooltip-popup--fixed::before,
+.help-tooltip-popup--sidebar-escape::before {
+  display: none;
+}
+
+.help-tooltip-popup--sidebar-escape {
+  position: fixed;
+  left: 276px;
+  right: auto;
+  top: 112px;
+  width: min(360px, calc(100vw - 96px));
+  z-index: 9999;
+}
+
+.help-tooltip-popup code {
+  background: rgba(255, 255, 255, 0.07);
+  border: 1px solid rgba(255, 255, 255, 0.12);
+  border-radius: 3px;
+  padding: 0.1em 0.3em;
+  font-size: 0.85em;
+  color: #d2d8e3;
+  font-family: 'Consolas', 'Monaco', monospace;
+}
+
+.header-status-chip {
+  min-height: 34px;
+  display: inline-flex;
+  align-items: center;
+  margin-left: 0.5rem;
+  padding: 0.42rem 0.78rem;
+  border-radius: var(--radius-sm);
+  background: rgba(16, 21, 18, 0.94);
+  border: 1px solid rgba(30, 255, 28, 0.16);
+  box-shadow: 0 8px 18px rgba(0, 0, 0, 0.24);
+  color: #fff;
+  font-size: 0.82rem;
+  font-weight: 600;
+  line-height: 1;
+  white-space: nowrap;
+}
+
+button.header-status-chip {
+  cursor: pointer;
+  transition: all var(--transition-fast);
+}
+
+button.header-status-chip:hover,
+button.header-status-chip:focus-visible {
+  transform: translateY(-1px);
+  background: rgba(20, 30, 22, 0.96);
+  border-color: rgba(30, 255, 28, 0.36);
+}
+
+button.header-status-chip:focus-visible {
+  outline: 1px solid rgba(30, 255, 28, 0.45);
+  outline-offset: 2px;
+}
+
+.header-status-chip--ready {
+  background: rgba(23, 43, 26, 0.8);
+  border-color: rgba(30, 255, 28, 0.32);
+}
+
+.header-status-chip--inactive {
+  background: rgba(18, 22, 19, 0.92);
+  border-color: rgba(255, 255, 255, 0.08);
+  color: rgba(255, 255, 255, 0.88);
+}
+
+.header-status-chip--hosted {
+  background: rgba(18, 22, 19, 0.92);
+  border-color: rgba(30, 255, 28, 0.18);
+}
+
+.header-status-chip--pending {
+  background: rgba(22, 22, 32, 0.92);
+  border-color: rgba(255, 255, 255, 0.16);
+  color: rgba(255, 255, 255, 0.62);
+  opacity: 0.9;
 }
 
 .tabs {
@@ -376,6 +603,7 @@ code {
   flex: 1;
   padding: 2rem 3rem;
   overflow-y: auto;
+  scrollbar-gutter: stable;
   max-width: 100%;
 }
 
@@ -582,7 +810,7 @@ button.danger:hover {
 }
 
 .event-info {
-  background: rgba(33, 150, 243, 0.08);
+  background: rgba(24, 204, 23, 0.08);
   border-left: 3px solid var(--accent-blue);
   border-radius: var(--radius-sm);
 }
@@ -1282,13 +1510,13 @@ button.danger:hover {
 }
 
 .tab-compiler.active {
-  color: #2196F3;
-  border-bottom-color: #2196F3;
+  color: #18cc17;
+  border-bottom-color: #18cc17;
 }
 
 .tab-autonomous.active {
-  color: #9C27B0;
-  border-bottom-color: #9C27B0;
+  color: #18cc17;
+  border-bottom-color: #18cc17;
 }
 
 .tab-boost.active {
@@ -1298,9 +1526,9 @@ button.danger:hover {
 
 /* Tier 3 Final Answer Tab Special Styling */
 .tab-tier3-active {
-  background: linear-gradient(135deg, rgba(52, 152, 219, 0.2), rgba(155, 89, 182, 0.2)) !important;
+  background: linear-gradient(135deg, rgba(24, 204, 23, 0.2), rgba(24, 204, 23, 0.2)) !important;
   animation: tier3-tab-pulse 2s infinite;
-  border-bottom: 2px solid #3498db !important;
+  border-bottom: 2px solid #18cc17 !important;
 }
 
 .tab-tier3-complete {
@@ -1439,12 +1667,12 @@ button.danger:hover {
 }
 
 .activity-icon.topic {
-  background: rgba(156, 39, 176, 0.12);
+  background: rgba(24, 204, 23, 0.12);
   color: var(--accent-purple);
 }
 
 .activity-icon.paper {
-  background: rgba(33, 150, 243, 0.12);
+  background: rgba(24, 204, 23, 0.12);
   color: var(--accent-blue);
 }
 
@@ -1491,7 +1719,7 @@ button.danger:hover {
 }
 
 .brainstorm-topic-id {
-  color: #9C27B0;
+  color: #18cc17;
   font-family: monospace;
   font-size: 0.85rem;
 }
@@ -1543,7 +1771,7 @@ button.danger:hover {
 }
 
 .brainstorm-paper-link {
-  color: #2196F3;
+  color: #18cc17;
   font-size: 0.9rem;
   text-decoration: none;
   cursor: pointer;
@@ -1574,7 +1802,7 @@ button.danger:hover {
 }
 
 .paper-card:hover {
-  border-color: rgba(33, 150, 243, 0.35);
+  border-color: rgba(24, 204, 23, 0.35);
   transform: translateY(-3px);
   box-shadow: var(--shadow-md);
 }
@@ -1930,6 +2158,61 @@ button.danger:hover {
   }
 }
 
+/* ── Update Notice Banner ── */
+.update-notice-banner {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 1rem;
+  padding: 0.6rem 1.2rem;
+  background: linear-gradient(135deg, rgba(30, 255, 28, 0.12) 0%, rgba(30, 200, 28, 0.08) 100%);
+  border-bottom: 1px solid rgba(30, 255, 28, 0.35);
+  color: #c8ffc7;
+  font-size: 0.88rem;
+  line-height: 1.45;
+  z-index: 50;
+}
+
+.update-notice-content {
+  display: flex;
+  align-items: center;
+  gap: 0.6rem;
+  flex: 1;
+  min-width: 0;
+}
+
+.update-notice-icon {
+  font-size: 1.15rem;
+  color: #1eff1c;
+  flex-shrink: 0;
+}
+
+.update-notice-text strong {
+  color: #1eff1c;
+}
+
+.update-notice-detail {
+  color: #a0d89e;
+}
+
+.update-notice-dismiss {
+  flex-shrink: 0;
+  background: none;
+  border: 1px solid rgba(30, 255, 28, 0.3);
+  border-radius: 4px;
+  color: #1eff1c;
+  font-size: 0.95rem;
+  cursor: pointer;
+  padding: 0.2rem 0.55rem;
+  line-height: 1;
+  transition: background 0.15s, border-color 0.15s;
+}
+
+.update-notice-dismiss:hover {
+  background: rgba(30, 255, 28, 0.15);
+  border-color: rgba(30, 255, 28, 0.6);
+}
+
 .disclaimer-modal {
   position: fixed;
   top: 50%;
@@ -1938,9 +2221,12 @@ button.danger:hover {
   background: var(--surface-2);
   border: 1px solid var(--gold-dim);
   border-radius: var(--radius-lg);
-  padding: 2.5rem;
+  padding: 2rem;
   max-width: 620px;
-  width: 90%;
+  width: min(90vw, 620px);
+  max-height: 90vh;
+  overflow-y: auto;
+  overscroll-behavior: contain;
   z-index: 9999;
   box-shadow: 0 16px 48px rgba(0, 0, 0, 0.6), 0 0 40px var(--gold-glow);
 }
@@ -2015,12 +2301,13 @@ button.danger:hover {
 
 .footer-content {
   display: flex;
-  justify-content: space-between;
+  flex-direction: column;
+  justify-content: center;
   align-items: center;
   max-width: 1920px;
   margin: 0 auto;
   flex-wrap: wrap;
-  gap: 1rem;
+  gap: 0.75rem;
 }
 
 .footer-section {
@@ -2051,6 +2338,8 @@ button.danger:hover {
 .footer-links {
   display: flex;
   gap: 1.5rem;
+  justify-content: center;
+  flex-wrap: wrap;
 }
 
 .footer-link {
diff --git a/frontend/src/index.jsx b/frontend/src/index.jsx
index 46457ed..ca42421 100644
--- a/frontend/src/index.jsx
+++ b/frontend/src/index.jsx
@@ -2,6 +2,9 @@ import React from 'react'
 import ReactDOM from 'react-dom/client'
 import App from './App'
 import './index.css'
+import { installNamespacedLocalStorage } from './utils/runtimeConfig'
+
+installNamespacedLocalStorage()
 
 ReactDOM.createRoot(document.getElementById('root')).render(
   <React.StrictMode>
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index c878b51..8280637 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -2,7 +2,74 @@
  * API service for backend communication
  */
 
-const API_BASE = '/api';
+const API_BASE = import.meta.env.VITE_MOTO_API_BASE || '/api';
+
+/**
+ * Extract the most useful human-readable message from a non-ok fetch Response.
+ *
+ * The backend returns FastAPI-style `{ "detail": "..." }` on errors, but:
+ *   - `detail` may be a string, or a list/object (e.g. 422 validation errors)
+ *   - proxies / dev servers can return HTML or empty bodies on 502/504
+ *   - `response.json()` throws on any non-JSON body, which is how the old
+ *     wrappers ended up surfacing a generic "Failed to ..." fallback even
+ *     when the backend had a perfectly clear error to report
+ *
+ * Returns a string containing the HTTP status + the best available reason.
+ */
+async function extractErrorMessage(response, fallbackMessage) {
+  const status = response.status;
+  const statusText = response.statusText || '';
+  const prefix = `HTTP ${status}${statusText ? ` ${statusText}` : ''}`;
+
+  let bodyText = '';
+  try {
+    bodyText = await response.text();
+  } catch {
+    return `${prefix} (no response body): ${fallbackMessage}`;
+  }
+
+  if (!bodyText.trim()) {
+    return `${prefix}: ${fallbackMessage}`;
+  }
+
+  let parsed = null;
+  try {
+    parsed = JSON.parse(bodyText);
+  } catch {
+    const snippet = bodyText.trim().slice(0, 500);
+    return `${prefix}: ${snippet || fallbackMessage}`;
+  }
+
+  let detail = parsed && typeof parsed === 'object' ? parsed.detail : null;
+  if (detail == null && parsed && typeof parsed === 'object') {
+    detail = parsed.message || parsed.error || null;
+  }
+
+  if (typeof detail === 'string' && detail.trim()) {
+    return `${prefix}: ${detail.trim()}`;
+  }
+  if (detail != null) {
+    try {
+      return `${prefix}: ${JSON.stringify(detail)}`;
+    } catch {
+      // fall through to fallback
+    }
+  }
+  return `${prefix}: ${fallbackMessage}`;
+}
+
+/**
+ * Throw an Error whose `.message` is the most informative reason we can
+ * synthesize from a non-ok Response. Attaches `.status` and `.body` so callers
+ * can inspect them programmatically.
+ */
+async function throwFromResponse(response, fallbackMessage) {
+  const message = await extractErrorMessage(response, fallbackMessage);
+  const err = new Error(message);
+  err.status = response.status;
+  err.statusText = response.statusText;
+  throw err;
+}
 
 // Aggregator API
 export const api = {
@@ -13,6 +80,20 @@ export const api = {
     return response.json();
   },
 
+  // Get shared runtime feature flags and build identity
+  async getFeatures() {
+    const response = await fetch(`${API_BASE}/features`);
+    if (!response.ok) throw new Error('Failed to fetch features');
+    return response.json();
+  },
+
+  // Get update notice written by the launcher (if any)
+  async getUpdateNotice() {
+    const response = await fetch(`${API_BASE}/update-notice`);
+    if (!response.ok) return { update_available: false };
+    return response.json();
+  },
+
   // Start aggregator
   async startAggregator(config) {
     const response = await fetch(`${API_BASE}/aggregator/start`, {
@@ -391,6 +472,94 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  // Get all verified proofs
+  async getProofs() {
+    const response = await fetch(`${API_BASE}/proofs`);
+    if (!response.ok) throw new Error('Failed to get proofs');
+    return response.json();
+  },
+
+  // Get only novel verified proofs
+  async getNovelProofs() {
+    const response = await fetch(`${API_BASE}/proofs/novel`);
+    if (!response.ok) throw new Error('Failed to get novel proofs');
+    return response.json();
+  },
+
+  // Get Lean 4 proof system status
+  async getProofStatus() {
+    const response = await fetch(`${API_BASE}/proofs/status`);
+    if (!response.ok) throw new Error('Failed to get proof status');
+    return response.json();
+  },
+
+  // Update runtime Lean 4 proof settings
+  async updateProofSettings(settings) {
+    const response = await fetch(`${API_BASE}/proofs/settings`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify(settings),
+    });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData?.detail?.message || errorData?.detail || 'Failed to update proof settings');
+    }
+    return response.json();
+  },
+
+  // Queue a manual proof check for one brainstorm or paper
+  async runProofCheck({ sourceType, sourceId }) {
+    const response = await fetch(`${API_BASE}/proofs/check`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({
+        source_type: sourceType,
+        source_id: sourceId,
+      }),
+    });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData?.detail?.message || errorData?.detail || 'Failed to queue proof check');
+    }
+    return response.json();
+  },
+
+  // Get one proof with full Lean code
+  async getProof(proofId) {
+    const response = await fetch(`${API_BASE}/proofs/${encodeURIComponent(proofId)}`);
+    if (!response.ok) throw new Error(`Failed to get proof ${proofId}`);
+    return response.json();
+  },
+
+  // Get dependency edges for one proof
+  async getProofDependencies(proofId) {
+    const response = await fetch(`${API_BASE}/proofs/${encodeURIComponent(proofId)}/dependencies`);
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData?.detail?.message || errorData?.detail || `Failed to get proof dependencies for ${proofId}`);
+    }
+    return response.json();
+  },
+
+  // Get the full proof dependency graph in one payload
+  async getProofGraph() {
+    const response = await fetch(`${API_BASE}/proofs/graph`);
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData?.detail?.message || errorData?.detail || 'Failed to get proof graph');
+    }
+    return response.json();
+  },
+
+  // Download URLs for machine-readable proof certificates
+  getProofCertificateUrl(proofId) {
+    return `${API_BASE}/proofs/${encodeURIComponent(proofId)}/certificate`;
+  },
+
+  getProofLeanDownloadUrl(proofId) {
+    return `${API_BASE}/proofs/${encodeURIComponent(proofId)}/certificate.lean`;
+  },
+
   // Get current paper progress (in-progress paper during Tier 2)
   async getCurrentPaperProgress() {
     const response = await fetch(`${API_BASE}/auto-research/current-paper-progress`);
@@ -900,7 +1069,7 @@ export const openRouterAPI = {
   // Get API key status (has_key, enabled)
   async getApiKeyStatus() {
     const response = await fetch(`${API_BASE}/openrouter/api-key-status`);
-    if (!response.ok) throw new Error('Failed to get API key status');
+    if (!response.ok) await throwFromResponse(response, 'Failed to get API key status');
     return response.json();
   },
 
@@ -911,10 +1080,7 @@ export const openRouterAPI = {
       headers: { 'Content-Type': 'application/json' },
       body: JSON.stringify({ api_key: apiKey }),
     });
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to set API key');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to set API key');
     return response.json();
   },
 
@@ -923,7 +1089,7 @@ export const openRouterAPI = {
     const response = await fetch(`${API_BASE}/openrouter/api-key`, {
       method: 'DELETE',
     });
-    if (!response.ok) throw new Error('Failed to clear API key');
+    if (!response.ok) await throwFromResponse(response, 'Failed to clear API key');
     return response.json();
   },
 
@@ -934,10 +1100,7 @@ export const openRouterAPI = {
       headers: { 'Content-Type': 'application/json' },
       body: JSON.stringify({ api_key: apiKey }),
     });
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to test connection');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to test connection');
     return response.json();
   },
 
@@ -949,10 +1112,7 @@ export const openRouterAPI = {
     
     const url = `${API_BASE}/openrouter/models${params.toString() ? '?' + params.toString() : ''}`;
     const response = await fetch(url);
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to fetch models');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to fetch models');
     return response.json();
   },
 
@@ -962,19 +1122,13 @@ export const openRouterAPI = {
     const response = await fetch(url, {
       headers: apiKey ? { 'Authorization': `Bearer ${apiKey}` } : {}
     });
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to fetch providers');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to fetch providers');
     return response.json();
   },
 
   async getFreeModelSettings() {
     const response = await fetch(`${API_BASE}/openrouter/free-model-settings`);
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to fetch free model settings');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to fetch free model settings');
     return response.json();
   },
 
@@ -987,10 +1141,7 @@ export const openRouterAPI = {
         auto_selector_enabled: autoSelectorEnabled,
       }),
     });
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to update free model settings');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to update free model settings');
     return response.json();
   },
 
@@ -998,10 +1149,7 @@ export const openRouterAPI = {
     const response = await fetch(`${API_BASE}/openrouter/reset-exhaustion`, {
       method: 'POST',
     });
-    if (!response.ok) {
-      const errorData = await response.json();
-      throw new Error(errorData.detail || 'Failed to reset credit exhaustion');
-    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to reset credit exhaustion');
     return response.json();
   },
 };
@@ -1013,19 +1161,13 @@ api.post = async (url, data) => {
     headers: { 'Content-Type': 'application/json' },
     body: data ? JSON.stringify(data) : undefined,
   });
-  if (!response.ok) {
-    const errorData = await response.json();
-    throw new Error(errorData.detail || 'Request failed');
-  }
+  if (!response.ok) await throwFromResponse(response, 'Request failed');
   return response.json();
 };
 
 api.get = async (url) => {
   const response = await fetch(url);
-  if (!response.ok) {
-    const errorData = await response.json();
-    throw new Error(errorData.detail || 'Request failed');
-  }
+  if (!response.ok) await throwFromResponse(response, 'Request failed');
   return response.json();
 };
 
diff --git a/frontend/src/services/websocket.js b/frontend/src/services/websocket.js
index 5db9688..55d36c7 100644
--- a/frontend/src/services/websocket.js
+++ b/frontend/src/services/websocket.js
@@ -12,7 +12,8 @@ class WebSocketService {
 
   connect() {
     const protocol = window.location.protocol === 'https:' ? 'wss:' : 'ws:';
-    const wsUrl = `${protocol}//${window.location.host}/ws`;
+    const wsPath = import.meta.env.VITE_MOTO_WS_PATH || '/ws';
+    const wsUrl = `${protocol}//${window.location.host}${wsPath}`;
     
     this.ws = new WebSocket(wsUrl);
     
diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
index 9895087..94a0c90 100644
--- a/frontend/src/utils/autonomousProfiles.js
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -6,9 +6,13 @@ export const STARTUP_PROVIDER_CHOICE_STORAGE_KEY = 'startup_provider_choice';
 export const LM_STUDIO_STARTUP_CHOICE = 'lm_studio';
 export const RECOMMENDED_PROFILE_KEY = 'recommended_slower_affordable_higher_knowledge';
 export const RECOMMENDED_ALTERNATE_PROFILE_KEY = 'recommended_fast_affordable_mid';
+export const RECOMMENDED_LAB_FAST_PROFILE_KEY = 'recommended_lab_fast_costly_extra_high';
+export const RECOMMENDED_LAB_MAX_PROFILE_KEY = 'recommended_lab_slow_costly_max';
 export const RECOMMENDED_PROFILE_KEYS = [
   RECOMMENDED_PROFILE_KEY,
   RECOMMENDED_ALTERNATE_PROFILE_KEY,
+  RECOMMENDED_LAB_FAST_PROFILE_KEY,
+  RECOMMENDED_LAB_MAX_PROFILE_KEY,
 ];
 
 const DEFAULT_SUBMITTER_CONFIG = {
@@ -21,62 +25,10 @@ const DEFAULT_SUBMITTER_CONFIG = {
   maxOutputTokens: 25000,
 };
 
-const DEFAULT_OPENROUTER_SUBMITTER_CONFIGS = [
-  {
-    submitterId: 1,
-    provider: 'openrouter',
-    modelId: 'openai/gpt-oss-120b',
-    openrouterProvider: 'Google',
-    lmStudioFallbackId: null,
-    contextWindow: 131072,
-    maxOutputTokens: 25000,
-  },
-  {
-    submitterId: 2,
-    provider: 'openrouter',
-    modelId: 'openai/gpt-oss-20b',
-    openrouterProvider: 'Groq',
-    lmStudioFallbackId: null,
-    contextWindow: 131072,
-    maxOutputTokens: 25000,
-  },
-  {
-    submitterId: 3,
-    provider: 'openrouter',
-    modelId: 'openai/gpt-oss-120b',
-    openrouterProvider: 'Google',
-    lmStudioFallbackId: null,
-    contextWindow: 131072,
-    maxOutputTokens: 25000,
-  },
-];
-
-const DEFAULT_LOCAL_CONFIG = {
-  validator_provider: 'openrouter',
-  validator_model: 'openai/gpt-oss-120b',
-  validator_openrouter_provider: 'Google',
-  validator_lm_studio_fallback: null,
-  validator_context_window: 131072,
-  validator_max_tokens: 25000,
-  high_context_provider: 'openrouter',
-  high_context_model: 'openai/gpt-oss-120b',
-  high_context_openrouter_provider: 'Google',
-  high_context_lm_studio_fallback: null,
-  high_context_context_window: 131072,
-  high_context_max_tokens: 25000,
-  high_param_provider: 'openrouter',
-  high_param_model: 'openai/gpt-oss-120b',
-  high_param_openrouter_provider: 'Google',
-  high_param_lm_studio_fallback: null,
-  high_param_context_window: 131072,
-  high_param_max_tokens: 25000,
-  critique_submitter_provider: 'openrouter',
-  critique_submitter_model: 'openai/gpt-oss-120b',
-  critique_submitter_openrouter_provider: 'Google',
-  critique_submitter_lm_studio_fallback: null,
-  critique_submitter_context_window: 131072,
-  critique_submitter_max_tokens: 25000,
-};
+// NOTE: DEFAULT_OPENROUTER_SUBMITTER_CONFIGS and DEFAULT_LOCAL_CONFIG are derived
+// from RECOMMENDED_PROFILES[RECOMMENDED_PROFILE_KEY] further below so the "default"
+// startup configuration and the selectable recommended profile stay in sync.
+// Update the recommended profile below to change what a fresh install runs with.
 
 const DEFAULT_LM_LOCAL_CONFIG = {
   validator_provider: 'lm_studio',
@@ -113,21 +65,9 @@ const createDefaultSubmitterConfigs = (modelId = '') => (
   }))
 );
 
-const DEFAULT_AUTONOMOUS_SETTINGS = {
-  numSubmitters: 3,
-  submitterConfigs: DEFAULT_OPENROUTER_SUBMITTER_CONFIGS,
-  localConfig: DEFAULT_LOCAL_CONFIG,
-  freeOnly: false,
-  freeModelLooping: true,
-  freeModelAutoSelector: true,
-  tier3Enabled: false,
-  modelProviders: {},
-  selectedProfile: '',
-};
-
 export const RECOMMENDED_PROFILES = {
   [RECOMMENDED_PROFILE_KEY]: {
-    name: 'Slower, less affordable, higher knowledge',
+    name: 'Slow, less affordable, higher knowledge',
     numSubmitters: 3,
     submitters: [
       {
@@ -139,7 +79,7 @@ export const RECOMMENDED_PROFILES = {
         maxOutputTokens: 65500,
       },
       {
-        modelId: 'moonshotai/kimi-k2.5',
+        modelId: 'moonshotai/kimi-k2.6',
         provider: 'openrouter',
         openrouterProvider: null,
         lmStudioFallbackId: null,
@@ -147,16 +87,16 @@ export const RECOMMENDED_PROFILES = {
         maxOutputTokens: 40000,
       },
       {
-        modelId: 'deepseek/deepseek-v3.2',
+        modelId: 'deepseek/deepseek-v4-pro',
         provider: 'openrouter',
-        openrouterProvider: 'AtlasCloud',
+        openrouterProvider: null,
         lmStudioFallbackId: null,
-        contextWindow: 163800,
-        maxOutputTokens: 30000,
+        contextWindow: 1048576,
+        maxOutputTokens: 65500,
       },
     ],
     validator: {
-      modelId: 'moonshotai/kimi-k2.5',
+      modelId: 'moonshotai/kimi-k2.6',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,
@@ -190,12 +130,12 @@ export const RECOMMENDED_PROFILES = {
   },
   [RECOMMENDED_ALTERNATE_PROFILE_KEY]: {
     name: 'Fast, affordable, mid-tier knowledge',
-    numSubmitters: 3,
+    numSubmitters: 4,
     submitters: [
       {
-        modelId: 'moonshotai/kimi-k2.5',
+        modelId: 'moonshotai/kimi-k2.6',
         provider: 'openrouter',
-        openrouterProvider: 'SiliconFlow',
+        openrouterProvider: null,
         lmStudioFallbackId: null,
         contextWindow: 262000,
         maxOutputTokens: 40000,
@@ -209,26 +149,34 @@ export const RECOMMENDED_PROFILES = {
         maxOutputTokens: 25000,
       },
       {
-        modelId: 'deepseek/deepseek-v3.2',
+        modelId: 'deepseek/deepseek-v4-pro',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1048576,
+        maxOutputTokens: 65500,
+      },
+      {
+        modelId: 'inception/mercury-2',
         provider: 'openrouter',
-        openrouterProvider: 'AtlasCloud',
+        openrouterProvider: null,
         lmStudioFallbackId: null,
-        contextWindow: 163800,
-        maxOutputTokens: 30000,
+        contextWindow: 128000,
+        maxOutputTokens: 25000,
       },
     ],
     validator: {
-      modelId: 'qwen/qwen3.5-flash-02-23',
+      modelId: 'x-ai/grok-4.1-fast',
       provider: 'openrouter',
       openrouterProvider: null,
       lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500,
+      contextWindow: 2000000,
+      maxOutputTokens: 30000,
     },
     highContext: {
-      modelId: 'moonshotai/kimi-k2.5',
+      modelId: 'moonshotai/kimi-k2.6',
       provider: 'openrouter',
-      openrouterProvider: 'SiliconFlow',
+      openrouterProvider: null,
       lmStudioFallbackId: null,
       contextWindow: 262000,
       maxOutputTokens: 40000,
@@ -250,6 +198,197 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
   },
+  [RECOMMENDED_LAB_FAST_PROFILE_KEY]: {
+    name: 'Lab grade, fast, costly (starts at ~$10 per hour), extra-high knowledge',
+    numSubmitters: 3,
+    submitters: [
+      {
+        modelId: 'openai/gpt-5.5',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1050000,
+        maxOutputTokens: 128000,
+      },
+      {
+        modelId: 'moonshotai/kimi-k2.6',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
+      },
+      {
+        modelId: 'deepseek/deepseek-v4-pro',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1048576,
+        maxOutputTokens: 65500,
+      },
+    ],
+    validator: {
+      modelId: 'x-ai/grok-4.1-fast',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 2000000,
+      maxOutputTokens: 30000,
+    },
+    highContext: {
+      modelId: 'openai/gpt-5.5',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1050000,
+      maxOutputTokens: 128000,
+    },
+    highParam: {
+      modelId: 'anthropic/claude-opus-4.7',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1000000,
+      maxOutputTokens: 128000,
+    },
+    critique: {
+      modelId: 'google/gemini-3.1-pro-preview',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+  },
+  [RECOMMENDED_LAB_MAX_PROFILE_KEY]: {
+    name: 'Lab grade, SOTA models, slower, costly (starts at ~$20 per hour), max knowledge',
+    numSubmitters: 4,
+    submitters: [
+      {
+        modelId: 'anthropic/claude-opus-4.7',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1000000,
+        maxOutputTokens: 128000,
+      },
+      {
+        modelId: 'openai/gpt-5.5-pro',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1050000,
+        maxOutputTokens: 128000,
+      },
+      {
+        modelId: 'x-ai/grok-4.20-multi-agent',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 2000000,
+        maxOutputTokens: 65500,
+      },
+      {
+        modelId: 'moonshotai/kimi-k2.6',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
+      },
+    ],
+    validator: {
+      modelId: 'openai/gpt-5.5-pro',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1050000,
+      maxOutputTokens: 128000,
+    },
+    highContext: {
+      modelId: 'anthropic/claude-opus-4.7',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1000000,
+      maxOutputTokens: 128000,
+    },
+    highParam: {
+      modelId: 'anthropic/claude-opus-4.7',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1000000,
+      maxOutputTokens: 128000,
+    },
+    critique: {
+      modelId: 'x-ai/grok-4.20-multi-agent',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 2000000,
+      maxOutputTokens: 65500,
+    },
+  },
+};
+
+// Derive the startup/fallback OpenRouter defaults directly from the default
+// recommended profile so there is a single source of truth. Changing the
+// RECOMMENDED_PROFILE_KEY profile above automatically updates what a fresh
+// install (or any settings reset) runs with.
+const DEFAULT_RECOMMENDED_PROFILE = RECOMMENDED_PROFILES[RECOMMENDED_PROFILE_KEY];
+
+const submitterFromRecommended = (submitter, submitterId) => ({
+  submitterId,
+  provider: submitter.provider || 'openrouter',
+  modelId: submitter.modelId || '',
+  openrouterProvider: submitter.openrouterProvider || null,
+  lmStudioFallbackId: submitter.lmStudioFallbackId || null,
+  contextWindow: submitter.contextWindow,
+  maxOutputTokens: submitter.maxOutputTokens,
+});
+
+const DEFAULT_OPENROUTER_SUBMITTER_CONFIGS = DEFAULT_RECOMMENDED_PROFILE.submitters.map(
+  (submitter, index) => submitterFromRecommended(submitter, index + 1)
+);
+
+const DEFAULT_LOCAL_CONFIG = {
+  validator_provider: DEFAULT_RECOMMENDED_PROFILE.validator.provider || 'openrouter',
+  validator_model: DEFAULT_RECOMMENDED_PROFILE.validator.modelId || '',
+  validator_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.validator.openrouterProvider || null,
+  validator_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.validator.lmStudioFallbackId || null,
+  validator_context_window: DEFAULT_RECOMMENDED_PROFILE.validator.contextWindow,
+  validator_max_tokens: DEFAULT_RECOMMENDED_PROFILE.validator.maxOutputTokens,
+  high_context_provider: DEFAULT_RECOMMENDED_PROFILE.highContext.provider || 'openrouter',
+  high_context_model: DEFAULT_RECOMMENDED_PROFILE.highContext.modelId || '',
+  high_context_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.highContext.openrouterProvider || null,
+  high_context_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.highContext.lmStudioFallbackId || null,
+  high_context_context_window: DEFAULT_RECOMMENDED_PROFILE.highContext.contextWindow,
+  high_context_max_tokens: DEFAULT_RECOMMENDED_PROFILE.highContext.maxOutputTokens,
+  high_param_provider: DEFAULT_RECOMMENDED_PROFILE.highParam.provider || 'openrouter',
+  high_param_model: DEFAULT_RECOMMENDED_PROFILE.highParam.modelId || '',
+  high_param_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.highParam.openrouterProvider || null,
+  high_param_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.highParam.lmStudioFallbackId || null,
+  high_param_context_window: DEFAULT_RECOMMENDED_PROFILE.highParam.contextWindow,
+  high_param_max_tokens: DEFAULT_RECOMMENDED_PROFILE.highParam.maxOutputTokens,
+  critique_submitter_provider: DEFAULT_RECOMMENDED_PROFILE.critique.provider || 'openrouter',
+  critique_submitter_model: DEFAULT_RECOMMENDED_PROFILE.critique.modelId || '',
+  critique_submitter_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.critique.openrouterProvider || null,
+  critique_submitter_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.critique.lmStudioFallbackId || null,
+  critique_submitter_context_window: DEFAULT_RECOMMENDED_PROFILE.critique.contextWindow,
+  critique_submitter_max_tokens: DEFAULT_RECOMMENDED_PROFILE.critique.maxOutputTokens,
+};
+
+const DEFAULT_AUTONOMOUS_SETTINGS = {
+  numSubmitters: DEFAULT_RECOMMENDED_PROFILE.numSubmitters || DEFAULT_OPENROUTER_SUBMITTER_CONFIGS.length,
+  submitterConfigs: DEFAULT_OPENROUTER_SUBMITTER_CONFIGS,
+  localConfig: DEFAULT_LOCAL_CONFIG,
+  freeOnly: false,
+  freeModelLooping: true,
+  freeModelAutoSelector: true,
+  tier3Enabled: false,
+  modelProviders: {},
+  selectedProfile: RECOMMENDED_PROFILE_KEY,
 };
 
 function normalizeStoredSettings(settings = {}) {
@@ -275,7 +414,7 @@ function normalizeStoredSettings(settings = {}) {
     freeModelAutoSelector: settings.freeModelAutoSelector ?? DEFAULT_AUTONOMOUS_SETTINGS.freeModelAutoSelector,
     tier3Enabled: settings.tier3Enabled ?? DEFAULT_AUTONOMOUS_SETTINGS.tier3Enabled,
     modelProviders: settings.modelProviders || DEFAULT_AUTONOMOUS_SETTINGS.modelProviders,
-    selectedProfile: settings.selectedProfile || '',
+    selectedProfile: settings.selectedProfile ?? DEFAULT_AUTONOMOUS_SETTINGS.selectedProfile,
   };
 }
 
diff --git a/frontend/src/utils/disclaimerHelper.js b/frontend/src/utils/disclaimerHelper.js
index 6ecb910..52ec907 100644
--- a/frontend/src/utils/disclaimerHelper.js
+++ b/frontend/src/utils/disclaimerHelper.js
@@ -13,7 +13,7 @@ export const PAPER_DISCLAIMER =
   `${SEPARATOR}\n` +
   'DISCLAIMER\n' +
   '\n' +
-  'This content is provided for informational and experimental purposes only.\n' +
+  'This content is provided for informational purposes only.\n' +
   'This paper was autonomously generated with the novelty-seeking MOTO harness\n' +
   'without peer review or user oversight beyond the original prompt. It may\n' +
   'contain incorrect, incomplete, misleading, or fabricated claims presented\n' +
@@ -28,7 +28,7 @@ export const BRAINSTORM_DISCLAIMER =
   `${SEPARATOR}\n` +
   'DISCLAIMER\n' +
   '\n' +
-  'This content is provided for informational and experimental purposes only.\n' +
+  'This content is provided for informational purposes only.\n' +
   'This brainstorm database was autonomously generated with the novelty-seeking\n' +
   'MOTO harness without peer review or user oversight beyond the original\n' +
   'prompt. It may contain incorrect, incomplete, misleading, or\n' +
diff --git a/frontend/src/utils/openRouterSelection.js b/frontend/src/utils/openRouterSelection.js
new file mode 100644
index 0000000..11eded4
--- /dev/null
+++ b/frontend/src/utils/openRouterSelection.js
@@ -0,0 +1,121 @@
+const DEFAULT_CONTEXT_WINDOW = 131072;
+const CONTEXT_BUFFER_TOKENS = 500;
+
+function toPositiveInteger(value) {
+  const parsed = Number(value);
+  if (!Number.isFinite(parsed) || parsed <= 0) {
+    return null;
+  }
+  return Math.floor(parsed);
+}
+
+export function findOpenRouterModel(models, modelId) {
+  if (!Array.isArray(models) || !modelId) {
+    return null;
+  }
+  return models.find((model) => model.id === modelId) || null;
+}
+
+export function hasEndpointMetadata(providerData) {
+  return Boolean(
+    providerData &&
+    !Array.isArray(providerData) &&
+    Array.isArray(providerData.endpoints)
+  );
+}
+
+export function normalizeProviderData(providerData) {
+  if (Array.isArray(providerData)) {
+    return {
+      providers: providerData,
+      endpoints: [],
+    };
+  }
+
+  if (!providerData || typeof providerData !== 'object') {
+    return {
+      providers: [],
+      endpoints: [],
+    };
+  }
+
+  return {
+    providers: Array.isArray(providerData.providers) ? providerData.providers : [],
+    endpoints: Array.isArray(providerData.endpoints) ? providerData.endpoints : [],
+  };
+}
+
+export function getProviderNames(providerData) {
+  return normalizeProviderData(providerData).providers;
+}
+
+export function computeOpenRouterAutoSettings(model, providerData, selectedProvider = null) {
+  const { endpoints } = normalizeProviderData(providerData);
+
+  const relevantEndpoints = selectedProvider
+    ? endpoints.filter((endpoint) => endpoint?.provider_name === selectedProvider)
+    : endpoints;
+
+  if (relevantEndpoints.length === 0) {
+    return null;
+  }
+
+  const hasCompleteEndpointContexts = relevantEndpoints.every(
+    (endpoint) => toPositiveInteger(endpoint?.context_length) !== null
+  );
+  const hasCompleteEndpointOutputCaps = relevantEndpoints.every(
+    (endpoint) => toPositiveInteger(endpoint?.max_completion_tokens) !== null
+  );
+
+  if (!hasCompleteEndpointContexts || !hasCompleteEndpointOutputCaps) {
+    return null;
+  }
+
+  const endpointContexts = relevantEndpoints
+    .map((endpoint) => toPositiveInteger(endpoint?.context_length))
+    .filter((value) => value !== null);
+
+  const endpointOutputCaps = relevantEndpoints
+    .map((endpoint) => toPositiveInteger(endpoint?.max_completion_tokens))
+    .filter((value) => value !== null);
+
+  const endpointPromptCaps = relevantEndpoints
+    .map((endpoint) => toPositiveInteger(endpoint?.max_prompt_tokens))
+    .filter((value) => value !== null);
+
+  const smallestEndpointContext = Math.min(...endpointContexts);
+  const smallestEndpointOutputCap = Math.min(...endpointOutputCaps);
+  const smallestEndpointPromptCap = endpointPromptCaps.length > 0
+    ? Math.min(...endpointPromptCaps)
+    : null;
+
+  let contextWindow = smallestEndpointContext;
+  let twentyPercentOutputCap = Math.max(1, Math.floor(contextWindow * 0.2));
+
+  if (smallestEndpointPromptCap !== null) {
+    const promptLimitedOutputCap = Math.max(
+      1,
+      Math.floor((smallestEndpointPromptCap + CONTEXT_BUFFER_TOKENS) / 4)
+    );
+    twentyPercentOutputCap = Math.min(twentyPercentOutputCap, promptLimitedOutputCap);
+  }
+
+  const maxOutputTokens = Math.min(smallestEndpointOutputCap, twentyPercentOutputCap);
+
+  if (smallestEndpointPromptCap !== null) {
+    contextWindow = Math.min(
+      contextWindow,
+      smallestEndpointPromptCap + maxOutputTokens + CONTEXT_BUFFER_TOKENS
+    );
+  }
+
+  return {
+    contextWindow,
+    maxOutputTokens,
+    twentyPercentOutputCap,
+    smallestEndpointOutputCap,
+    smallestEndpointContext,
+    smallestEndpointPromptCap,
+    fallbackModelContext: toPositiveInteger(model?.context_length) || DEFAULT_CONTEXT_WINDOW,
+  };
+}
diff --git a/frontend/src/utils/researchRunHistory.js b/frontend/src/utils/researchRunHistory.js
index a06cc24..a87c334 100644
--- a/frontend/src/utils/researchRunHistory.js
+++ b/frontend/src/utils/researchRunHistory.js
@@ -24,11 +24,48 @@ function compareStage3Answers(a, b) {
   return toTimestamp(b.completion_date) - toTimestamp(a.completion_date);
 }
 
+const UNKNOWN_RESEARCH_QUESTION = 'Unknown research question';
+
+function normalizePrompt(value) {
+  return typeof value === 'string' ? value.trim() : '';
+}
+
+function derivePromptFromSessionId(sessionId) {
+  if (sessionId === 'legacy') {
+    return 'Legacy research session';
+  }
+
+  const promptSlug = String(sessionId || '').replace(/_\d{4}-\d{2}-\d{2}_\d{2}-\d{2}$/, '');
+  const prompt = promptSlug.replace(/_/g, ' ').trim();
+
+  if (!prompt) {
+    return UNKNOWN_RESEARCH_QUESTION;
+  }
+
+  return prompt.charAt(0).toUpperCase() + prompt.slice(1);
+}
+
+function resolvePrompt(sessionId, ...candidates) {
+  for (const candidate of candidates) {
+    const prompt = normalizePrompt(candidate);
+    if (prompt && prompt !== UNKNOWN_RESEARCH_QUESTION) {
+      return prompt;
+    }
+  }
+
+  return derivePromptFromSessionId(sessionId);
+}
+
+function shouldUpgradePrompt(currentPrompt) {
+  const prompt = normalizePrompt(currentPrompt);
+  return !prompt || prompt === UNKNOWN_RESEARCH_QUESTION;
+}
+
 function buildFallbackRun(sessionId, seedItem = null) {
   return {
     sessionId,
     displaySessionId: sessionId === 'legacy' ? 'Legacy' : sessionId,
-    userPrompt: seedItem?.user_prompt || (sessionId === 'legacy' ? 'Legacy research session' : 'Unknown research question'),
+    userPrompt: resolvePrompt(sessionId, seedItem?.user_prompt, seedItem?.user_research_prompt),
     createdAt: seedItem?.created_at || seedItem?.completion_date || null,
     brainstormCount: null,
     sessionPaperCount: null,
@@ -64,7 +101,13 @@ export function buildResearchRunGroups({
       ? {
           sessionId,
           displaySessionId: sessionId === 'legacy' ? 'Legacy' : sessionId,
-          userPrompt: session.user_prompt || seedItem?.user_prompt || 'Unknown research question',
+          userPrompt: resolvePrompt(
+            sessionId,
+            session.user_prompt,
+            session.user_research_prompt,
+            seedItem?.user_prompt,
+            seedItem?.user_research_prompt,
+          ),
           createdAt: session.created_at || seedItem?.created_at || seedItem?.completion_date || null,
           brainstormCount: session.brainstorm_count ?? null,
           sessionPaperCount: session.paper_count ?? null,
@@ -82,8 +125,8 @@ export function buildResearchRunGroups({
   for (const paper of stage2Papers) {
     const group = ensureGroup(paper.session_id, paper);
     group.stage2Papers.push(paper);
-    if (!group.userPrompt && paper.user_prompt) {
-      group.userPrompt = paper.user_prompt;
+    if (shouldUpgradePrompt(group.userPrompt)) {
+      group.userPrompt = resolvePrompt(group.sessionId, paper.user_prompt, paper.user_research_prompt);
     }
     if (!group.createdAt) {
       group.createdAt = paper.created_at || null;
@@ -93,8 +136,8 @@ export function buildResearchRunGroups({
   for (const answer of stage3Answers) {
     const group = ensureGroup(answer.session_id, answer);
     group.stage3Answers.push(answer);
-    if (!group.userPrompt && answer.user_prompt) {
-      group.userPrompt = answer.user_prompt;
+    if (shouldUpgradePrompt(group.userPrompt)) {
+      group.userPrompt = resolvePrompt(group.sessionId, answer.user_prompt, answer.user_research_prompt);
     }
     if (!group.createdAt) {
       group.createdAt = answer.completion_date || null;
diff --git a/frontend/src/utils/runtimeConfig.js b/frontend/src/utils/runtimeConfig.js
new file mode 100644
index 0000000..77f1818
--- /dev/null
+++ b/frontend/src/utils/runtimeConfig.js
@@ -0,0 +1,59 @@
+const storagePrefix = (import.meta.env.VITE_MOTO_STORAGE_PREFIX || '').trim();
+const instanceId = (import.meta.env.VITE_MOTO_INSTANCE_ID || '').trim();
+const dataRootDisplay = (import.meta.env.VITE_MOTO_DATA_ROOT_DISPLAY || '').trim();
+
+function toScopedKey(key) {
+  if (!storagePrefix || typeof key !== 'string' || key.length === 0) {
+    return key;
+  }
+  return `${storagePrefix}:${key}`;
+}
+
+export function installNamespacedLocalStorage() {
+  if (typeof window === 'undefined' || !storagePrefix) {
+    return;
+  }
+
+  if (window.__motoStorageNamespacePatched) {
+    return;
+  }
+
+  const storageProto = Object.getPrototypeOf(window.localStorage);
+  const originalGetItem = storageProto.getItem;
+  const originalSetItem = storageProto.setItem;
+  const originalRemoveItem = storageProto.removeItem;
+
+  storageProto.getItem = function patchedGetItem(key) {
+    if (this === window.localStorage) {
+      return originalGetItem.call(this, toScopedKey(key));
+    }
+    return originalGetItem.call(this, key);
+  };
+
+  storageProto.setItem = function patchedSetItem(key, value) {
+    if (this === window.localStorage) {
+      return originalSetItem.call(this, toScopedKey(key), value);
+    }
+    return originalSetItem.call(this, key, value);
+  };
+
+  storageProto.removeItem = function patchedRemoveItem(key) {
+    if (this === window.localStorage) {
+      return originalRemoveItem.call(this, toScopedKey(key));
+    }
+    return originalRemoveItem.call(this, key);
+  };
+
+  window.__motoStorageNamespacePatched = true;
+}
+
+export function getRuntimeDataPath(relativePath = '') {
+  const normalizedRelativePath = String(relativePath || '').replace(/^[/\\]+/, '');
+  const basePath = dataRootDisplay || 'this instance data root';
+  return normalizedRelativePath ? `${basePath}/${normalizedRelativePath}` : basePath;
+}
+
+export function getRuntimeInstanceId() {
+  return instanceId || 'default';
+}
+
diff --git a/frontend/vite.config.js b/frontend/vite.config.js
index 9577236..63f7f2a 100644
--- a/frontend/vite.config.js
+++ b/frontend/vite.config.js
@@ -1,22 +1,58 @@
-import { defineConfig } from 'vite'
+import { defineConfig, loadEnv, createLogger } from 'vite'
 import react from '@vitejs/plugin-react'
 
-export default defineConfig({
-  plugins: [react()],
-  server: {
-    port: 5173,
-    strictPort: true,
-    open: false,
-    proxy: {
-      '/api': {
-        target: 'http://localhost:8000',
-        changeOrigin: true,
-      },
-      '/ws': {
-        target: 'ws://localhost:8000',
-        ws: true,
+export default defineConfig(({ mode }) => {
+  const env = loadEnv(mode, process.cwd(), '')
+  const backendPort = env.MOTO_BACKEND_PORT || env.PORT || '8000'
+  const backendUrl = env.VITE_MOTO_BACKEND_URL || `http://localhost:${backendPort}`
+  const backendWsUrl = env.VITE_MOTO_BACKEND_WS_URL || backendUrl.replace(/^http/i, 'ws')
+  const frontendPort = Number(env.VITE_MOTO_FRONTEND_PORT || env.MOTO_FRONTEND_PORT || env.FRONTEND_PORT || 5173)
+  const frontendHost = env.VITE_MOTO_FRONTEND_HOST || '0.0.0.0'
+
+  const logger = createLogger()
+  const originalError = logger.error.bind(logger)
+  logger.error = (msg, options) => {
+    if (typeof msg === 'string' && /proxy error/i.test(msg) && /ECONNREFUSED|ECONNRESET|ETIMEDOUT/i.test(msg)) {
+      return
+    }
+    originalError(msg, options)
+  }
+
+  return {
+    customLogger: logger,
+    plugins: [react()],
+    server: {
+      host: frontendHost,
+      port: frontendPort,
+      strictPort: true,
+      open: false,
+      proxy: {
+        '/api': {
+          target: backendUrl,
+          changeOrigin: true,
+          configure: (proxy) => {
+            proxy.on('error', (err, _req, res) => {
+              const code = err && err.code
+              if (code === 'ECONNREFUSED' || code === 'ECONNRESET' || code === 'ETIMEDOUT') {
+                if (res && !res.headersSent && typeof res.writeHead === 'function') {
+                  try {
+                    res.writeHead(503, { 'Content-Type': 'application/json' })
+                    res.end('{"error":"backend_unavailable"}')
+                  } catch (_) {}
+                }
+              }
+            })
+          },
+        },
+        '/ws': {
+          target: backendWsUrl,
+          ws: true,
+          configure: (proxy) => {
+            proxy.on('error', () => {})
+          },
+        },
       },
     },
-  },
+  }
 })
 
diff --git a/moto-update-manifest.json b/moto-update-manifest.json
new file mode 100644
index 0000000..df18b1d
--- /dev/null
+++ b/moto-update-manifest.json
@@ -0,0 +1,7 @@
+{
+  "manifest_version": 1,
+  "version": "1.0.7",
+  "build_commit": "d352090d687bd3475acfee17f29f7f0cfb17264e",
+  "update_channel": "main",
+  "api_contract_version": "build5-v1"
+}
diff --git a/moto_launcher.py b/moto_launcher.py
new file mode 100644
index 0000000..1c6d5e0
--- /dev/null
+++ b/moto_launcher.py
@@ -0,0 +1,1563 @@
+"""
+MOTO System Launcher (Python)
+This is an internal script. Use "Click To Launch MOTO.bat" on Windows or "Launch MOTO.sh" on Ubuntu 24.04.
+"""
+from __future__ import annotations
+
+from dataclasses import dataclass
+from datetime import datetime
+import json
+import os
+from pathlib import Path
+import platform
+from random import randint
+import re
+import socket
+import shlex
+from shutil import which
+import subprocess
+import sys
+import tarfile
+import time
+from typing import Sequence
+from urllib.error import URLError
+from urllib.request import Request, urlopen
+import webbrowser
+import zipfile
+
+from moto_updater import (
+    apply_update,
+    build_update_prompt,
+    build_warning_message,
+    check_for_updates,
+    cleanup_launcher_state,
+    cleanup_path,
+    consume_internal_launcher_args,
+    load_last_instance_record,
+    register_active_instance,
+    save_last_instance_record,
+    show_yes_no_dialog,
+    write_update_notice,
+)
+
+SCRIPT_DIR = Path(__file__).resolve().parent
+
+CYAN = "\033[96m"
+GREEN = "\033[92m"
+YELLOW = "\033[93m"
+RED = "\033[91m"
+WHITE = "\033[97m"
+RESET = "\033[0m"
+
+
+@dataclass(frozen=True)
+class InstanceRuntime:
+    instance_id: str
+    backend_host: str
+    backend_port: int
+    frontend_port: int
+    data_root: str
+    log_root: str
+    secret_namespace: str | None
+    storage_prefix: str | None
+    is_default: bool
+    # True when the caller used MOTO_INSTANCE_ID / MOTO_DATA_ROOT / etc. to
+    # override the default runtime. Explicit launches are treated as one-off
+    # overrides: we NEVER persist them to `.moto_last_instance.json`, so a
+    # plain subsequent launch still points back at the user's stable default
+    # / previously-recorded isolated instance.
+    explicit_override: bool
+
+
+@dataclass(frozen=True)
+class LaunchedService:
+    title: str
+    pid: int
+    mode: str
+    log_path: str | None = None
+
+
+def _enable_ansi_on_windows() -> None:
+    if sys.platform != "win32":
+        return
+
+    try:
+        import ctypes
+
+        kernel32 = ctypes.windll.kernel32
+        kernel32.SetConsoleMode(kernel32.GetStdHandle(-11), 7)
+    except Exception:
+        return
+
+
+def cprint(message: str, colour: str = RESET) -> None:
+    print(f"{colour}{message}{RESET}")
+
+
+def exit_with_pause(code: int = 0) -> None:
+    print()
+    cprint("Press Enter to close...", YELLOW)
+    try:
+        input()
+    except EOFError:
+        pass
+    sys.exit(code)
+
+
+def resolve_command(*names: str) -> str | None:
+    for name in names:
+        resolved = which(name)
+        if resolved:
+            return resolved
+    return None
+
+
+def command_exists(name: str) -> bool:
+    return resolve_command(name) is not None
+
+
+def get_python_command() -> str:
+    return sys.executable or resolve_command("python3", "python") or "python"
+
+
+def _path_is_within(root: Path, candidate: str | Path) -> bool:
+    try:
+        Path(candidate).resolve().relative_to(root.resolve())
+    except (OSError, ValueError):
+        return False
+    return True
+
+
+def using_repo_local_venv() -> bool:
+    return _path_is_within(SCRIPT_DIR / ".venv", get_python_command())
+
+
+def is_linux() -> bool:
+    return sys.platform.startswith("linux")
+
+
+def shell_join(args: Sequence[str]) -> str:
+    return " ".join(shlex.quote(part) for part in args)
+
+
+def get_node_command() -> str | None:
+    if sys.platform == "win32":
+        return resolve_command("node.exe", "node")
+    return resolve_command("node")
+
+
+def get_npm_command() -> str | None:
+    if sys.platform == "win32":
+        return resolve_command("npm.cmd", "npm.exe", "npm")
+    return resolve_command("npm")
+
+
+def get_lean_command() -> str | None:
+    if sys.platform == "win32":
+        return resolve_command("lean.exe", "lean")
+    return resolve_command("lean")
+
+
+def get_lake_command() -> str | None:
+    if sys.platform == "win32":
+        return resolve_command("lake.exe", "lake")
+    return resolve_command("lake")
+
+
+def get_z3_command() -> str | None:
+    if sys.platform == "win32":
+        return resolve_command("z3.exe", "z3")
+    return resolve_command("z3")
+
+
+def port_in_use(port: int) -> bool:
+    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as connection:
+        try:
+            connection.bind(("127.0.0.1", port))
+            return False
+        except OSError:
+            return True
+
+
+def find_free_port(start: int, exclude: set[int] | None = None) -> int:
+    blocked_ports = exclude or set()
+    for candidate in range(start, start + 2000):
+        if candidate in blocked_ports:
+            continue
+        if not port_in_use(candidate):
+            return candidate
+    raise RuntimeError(f"Could not find a free port starting from {start}.")
+
+
+def resolve_launcher_path(raw: str | None) -> str | None:
+    if not raw or not raw.strip():
+        return None
+    path = Path(raw)
+    if path.is_absolute():
+        return str(path.resolve())
+    return str((SCRIPT_DIR / path).resolve())
+
+
+def sanitize_instance_id(raw: str | None) -> str | None:
+    if not raw or not raw.strip():
+        return None
+    normalized = re.sub(r"[^A-Za-z0-9._-]", "_", raw).strip("_")
+    return normalized if normalized else None
+
+
+def new_instance_id() -> str:
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    suffix = randint(1000, 9999)
+    return f"instance_{timestamp}_{suffix}"
+
+
+def clear_console() -> None:
+    os.system("cls" if sys.platform == "win32" else "clear")
+
+
+def print_banner() -> None:
+    cprint("================================================================", CYAN)
+    cprint("  MOTO System Launcher", CYAN)
+    cprint("================================================================", CYAN)
+    print()
+
+
+def resolve_instance_runtime() -> InstanceRuntime:
+    explicit_id = sanitize_instance_id(os.environ.get("MOTO_INSTANCE_ID"))
+    explicit_data = resolve_launcher_path(os.environ.get("MOTO_DATA_ROOT"))
+    explicit_log = resolve_launcher_path(os.environ.get("MOTO_LOG_ROOT"))
+    explicit_secret = sanitize_instance_id(os.environ.get("MOTO_SECRET_NAMESPACE"))
+    explicit_storage = sanitize_instance_id(os.environ.get("MOTO_FRONTEND_STORAGE_PREFIX"))
+
+    backend_host = os.environ.get("MOTO_BACKEND_HOST") or os.environ.get("HOST") or "0.0.0.0"
+
+    explicit_backend_port = None
+    for variable in ("MOTO_BACKEND_PORT", "PORT"):
+        value = os.environ.get(variable)
+        if value:
+            explicit_backend_port = int(value)
+            break
+
+    explicit_frontend_port = None
+    for variable in ("MOTO_FRONTEND_PORT", "FRONTEND_PORT"):
+        value = os.environ.get(variable)
+        if value:
+            explicit_frontend_port = int(value)
+            break
+
+    default_data = str((SCRIPT_DIR / "backend" / "data").resolve())
+    default_log = str((SCRIPT_DIR / "backend" / "logs").resolve())
+    default_backend = 8000
+    default_frontend = 5173
+
+    has_explicit_runtime = any(
+        value is not None
+        for value in (
+            explicit_id,
+            explicit_data,
+            explicit_log,
+            explicit_backend_port,
+            explicit_frontend_port,
+            explicit_secret,
+            explicit_storage,
+        )
+    )
+
+    # ------------------------------------------------------------------
+    # CRITICAL: keyring namespace stability across every relaunch.
+    #
+    # Previously, a "fresh" launch with free default ports would mint
+    # `instance_id="default"` with `secret_namespace=None` but never record
+    # that choice. If the very next launch happened to find default ports
+    # busy (e.g. Windows TIME_WAIT on 8000/5173), the launcher fell back to
+    # minting a brand-new timestamped instance_id and therefore a brand-new
+    # keyring service name, which made the saved OpenRouter / Wolfram keys
+    # look like they had disappeared. A third launch would flip back to the
+    # default namespace and "rediscover" the original key. This is the
+    # 1/3-startup key-loss symptom.
+    #
+    # Fix: `save_last_instance_record` is invoked for EVERY non-explicit
+    # launch (including default), and here on every non-explicit relaunch we
+    # prefer the recorded runtime when it is not currently live — regardless
+    # of whether the default ports are free. This keeps the keyring service
+    # name and data root perfectly stable across restarts.
+    # ------------------------------------------------------------------
+    reused_record: dict | None = None
+    blocked_record_instance_id: str | None = None
+    if not has_explicit_runtime:
+        last_record = load_last_instance_record()
+        if last_record is not None:
+            candidate_id = sanitize_instance_id(last_record.get("instance_id")) or "default"
+            live_instance_ids = {
+                str(active.get("instance_id") or "").strip()
+                for active in cleanup_launcher_state()
+                if isinstance(active, dict)
+            }
+            if candidate_id not in live_instance_ids:
+                reused_record = {
+                    "instance_id": candidate_id,
+                    "data_root": last_record.get("data_root") or None,
+                    "log_root": last_record.get("log_root") or None,
+                    "secret_namespace": last_record.get("secret_namespace"),
+                    "storage_prefix": last_record.get("storage_prefix"),
+                }
+            else:
+                blocked_record_instance_id = candidate_id
+
+    # Decide the instance identity.
+    if has_explicit_runtime:
+        instance_id = explicit_id or new_instance_id()
+    elif reused_record is not None:
+        instance_id = reused_record["instance_id"]
+    else:
+        # Very first launch on this install (no recorded runtime yet).
+        # Only "adopt" the default instance if the default ports are
+        # currently free AND the recorded live instance is not already using
+        # the default identity. Otherwise mint a fresh namespace so we do not
+        # collide with an active default data root/keyring namespace, or with
+        # whatever process is holding 8000/5173.
+        defaults_free = not port_in_use(default_backend) and not port_in_use(default_frontend)
+        instance_id = (
+            "default"
+            if defaults_free and blocked_record_instance_id != "default"
+            else new_instance_id()
+        )
+
+    is_default_instance = instance_id == "default"
+
+    # Resolve data / log roots.
+    if is_default_instance:
+        data_root = explicit_data or (reused_record or {}).get("data_root") or default_data
+        log_root = explicit_log or (reused_record or {}).get("log_root") or default_log
+    else:
+        instance_root = (SCRIPT_DIR / ".moto_instances" / instance_id).resolve()
+        data_root = (
+            explicit_data
+            or (reused_record or {}).get("data_root")
+            or str(instance_root / "data")
+        )
+        log_root = (
+            explicit_log
+            or (reused_record or {}).get("log_root")
+            or str(instance_root / "logs")
+        )
+
+    # Resolve ports. We always pick a free port; ports are not part of the
+    # keyring namespace, so changing them between launches is safe.
+    if explicit_backend_port is not None:
+        if port_in_use(explicit_backend_port):
+            raise RuntimeError(f"Requested backend port {explicit_backend_port} is already in use.")
+        backend_port = explicit_backend_port
+    else:
+        backend_port = default_backend if not port_in_use(default_backend) else find_free_port(default_backend)
+
+    if explicit_frontend_port is not None:
+        if explicit_frontend_port == backend_port:
+            raise RuntimeError(f"Frontend port cannot match backend port ({backend_port}).")
+        if port_in_use(explicit_frontend_port):
+            raise RuntimeError(f"Requested frontend port {explicit_frontend_port} is already in use.")
+        frontend_port = explicit_frontend_port
+    else:
+        if not port_in_use(default_frontend) and default_frontend != backend_port:
+            frontend_port = default_frontend
+        else:
+            frontend_port = find_free_port(default_frontend, exclude={backend_port})
+
+    # Resolve secret namespace / storage prefix.
+    # Default instance: explicit shared "no namespace" → keyring service
+    # name has no suffix (legacy). Non-default instance: namespace is the
+    # instance_id unless explicitly overridden or reused from a record that
+    # stored an explicit override.
+    if is_default_instance:
+        secret_namespace = explicit_secret or (reused_record or {}).get("secret_namespace")
+        storage_prefix = explicit_storage or (reused_record or {}).get("storage_prefix")
+    else:
+        recorded_secret = (reused_record or {}).get("secret_namespace")
+        recorded_storage = (reused_record or {}).get("storage_prefix")
+        secret_namespace = (
+            explicit_secret
+            or (sanitize_instance_id(recorded_secret) if recorded_secret else None)
+            or instance_id
+        )
+        storage_prefix = (
+            explicit_storage
+            or (sanitize_instance_id(recorded_storage) if recorded_storage else None)
+            or instance_id
+        )
+
+    return InstanceRuntime(
+        instance_id=instance_id,
+        backend_host=backend_host,
+        backend_port=backend_port,
+        frontend_port=frontend_port,
+        data_root=str(Path(data_root).resolve()),
+        log_root=str(Path(log_root).resolve()),
+        secret_namespace=secret_namespace,
+        storage_prefix=storage_prefix,
+        is_default=is_default_instance,
+        explicit_override=has_explicit_runtime,
+    )
+
+
+def run_visible(args: list[str], cwd: str | None = None, check: bool = True) -> int:
+    result = subprocess.run(args, cwd=cwd, check=False)
+    if check and result.returncode != 0:
+        return result.returncode
+    return result.returncode
+
+
+def run_silent(args: list[str], cwd: str | None = None) -> int:
+    return subprocess.run(
+        args,
+        cwd=cwd,
+        stdout=subprocess.DEVNULL,
+        stderr=subprocess.DEVNULL,
+        check=False,
+    ).returncode
+
+
+def has_desktop_session() -> bool:
+    return bool(os.environ.get("DISPLAY") or os.environ.get("WAYLAND_DISPLAY"))
+
+
+def resolve_linux_terminal() -> tuple[str, str] | None:
+    if not is_linux() or not has_desktop_session():
+        return None
+    for candidate in ("x-terminal-emulator", "gnome-terminal", "konsole", "xterm"):
+        resolved = resolve_command(candidate)
+        if resolved:
+            return candidate, resolved
+    return None
+
+
+def build_linux_terminal_command(
+    terminal_name: str,
+    terminal_path: str,
+    title: str,
+    args: Sequence[str],
+    cwd: str,
+) -> list[str]:
+    command_text = f"cd {shlex.quote(cwd)} && exec {shell_join(args)}"
+    if terminal_name == "gnome-terminal":
+        return [terminal_path, f"--title={title}", "--", "bash", "-lc", command_text]
+    if terminal_name == "konsole":
+        return [terminal_path, "-p", f"tabtitle={title}", "-e", "bash", "-lc", command_text]
+    return [terminal_path, "-T", title, "-e", "bash", "-lc", command_text]
+
+
+def resolve_windows_console_executable(executable: str) -> str:
+    """Prefer a PATH-safe executable name when building cmd.exe command text."""
+    candidate = str(executable or "").strip()
+    if sys.platform != "win32" or not candidate or not os.path.isabs(candidate):
+        return candidate
+
+    executable_path = Path(candidate)
+    command_name = executable_path.name
+    resolved = resolve_command(command_name)
+    if not resolved:
+        return candidate
+
+    try:
+        if Path(resolved).resolve() == executable_path.resolve():
+            return command_name
+    except OSError:
+        return candidate
+
+    return candidate
+
+
+def windows_service_requires_direct_launch(args: Sequence[str]) -> bool:
+    """Return True when cmd.exe quoting would be unsafe for this command."""
+    if sys.platform != "win32" or not args:
+        return False
+
+    executable = str(args[0] or "").strip()
+    if not executable or not os.path.isabs(executable):
+        return False
+
+    normalized = resolve_windows_console_executable(executable)
+    return normalized == executable and any(character.isspace() for character in executable)
+
+
+def build_windows_service_command(title: str, args: Sequence[str]) -> str:
+    """Build a cmd.exe-safe command string for a titled service window."""
+    shell_args = list(args)
+    if shell_args:
+        shell_args[0] = resolve_windows_console_executable(str(shell_args[0]))
+    return f"title {title} && {subprocess.list2cmdline(shell_args)}"
+
+
+def launch_windows_service(title: str, args: Sequence[str], cwd: str, env: dict[str, str]) -> LaunchedService:
+    creationflags = getattr(subprocess, "CREATE_NEW_CONSOLE", 0)
+
+    # Some Windows tools (notably npm.cmd under "Program Files") break when a
+    # quoted absolute path is embedded inside a `cmd /k` string. Prefer the
+    # PATH-safe executable name when possible; otherwise launch directly.
+    if windows_service_requires_direct_launch(args):
+        process = subprocess.Popen(
+            list(args),
+            cwd=cwd,
+            env=env,
+            creationflags=creationflags,
+        )
+        return LaunchedService(title=title, pid=process.pid, mode="window")
+
+    process = subprocess.Popen(
+        ["cmd", "/k", build_windows_service_command(title, args)],
+        cwd=cwd,
+        env=env,
+        creationflags=creationflags,
+    )
+    return LaunchedService(title=title, pid=process.pid, mode="window")
+
+
+def launch_linux_terminal_service(
+    title: str,
+    args: Sequence[str],
+    cwd: str,
+    env: dict[str, str],
+) -> LaunchedService | None:
+    terminal = resolve_linux_terminal()
+    if terminal is None:
+        return None
+    terminal_name, terminal_path = terminal
+    try:
+        process = subprocess.Popen(
+            build_linux_terminal_command(terminal_name, terminal_path, title, args, cwd),
+            cwd=cwd,
+            env=env,
+            start_new_session=True,
+        )
+    except OSError:
+        return None
+    return LaunchedService(title=title, pid=process.pid, mode="terminal")
+
+
+def launch_background_service(
+    title: str,
+    service_slug: str,
+    args: Sequence[str],
+    cwd: str,
+    env: dict[str, str],
+    log_root: str,
+) -> LaunchedService:
+    log_path = Path(log_root) / f"launcher_{service_slug}.log"
+    log_path.parent.mkdir(parents=True, exist_ok=True)
+    stream = log_path.open("a", encoding="utf-8")
+    stream.write(f"\n=== {title} ({datetime.now().isoformat(timespec='seconds')}) ===\n")
+    stream.write(f"Command: {shell_join(args)}\n\n")
+    stream.flush()
+    process = subprocess.Popen(
+        list(args),
+        cwd=cwd,
+        env=env,
+        stdout=stream,
+        stderr=subprocess.STDOUT,
+        start_new_session=True,
+    )
+    stream.close()
+    return LaunchedService(title=title, pid=process.pid, mode="background", log_path=str(log_path))
+
+
+def launch_service(
+    title: str,
+    service_slug: str,
+    args: Sequence[str],
+    cwd: str,
+    env: dict[str, str],
+    log_root: str,
+) -> LaunchedService:
+    if sys.platform == "win32":
+        return launch_windows_service(title, args, cwd, env)
+    if is_linux():
+        terminal_service = launch_linux_terminal_service(title, args, cwd, env)
+        if terminal_service is not None:
+            return terminal_service
+    return launch_background_service(title, service_slug, args, cwd, env, log_root)
+
+
+def cleanup_relaunch_artifacts(cleanup_paths: list[Path]) -> None:
+    if not cleanup_paths:
+        return
+    for cleanup_target in cleanup_paths:
+        cleanup_path(cleanup_target)
+
+
+def handle_available_updates(launcher_args: list[str]) -> bool:
+    cprint("[Update] Checking for main-branch updates...", YELLOW)
+    result = check_for_updates()
+
+    if result.install_state.active_instance_count:
+        count = result.install_state.active_instance_count
+        suffix = "s" if count != 1 else ""
+        cprint(f"[Update] Detected {count} launcher-managed instance{suffix} from this install.", YELLOW)
+
+    if result.error:
+        cprint(f"[Update] Skipping update check: {result.error}", YELLOW)
+        write_update_notice(result)
+        print()
+        return True
+
+    if result.warning:
+        cprint(f"[Update] {result.warning}", YELLOW)
+
+    if not result.update_available:
+        write_update_notice(result)
+        cprint(
+            f"[Update] Launcher is already on {result.local_manifest.version} ({result.local_manifest.short_commit}).",
+            GREEN,
+        )
+        print()
+        return True
+
+    remote_manifest = result.remote_manifest
+    assert remote_manifest is not None
+    cprint(
+        f"[Update] Found {remote_manifest.version} ({remote_manifest.short_commit}) on GitHub main.",
+        YELLOW,
+    )
+
+    if not result.can_apply_update:
+        if not result.warning:
+            cprint(f"[Update] {result.install_state.reason}", YELLOW)
+        write_update_notice(result)
+        cprint("[Update] Update notice saved — the app will show an in-app banner.", YELLOW)
+        print()
+        return True
+
+    if not show_yes_no_dialog("MOTO Update Available", build_update_prompt(result)):
+        cprint("[Update] Continuing without applying the update.", YELLOW)
+        write_update_notice(result)
+        print()
+        return True
+
+    applied, message = apply_update(result, launcher_args, os.environ)
+    cprint(f"[Update] {message}", GREEN if applied else YELLOW)
+    print()
+    return not applied
+
+
+def check_python_installation() -> None:
+    cprint("[1/8] Checking Python installation...", YELLOW)
+    python_cmd = get_python_command()
+    if not python_cmd:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: Python 3.8+ is required to run the launcher", RED)
+        cprint("============================================================", RED)
+        print()
+        if is_linux():
+            cprint("Install Python 3 and python3-venv, then launch via `Launch MOTO.sh`.", YELLOW)
+            cprint("Example: sudo apt install python3 python3-venv", YELLOW)
+        else:
+            cprint("Please install Python 3.8+ from:", YELLOW)
+            cprint("https://www.python.org/downloads/", YELLOW)
+            print()
+            cprint("IMPORTANT: Check 'Add Python to PATH' during installation", YELLOW)
+        exit_with_pause(1)
+
+    version = subprocess.check_output([python_cmd, "--version"], text=True).strip()
+    cprint(version, GREEN)
+    cprint(f"Interpreter: {python_cmd}", WHITE)
+    if is_linux():
+        if using_repo_local_venv():
+            cprint("Using repo-local .venv for Ubuntu-safe package installs.", GREEN)
+        else:
+            cprint("Tip: `Launch MOTO.sh` is the recommended Ubuntu 24.04 entrypoint because it keeps Python packages inside the repo-local .venv.", YELLOW)
+    print()
+
+
+def check_node_installation() -> None:
+    cprint("[2/8] Checking Node.js installation...", YELLOW)
+    node_cmd = get_node_command()
+    if not node_cmd:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: Node.js is not installed or not in PATH", RED)
+        cprint("============================================================", RED)
+        print()
+        if is_linux():
+            cprint("Install Node.js 16+ from nodejs.org or your Ubuntu package source, then retry.", YELLOW)
+        else:
+            cprint("Please install Node.js 16+ from:", YELLOW)
+            cprint("https://nodejs.org/", YELLOW)
+        exit_with_pause(1)
+
+    npm_cmd = get_npm_command()
+    if not npm_cmd:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: npm is not available in PATH", RED)
+        cprint("============================================================", RED)
+        print()
+        cprint("Node.js appears to be installed, but npm could not be found.", YELLOW)
+        if is_linux():
+            cprint("Reinstall Node.js and ensure both `node` and `npm` are available in PATH.", YELLOW)
+        else:
+            cprint("Reinstall Node.js from https://nodejs.org/ and ensure npm is included in PATH.", YELLOW)
+        exit_with_pause(1)
+
+    node_version = subprocess.check_output([node_cmd, "--version"], text=True).strip()
+    npm_version = subprocess.check_output([npm_cmd, "--version"], text=True).strip()
+    cprint(f"Node: {node_version}", GREEN)
+    cprint(f"npm: {npm_version}", GREEN)
+    print()
+
+
+def prepare_runtime_and_environment() -> tuple[InstanceRuntime, str, str, dict[str, str]]:
+    cprint("[3/8] Resolving instance runtime...", YELLOW)
+    runtime = resolve_instance_runtime()
+    frontend_url = f"http://localhost:{runtime.frontend_port}"
+    backend_url = f"http://localhost:{runtime.backend_port}"
+    user_uploads = os.path.join(runtime.data_root, "user_uploads")
+
+    for directory in (runtime.data_root, runtime.log_root, user_uploads):
+        os.makedirs(directory, exist_ok=True)
+
+    last_record = load_last_instance_record()
+    reused_from_record = (
+        last_record is not None
+        and sanitize_instance_id(last_record.get("instance_id")) == runtime.instance_id
+        and not runtime.explicit_override
+    )
+
+    if runtime.explicit_override:
+        cprint(
+            "Explicit instance overrides detected (MOTO_INSTANCE_ID / MOTO_DATA_ROOT / "
+            "MOTO_SECRET_NAMESPACE). This launch will NOT update the persisted last-instance "
+            "record so a plain relaunch still points back at your default setup.",
+            YELLOW,
+        )
+    elif runtime.is_default:
+        if reused_from_record:
+            cprint(
+                "Reusing the default instance runtime (shared keyring namespace, stable data root).",
+                GREEN,
+            )
+        else:
+            cprint("Using default instance storage (shared keyring namespace).", GREEN)
+    else:
+        if reused_from_record:
+            cprint(
+                "Reusing previously launched instance runtime (same secret namespace, same data root).",
+                GREEN,
+            )
+        else:
+            cprint("Launching an isolated instance with its own data root and keyring namespace.", GREEN)
+
+    cprint(f"Instance ID: {runtime.instance_id}", CYAN)
+    cprint(f"Backend URL: {backend_url}", GREEN)
+    cprint(f"Frontend URL: {frontend_url}", GREEN)
+    cprint(f"Data root: {runtime.data_root}", WHITE)
+    cprint(f"Log root: {runtime.log_root}", WHITE)
+    if runtime.secret_namespace:
+        cprint(f"Secret namespace: {runtime.secret_namespace}", WHITE)
+    else:
+        cprint("Secret namespace: shared default store", WHITE)
+    print()
+
+    env = os.environ.copy()
+    env["MOTO_INSTANCE_ID"] = runtime.instance_id
+    env["MOTO_DATA_ROOT"] = runtime.data_root
+    env["MOTO_LOG_ROOT"] = runtime.log_root
+    env["MOTO_BACKEND_HOST"] = runtime.backend_host
+    env["HOST"] = runtime.backend_host
+    env["MOTO_BACKEND_PORT"] = str(runtime.backend_port)
+    env["PORT"] = str(runtime.backend_port)
+    env["MOTO_FRONTEND_PORT"] = str(runtime.frontend_port)
+    env["FRONTEND_PORT"] = str(runtime.frontend_port)
+    env["VITE_MOTO_FRONTEND_PORT"] = str(runtime.frontend_port)
+    env["VITE_MOTO_BACKEND_URL"] = backend_url
+    env["VITE_MOTO_INSTANCE_ID"] = runtime.instance_id
+    env["VITE_MOTO_DATA_ROOT_DISPLAY"] = runtime.data_root
+
+    if runtime.storage_prefix:
+        env["MOTO_FRONTEND_STORAGE_PREFIX"] = runtime.storage_prefix
+        env["VITE_MOTO_STORAGE_PREFIX"] = runtime.storage_prefix
+    else:
+        env.pop("MOTO_FRONTEND_STORAGE_PREFIX", None)
+        env.pop("VITE_MOTO_STORAGE_PREFIX", None)
+
+    if runtime.secret_namespace:
+        env["MOTO_SECRET_NAMESPACE"] = runtime.secret_namespace
+    else:
+        env.pop("MOTO_SECRET_NAMESPACE", None)
+
+    return runtime, frontend_url, backend_url, env
+
+
+def install_python_dependencies() -> None:
+    cprint("[4/8] Installing Python dependencies...", YELLOW)
+    cprint("Upgrading pip and checking packages...", YELLOW)
+    print()
+    python_cmd = get_python_command()
+    run_silent([python_cmd, "-m", "pip", "install", "--upgrade", "pip"], cwd=str(SCRIPT_DIR))
+    result = run_visible(
+        [python_cmd, "-m", "pip", "install", "--upgrade", "-r", "requirements.txt"],
+        cwd=str(SCRIPT_DIR),
+        check=False,
+    )
+    if result != 0:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: Failed to install Python dependencies", RED)
+        cprint("============================================================", RED)
+        print()
+        cprint("Please check:", YELLOW)
+        cprint("- Internet connection is working", YELLOW)
+        cprint("- You have permission to install packages", YELLOW)
+        if is_linux():
+            cprint("- On Ubuntu 24.04, prefer launching via `Launch MOTO.sh` so installs stay inside the repo-local .venv", YELLOW)
+            cprint("- If venv creation fails, install `python3-venv` first", YELLOW)
+        exit_with_pause(1)
+    cprint("Python dependencies up to date", GREEN)
+    print()
+
+
+def install_playwright_browser() -> None:
+    cprint("[4b/8] Installing Playwright Chromium browser for PDF generation...", YELLOW)
+    cprint("This is a one-time download (~150MB) and may take a few minutes...", YELLOW)
+    print()
+    python_cmd = get_python_command()
+    result = run_visible([python_cmd, "-m", "playwright", "install", "chromium"], cwd=str(SCRIPT_DIR), check=False)
+    if result != 0:
+        print()
+        cprint("WARNING: Playwright Chromium install failed.", YELLOW)
+        cprint("PDF generation will not be available until resolved.", YELLOW)
+        cprint(f"Retry manually: {python_cmd} -m playwright install chromium", YELLOW)
+        if is_linux():
+            cprint("Ubuntu 24.04 may also require desktop/browser system libraries before Playwright can launch Chromium successfully.", YELLOW)
+        cprint("Continuing startup anyway...", YELLOW)
+    else:
+        cprint("Playwright Chromium ready!", GREEN)
+    print()
+
+
+def _prepend_path_entry(path_entry: str, env: dict[str, str]) -> None:
+    """Prepend a directory to PATH for the current process and child services."""
+    if not path_entry:
+        return
+    current_parts = [part for part in os.environ.get("PATH", "").split(os.pathsep) if part]
+    try:
+        normalized_entry = str(Path(path_entry).resolve())
+    except OSError:
+        normalized_entry = path_entry
+    normalized_parts = set()
+    for part in current_parts:
+        try:
+            normalized_parts.add(str(Path(part).resolve()))
+        except OSError:
+            normalized_parts.add(part)
+    if normalized_entry not in normalized_parts:
+        os.environ["PATH"] = normalized_entry + os.pathsep + os.environ.get("PATH", "")
+    env["PATH"] = os.environ.get("PATH", "")
+
+
+def _write_lean_workspace_files(workspace_dir: Path) -> None:
+    """Create the reusable Lean 4 Mathlib workspace files."""
+    workspace_dir.mkdir(parents=True, exist_ok=True)
+
+    lean_toolchain_path = workspace_dir / "lean-toolchain"
+    if not lean_toolchain_path.exists():
+        lean_toolchain_path.write_text("leanprover/lean4:stable\n", encoding="utf-8")
+
+    lakefile_path = workspace_dir / "lakefile.lean"
+    if not lakefile_path.exists():
+        lakefile_path.write_text(
+            "\n".join(
+                [
+                    "import Lake",
+                    "open Lake DSL",
+                    "",
+                    "package «moto_proof_workspace» where",
+                    "",
+                    "require mathlib from git",
+                    '  "https://github.com/leanprover-community/mathlib4.git"',
+                ]
+            )
+            + "\n",
+            encoding="utf-8",
+        )
+
+    root_file_path = workspace_dir / "MOTOProofWorkspace.lean"
+    if not root_file_path.exists():
+        root_file_path.write_text("import Mathlib\n", encoding="utf-8")
+
+
+def _download_file(url: str, destination: Path) -> None:
+    """Download a remote file to disk using the standard library."""
+    destination.parent.mkdir(parents=True, exist_ok=True)
+    request = Request(url, headers={"User-Agent": "MOTO Launcher"})
+    with urlopen(request, timeout=120) as response, destination.open("wb") as handle:
+        while True:
+            chunk = response.read(1024 * 1024)
+            if not chunk:
+                break
+            handle.write(chunk)
+
+
+def _extract_archive(archive_path: Path, destination: Path) -> None:
+    """Extract a zip or tarball into the destination directory."""
+    destination.mkdir(parents=True, exist_ok=True)
+    archive_name = archive_path.name.lower()
+    if archive_name.endswith(".zip"):
+        with zipfile.ZipFile(archive_path) as archive:
+            archive.extractall(destination)
+        return
+    if archive_name.endswith(".tar.gz") or archive_name.endswith(".tgz"):
+        with tarfile.open(archive_path, "r:gz") as archive:
+            archive.extractall(destination)
+        return
+    raise RuntimeError(f"Unsupported archive format: {archive_path.name}")
+
+
+def _detect_z3_asset_name() -> tuple[str, tuple[str, ...]]:
+    """Return the preferred platform marker and fallback markers for Z3 assets."""
+    machine = platform.machine().lower()
+    if machine in {"x86_64", "amd64"}:
+        arch_markers = ("x64",)
+    elif machine in {"aarch64", "arm64"}:
+        arch_markers = ("arm64", "aarch64")
+    else:
+        raise RuntimeError(f"Unsupported architecture for automatic Z3 install: {machine}")
+
+    if sys.platform == "win32":
+        return "win", arch_markers
+    if is_linux():
+        return "glibc", arch_markers
+    raise RuntimeError(f"Automatic Z3 install is unsupported on platform: {sys.platform}")
+
+
+def _select_z3_asset(assets: list[dict[str, str]]) -> dict[str, str]:
+    """Pick the best-matching release asset for the current platform."""
+    platform_marker, arch_markers = _detect_z3_asset_name()
+    candidates = [
+        asset
+        for asset in assets
+        if isinstance(asset, dict)
+        and asset.get("name")
+        and asset.get("browser_download_url")
+        and ".sig" not in asset["name"].lower()
+        and any(marker in asset["name"].lower() for marker in arch_markers)
+    ]
+
+    for asset in candidates:
+        name = asset["name"].lower()
+        if platform_marker in name and (name.endswith(".zip") or name.endswith(".tar.gz") or name.endswith(".tgz")):
+            return asset
+
+    readable_assets = ", ".join(asset.get("name", "<unknown>") for asset in assets if isinstance(asset, dict))
+    raise RuntimeError(f"Could not find a matching Z3 release asset. Available assets: {readable_assets}")
+
+
+def _find_z3_binary(search_root: Path) -> Path | None:
+    """Locate the extracted Z3 executable."""
+    candidate_names = ("z3.exe", "z3") if sys.platform == "win32" else ("z3",)
+    for candidate_name in candidate_names:
+        for candidate in search_root.rglob(candidate_name):
+            if candidate.is_file():
+                return candidate
+    return None
+
+
+def _select_elan_windows_asset(assets: list[dict[str, str]]) -> dict[str, str]:
+    """Pick the best-matching Windows elan release asset for the current architecture.
+
+    Upstream elan no longer publishes a bare ``elan-init.exe``; instead it ships
+    per-platform zip archives (for example ``elan-x86_64-pc-windows-msvc.zip``)
+    that contain ``elan-init.exe`` inside. We prefer the native architecture and
+    fall back to x86_64 so ARM64 Windows hosts can still bootstrap via emulation.
+    """
+    machine = platform.machine().lower()
+    if machine in {"aarch64", "arm64"}:
+        preferred_markers = ("aarch64-pc-windows", "arm64-pc-windows")
+        fallback_markers = ("x86_64-pc-windows", "amd64-pc-windows")
+    else:
+        preferred_markers = ("x86_64-pc-windows", "amd64-pc-windows")
+        fallback_markers: tuple[str, ...] = ()
+
+    candidates = [
+        asset
+        for asset in assets
+        if isinstance(asset, dict)
+        and asset.get("name")
+        and asset.get("browser_download_url")
+        and asset["name"].lower().endswith(".zip")
+        and ".sig" not in asset["name"].lower()
+    ]
+
+    for markers in (preferred_markers, fallback_markers):
+        for asset in candidates:
+            name = asset["name"].lower()
+            if any(marker in name for marker in markers):
+                return asset
+
+    readable_assets = ", ".join(asset.get("name", "<unknown>") for asset in assets if isinstance(asset, dict))
+    raise RuntimeError(
+        f"Could not find a matching elan release asset for Windows. Available assets: {readable_assets}"
+    )
+
+
+def _find_elan_installer(search_root: Path) -> Path | None:
+    """Locate the extracted elan-init installer executable."""
+    if not search_root.exists():
+        return None
+    candidate_names = ("elan-init.exe",) if sys.platform == "win32" else ("elan-init",)
+    for candidate_name in candidate_names:
+        for candidate in search_root.rglob(candidate_name):
+            if candidate.is_file():
+                return candidate
+    return None
+
+
+def _set_lean_env_flags(
+    env: dict[str, str],
+    *,
+    enabled: bool,
+    lean_path: str = "",
+    workspace_dir: str = "",
+) -> None:
+    env["MOTO_LEAN4_ENABLED"] = "1" if enabled else "0"
+    env["MOTO_LEAN4_PATH"] = lean_path
+    env["MOTO_LEAN4_WORKSPACE_DIR"] = workspace_dir
+    env["MOTO_LEAN4_PROOF_TIMEOUT"] = env.get("MOTO_LEAN4_PROOF_TIMEOUT", "").strip() or "120"
+    env["MOTO_LEAN4_LSP_ENABLED"] = (
+        env.get("MOTO_LEAN4_LSP_ENABLED", "").strip()
+        if enabled and env.get("MOTO_LEAN4_LSP_ENABLED", "").strip()
+        else ("1" if enabled else "0")
+    )
+    env["MOTO_LEAN4_LSP_IDLE_TIMEOUT"] = env.get("MOTO_LEAN4_LSP_IDLE_TIMEOUT", "").strip() or "600"
+
+
+def _set_smt_env_flags(
+    env: dict[str, str],
+    *,
+    enabled: bool,
+    z3_path: str = "",
+) -> None:
+    env["MOTO_SMT_ENABLED"] = "1" if enabled else "0"
+    env["MOTO_Z3_PATH"] = z3_path
+    env["MOTO_SMT_TIMEOUT"] = env.get("MOTO_SMT_TIMEOUT", "").strip() or "30"
+
+
+def install_lean4(runtime: InstanceRuntime, env: dict[str, str]) -> None:
+    """
+    Ensure Lean 4 / elan is available for proof verification.
+
+    This step is intentionally non-fatal: if installation fails, MOTO still
+    launches and simply skips automated proof verification.
+    """
+    cprint("[4c/8] Checking Lean 4 / elan for proof verification...", YELLOW)
+    print()
+
+    elan_bin_dir = Path.home() / ".elan" / "bin"
+    lean_cmd = get_lean_command()
+    lake_cmd = get_lake_command()
+
+    if lean_cmd and elan_bin_dir.exists():
+        _prepend_path_entry(str(elan_bin_dir), env)
+
+    if not lean_cmd:
+        cprint("Lean 4 not detected. Attempting one-time elan installation...", YELLOW)
+        try:
+            if sys.platform == "win32":
+                managed_root = Path(runtime.data_root) / "elan"
+                release_request = Request(
+                    "https://api.github.com/repos/leanprover/elan/releases/latest",
+                    headers={
+                        "User-Agent": "MOTO Launcher",
+                        "Accept": "application/vnd.github+json",
+                    },
+                )
+                with urlopen(release_request, timeout=60) as response:
+                    release_payload = json.loads(response.read().decode("utf-8"))
+
+                asset = _select_elan_windows_asset(list(release_payload.get("assets") or []))
+                archive_path = managed_root / "downloads" / asset["name"]
+                install_root = managed_root / "current"
+
+                if not archive_path.exists():
+                    _download_file(asset["browser_download_url"], archive_path)
+
+                installer_path = _find_elan_installer(install_root)
+                if installer_path is None:
+                    _extract_archive(archive_path, install_root)
+                    installer_path = _find_elan_installer(install_root)
+
+                if installer_path is None:
+                    raise RuntimeError(
+                        "elan archive extracted successfully, but elan-init.exe could not be located."
+                    )
+
+                install_result = run_visible(
+                    [
+                        str(installer_path),
+                        "-y",
+                        "--default-toolchain",
+                        "leanprover/lean4:stable",
+                    ],
+                    cwd=str(SCRIPT_DIR),
+                    check=False,
+                )
+                if install_result != 0:
+                    raise RuntimeError("elan installer exited with a non-zero status.")
+            else:
+                install_result = subprocess.run(
+                    [
+                        "sh",
+                        "-c",
+                        "curl https://elan.lean-lang.org/install.sh -sSf | sh -s -- -y --default-toolchain leanprover/lean4:stable",
+                    ],
+                    cwd=str(SCRIPT_DIR),
+                    check=False,
+                ).returncode
+                if install_result != 0:
+                    raise RuntimeError("elan install script exited with a non-zero status.")
+        except Exception as exc:
+            print()
+            cprint("WARNING: Lean 4 not available -- proof verification will be skipped.", YELLOW)
+            cprint(str(exc), YELLOW)
+            _set_lean_env_flags(env, enabled=False)
+            print()
+            return
+
+    if elan_bin_dir.exists():
+        _prepend_path_entry(str(elan_bin_dir), env)
+
+    lean_cmd = get_lean_command()
+    lake_cmd = get_lake_command()
+    if not lean_cmd or not lake_cmd:
+        cprint("WARNING: Lean 4 tooling is incomplete -- proof verification will be skipped.", YELLOW)
+        _set_lean_env_flags(env, enabled=False)
+        print()
+        return
+
+    try:
+        lean_version = subprocess.check_output([lean_cmd, "--version"], text=True).strip()
+        cprint(f"Lean 4 ready: {lean_version}", GREEN)
+    except Exception as exc:
+        cprint("WARNING: Lean 4 verification failed during version check -- proof verification will be skipped.", YELLOW)
+        cprint(str(exc), YELLOW)
+        _set_lean_env_flags(env, enabled=False)
+        print()
+        return
+
+    workspace_dir = Path(runtime.data_root) / "lean4_workspace"
+    try:
+        _write_lean_workspace_files(workspace_dir)
+    except Exception as exc:
+        cprint("WARNING: Lean 4 workspace files could not be prepared; proof verification may fail later.", YELLOW)
+        cprint(str(exc), YELLOW)
+
+    _set_lean_env_flags(
+        env,
+        enabled=True,
+        lean_path=str(Path(lean_cmd).resolve()),
+        workspace_dir=str(workspace_dir.resolve()),
+    )
+    cprint(f"Lean 4 workspace: {workspace_dir}", GREEN)
+    print()
+
+
+def install_z3(runtime: InstanceRuntime, env: dict[str, str]) -> None:
+    """
+    Ensure Z3 is available for optional SMT workflows.
+
+    This step is intentionally non-fatal: if installation fails, MOTO still
+    launches and simply disables SMT-related runtime wiring.
+    """
+    cprint("[4d/8] Checking optional Z3 / SMT solver...", YELLOW)
+    print()
+
+    managed_root = Path(runtime.data_root) / "z3"
+    z3_cmd = get_z3_command()
+
+    if not z3_cmd and managed_root.exists():
+        managed_binary = _find_z3_binary(managed_root)
+        if managed_binary is not None:
+            _prepend_path_entry(str(managed_binary.parent), env)
+            z3_cmd = str(managed_binary.resolve())
+
+    if not z3_cmd:
+        cprint("Z3 not detected. Attempting one-time download...", YELLOW)
+        try:
+            release_request = Request(
+                "https://api.github.com/repos/Z3Prover/z3/releases/latest",
+                headers={
+                    "User-Agent": "MOTO Launcher",
+                    "Accept": "application/vnd.github+json",
+                },
+            )
+            with urlopen(release_request, timeout=60) as response:
+                release_payload = json.loads(response.read().decode("utf-8"))
+
+            asset = _select_z3_asset(list(release_payload.get("assets") or []))
+            archive_path = managed_root / "downloads" / asset["name"]
+            install_root = managed_root / "current"
+
+            if not archive_path.exists():
+                _download_file(asset["browser_download_url"], archive_path)
+
+            if not install_root.exists() or _find_z3_binary(install_root) is None:
+                _extract_archive(archive_path, install_root)
+
+            managed_binary = _find_z3_binary(install_root)
+            if managed_binary is None:
+                raise RuntimeError("Z3 archive extracted successfully, but the z3 binary could not be located.")
+
+            if sys.platform != "win32":
+                managed_binary.chmod(managed_binary.stat().st_mode | 0o111)
+
+            _prepend_path_entry(str(managed_binary.parent), env)
+            z3_cmd = str(managed_binary.resolve())
+        except Exception as exc:
+            print()
+            cprint("WARNING: Z3 is not available -- SMT integration will remain disabled.", YELLOW)
+            cprint(str(exc), YELLOW)
+            _set_smt_env_flags(env, enabled=False)
+            print()
+            return
+
+    try:
+        z3_version = subprocess.check_output(
+            [z3_cmd, "-version"],
+            text=True,
+            stderr=subprocess.STDOUT,
+        ).strip()
+        cprint(f"Z3 ready: {z3_version}", GREEN)
+    except Exception as exc:
+        cprint("WARNING: Z3 failed during version check -- SMT integration will remain disabled.", YELLOW)
+        cprint(str(exc), YELLOW)
+        _set_smt_env_flags(env, enabled=False)
+        print()
+        return
+
+    _set_smt_env_flags(
+        env,
+        enabled=True,
+        z3_path=str(Path(z3_cmd).resolve()),
+    )
+    cprint(f"Z3 binary: {z3_cmd}", GREEN)
+    print()
+
+
+def install_frontend_dependencies() -> tuple[str, bool]:
+    cprint("[5/8] Checking Node.js dependencies...", YELLOW)
+    frontend_path = str(SCRIPT_DIR / "frontend")
+    if not os.path.isdir(frontend_path):
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: frontend directory not found!", RED)
+        cprint("============================================================", RED)
+        print()
+        cprint("Make sure you're running this from the project root directory.", YELLOW)
+        exit_with_pause(1)
+
+    npm_cmd = get_npm_command()
+    if not npm_cmd:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: npm is not available in PATH", RED)
+        cprint("============================================================", RED)
+        print()
+        cprint("Reinstall Node.js from https://nodejs.org/ and ensure npm is included in PATH.", YELLOW)
+        exit_with_pause(1)
+
+    npm_result = subprocess.run(
+        [npm_cmd, "install"],
+        cwd=frontend_path,
+        stdout=subprocess.PIPE,
+        stderr=subprocess.STDOUT,
+        text=True,
+        check=False,
+    )
+    npm_output = npm_result.stdout or ""
+    print(npm_output, end="")
+
+    if npm_result.returncode != 0:
+        print()
+        cprint("============================================================", RED)
+        cprint("ERROR: Failed to install Node.js dependencies", RED)
+        cprint("============================================================", RED)
+        print()
+        cprint("Please check:", YELLOW)
+        cprint("- Internet connection is working", YELLOW)
+        cprint("- package.json exists in frontend directory", YELLOW)
+        exit_with_pause(1)
+
+    vulnerability_warning = "vulnerabilities found" in npm_output.lower()
+    if vulnerability_warning:
+        print()
+        cprint("NOTE: npm reported vulnerability warnings during install.", YELLOW)
+        cprint("Build 1 no longer auto-runs `npm audit fix` because that can dirty a clean checkout and break updater eligibility.", YELLOW)
+        cprint("If you want to mutate dependencies intentionally, run `npm audit fix` manually inside `frontend/`.", YELLOW)
+
+    cprint("Node.js dependencies up to date", GREEN)
+    print()
+    return npm_cmd, vulnerability_warning
+
+
+def check_lm_studio() -> None:
+    cprint("[6/8] Checking LM Studio...", YELLOW)
+    print()
+    lm_available = False
+    try:
+        urlopen("http://127.0.0.1:1234/v1/models", timeout=3)
+        lm_available = True
+    except (URLError, OSError):
+        pass
+
+    if lm_available:
+        cprint("LM Studio is running and responding!", GREEN)
+    else:
+        cprint("================================================================", CYAN)
+        cprint("NOTE: LM Studio is not detected on http://127.0.0.1:1234", CYAN)
+        cprint("================================================================", CYAN)
+        print()
+        cprint("This is OK! You have two options for AI models:", YELLOW)
+        print()
+        cprint("  Option 1: LM Studio (Local)", YELLOW)
+        cprint("    - Download from: https://lmstudio.ai/", WHITE)
+        cprint("    - Load a model and start the Local Server", WHITE)
+        print()
+        cprint("  Option 2: OpenRouter (Cloud API)", YELLOW)
+        cprint("    - Get an API key from: https://openrouter.ai/", WHITE)
+        cprint("    - Configure in Settings tab after launch", WHITE)
+        print()
+        cprint("The system will still start with isolated instance settings.", GREEN)
+    print()
+
+
+def check_secure_keyring() -> None:
+    cprint("[6b/8] Checking secure credential storage...", YELLOW)
+    try:
+        import keyring
+
+        backend = keyring.get_keyring()
+        backend_name = f"{backend.__class__.__module__}.{backend.__class__.__name__}"
+        if backend.__class__.__module__.startswith("keyring.backends.fail"):
+            cprint("WARNING: No OS keyring backend is available right now.", YELLOW)
+            if is_linux():
+                cprint("Saved OpenRouter and Wolfram keys will not persist until a Secret Service compatible keyring is available in your desktop session.", YELLOW)
+                cprint("Ubuntu users typically resolve this by enabling a desktop keyring such as `gnome-keyring`.", YELLOW)
+            else:
+                cprint("Saved provider keys will not persist until the OS keyring becomes available.", YELLOW)
+        else:
+            cprint(f"Keyring backend: {backend_name}", GREEN)
+    except Exception as exc:
+        cprint(f"WARNING: Could not inspect OS keyring availability: {exc}", YELLOW)
+    print()
+
+
+def verify_instance_ports(runtime: InstanceRuntime) -> None:
+    cprint("[7/8] Final launch checks...", YELLOW)
+    if port_in_use(runtime.backend_port):
+        raise RuntimeError(f"Backend port {runtime.backend_port} became occupied before launch.")
+    if port_in_use(runtime.frontend_port):
+        raise RuntimeError(f"Frontend port {runtime.frontend_port} became occupied before launch.")
+    cprint("Instance resources are ready.", GREEN)
+    print()
+
+
+def is_pid_running(pid: int) -> bool:
+    try:
+        os.kill(pid, 0)
+    except OSError:
+        return False
+    return True
+
+
+def start_services(
+    runtime: InstanceRuntime,
+    env: dict[str, str],
+    frontend_url: str,
+    backend_url: str,
+    npm_cmd: str,
+) -> tuple[LaunchedService, LaunchedService]:
+    cprint("[8/8] Starting services...", YELLOW)
+    print()
+    cprint("================================================================", CYAN)
+    cprint(f"  Starting MOTO instance '{runtime.instance_id}'", CYAN)
+    cprint("================================================================", CYAN)
+    print()
+    cprint(f"Backend API will run on: {backend_url}", GREEN)
+    cprint(f"Frontend UI will run on: {frontend_url}", GREEN)
+    print()
+    if is_linux():
+        terminal = resolve_linux_terminal()
+        if terminal is not None:
+            cprint(f"Launcher will open separate Linux service terminals via {terminal[0]}.", GREEN)
+        else:
+            cprint("No desktop terminal emulator was detected. Services will run in the background and write logs under the active log root.", YELLOW)
+            if not has_desktop_session():
+                cprint("No DISPLAY/WAYLAND desktop session is active, so you may need to open the frontend URL manually.", YELLOW)
+        print()
+    cprint("Starting services automatically in 3 seconds...", YELLOW)
+    time.sleep(3)
+    print()
+
+    backend_args = [
+        get_python_command(),
+        "-m",
+        "uvicorn",
+        "backend.api.main:app",
+        "--host",
+        runtime.backend_host,
+        "--port",
+        str(runtime.backend_port),
+        "--no-access-log",
+    ]
+    backend_service = launch_service(
+        title=f"MOTO Backend [{runtime.instance_id}]",
+        service_slug="backend",
+        args=backend_args,
+        cwd=str(SCRIPT_DIR),
+        env=env,
+        log_root=runtime.log_root,
+    )
+
+    cprint("Waiting for backend to initialize...", YELLOW)
+    time.sleep(5)
+    if backend_service.mode != "window" and not is_pid_running(backend_service.pid):
+        log_hint = f" Check {backend_service.log_path} for details." if backend_service.log_path else ""
+        raise RuntimeError(f"{backend_service.title} exited during startup.{log_hint}")
+
+    frontend_service = launch_service(
+        title=f"MOTO Frontend [{runtime.instance_id}]",
+        service_slug="frontend",
+        args=[npm_cmd, "run", "dev"],
+        cwd=str(SCRIPT_DIR / "frontend"),
+        env=env,
+        log_root=runtime.log_root,
+    )
+
+    cprint("Waiting for frontend to initialize...", YELLOW)
+    time.sleep(8)
+    if frontend_service.mode != "window" and not is_pid_running(frontend_service.pid):
+        log_hint = f" Check {frontend_service.log_path} for details." if frontend_service.log_path else ""
+        raise RuntimeError(f"{frontend_service.title} exited during startup.{log_hint}")
+
+    register_active_instance(
+        instance_id=runtime.instance_id,
+        backend_window_pid=backend_service.pid,
+        frontend_window_pid=frontend_service.pid,
+        backend_port=runtime.backend_port,
+        frontend_port=runtime.frontend_port,
+        data_root=runtime.data_root,
+        log_root=runtime.log_root,
+        secret_namespace=runtime.secret_namespace,
+        storage_prefix=runtime.storage_prefix,
+    )
+
+    # Persist the active instance runtime so subsequent relaunches can reuse
+    # the same secret_namespace / data_root / storage_prefix. This includes
+    # "default" launches — previously those were skipped, which caused the
+    # keyring namespace to flip between None and a freshly minted timestamp
+    # whenever the default ports happened to be busy between runs, and
+    # therefore made saved OpenRouter / Wolfram Alpha keys look like they
+    # "disappeared" on roughly every other launch.
+    #
+    # We intentionally SKIP this save for explicit overrides (MOTO_INSTANCE_ID
+    # / MOTO_DATA_ROOT / MOTO_SECRET_NAMESPACE etc.). Those are one-off
+    # overrides by design; persisting them would silently redirect the next
+    # plain launch at the override's data root and keyring namespace, which
+    # would look like the user's default instance had disappeared.
+    if not runtime.explicit_override:
+        try:
+            save_last_instance_record(
+                instance_id=runtime.instance_id,
+                data_root=runtime.data_root,
+                log_root=runtime.log_root,
+                secret_namespace=runtime.secret_namespace,
+                storage_prefix=runtime.storage_prefix,
+            )
+        except OSError as exc:
+            cprint(f"Warning: could not persist last-instance record: {exc}", YELLOW)
+
+    cprint("Opening browser...", GREEN)
+    webbrowser.open(frontend_url)
+    return backend_service, frontend_service
+
+
+def print_success_footer(
+    runtime: InstanceRuntime,
+    frontend_url: str,
+    vulnerability_warning: bool,
+    backend_service: LaunchedService,
+    frontend_service: LaunchedService,
+) -> None:
+    print()
+    cprint("================================================================", CYAN)
+    cprint("  INSTANCE STARTED", CYAN)
+    cprint("================================================================", CYAN)
+    print()
+    if backend_service.mode == "window" and frontend_service.mode == "window":
+        cprint("Two service windows have opened:", GREEN)
+    elif backend_service.mode == "terminal" and frontend_service.mode == "terminal":
+        cprint("Two service terminals have opened:", GREEN)
+    else:
+        cprint("MOTO started the following launcher-managed services:", GREEN)
+    cprint(f"  - MOTO Backend [{runtime.instance_id}] on port {runtime.backend_port}", GREEN)
+    cprint(f"  - MOTO Frontend [{runtime.instance_id}] on port {runtime.frontend_port}", GREEN)
+    if backend_service.log_path:
+        cprint(f"    Backend log: {backend_service.log_path}", WHITE)
+    if frontend_service.log_path:
+        cprint(f"    Frontend log: {frontend_service.log_path}", WHITE)
+    print()
+    cprint("Browser opened automatically to:", GREEN)
+    cprint(f"  {frontend_url}", CYAN)
+    print()
+    if vulnerability_warning:
+        cprint("npm install reported vulnerability warnings earlier. Build 1 leaves that decision manual so updater-safe checkouts stay clean.", YELLOW)
+        print()
+    if backend_service.mode == "background" or frontend_service.mode == "background":
+        cprint(f"To stop this instance: stop the launcher-managed backend/frontend processes for {runtime.instance_id}.", YELLOW)
+    else:
+        cprint(f"To stop this instance: close both service terminals/windows for {runtime.instance_id}.", YELLOW)
+    print()
+    cprint("This launcher window will close automatically.", GREEN)
+    print()
+
+
+def main() -> int:
+    launcher_args, cleanup_targets = consume_internal_launcher_args(sys.argv[1:])
+    _enable_ansi_on_windows()
+
+    try:
+        cleanup_relaunch_artifacts(cleanup_targets)
+        clear_console()
+        print_banner()
+
+        if not handle_available_updates(launcher_args):
+            return 0
+
+        check_python_installation()
+        check_node_installation()
+        runtime, frontend_url, backend_url, env = prepare_runtime_and_environment()
+        install_python_dependencies()
+        install_playwright_browser()
+        install_lean4(runtime, env)
+        install_z3(runtime, env)
+        npm_cmd, vulnerability_warning = install_frontend_dependencies()
+        check_lm_studio()
+        check_secure_keyring()
+        verify_instance_ports(runtime)
+        backend_service, frontend_service = start_services(runtime, env, frontend_url, backend_url, npm_cmd)
+        print_success_footer(runtime, frontend_url, vulnerability_warning, backend_service, frontend_service)
+        return 0
+    except Exception as exc:
+        print()
+        cprint("============================================================", RED)
+        cprint(f"FATAL ERROR: {exc}", RED)
+        cprint("============================================================", RED)
+        print()
+        import traceback
+
+        cprint("Stack Trace:", YELLOW)
+        traceback.print_exc()
+        exit_with_pause(1)
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/moto_updater.py b/moto_updater.py
new file mode 100644
index 0000000..ae8d996
--- /dev/null
+++ b/moto_updater.py
@@ -0,0 +1,924 @@
+"""
+Build 1/2 updater helpers for the MOTO launcher.
+"""
+from __future__ import annotations
+
+from dataclasses import dataclass
+import json
+import os
+from pathlib import Path
+import shutil
+import subprocess
+import sys
+import tempfile
+import urllib.error
+import urllib.request
+import zipfile
+
+
+REPO_ROOT = Path(__file__).resolve().parent
+PACKAGE_JSON_PATH = REPO_ROOT / "package.json"
+LOCAL_MANIFEST_PATH = REPO_ROOT / "moto-update-manifest.json"
+LAUNCHER_STATE_PATH = REPO_ROOT / ".moto_launcher_state.json"
+LAUNCHER_LAST_INSTANCE_PATH = REPO_ROOT / ".moto_last_instance.json"
+LAUNCHER_ENTRYPOINT_ENV = "MOTO_LAUNCHER_ENTRYPOINT"
+
+_DEFAULT_MANIFEST = {
+    "manifest_version": 1,
+    "version": "0.0.0-dev",
+    "build_commit": "dev",
+    "update_channel": "main",
+    "api_contract_version": "build5-v1",
+}
+
+_DEFAULT_PRESERVED_ROOTS = {
+    ".git",
+    ".moto_instances",
+    "backend/data",
+    "backend/logs",
+    "frontend/node_modules",
+    "frontend/dist",
+    ".venv",
+    "venv",
+    "env",
+    "ENV",
+}
+_DEFAULT_PRESERVED_FILES = {
+    ".env",
+    ".env.local",
+    ".moto_launcher_state.json",
+    ".moto_last_instance.json",
+    "frontend/.env",
+    "frontend/.env.local",
+}
+_WINDOWS_YES = 6
+
+
+@dataclass(frozen=True)
+class BuildManifest:
+    version: str
+    build_commit: str
+    update_channel: str
+    api_contract_version: str
+    manifest_version: int = 1
+
+    @property
+    def short_commit(self) -> str:
+        return self.build_commit[:7] if self.build_commit else "unknown"
+
+
+@dataclass(frozen=True)
+class InstallState:
+    kind: str
+    label: str
+    can_auto_apply: bool
+    reason: str
+    active_instance_count: int = 0
+    git_branch: str | None = None
+    git_upstream: str | None = None
+    git_remote_url: str | None = None
+
+
+@dataclass(frozen=True)
+class UpdateCheckResult:
+    local_manifest: BuildManifest
+    remote_manifest: BuildManifest | None
+    install_state: InstallState
+    error: str | None = None
+    warning: str | None = None
+    metadata_source: str = "none"
+
+    @property
+    def update_available(self) -> bool:
+        if self.remote_manifest is None:
+            return False
+        return self.remote_manifest.build_commit != self.local_manifest.build_commit
+
+    @property
+    def can_apply_update(self) -> bool:
+        return (
+            self.update_available
+            and self.remote_manifest is not None
+            and self.metadata_source == "manifest"
+            and self.install_state.can_auto_apply
+        )
+
+
+@dataclass
+class _CopyJournal:
+    created_files: list[str]
+    overwritten_files: list[str]
+    overwritten_directories: list[str]
+
+    def __init__(self) -> None:
+        self.created_files = []
+        self.overwritten_files = []
+        self.overwritten_directories = []
+
+
+def _read_json(path: Path) -> dict | None:
+    try:
+        return json.loads(path.read_text(encoding="utf-8"))
+    except (FileNotFoundError, json.JSONDecodeError, OSError):
+        return None
+
+
+def _write_json(path: Path, payload: dict) -> None:
+    path.write_text(json.dumps(payload, indent=2), encoding="utf-8")
+
+
+def _load_package_json() -> dict:
+    payload = _read_json(PACKAGE_JSON_PATH)
+    return payload if isinstance(payload, dict) else {}
+
+
+def _coerce_manifest(payload: dict | None) -> BuildManifest:
+    data = dict(_DEFAULT_MANIFEST)
+    package_json = _load_package_json()
+    version = str(package_json.get("version", "")).strip()
+    if version:
+        data["version"] = version
+
+    if isinstance(payload, dict):
+        for key in ("version", "build_commit", "update_channel", "api_contract_version"):
+            value = str(payload.get(key, "")).strip()
+            if value:
+                data[key] = value
+        try:
+            data["manifest_version"] = int(payload.get("manifest_version", data["manifest_version"]))
+        except (TypeError, ValueError):
+            data["manifest_version"] = int(_DEFAULT_MANIFEST["manifest_version"])
+
+    return BuildManifest(
+        version=str(data["version"]),
+        build_commit=str(data["build_commit"]),
+        update_channel=str(data["update_channel"]),
+        api_contract_version=str(data["api_contract_version"]),
+        manifest_version=int(data["manifest_version"]),
+    )
+
+
+def load_local_manifest() -> BuildManifest:
+    return _coerce_manifest(_read_json(LOCAL_MANIFEST_PATH))
+
+
+def _normalize_repo_slug(url: str) -> str | None:
+    raw = (url or "").strip()
+    if not raw:
+        return None
+
+    cleaned = raw.rstrip("/")
+    for prefix in ("git+https://", "https://", "http://", "ssh://git@"):
+        if cleaned.startswith(prefix):
+            cleaned = cleaned[len(prefix):]
+            break
+
+    if cleaned.startswith("git@github.com:"):
+        cleaned = cleaned[len("git@github.com:") :]
+    elif cleaned.startswith("github.com/"):
+        cleaned = cleaned[len("github.com/") :]
+
+    cleaned = cleaned.removesuffix(".git")
+    parts = [part for part in cleaned.split("/") if part]
+    if len(parts) >= 2:
+        return f"{parts[-2]}/{parts[-1]}"
+    return None
+
+
+def _sanitize_instance_id(raw: str | None) -> str | None:
+    normalized = (raw or "").strip()
+    if not normalized:
+        return None
+    cleaned = []
+    for character in normalized:
+        if character.isalnum() or character in "._-":
+            cleaned.append(character)
+        else:
+            cleaned.append("_")
+    collapsed = "".join(cleaned).strip("_")
+    return collapsed or None
+
+
+def _official_repo_slug() -> str:
+    package_json = _load_package_json()
+    repository = package_json.get("repository", {})
+    if isinstance(repository, dict):
+        repo_url = str(repository.get("url", "")).strip()
+    else:
+        repo_url = str(repository or "").strip()
+
+    repo_slug = _normalize_repo_slug(repo_url)
+    if not repo_slug:
+        raise RuntimeError("Could not determine the official GitHub repository URL from package.json.")
+    return repo_slug
+
+
+def _manifest_url_for_channel(update_channel: str) -> str:
+    repo_slug = _official_repo_slug()
+    channel = (update_channel or "main").strip() or "main"
+    return f"https://raw.githubusercontent.com/{repo_slug}/{channel}/moto-update-manifest.json"
+
+
+def _package_json_url_for_channel(update_channel: str) -> str:
+    repo_slug = _official_repo_slug()
+    channel = (update_channel or "main").strip() or "main"
+    return f"https://raw.githubusercontent.com/{repo_slug}/{channel}/package.json"
+
+
+def _branch_api_url_for_channel(update_channel: str) -> str:
+    repo_slug = _official_repo_slug()
+    channel = (update_channel or "main").strip() or "main"
+    return f"https://api.github.com/repos/{repo_slug}/branches/{channel}"
+
+
+def archive_url_for_manifest(manifest: BuildManifest) -> str:
+    repo_slug = _official_repo_slug()
+    return f"https://github.com/{repo_slug}/archive/{manifest.build_commit}.zip"
+
+
+def _fetch_json_url(url: str, timeout_seconds: int) -> dict:
+    request = urllib.request.Request(
+        url,
+        headers={"User-Agent": "MOTO-Build1-Updater"},
+    )
+    with urllib.request.urlopen(request, timeout=timeout_seconds) as response:
+        payload = json.loads(response.read().decode("utf-8"))
+
+    if not isinstance(payload, dict):
+        raise RuntimeError(f"Unexpected JSON payload from {url}")
+    return payload
+
+
+def fetch_remote_manifest(local_manifest: BuildManifest, timeout_seconds: int = 10) -> BuildManifest:
+    payload = _fetch_json_url(_manifest_url_for_channel(local_manifest.update_channel), timeout_seconds)
+    return _coerce_manifest(payload)
+
+
+def fetch_branch_head_fallback(local_manifest: BuildManifest, timeout_seconds: int = 10) -> BuildManifest:
+    package_payload = _fetch_json_url(_package_json_url_for_channel(local_manifest.update_channel), timeout_seconds)
+    branch_payload = _fetch_json_url(_branch_api_url_for_channel(local_manifest.update_channel), timeout_seconds)
+
+    version = str(package_payload.get("version", "")).strip() or local_manifest.version
+    commit = str(branch_payload.get("commit", {}).get("sha", "")).strip()
+    if not commit:
+        raise RuntimeError("GitHub branch metadata did not include a branch-head commit SHA.")
+
+    return BuildManifest(
+        version=version,
+        build_commit=commit,
+        update_channel=local_manifest.update_channel,
+        api_contract_version=local_manifest.api_contract_version,
+        manifest_version=local_manifest.manifest_version,
+    )
+
+
+def cleanup_path(path: Path) -> None:
+    if not path.exists():
+        return
+    if path.is_dir():
+        shutil.rmtree(path, ignore_errors=True)
+    else:
+        try:
+            path.unlink()
+        except FileNotFoundError:
+            return
+
+
+def consume_internal_launcher_args(argv: list[str]) -> tuple[list[str], list[Path]]:
+    passthrough: list[str] = []
+    cleanup_paths: list[Path] = []
+    index = 0
+    while index < len(argv):
+        arg = argv[index]
+        if arg == "--moto-cleanup-update":
+            if index + 1 < len(argv):
+                cleanup_paths.append(Path(argv[index + 1]))
+                index += 2
+                continue
+        passthrough.append(arg)
+        index += 1
+    return passthrough, cleanup_paths
+
+
+def _is_pid_running(pid: int | None) -> bool:
+    if not pid or pid <= 0:
+        return False
+    try:
+        os.kill(pid, 0)
+    except (OSError, SystemError):
+        return False
+    return True
+
+
+def _load_launcher_state() -> dict:
+    payload = _read_json(LAUNCHER_STATE_PATH)
+    if not isinstance(payload, dict):
+        return {"instances": []}
+    instances = payload.get("instances", [])
+    if not isinstance(instances, list):
+        instances = []
+    return {"instances": instances}
+
+
+def _save_launcher_state(payload: dict) -> None:
+    if not payload.get("instances"):
+        cleanup_path(LAUNCHER_STATE_PATH)
+        return
+    _write_json(LAUNCHER_STATE_PATH, payload)
+
+
+def cleanup_launcher_state() -> list[dict]:
+    payload = _load_launcher_state()
+    active_instances: list[dict] = []
+    for instance in payload.get("instances", []):
+        if not isinstance(instance, dict):
+            continue
+        backend_pid = _coerce_int(instance.get("backend_window_pid"))
+        frontend_pid = _coerce_int(instance.get("frontend_window_pid"))
+        if _is_pid_running(backend_pid) or _is_pid_running(frontend_pid):
+            active_instances.append(instance)
+
+    _save_launcher_state({"instances": active_instances})
+    return active_instances
+
+
+def register_active_instance(
+    *,
+    instance_id: str,
+    backend_window_pid: int,
+    frontend_window_pid: int,
+    backend_port: int,
+    frontend_port: int,
+    data_root: str,
+    log_root: str,
+    secret_namespace: str | None,
+    storage_prefix: str | None,
+) -> None:
+    active_instances = cleanup_launcher_state()
+    active_instances.append(
+        {
+            "instance_id": instance_id,
+            "backend_window_pid": backend_window_pid,
+            "frontend_window_pid": frontend_window_pid,
+            "backend_port": backend_port,
+            "frontend_port": frontend_port,
+            "data_root": data_root,
+            "log_root": log_root,
+            "secret_namespace": secret_namespace,
+            "storage_prefix": storage_prefix,
+        }
+    )
+    _save_launcher_state({"instances": active_instances})
+
+
+def load_last_instance_record() -> dict | None:
+    """Return the most recently launched non-default instance record, or None.
+
+    Used to preserve a stable secret_namespace / data_root / storage_prefix across
+    relaunches when the default ports are temporarily busy. Without this the
+    launcher would mint a fresh timestamped instance_id on every relaunch, which
+    changes the OS-keyring service name and makes the saved OpenRouter / Wolfram
+    Alpha API keys look "missing" on startup.
+    """
+    payload = _read_json(LAUNCHER_LAST_INSTANCE_PATH)
+    if not isinstance(payload, dict):
+        return None
+    instance_id = payload.get("instance_id")
+    if not isinstance(instance_id, str) or not instance_id.strip():
+        return None
+    return payload
+
+
+def save_last_instance_record(
+    *,
+    instance_id: str,
+    data_root: str,
+    log_root: str,
+    secret_namespace: str | None,
+    storage_prefix: str | None,
+) -> None:
+    """Persist the last launched non-default instance so it can be reused on relaunch."""
+    _write_json(
+        LAUNCHER_LAST_INSTANCE_PATH,
+        {
+            "instance_id": instance_id,
+            "data_root": data_root,
+            "log_root": log_root,
+            "secret_namespace": secret_namespace,
+            "storage_prefix": storage_prefix,
+        },
+    )
+
+
+def _coerce_int(value: object) -> int | None:
+    try:
+        return int(value)  # type: ignore[arg-type]
+    except (TypeError, ValueError):
+        return None
+
+
+def _git_output(args: list[str]) -> tuple[int, str, str]:
+    try:
+        result = subprocess.run(
+            ["git", *args],
+            cwd=str(REPO_ROOT),
+            capture_output=True,
+            text=True,
+            check=False,
+        )
+    except OSError as exc:
+        return 1, "", str(exc)
+    return result.returncode, result.stdout.strip(), result.stderr.strip()
+
+
+def _git_checkout_matches_repo() -> bool:
+    code, output, _ = _git_output(["rev-parse", "--show-toplevel"])
+    if code != 0 or not output:
+        return False
+    try:
+        return Path(output).resolve() == REPO_ROOT.resolve()
+    except OSError:
+        return False
+
+
+def classify_install_state(active_instances: list[dict]) -> InstallState:
+    active_count = len(active_instances)
+    active_reason = ""
+    if active_count:
+        plural = "s are" if active_count != 1 else " is"
+        active_reason = (
+            f"{active_count} MOTO instance{plural} still running from this install. "
+            "Close both launcher-managed MOTO services before applying an update."
+        )
+
+    has_git_metadata = (REPO_ROOT / ".git").exists()
+    if not _git_checkout_matches_repo():
+        if has_git_metadata:
+            return InstallState(
+                kind="dirty_git_checkout",
+                label="Git checkout",
+                can_auto_apply=False,
+                reason=active_reason or "This install has git metadata, but the checkout could not be inspected safely for automatic updates.",
+                active_instance_count=active_count,
+            )
+        reason = active_reason or "ZIP / extracted consumer install."
+        return InstallState(
+            kind="zip_install",
+            label="ZIP / extracted consumer install",
+            can_auto_apply=active_count == 0,
+            reason=reason,
+            active_instance_count=active_count,
+        )
+
+    code, branch, _ = _git_output(["rev-parse", "--abbrev-ref", "HEAD"])
+    if code != 0:
+        return InstallState(
+            kind="dirty_git_checkout",
+            label="Git checkout",
+            can_auto_apply=False,
+            reason=active_reason or "Could not determine the current git branch for this checkout.",
+            active_instance_count=active_count,
+        )
+
+    _, upstream, _ = _git_output(["rev-parse", "--abbrev-ref", "--symbolic-full-name", "@{u}"])
+    _, status_output, _ = _git_output(["status", "--porcelain", "--untracked-files=no"])
+    _, remote_url, _ = _git_output(["remote", "get-url", "origin"])
+    official_slug = _official_repo_slug()
+    remote_matches = _normalize_repo_slug(remote_url) == official_slug
+    dirty_checkout = bool(status_output.strip())
+    clean_checkout = branch == "main" and upstream == "origin/main" and remote_matches and not dirty_checkout
+    if clean_checkout:
+        return InstallState(
+            kind="clean_git_clone",
+            label="Clean git clone on main",
+            can_auto_apply=active_count == 0,
+            reason=active_reason or "Clean git checkout tracking origin/main.",
+            active_instance_count=active_count,
+            git_branch=branch,
+            git_upstream=upstream,
+            git_remote_url=remote_url,
+        )
+
+    reason_parts = []
+    if active_reason:
+        reason_parts.append(active_reason)
+    if branch != "main":
+        reason_parts.append(f"Current branch is '{branch}', not 'main'.")
+    if upstream != "origin/main":
+        reason_parts.append("This checkout does not track origin/main.")
+    if remote_url and not remote_matches:
+        reason_parts.append("This checkout's origin remote does not match the official MOTO repository.")
+    if dirty_checkout:
+        reason_parts.append("Tracked files have local modifications.")
+    if not reason_parts:
+        reason_parts.append("This git checkout is not a safe fast-forward target for automatic updates.")
+
+    return InstallState(
+        kind="dirty_git_checkout",
+        label="Dirty or non-standard git checkout",
+        can_auto_apply=False,
+        reason=" ".join(reason_parts),
+        active_instance_count=active_count,
+        git_branch=branch,
+        git_upstream=upstream or None,
+        git_remote_url=remote_url or None,
+    )
+
+
+def check_for_updates() -> UpdateCheckResult:
+    local_manifest = load_local_manifest()
+    active_instances = cleanup_launcher_state()
+    install_state = classify_install_state(active_instances)
+    try:
+        remote_manifest = fetch_remote_manifest(local_manifest)
+        return UpdateCheckResult(
+            local_manifest,
+            remote_manifest,
+            install_state,
+            metadata_source="manifest",
+        )
+    except urllib.error.HTTPError as exc:
+        if exc.code == 404:
+            try:
+                fallback_manifest = fetch_branch_head_fallback(local_manifest)
+                return UpdateCheckResult(
+                    local_manifest,
+                    fallback_manifest,
+                    install_state,
+                    warning=(
+                        "GitHub main is reachable, but `moto-update-manifest.json` is not published there yet. "
+                        "The launcher can compare branch-head builds, but automatic update-apply stays disabled until the manifest exists on main."
+                    ),
+                    metadata_source="branch_head_fallback",
+                )
+            except (RuntimeError, urllib.error.URLError, TimeoutError, OSError, json.JSONDecodeError) as fallback_exc:
+                return UpdateCheckResult(
+                    local_manifest,
+                    None,
+                    install_state,
+                    error=(
+                        f"{exc}. The fallback branch-head lookup also failed: {fallback_exc}"
+                    ),
+                )
+        return UpdateCheckResult(local_manifest, None, install_state, error=str(exc))
+    except (RuntimeError, urllib.error.URLError, TimeoutError, OSError, json.JSONDecodeError) as exc:
+        return UpdateCheckResult(local_manifest, None, install_state, error=str(exc))
+
+
+def show_yes_no_dialog(title: str, message: str) -> bool:
+    if sys.platform == "win32":
+        try:
+            import ctypes
+
+            response = ctypes.windll.user32.MessageBoxW(None, message, title, 0x00000004 | 0x00000040)
+            return response == _WINDOWS_YES
+        except Exception:
+            pass
+
+    print()
+    print(message)
+    choice = input("Apply update now? [y/N]: ").strip().lower()
+    return choice in {"y", "yes"}
+
+
+def show_info_dialog(title: str, message: str) -> None:
+    print()
+    print(f"{title}: {message}")
+
+
+UPDATE_NOTICE_PATH = REPO_ROOT / ".moto_update_notice.json"
+
+
+def write_update_notice(result: UpdateCheckResult) -> None:
+    """Persist a short update-notice payload so the backend can serve it as an in-app banner."""
+    if not result.update_available or result.remote_manifest is None:
+        cleanup_path(UPDATE_NOTICE_PATH)
+        return
+
+    payload = {
+        "update_available": True,
+        "installed_version": result.local_manifest.version,
+        "installed_commit": result.local_manifest.short_commit,
+        "available_version": result.remote_manifest.version,
+        "available_commit": result.remote_manifest.short_commit,
+        "install_layout": result.install_state.label,
+        "can_auto_apply": result.can_apply_update,
+        "message": build_warning_message(result) if not result.can_apply_update else build_update_prompt(result),
+    }
+    _write_json(UPDATE_NOTICE_PATH, payload)
+
+
+def build_update_prompt(result: UpdateCheckResult) -> str:
+    if result.remote_manifest is None:
+        return "Update information is unavailable."
+
+    return (
+        "A newer MOTO build is available from GitHub main.\n\n"
+        f"Installed: {result.local_manifest.version} ({result.local_manifest.short_commit})\n"
+        f"Available: {result.remote_manifest.version} ({result.remote_manifest.short_commit})\n"
+        f"Install layout: {result.install_state.label}\n\n"
+        "If you continue, MOTO will preserve runtime data/log roots, instance-scoped local storage namespaces, and OS keyring namespaces."
+    )
+
+
+def build_warning_message(result: UpdateCheckResult) -> str:
+    if result.remote_manifest is None:
+        return result.error or "Update information is unavailable."
+
+    details = []
+    if result.warning:
+        details.append(result.warning)
+    if not result.install_state.can_auto_apply:
+        details.append(result.install_state.reason)
+    detail_text = "\n\n".join(details) if details else result.install_state.reason
+
+    return (
+        "A newer MOTO build is available from GitHub main, but this install cannot auto-apply it.\n\n"
+        f"Installed: {result.local_manifest.version} ({result.local_manifest.short_commit})\n"
+        f"Available: {result.remote_manifest.version} ({result.remote_manifest.short_commit})\n"
+        f"Install layout: {result.install_state.label}\n\n"
+        f"{detail_text}"
+    )
+
+
+def _relative_if_inside_repo(path: Path) -> str | None:
+    try:
+        relative = path.resolve().relative_to(REPO_ROOT.resolve())
+    except ValueError:
+        return None
+    return str(relative).replace("\\", "/")
+
+
+def _resolve_repo_relative_path(raw: str | None) -> Path | None:
+    if not raw or not raw.strip():
+        return None
+    candidate = Path(raw)
+    if not candidate.is_absolute():
+        candidate = REPO_ROOT / candidate
+    try:
+        return candidate.resolve()
+    except OSError:
+        return None
+
+
+def collect_preserved_relatives(env: dict[str, str] | os._Environ[str], active_instances: list[dict] | None = None) -> set[str]:
+    preserved = set(_DEFAULT_PRESERVED_ROOTS) | set(_DEFAULT_PRESERVED_FILES)
+
+    active_instances = active_instances if active_instances is not None else cleanup_launcher_state()
+    for instance in active_instances:
+        if not isinstance(instance, dict):
+            continue
+        for key in ("data_root", "log_root"):
+            value = str(instance.get(key, "")).strip()
+            if not value:
+                continue
+            relative = _relative_if_inside_repo(Path(value))
+            if relative:
+                preserved.add(relative)
+
+    for env_name in ("MOTO_DATA_ROOT", "MOTO_LOG_ROOT"):
+        resolved = _resolve_repo_relative_path(env.get(env_name))
+        if resolved:
+            relative = _relative_if_inside_repo(resolved)
+            if relative:
+                preserved.add(relative)
+
+    explicit_instance_id = _sanitize_instance_id(env.get("MOTO_INSTANCE_ID"))
+    if explicit_instance_id:
+        instance_root = REPO_ROOT / ".moto_instances" / explicit_instance_id
+        relative = _relative_if_inside_repo(instance_root)
+        if relative:
+            preserved.add(relative)
+
+    return {path.replace("\\", "/").strip("/") for path in preserved if path}
+
+
+def _is_preserved(relative_path: str, preserved_relatives: set[str]) -> bool:
+    normalized = relative_path.replace("\\", "/").strip("/")
+    for preserved in preserved_relatives:
+        if normalized == preserved or normalized.startswith(f"{preserved}/"):
+            return True
+    return False
+
+
+def _ensure_backup_for_destination(destination: Path, backup_root: Path, relative_path: str, journal: _CopyJournal) -> None:
+    backup_target = backup_root / relative_path
+    if destination.is_dir():
+        if relative_path in journal.overwritten_directories:
+            return
+        backup_target.parent.mkdir(parents=True, exist_ok=True)
+        shutil.copytree(destination, backup_target, dirs_exist_ok=True)
+        journal.overwritten_directories.append(relative_path)
+        return
+
+    if relative_path in journal.overwritten_files:
+        return
+    backup_target.parent.mkdir(parents=True, exist_ok=True)
+    shutil.copy2(destination, backup_target)
+    journal.overwritten_files.append(relative_path)
+
+
+def sync_snapshot_into_install(
+    source_root: Path,
+    destination_root: Path,
+    preserved_relatives: set[str],
+    backup_root: Path,
+) -> _CopyJournal:
+    journal = _CopyJournal()
+    for source_path in source_root.rglob("*"):
+        if source_path.is_dir():
+            continue
+
+        relative_path = str(source_path.relative_to(source_root)).replace("\\", "/")
+        if _is_preserved(relative_path, preserved_relatives):
+            continue
+
+        destination_path = destination_root / relative_path
+        destination_path.parent.mkdir(parents=True, exist_ok=True)
+
+        if destination_path.exists():
+            _ensure_backup_for_destination(destination_path, backup_root, relative_path, journal)
+            if destination_path.is_dir():
+                shutil.rmtree(destination_path)
+        else:
+            journal.created_files.append(relative_path)
+
+        shutil.copy2(source_path, destination_path)
+
+    return journal
+
+
+def restore_snapshot_from_backup(destination_root: Path, backup_root: Path, journal: _CopyJournal) -> None:
+    for relative_path in reversed(journal.created_files):
+        cleanup_path(destination_root / relative_path)
+        _remove_empty_parents((destination_root / relative_path).parent)
+
+    for relative_path in journal.overwritten_files:
+        destination_path = destination_root / relative_path
+        backup_path = backup_root / relative_path
+        cleanup_path(destination_path)
+        destination_path.parent.mkdir(parents=True, exist_ok=True)
+        shutil.copy2(backup_path, destination_path)
+
+    for relative_path in journal.overwritten_directories:
+        destination_path = destination_root / relative_path
+        backup_path = backup_root / relative_path
+        cleanup_path(destination_path)
+        shutil.copytree(backup_path, destination_path, dirs_exist_ok=True)
+
+
+def _remove_empty_parents(path: Path) -> None:
+    current = path
+    while current != REPO_ROOT:
+        try:
+            current.rmdir()
+        except OSError:
+            return
+        current = current.parent
+
+
+def _download_archive(manifest: BuildManifest, destination: Path) -> None:
+    request = urllib.request.Request(
+        archive_url_for_manifest(manifest),
+        headers={"User-Agent": "MOTO-Build1-Updater"},
+    )
+    with urllib.request.urlopen(request, timeout=30) as response, destination.open("wb") as output:
+        shutil.copyfileobj(response, output)
+
+
+def _extract_archive(archive_path: Path, destination: Path) -> Path:
+    with zipfile.ZipFile(archive_path) as archive:
+        archive.extractall(destination)
+
+    children = [child for child in destination.iterdir()]
+    if len(children) == 1 and children[0].is_dir():
+        return children[0]
+    return destination
+
+
+def _resolve_entrypoint_path(raw: str | None) -> Path | None:
+    if not raw or not raw.strip():
+        return None
+    candidate = Path(raw)
+    if not candidate.is_absolute():
+        candidate = REPO_ROOT / candidate
+    try:
+        return candidate.resolve()
+    except OSError:
+        return None
+
+
+def _build_relaunch_command(env: dict[str, str]) -> list[str]:
+    entrypoint = _resolve_entrypoint_path(env.get(LAUNCHER_ENTRYPOINT_ENV))
+    if entrypoint and entrypoint.exists():
+        suffix = entrypoint.suffix.lower()
+        if suffix == ".sh":
+            return ["bash", str(entrypoint)]
+        if suffix in {".bat", ".cmd"}:
+            return ["cmd", "/c", str(entrypoint)]
+        if suffix == ".ps1":
+            return ["powershell", "-ExecutionPolicy", "Bypass", "-File", str(entrypoint)]
+        return [str(entrypoint)]
+
+    return [sys.executable, str(REPO_ROOT / "moto_launcher.py")]
+
+
+def _relaunch_launcher(launcher_args: list[str], cleanup_paths: list[Path], env: dict[str, str]) -> None:
+    command = _build_relaunch_command(env)
+    command.extend(launcher_args)
+    for cleanup_path in cleanup_paths:
+        command.extend(["--moto-cleanup-update", str(cleanup_path)])
+    subprocess.Popen(command, cwd=str(REPO_ROOT), env=env)
+
+
+def apply_zip_update(
+    *,
+    remote_manifest: BuildManifest,
+    launcher_args: list[str],
+    env: dict[str, str],
+) -> tuple[bool, str]:
+    active_instances = cleanup_launcher_state()
+    preserved_relatives = collect_preserved_relatives(env, active_instances)
+    work_root = Path(tempfile.mkdtemp(prefix="moto-update-"))
+    extract_root = work_root / "extract"
+    archive_path = work_root / "update.zip"
+    backup_root = Path(tempfile.mkdtemp(prefix="moto-update-backup-"))
+    journal = _CopyJournal()
+
+    try:
+        _download_archive(remote_manifest, archive_path)
+        extracted_source = _extract_archive(archive_path, extract_root)
+        journal = sync_snapshot_into_install(extracted_source, REPO_ROOT, preserved_relatives, backup_root)
+        _relaunch_launcher(launcher_args, [backup_root, work_root], env)
+        return True, "Update applied successfully. Relaunching MOTO with the new build."
+    except Exception as exc:
+        restore_snapshot_from_backup(REPO_ROOT, backup_root, journal)
+        cleanup_path(work_root)
+        cleanup_path(backup_root)
+        return False, f"Update failed and the previous install was restored: {exc}"
+
+
+def _safe_fast_forward_possible() -> tuple[bool, str]:
+    fetch_code, _, fetch_stderr = _git_output(["fetch", "origin", "main", "--quiet"])
+    if fetch_code != 0:
+        return False, fetch_stderr or "Failed to fetch origin/main."
+
+    code, divergence_output, divergence_stderr = _git_output(["rev-list", "--left-right", "--count", "HEAD...origin/main"])
+    if code != 0:
+        return False, divergence_stderr or "Failed to compare HEAD against origin/main."
+
+    try:
+        ahead_str, behind_str = divergence_output.split()
+        ahead = int(ahead_str)
+        behind = int(behind_str)
+    except (ValueError, TypeError):
+        return False, "Failed to parse git divergence counts for origin/main."
+
+    if ahead != 0:
+        return False, "This checkout is ahead of origin/main and cannot be fast-forwarded automatically."
+    if behind == 0:
+        return False, "This checkout is already at the latest origin/main commit."
+    return True, ""
+
+
+def apply_git_update(
+    *,
+    launcher_args: list[str],
+    env: dict[str, str],
+) -> tuple[bool, str]:
+    code, previous_head, stderr = _git_output(["rev-parse", "HEAD"])
+    if code != 0 or not previous_head:
+        return False, stderr or "Failed to determine the current git HEAD."
+
+    safe_to_update, reason = _safe_fast_forward_possible()
+    if not safe_to_update:
+        return False, reason
+
+    merge_code, _, merge_stderr = _git_output(["merge", "--ff-only", "origin/main"])
+    if merge_code != 0:
+        return False, merge_stderr or "Fast-forward merge from origin/main failed."
+
+    try:
+        _relaunch_launcher(launcher_args, [], env)
+        return True, "Git checkout fast-forwarded successfully. Relaunching MOTO with the new build."
+    except Exception as exc:
+        _git_output(["reset", "--hard", previous_head])
+        return False, f"Update was rolled back after relaunch failed: {exc}"
+
+
+def apply_update(
+    result: UpdateCheckResult,
+    launcher_args: list[str],
+    env: dict[str, str] | os._Environ[str],
+) -> tuple[bool, str]:
+    if result.remote_manifest is None:
+        return False, result.error or "Update information is unavailable."
+    if result.metadata_source != "manifest":
+        return False, result.warning or "Automatic update-apply is disabled until the official main-branch manifest is published."
+
+    env_copy = dict(env)
+    if result.install_state.kind == "clean_git_clone":
+        return apply_git_update(launcher_args=launcher_args, env=env_copy)
+    if result.install_state.kind == "zip_install":
+        return apply_zip_update(remote_manifest=result.remote_manifest, launcher_args=launcher_args, env=env_copy)
+    return False, result.install_state.reason
diff --git a/package.json b/package.json
index 3687c44..57dcba0 100644
--- a/package.json
+++ b/package.json
@@ -1,12 +1,12 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.6",
+  "version": "1.0.7",
   "description": "MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "scripts": {
-    "dev:backend": "cd backend && uvicorn api.main:app --reload --host 0.0.0.0 --port 8000",
-    "dev:frontend": "cd frontend && npm run dev",
-    "install:frontend": "cd frontend && npm install",
-    "build:frontend": "cd frontend && npm run build"
+    "dev:backend": "python -c \"import os, uvicorn; uvicorn.run('backend.api.main:app', host=os.getenv('MOTO_BACKEND_HOST', os.getenv('HOST', '0.0.0.0')), port=int(os.getenv('MOTO_BACKEND_PORT', os.getenv('PORT', '8000'))), reload=True, access_log=False)\"",
+    "dev:frontend": "npm --prefix frontend run dev",
+    "install:frontend": "npm --prefix frontend install",
+    "build:frontend": "npm --prefix frontend run build"
   },
   "keywords": [
     "ai",
diff --git a/requirements-generic.txt b/requirements-generic.txt
new file mode 100644
index 0000000..b9a3e1e
--- /dev/null
+++ b/requirements-generic.txt
@@ -0,0 +1,3 @@
+-r requirements.txt
+fastembed>=0.3.6
+onnxruntime>=1.18.0,<2.0
diff --git a/tests/test_compiler_marker_visibility.py b/tests/test_compiler_marker_visibility.py
new file mode 100644
index 0000000..37a1e09
--- /dev/null
+++ b/tests/test_compiler_marker_visibility.py
@@ -0,0 +1,251 @@
+import unittest
+import tempfile
+from pathlib import Path
+
+from backend.compiler.core import compiler_coordinator as coordinator_module
+from backend.compiler.core.compiler_coordinator import CompilerCoordinator
+from backend.compiler.agents.high_context_submitter import (
+    _strip_paper_markers_for_llm as strip_for_high_context,
+)
+from backend.compiler.agents.high_param_submitter import (
+    _strip_paper_markers_for_llm as strip_for_high_param,
+)
+from backend.compiler.memory.paper_memory import (
+    APPENDIX_EMPTY_PLACEHOLDER,
+    CONCLUSION_PLACEHOLDER,
+    PAPER_ANCHOR,
+    THEOREMS_APPENDIX_END,
+    THEOREMS_APPENDIX_START,
+    paper_memory,
+)
+from backend.compiler.validation.compiler_validator import CompilerValidator
+from backend.shared.models import CompilerSubmission, CompilerValidationResult
+
+
+class CompilerMarkerVisibilityTests(unittest.TestCase):
+    def test_submitter_paper_view_preserves_appendix_markers_for_exact_matching(self) -> None:
+        paper = (
+            "Body text.\n\n"
+            f"{THEOREMS_APPENDIX_START}\n"
+            "[Theorems appendix - verified Lean 4 theorems not placed inline will appear here]\n"
+            f"{THEOREMS_APPENDIX_END}\n\n"
+            f"{PAPER_ANCHOR}"
+        )
+
+        for strip_for_llm in (strip_for_high_context, strip_for_high_param):
+            with self.subTest(strip_for_llm=strip_for_llm.__module__):
+                visible_paper = strip_for_llm(paper)
+
+                self.assertIn(THEOREMS_APPENDIX_START, visible_paper)
+                self.assertIn(THEOREMS_APPENDIX_END, visible_paper)
+                self.assertIn(PAPER_ANCHOR, visible_paper)
+
+    def test_replace_old_string_with_appendix_marker_suffix_is_trimmed_safely(self) -> None:
+        validator = CompilerValidator(model_name="test-model", user_prompt="Write.")
+        old_section = "\\section{Conclusion}\n\nOld conclusion text."
+        paper = (
+            f"{old_section}\n\n"
+            f"{THEOREMS_APPENDIX_START}\n"
+            f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+            f"{THEOREMS_APPENDIX_END}\n\n"
+            f"{PAPER_ANCHOR}"
+        )
+        submission = CompilerSubmission(
+            submission_id="sub-marker-trim",
+            mode="construction",
+            content="\\section{Conclusion}\n\nNew conclusion text.",
+            operation="replace",
+            old_string=(
+                f"{old_section}\n\n"
+                f"{THEOREMS_APPENDIX_START}\n"
+                f"{APPENDIX_EMPTY_PLACEHOLDER}"
+            ),
+            new_string="\\section{Conclusion}\n\nNew conclusion text.",
+            reasoning="Replace conclusion.",
+        )
+
+        result = validator._pre_validate_exact_string_match(submission, paper, "Outline")
+
+        self.assertIsNone(result)
+        self.assertEqual(submission.old_string, old_section)
+
+    def test_delete_old_string_crossing_appendix_marker_is_rejected(self) -> None:
+        validator = CompilerValidator(model_name="test-model", user_prompt="Write.")
+        paper = (
+            "Conclusion text.\n\n"
+            f"{THEOREMS_APPENDIX_START}\n"
+            f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+            f"{THEOREMS_APPENDIX_END}\n\n"
+            f"{PAPER_ANCHOR}"
+        )
+        submission = CompilerSubmission(
+            submission_id="sub-marker-delete",
+            mode="construction",
+            content="",
+            operation="delete",
+            old_string=f"Conclusion text.\n\n{THEOREMS_APPENDIX_START}",
+            new_string="",
+            reasoning="Delete stale conclusion.",
+        )
+
+        result = validator._pre_validate_exact_string_match(submission, paper, "Outline")
+
+        self.assertIsNotNone(result)
+        self.assertEqual(result.decision, "reject")
+        self.assertIn("PROTECTED_MARKER_BOUNDARY", result.reasoning)
+
+
+class CompilerCoordinatorMarkerTests(unittest.IsolatedAsyncioTestCase):
+    async def test_conclusion_phase_without_placeholder_applies_validated_edit(self) -> None:
+        old_path = paper_memory.file_path
+        old_initialized = paper_memory._initialized
+        old_rechunk_callback = paper_memory.rechunk_callback
+        old_add_acceptance = coordinator_module.compiler_rejection_log.add_acceptance
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                paper_memory.file_path = Path(tmpdir) / "paper.txt"
+                paper_memory._initialized = True
+                paper_memory.rechunk_callback = None
+
+                old_conclusion = "\\section{Conclusion}\n\nOld conclusion."
+                new_conclusion = "\\section{Conclusion}\n\nNew conclusion."
+                await paper_memory.update_paper(
+                    f"Body text.\n\n"
+                    f"{old_conclusion}\n\n"
+                    f"{THEOREMS_APPENDIX_START}\n"
+                    f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+                    f"{THEOREMS_APPENDIX_END}\n\n"
+                    f"{PAPER_ANCHOR}"
+                )
+
+                submission = CompilerSubmission(
+                    submission_id="sub-conclusion-existing",
+                    mode="construction",
+                    content=new_conclusion,
+                    operation="replace",
+                    old_string=old_conclusion,
+                    new_string=new_conclusion,
+                    reasoning="Refresh existing conclusion.",
+                    section_complete=False,
+                )
+
+                class FakeSubmitter:
+                    async def submit_construction(self, **_kwargs):
+                        return submission
+
+                class FakeValidator:
+                    async def validate_submission(self, *_args, **_kwargs):
+                        return CompilerValidationResult(
+                            submission_id=submission.submission_id,
+                            decision="accept",
+                            reasoning="Accepted.",
+                            coherence_check=True,
+                            rigor_check=True,
+                            placement_check=True,
+                        )
+
+                async def fake_add_acceptance(*_args, **_kwargs):
+                    return None
+
+                coordinator_module.compiler_rejection_log.add_acceptance = fake_add_acceptance
+
+                coordinator = CompilerCoordinator()
+                coordinator.autonomous_mode = True
+                coordinator.autonomous_section_phase = "conclusion"
+                coordinator.high_context_submitter = FakeSubmitter()
+                coordinator.validator = FakeValidator()
+
+                accepted, rejection_reason = await coordinator._submit_and_validate_construction()
+
+                paper = await paper_memory.get_paper()
+                self.assertTrue(accepted)
+                self.assertIsNone(rejection_reason)
+                self.assertIn(new_conclusion, paper)
+                self.assertNotIn(old_conclusion, paper)
+                self.assertIn(THEOREMS_APPENDIX_START, paper)
+                self.assertIn(THEOREMS_APPENDIX_END, paper)
+            finally:
+                paper_memory.file_path = old_path
+                paper_memory._initialized = old_initialized
+                paper_memory.rechunk_callback = old_rechunk_callback
+                coordinator_module.compiler_rejection_log.add_acceptance = old_add_acceptance
+
+    async def test_phase_full_content_with_placeholder_replaces_placeholder_not_whole_paper(self) -> None:
+        old_path = paper_memory.file_path
+        old_initialized = paper_memory._initialized
+        old_rechunk_callback = paper_memory.rechunk_callback
+        old_add_acceptance = coordinator_module.compiler_rejection_log.add_acceptance
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                paper_memory.file_path = Path(tmpdir) / "paper.txt"
+                paper_memory._initialized = True
+                paper_memory.rechunk_callback = None
+
+                new_conclusion = "\\section{Conclusion}\n\nNew conclusion."
+                await paper_memory.update_paper(
+                    "Body text.\n\n"
+                    f"{CONCLUSION_PLACEHOLDER}\n\n"
+                    f"{THEOREMS_APPENDIX_START}\n"
+                    f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+                    f"{THEOREMS_APPENDIX_END}\n\n"
+                    f"{PAPER_ANCHOR}"
+                )
+
+                submission = CompilerSubmission(
+                    submission_id="sub-conclusion-full-content",
+                    mode="construction",
+                    content=new_conclusion,
+                    operation="full_content",
+                    old_string="Body text.",
+                    new_string=new_conclusion,
+                    reasoning="Write conclusion.",
+                    section_complete=False,
+                )
+
+                class FakeSubmitter:
+                    async def submit_construction(self, **_kwargs):
+                        return submission
+
+                class FakeValidator:
+                    async def validate_submission(self, *_args, **_kwargs):
+                        return CompilerValidationResult(
+                            submission_id=submission.submission_id,
+                            decision="accept",
+                            reasoning="Accepted.",
+                            coherence_check=True,
+                            rigor_check=True,
+                            placement_check=True,
+                        )
+
+                async def fake_add_acceptance(*_args, **_kwargs):
+                    return None
+
+                coordinator_module.compiler_rejection_log.add_acceptance = fake_add_acceptance
+
+                coordinator = CompilerCoordinator()
+                coordinator.autonomous_mode = True
+                coordinator.autonomous_section_phase = "conclusion"
+                coordinator.high_context_submitter = FakeSubmitter()
+                coordinator.validator = FakeValidator()
+
+                accepted, rejection_reason = await coordinator._submit_and_validate_construction()
+
+                paper = await paper_memory.get_paper()
+                self.assertTrue(accepted)
+                self.assertIsNone(rejection_reason)
+                self.assertIn("Body text.", paper)
+                self.assertIn(new_conclusion, paper)
+                self.assertNotIn(CONCLUSION_PLACEHOLDER, paper)
+                self.assertIn(THEOREMS_APPENDIX_START, paper)
+                self.assertIn(THEOREMS_APPENDIX_END, paper)
+            finally:
+                paper_memory.file_path = old_path
+                paper_memory._initialized = old_initialized
+                paper_memory.rechunk_callback = old_rechunk_callback
+                coordinator_module.compiler_rejection_log.add_acceptance = old_add_acceptance
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_compiler_wolfram_tracking.py b/tests/test_compiler_wolfram_tracking.py
new file mode 100644
index 0000000..febe929
--- /dev/null
+++ b/tests/test_compiler_wolfram_tracking.py
@@ -0,0 +1,51 @@
+import unittest
+
+from backend.autonomous.memory.paper_model_tracker import PaperModelTracker
+from backend.compiler.core.compiler_coordinator import CompilerCoordinator
+from backend.shared.models import CompilerSubmission
+
+
+def _submission_with_wolfram_calls() -> CompilerSubmission:
+    return CompilerSubmission(
+        submission_id="sub-wolfram",
+        mode="construction",
+        content="content",
+        operation="full_content",
+        old_string="",
+        new_string="content",
+        reasoning="accepted construction",
+        metadata={
+            "wolfram_calls": [
+                {"query": "2+2", "result": "4"},
+                {"query": "integrate x", "result": "x^2/2"},
+            ]
+        },
+    )
+
+
+class CompilerWolframTrackingTests(unittest.TestCase):
+    def test_manual_mode_tracks_accepted_wolfram_calls(self) -> None:
+        coordinator = CompilerCoordinator()
+        tracker = PaperModelTracker(user_prompt="prompt", paper_title="paper")
+        coordinator._paper_model_tracker = tracker
+
+        coordinator._track_submission_wolfram_calls(_submission_with_wolfram_calls())
+
+        self.assertEqual(tracker.get_wolfram_call_count(), 2)
+
+    def test_autonomous_mode_tracks_on_current_paper_tracker(self) -> None:
+        coordinator = CompilerCoordinator()
+        coordinator.enable_autonomous_mode()
+        manual_tracker = PaperModelTracker(user_prompt="manual", paper_title="manual")
+        autonomous_tracker = PaperModelTracker(user_prompt="auto", paper_title="auto")
+        coordinator._paper_model_tracker = manual_tracker
+        coordinator._current_paper_tracker = autonomous_tracker
+
+        coordinator._track_submission_wolfram_calls(_submission_with_wolfram_calls())
+
+        self.assertEqual(manual_tracker.get_wolfram_call_count(), 0)
+        self.assertEqual(autonomous_tracker.get_wolfram_call_count(), 2)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_lean4_client.py b/tests/test_lean4_client.py
new file mode 100644
index 0000000..d5b97ac
--- /dev/null
+++ b/tests/test_lean4_client.py
@@ -0,0 +1,142 @@
+import asyncio
+import tempfile
+import unittest
+from pathlib import Path
+
+from backend.shared.lean4_client import (
+    Lean4Client,
+    _deduplicate_leading_import,
+    _strip_markdown_fences,
+)
+
+
+class Lean4ClientWorkspaceTests(unittest.IsolatedAsyncioTestCase):
+    async def test_cache_fetch_retries_after_removing_failed_ltar_archive(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            root = Path(tmpdir)
+            workspace = root / "workspace"
+            mathlib_pkg = workspace / ".lake" / "packages" / "mathlib"
+            mathlib_pkg.mkdir(parents=True)
+            lake_path = root / "lake.exe"
+            lake_path.write_text("", encoding="utf-8")
+
+            failed_archive = root / ".cache" / "mathlib" / "bad.ltar"
+            failed_archive.parent.mkdir(parents=True)
+            failed_archive.write_bytes(b"partial archive")
+
+            client = Lean4Client(lean_path=str(root / "lean.exe"), workspace_dir=str(workspace))
+            calls: list[list[str]] = []
+
+            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple[int, str, str]:
+                calls.append(args)
+                if args[1:] == ["update"]:
+                    return 0, "updated", ""
+                if len(calls) == 2:
+                    return (
+                        101,
+                        "",
+                        f"Decompression error: leantar exited with code 101 ({failed_archive})",
+                    )
+                return 0, "cache ok", ""
+
+            client._run_process = fake_run_process  # type: ignore[method-assign]
+
+            self.assertTrue(await client.ensure_workspace())
+            self.assertFalse(failed_archive.exists())
+            self.assertEqual(
+                [call[1:] for call in calls],
+                [
+                    ["update"],
+                    ["exe", "cache", "get"],
+                    ["exe", "cache", "get"],
+                ],
+            )
+
+    async def test_workspace_bootstrap_is_serialized(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            root = Path(tmpdir)
+            workspace = root / "workspace"
+            (workspace / ".lake" / "packages" / "mathlib").mkdir(parents=True)
+            lake_path = root / "lake.exe"
+            lake_path.write_text("", encoding="utf-8")
+
+            client = Lean4Client(lean_path=str(root / "lean.exe"), workspace_dir=str(workspace))
+            calls: list[list[str]] = []
+
+            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple[int, str, str]:
+                calls.append(args)
+                await asyncio.sleep(0.01)
+                return 0, "ok", ""
+
+            client._run_process = fake_run_process  # type: ignore[method-assign]
+
+            results = await asyncio.gather(client.ensure_workspace(), client.ensure_workspace())
+
+            self.assertEqual(results, [True, True])
+            self.assertEqual(
+                [call[1:] for call in calls],
+                [
+                    ["update"],
+                    ["exe", "cache", "get"],
+                ],
+            )
+
+
+class Lean4ExtractionTests(unittest.IsolatedAsyncioTestCase):
+    def _client(self) -> Lean4Client:
+        return Lean4Client(lean_path="", workspace_dir=tempfile.gettempdir())
+
+    def test_strip_markdown_fences_removes_lean_fence(self) -> None:
+        fence = "`" * 3
+        code = f"{fence}lean\nimport Mathlib\ntheorem t : 1 = 1 := rfl\n{fence}"
+        result = _strip_markdown_fences(code)
+        self.assertNotIn(fence, result)
+        self.assertIn("import Mathlib", result)
+        self.assertIn("theorem t : 1 = 1 := rfl", result)
+
+    def test_strip_markdown_fences_noop_when_no_fences(self) -> None:
+        code = "import Mathlib\ntheorem t : 1 = 1 := rfl"
+        self.assertEqual(_strip_markdown_fences(code), code)
+
+    def test_deduplicate_leading_import_collapses_duplicates(self) -> None:
+        code = "import Mathlib\nimport Mathlib\ntheorem t : 1 = 1 := rfl"
+        result = _deduplicate_leading_import(code)
+        self.assertEqual(result.count("import Mathlib"), 1)
+        self.assertIn("theorem t", result)
+
+    def test_prepare_lean_code_strips_fences_and_adds_import(self) -> None:
+        client = self._client()
+        fence = "`" * 3
+        code = f"{fence}\ntheorem t : 1 = 1 := rfl\n{fence}"
+        prepared = client._prepare_lean_code(code)
+        self.assertNotIn(fence, prepared)
+        self.assertTrue(prepared.startswith("import Mathlib"))
+        self.assertIn("theorem t : 1 = 1 := rfl", prepared)
+
+    def test_has_no_goals_diagnostic_detects_error(self) -> None:
+        self.assertTrue(
+            Lean4Client._has_no_goals_diagnostic(
+                "file.lean:43:9: error: No goals to be solved"
+            )
+        )
+        self.assertFalse(
+            Lean4Client._has_no_goals_diagnostic(
+                "file.lean:10:3: error: unknown identifier 'foo'"
+            )
+        )
+
+    def test_annotate_no_goals_hint_prepends_hint_once(self) -> None:
+        raw = "file.lean:43:9: error: No goals to be solved"
+        annotated = Lean4Client._annotate_no_goals_hint(raw)
+        self.assertIn("HINT:", annotated)
+        self.assertIn("no goals to be solved", annotated.lower())
+        annotated_twice = Lean4Client._annotate_no_goals_hint(annotated)
+        self.assertEqual(annotated_twice.count("HINT:"), 1)
+
+    def test_annotate_no_goals_hint_skips_unrelated_error(self) -> None:
+        raw = "file.lean:10:3: error: unknown identifier 'foo'"
+        self.assertEqual(Lean4Client._annotate_no_goals_hint(raw), raw)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_moto_launcher.py b/tests/test_moto_launcher.py
new file mode 100644
index 0000000..3408cdd
--- /dev/null
+++ b/tests/test_moto_launcher.py
@@ -0,0 +1,263 @@
+import os
+from pathlib import Path
+import tempfile
+import unittest
+from unittest import mock
+
+import moto_launcher
+
+
+class ResolveInstanceRuntimeTests(unittest.TestCase):
+    def test_defaults_free_uses_default_instance(self) -> None:
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=None):
+                with mock.patch.object(moto_launcher, "port_in_use", return_value=False):
+                    runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "default")
+        self.assertEqual(runtime.backend_port, 8000)
+        self.assertEqual(runtime.frontend_port, 5173)
+        self.assertTrue(runtime.is_default)
+        self.assertFalse(runtime.explicit_override)
+        self.assertIsNone(runtime.secret_namespace)
+        self.assertTrue(runtime.data_root.endswith("backend\\data") or runtime.data_root.endswith("backend/data"))
+        self.assertTrue(runtime.log_root.endswith("backend\\logs") or runtime.log_root.endswith("backend/logs"))
+
+    def test_occupied_defaults_allocate_isolated_instance(self) -> None:
+        def fake_port_in_use(port: int) -> bool:
+            return port in {8000, 5173}
+
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=None):
+                with mock.patch.object(moto_launcher, "port_in_use", side_effect=fake_port_in_use):
+                    with mock.patch.object(moto_launcher, "new_instance_id", return_value="instance_test_1234"):
+                        runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "instance_test_1234")
+        self.assertEqual(runtime.backend_port, 8001)
+        self.assertEqual(runtime.frontend_port, 5174)
+        self.assertFalse(runtime.is_default)
+        self.assertIn(".moto_instances", runtime.data_root)
+        self.assertIn("instance_test_1234", runtime.data_root)
+        self.assertIn(".moto_instances", runtime.log_root)
+        self.assertEqual(runtime.secret_namespace, "instance_test_1234")
+        self.assertEqual(runtime.storage_prefix, "instance_test_1234")
+        self.assertFalse(runtime.explicit_override)
+
+    def test_last_record_default_is_reused_when_ports_busy(self) -> None:
+        """
+        Regression test for the 1/3-startup keyring namespace drift bug.
+
+        Previous behaviour: a fresh "default" launch never recorded itself,
+        so if the second launch found the default ports busy (Windows
+        TIME_WAIT is extremely common for this), the launcher would mint a
+        brand-new timestamped instance_id with a brand-new keyring service
+        name, and the OpenRouter/Wolfram keys would look like they had
+        disappeared. Now a recorded "default" identity is reused even when
+        the default ports are temporarily occupied — only the ports change.
+        """
+        def fake_port_in_use(port: int) -> bool:
+            return port in {8000, 5173}
+
+        saved_record = {
+            "instance_id": "default",
+            "data_root": None,
+            "log_root": None,
+            "secret_namespace": None,
+            "storage_prefix": None,
+        }
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record):
+                with mock.patch.object(moto_launcher, "cleanup_launcher_state", return_value=[]):
+                    with mock.patch.object(moto_launcher, "port_in_use", side_effect=fake_port_in_use):
+                        runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "default")
+        self.assertTrue(runtime.is_default)
+        # The saved default namespace has None → keyring service name keeps
+        # its legacy, suffix-free form so previously-saved keys stay visible.
+        self.assertIsNone(runtime.secret_namespace)
+        # Ports are allowed to shift because they are not part of the keyring
+        # namespace — stability of `secret_namespace` is all that matters.
+        self.assertNotEqual(runtime.backend_port, 8000)
+        self.assertNotEqual(runtime.frontend_port, 5173)
+
+    def test_last_record_isolated_instance_is_reused_even_when_default_ports_are_free(self) -> None:
+        """A prior isolated launch must keep its namespace even when default ports become free."""
+        saved_record = {
+            "instance_id": "instance_20260101_000000_1111",
+            "data_root": r"C:\\custom\\data",
+            "log_root": r"C:\\custom\\logs",
+            "secret_namespace": "instance_20260101_000000_1111",
+            "storage_prefix": "instance_20260101_000000_1111",
+        }
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record):
+                with mock.patch.object(moto_launcher, "cleanup_launcher_state", return_value=[]):
+                    with mock.patch.object(moto_launcher, "port_in_use", return_value=False):
+                        runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "instance_20260101_000000_1111")
+        self.assertFalse(runtime.is_default)
+        self.assertEqual(runtime.secret_namespace, "instance_20260101_000000_1111")
+        self.assertEqual(runtime.storage_prefix, "instance_20260101_000000_1111")
+
+    def test_live_instance_is_not_reused_to_avoid_data_root_collision(self) -> None:
+        """A recorded identity currently live in another process must be avoided."""
+        saved_record = {
+            "instance_id": "instance_20260101_000000_1111",
+            "data_root": None,
+            "log_root": None,
+            "secret_namespace": "instance_20260101_000000_1111",
+            "storage_prefix": "instance_20260101_000000_1111",
+        }
+        live_record = [{"instance_id": "instance_20260101_000000_1111"}]
+
+        def fake_port_in_use(port: int) -> bool:
+            return port in {8000, 5173}
+
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record):
+                with mock.patch.object(moto_launcher, "cleanup_launcher_state", return_value=live_record):
+                    with mock.patch.object(moto_launcher, "port_in_use", side_effect=fake_port_in_use):
+                        with mock.patch.object(moto_launcher, "new_instance_id", return_value="instance_test_freshly_minted"):
+                            runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "instance_test_freshly_minted")
+        self.assertNotEqual(runtime.instance_id, saved_record["instance_id"])
+        self.assertFalse(runtime.is_default)
+
+    def test_live_default_instance_is_not_recreated_when_ports_look_free(self) -> None:
+        """A live recorded default instance must block fallback to the default identity."""
+        saved_record = {
+            "instance_id": "default",
+            "data_root": None,
+            "log_root": None,
+            "secret_namespace": None,
+            "storage_prefix": None,
+        }
+        live_record = [{"instance_id": "default"}]
+
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record):
+                with mock.patch.object(moto_launcher, "cleanup_launcher_state", return_value=live_record):
+                    with mock.patch.object(moto_launcher, "port_in_use", return_value=False):
+                        with mock.patch.object(moto_launcher, "new_instance_id", return_value="instance_safe_parallel"):
+                            runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "instance_safe_parallel")
+        self.assertFalse(runtime.is_default)
+        self.assertEqual(runtime.secret_namespace, "instance_safe_parallel")
+        self.assertEqual(runtime.storage_prefix, "instance_safe_parallel")
+
+    def test_explicit_override_does_not_read_last_record(self) -> None:
+        """Explicit env overrides must never be replaced by a stored record."""
+        saved_record = {
+            "instance_id": "default",
+            "data_root": None,
+            "log_root": None,
+            "secret_namespace": None,
+            "storage_prefix": None,
+        }
+        with mock.patch.dict(os.environ, {"MOTO_INSTANCE_ID": "explicit_run"}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record) as loader:
+                with mock.patch.object(moto_launcher, "port_in_use", return_value=False):
+                    runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.instance_id, "explicit_run")
+        self.assertTrue(runtime.explicit_override)
+        self.assertEqual(runtime.secret_namespace, "explicit_run")
+        # We must not even consult the stored last-instance record when the
+        # caller provided explicit overrides.
+        loader.assert_not_called()
+
+
+class WindowsLauncherStrategyTests(unittest.TestCase):
+    def test_build_windows_service_command_prefers_path_safe_executable_name(self) -> None:
+        npm_path = r"C:\Program Files\nodejs\npm.cmd"
+
+        with mock.patch.object(moto_launcher.sys, "platform", "win32"):
+            with mock.patch.object(moto_launcher, "resolve_command", return_value=npm_path):
+                command = moto_launcher.build_windows_service_command(
+                    "MOTO Frontend [default]",
+                    [npm_path, "run", "dev"],
+                )
+
+        self.assertIn("npm.cmd run dev", command)
+        self.assertNotIn(npm_path, command)
+
+    def test_launch_windows_service_falls_back_to_direct_launch_for_unsafe_absolute_path(self) -> None:
+        tool_path = r"C:\Program Files\Custom Tools\frontend.cmd"
+        process = mock.Mock(pid=5150)
+
+        with mock.patch.object(moto_launcher.sys, "platform", "win32"):
+            with mock.patch.object(moto_launcher, "resolve_command", return_value=None):
+                with mock.patch.object(moto_launcher.subprocess, "Popen", return_value=process) as popen:
+                    service = moto_launcher.launch_windows_service(
+                        "MOTO Frontend [default]",
+                        [tool_path, "run", "dev"],
+                        cwd=r"C:\repo",
+                        env={},
+                    )
+
+        self.assertEqual(service.mode, "window")
+        self.assertEqual(service.pid, 5150)
+        popen.assert_called_once()
+        self.assertEqual(popen.call_args.args[0], [tool_path, "run", "dev"])
+
+
+class LinuxLauncherStrategyTests(unittest.TestCase):
+    def test_using_repo_local_venv_detects_repo_scoped_interpreter(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            repo_root = Path(temp_dir)
+            python_path = repo_root / ".venv" / "bin" / "python"
+            python_path.parent.mkdir(parents=True)
+            python_path.write_text("", encoding="utf-8")
+
+            with mock.patch.object(moto_launcher, "SCRIPT_DIR", repo_root):
+                with mock.patch.object(moto_launcher, "get_python_command", return_value=str(python_path)):
+                    self.assertTrue(moto_launcher.using_repo_local_venv())
+
+    def test_launch_service_uses_linux_terminal_when_available(self) -> None:
+        process = mock.Mock(pid=3210)
+        with mock.patch.object(moto_launcher.sys, "platform", "linux"):
+            with mock.patch.object(moto_launcher, "resolve_linux_terminal", return_value=("gnome-terminal", "/usr/bin/gnome-terminal")):
+                with mock.patch.object(moto_launcher.subprocess, "Popen", return_value=process) as popen:
+                    service = moto_launcher.launch_service(
+                        title="MOTO Backend [default]",
+                        service_slug="backend",
+                        args=["python3", "-m", "uvicorn"],
+                        cwd="/tmp/project",
+                        env={},
+                        log_root="/tmp/project/logs",
+                    )
+
+        self.assertEqual(service.mode, "terminal")
+        self.assertEqual(service.pid, 3210)
+        self.assertIsNone(service.log_path)
+        popen.assert_called_once()
+
+    def test_launch_service_falls_back_to_background_when_no_linux_terminal(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            process = mock.Mock(pid=4242)
+            with mock.patch.object(moto_launcher.sys, "platform", "linux"):
+                with mock.patch.object(moto_launcher, "resolve_linux_terminal", return_value=None):
+                    with mock.patch.object(moto_launcher.subprocess, "Popen", return_value=process) as popen:
+                        service = moto_launcher.launch_service(
+                            title="MOTO Backend [default]",
+                            service_slug="backend",
+                            args=["python3", "-m", "http.server"],
+                            cwd=temp_dir,
+                            env={},
+                            log_root=temp_dir,
+                        )
+
+        self.assertEqual(service.mode, "background")
+        self.assertEqual(service.pid, 4242)
+        self.assertIsNotNone(service.log_path)
+        self.assertTrue(service.log_path.endswith("launcher_backend.log"))
+        popen.assert_called_once()
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_moto_updater.py b/tests/test_moto_updater.py
new file mode 100644
index 0000000..cfe67ef
--- /dev/null
+++ b/tests/test_moto_updater.py
@@ -0,0 +1,204 @@
+import json
+from pathlib import Path
+import tempfile
+import unittest
+import urllib.error
+from unittest import mock
+
+import moto_updater
+
+
+class RepoSlugTests(unittest.TestCase):
+    def test_normalize_repo_slug_handles_common_github_formats(self) -> None:
+        cases = {
+            "https://github.com/Intrafere/MOTO-Autonomous-ASI": "Intrafere/MOTO-Autonomous-ASI",
+            "https://github.com/Intrafere/MOTO-Autonomous-ASI.git": "Intrafere/MOTO-Autonomous-ASI",
+            "git@github.com:Intrafere/MOTO-Autonomous-ASI.git": "Intrafere/MOTO-Autonomous-ASI",
+            "git+https://github.com/Intrafere/MOTO-Autonomous-ASI.git": "Intrafere/MOTO-Autonomous-ASI",
+        }
+        for raw, expected in cases.items():
+            with self.subTest(raw=raw):
+                self.assertEqual(moto_updater._normalize_repo_slug(raw), expected)
+
+
+class InstallStateTests(unittest.TestCase):
+    def test_classify_zip_install_when_repo_has_no_git_metadata(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            repo_root = Path(temp_dir)
+            with mock.patch.object(moto_updater, "REPO_ROOT", repo_root):
+                with mock.patch.object(moto_updater, "_git_checkout_matches_repo", return_value=False):
+                    state = moto_updater.classify_install_state([])
+
+        self.assertEqual(state.kind, "zip_install")
+        self.assertTrue(state.can_auto_apply)
+
+    def test_classify_clean_git_clone_when_checkout_is_safe(self) -> None:
+        git_outputs = [
+            (0, "main", ""),
+            (0, "origin/main", ""),
+            (0, "", ""),
+            (0, "https://github.com/Intrafere/MOTO-Autonomous-ASI.git", ""),
+        ]
+
+        with mock.patch.object(moto_updater, "_git_checkout_matches_repo", return_value=True):
+            with mock.patch.object(moto_updater, "_official_repo_slug", return_value="Intrafere/MOTO-Autonomous-ASI"):
+                with mock.patch.object(moto_updater, "_git_output", side_effect=git_outputs):
+                    state = moto_updater.classify_install_state([])
+
+        self.assertEqual(state.kind, "clean_git_clone")
+        self.assertTrue(state.can_auto_apply)
+        self.assertEqual(state.git_branch, "main")
+        self.assertEqual(state.git_upstream, "origin/main")
+
+    def test_check_for_updates_falls_back_to_branch_head_when_manifest_missing(self) -> None:
+        local_manifest = moto_updater.BuildManifest(
+            version="1.0.7",
+            build_commit="localcommit",
+            update_channel="main",
+            api_contract_version="build5-v1",
+        )
+        fallback_manifest = moto_updater.BuildManifest(
+            version="1.0.6",
+            build_commit="remotecommit",
+            update_channel="main",
+            api_contract_version="build5-v1",
+        )
+        http_404 = urllib.error.HTTPError(
+            url="https://raw.githubusercontent.com/example/main/moto-update-manifest.json",
+            code=404,
+            msg="Not Found",
+            hdrs=None,
+            fp=None,
+        )
+
+        with mock.patch.object(moto_updater, "load_local_manifest", return_value=local_manifest):
+            with mock.patch.object(moto_updater, "cleanup_launcher_state", return_value=[]):
+                with mock.patch.object(
+                    moto_updater,
+                    "classify_install_state",
+                    return_value=moto_updater.InstallState(
+                        kind="zip_install",
+                        label="ZIP / extracted consumer install",
+                        can_auto_apply=True,
+                        reason="ZIP / extracted consumer install.",
+                    ),
+                ):
+                    with mock.patch.object(moto_updater, "fetch_remote_manifest", side_effect=http_404):
+                        with mock.patch.object(moto_updater, "fetch_branch_head_fallback", return_value=fallback_manifest):
+                            result = moto_updater.check_for_updates()
+
+        self.assertTrue(result.update_available)
+        self.assertEqual(result.metadata_source, "branch_head_fallback")
+        self.assertIsNone(result.error)
+        self.assertIsNotNone(result.warning)
+        self.assertFalse(result.can_apply_update)
+
+
+class LauncherStateTests(unittest.TestCase):
+    def test_cleanup_launcher_state_removes_dead_instances(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            state_path = Path(temp_dir) / ".moto_launcher_state.json"
+            state_path.write_text(
+                json.dumps(
+                    {
+                        "instances": [
+                            {"instance_id": "alive", "backend_window_pid": 100, "frontend_window_pid": 101},
+                            {"instance_id": "dead", "backend_window_pid": 200, "frontend_window_pid": 201},
+                        ]
+                    }
+                ),
+                encoding="utf-8",
+            )
+
+            def fake_is_pid_running(pid: int | None) -> bool:
+                return pid in {100, 101}
+
+            with mock.patch.object(moto_updater, "LAUNCHER_STATE_PATH", state_path):
+                with mock.patch.object(moto_updater, "_is_pid_running", side_effect=fake_is_pid_running):
+                    instances = moto_updater.cleanup_launcher_state()
+
+            self.assertEqual(len(instances), 1)
+            self.assertEqual(instances[0]["instance_id"], "alive")
+
+
+class SnapshotSyncTests(unittest.TestCase):
+    def test_collect_preserved_relatives_includes_explicit_instance_runtime_paths(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            repo_root = Path(temp_dir)
+            instance_data = repo_root / ".moto_instances" / "instance_alpha" / "data"
+            instance_logs = repo_root / ".moto_instances" / "instance_alpha" / "logs"
+            instance_data.mkdir(parents=True)
+            instance_logs.mkdir(parents=True)
+
+            env = {
+                "MOTO_INSTANCE_ID": "instance_alpha",
+                "MOTO_DATA_ROOT": str(instance_data),
+                "MOTO_LOG_ROOT": str(instance_logs),
+            }
+            with mock.patch.object(moto_updater, "REPO_ROOT", repo_root):
+                preserved = moto_updater.collect_preserved_relatives(env, active_instances=[])
+
+        self.assertIn(".moto_instances", preserved)
+        self.assertIn(".moto_instances/instance_alpha", preserved)
+        self.assertIn(".moto_instances/instance_alpha/data", preserved)
+        self.assertIn(".moto_instances/instance_alpha/logs", preserved)
+
+    def test_sync_snapshot_preserves_runtime_roots_and_can_restore(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            temp_root = Path(temp_dir)
+            source_root = temp_root / "source"
+            destination_root = temp_root / "destination"
+            backup_root = temp_root / "backup"
+
+            (source_root / "backend" / "data").mkdir(parents=True)
+            (source_root / "docs").mkdir(parents=True)
+            (source_root / "moto_launcher.py").write_text("new launcher\n", encoding="utf-8")
+            (source_root / "docs" / "guide.txt").write_text("new docs\n", encoding="utf-8")
+            (source_root / "backend" / "data" / "keep.txt").write_text("new data\n", encoding="utf-8")
+
+            (destination_root / "backend" / "data").mkdir(parents=True)
+            (destination_root / "docs").mkdir(parents=True)
+            (destination_root / "moto_launcher.py").write_text("old launcher\n", encoding="utf-8")
+            (destination_root / "backend" / "data" / "keep.txt").write_text("original data\n", encoding="utf-8")
+
+            journal = moto_updater.sync_snapshot_into_install(
+                source_root=source_root,
+                destination_root=destination_root,
+                preserved_relatives={"backend/data"},
+                backup_root=backup_root,
+            )
+
+            self.assertEqual((destination_root / "moto_launcher.py").read_text(encoding="utf-8"), "new launcher\n")
+            self.assertEqual((destination_root / "docs" / "guide.txt").read_text(encoding="utf-8"), "new docs\n")
+            self.assertEqual((destination_root / "backend" / "data" / "keep.txt").read_text(encoding="utf-8"), "original data\n")
+            self.assertIn("moto_launcher.py", journal.overwritten_files)
+            self.assertIn("docs/guide.txt", journal.created_files)
+
+            moto_updater.restore_snapshot_from_backup(destination_root, backup_root, journal)
+
+            self.assertEqual((destination_root / "moto_launcher.py").read_text(encoding="utf-8"), "old launcher\n")
+            self.assertFalse((destination_root / "docs" / "guide.txt").exists())
+            self.assertEqual((destination_root / "backend" / "data" / "keep.txt").read_text(encoding="utf-8"), "original data\n")
+
+
+class RelaunchCommandTests(unittest.TestCase):
+    def test_build_relaunch_command_prefers_linux_entrypoint_when_provided(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            entrypoint = Path(temp_dir) / "Launch MOTO.sh"
+            entrypoint.write_text("#!/usr/bin/env bash\n", encoding="utf-8")
+
+            command = moto_updater._build_relaunch_command(
+                {moto_updater.LAUNCHER_ENTRYPOINT_ENV: str(entrypoint)}
+            )
+
+        self.assertEqual(command, ["bash", str(entrypoint.resolve())])
+
+    def test_build_relaunch_command_falls_back_to_python_launcher(self) -> None:
+        command = moto_updater._build_relaunch_command({})
+
+        self.assertEqual(command[0], moto_updater.sys.executable)
+        self.assertTrue(command[1].endswith("moto_launcher.py"))
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_paper_memory_appendix.py b/tests/test_paper_memory_appendix.py
new file mode 100644
index 0000000..d9cf2ef
--- /dev/null
+++ b/tests/test_paper_memory_appendix.py
@@ -0,0 +1,78 @@
+import tempfile
+import unittest
+from pathlib import Path
+
+from backend.compiler.memory.paper_memory import (
+    APPENDIX_EMPTY_PLACEHOLDER,
+    ABSTRACT_PLACEHOLDER,
+    CONCLUSION_PLACEHOLDER,
+    INTRO_PLACEHOLDER,
+    PAPER_ANCHOR,
+    THEOREMS_APPENDIX_END,
+    THEOREMS_APPENDIX_START,
+    PaperMemory,
+)
+from backend.shared.config import system_config
+
+
+class PaperMemoryAppendixTests(unittest.IsolatedAsyncioTestCase):
+    async def test_appendix_entries_replace_placeholder_and_append_in_order(self) -> None:
+        old_paper_file = system_config.compiler_paper_file
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.compiler_paper_file = str(Path(tmpdir) / "paper.txt")
+                memory = PaperMemory()
+                await memory.initialize()
+                await memory.initialize_with_placeholders("II. Body\n\nBody text.")
+
+                first = "### Theorem A\nVerified with Lean 4.\n```lean\ntheorem a : True := by trivial\n```"
+                second = "### Theorem B\nVerified with Lean 4.\n```lean\ntheorem b : True := by trivial\n```"
+
+                self.assertTrue(await memory.append_to_theorems_appendix(first))
+                self.assertTrue(await memory.append_to_theorems_appendix(second))
+
+                paper = await memory.get_paper()
+                self.assertIn(THEOREMS_APPENDIX_START, paper)
+                self.assertIn(THEOREMS_APPENDIX_END, paper)
+                self.assertIn(first, paper)
+                self.assertIn(second, paper)
+                self.assertNotIn(APPENDIX_EMPTY_PLACEHOLDER, paper)
+                self.assertLess(paper.index(first), paper.index(second))
+                self.assertTrue(paper.rstrip().endswith(PAPER_ANCHOR))
+            finally:
+                system_config.compiler_paper_file = old_paper_file
+
+    async def test_latex_conclusion_content_removes_stale_placeholder(self) -> None:
+        old_paper_file = system_config.compiler_paper_file
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.compiler_paper_file = str(Path(tmpdir) / "paper.txt")
+                memory = PaperMemory()
+                await memory.initialize()
+
+                conclusion = "This is real conclusion content. " * 20
+                await memory.update_paper(
+                    f"{ABSTRACT_PLACEHOLDER}\n\n"
+                    f"{INTRO_PLACEHOLDER}\n\n"
+                    "\\section{Preliminaries}\n\nBody text.\n\n"
+                    f"\\section{{Conclusion}}\n\n{conclusion}\n\n"
+                    f"{CONCLUSION_PLACEHOLDER}\n\n"
+                    f"{THEOREMS_APPENDIX_START}\n"
+                    f"{APPENDIX_EMPTY_PLACEHOLDER}\n"
+                    f"{THEOREMS_APPENDIX_END}\n\n"
+                    f"{PAPER_ANCHOR}"
+                )
+
+                self.assertTrue(await memory.ensure_placeholders_exist())
+
+                paper = await memory.get_paper()
+                self.assertIn("\\section{Conclusion}", paper)
+                self.assertNotIn(CONCLUSION_PLACEHOLDER, paper)
+                self.assertIn(ABSTRACT_PLACEHOLDER, paper)
+                self.assertIn(INTRO_PLACEHOLDER, paper)
+            finally:
+                system_config.compiler_paper_file = old_paper_file
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_rigor_lean_placement_validator.py b/tests/test_rigor_lean_placement_validator.py
new file mode 100644
index 0000000..411d69f
--- /dev/null
+++ b/tests/test_rigor_lean_placement_validator.py
@@ -0,0 +1,76 @@
+import json
+import unittest
+
+from backend.compiler.validation import compiler_validator as validator_module
+from backend.compiler.validation.compiler_validator import CompilerValidator
+from backend.shared.models import CompilerSubmission
+
+
+class LeanPlacementValidatorTests(unittest.IsolatedAsyncioTestCase):
+    async def test_lean_placement_prompt_and_forced_rigor_check(self) -> None:
+        validator = CompilerValidator(model_name="test-model", user_prompt="Write a paper.")
+        submission = CompilerSubmission(
+            submission_id="sub-lean-placement",
+            mode="rigor",
+            content="Anchor paragraph.\n\nTheorem text. Verified with Lean 4.",
+            operation="insert_after",
+            old_string="Anchor paragraph.",
+            new_string="Theorem text. Verified with Lean 4.",
+            reasoning="Place the theorem after the anchor.",
+            metadata={
+                "rigor_mode": "lean_placement",
+                "theorem_statement": "theorem t : True",
+                "lean_code": "theorem t : True := by trivial",
+                "placement_attempt": 1,
+            },
+        )
+
+        captured_prompt = {}
+
+        async def fake_ensure_markers_intact() -> bool:
+            return False
+
+        async def fake_generate_completion(**kwargs):
+            captured_prompt["text"] = kwargs["messages"][0]["content"]
+            return {
+                "choices": [
+                    {
+                        "message": {
+                            "content": json.dumps(
+                                {
+                                    "decision": "reject",
+                                    "reasoning": "Placement needs a better narrative bridge.",
+                                    "coherence_check": True,
+                                    "rigor_check": False,
+                                    "placement_check": False,
+                                }
+                            )
+                        }
+                    }
+                ]
+            }
+
+        original_ensure = validator_module.paper_memory.ensure_markers_intact
+        original_generate = validator_module.api_client_manager.generate_completion
+        try:
+            validator_module.paper_memory.ensure_markers_intact = fake_ensure_markers_intact
+            validator_module.api_client_manager.generate_completion = fake_generate_completion
+
+            result = await validator.validate_submission(
+                submission,
+                current_paper="Anchor paragraph.\n",
+                current_outline="I. Outline",
+            )
+        finally:
+            validator_module.paper_memory.ensure_markers_intact = original_ensure
+            validator_module.api_client_manager.generate_completion = original_generate
+
+        self.assertEqual(result.decision, "reject")
+        self.assertTrue(result.rigor_check)
+        self.assertFalse(result.placement_check)
+        self.assertIn("Lean 4 Verified Theorem Placement", captured_prompt["text"])
+        self.assertIn("MUST NOT re-evaluate", captured_prompt["text"])
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_wolfram_tool_loop.py b/tests/test_wolfram_tool_loop.py
new file mode 100644
index 0000000..e253cc9
--- /dev/null
+++ b/tests/test_wolfram_tool_loop.py
@@ -0,0 +1,122 @@
+import json
+import unittest
+
+from backend.compiler.agents import high_context_submitter as submitter_module
+from backend.compiler.agents.high_context_submitter import HighContextSubmitter
+from backend.shared import wolfram_alpha_client as wolfram_module
+
+
+class FakeWolframClient:
+    def __init__(self) -> None:
+        self.queries: list[str] = []
+
+    async def query(self, query: str) -> str:
+        self.queries.append(query)
+        return f"result for {query}"
+
+
+def _tool_call(call_id: str, query: str) -> dict:
+    return {
+        "id": call_id,
+        "type": "function",
+        "function": {
+            "name": "wolfram_alpha_query",
+            "arguments": json.dumps({"query": query, "purpose": "test"}),
+        },
+    }
+
+
+class WolframToolLoopTests(unittest.IsolatedAsyncioTestCase):
+    async def test_tool_loop_executes_query_and_returns_final_json(self) -> None:
+        submitter = HighContextSubmitter(model_name="test-model", user_prompt="Write.")
+        fake_client = FakeWolframClient()
+        broadcasts = []
+
+        async def broadcaster(event: str, data: dict) -> None:
+            broadcasts.append((event, data))
+
+        submitter.websocket_broadcaster = broadcaster
+        responses = [
+            {"choices": [{"message": {"content": "", "tool_calls": [_tool_call("call-1", "2+2")]}}]},
+            {"choices": [{"message": {"content": '{"needs_construction": false}'}}]},
+        ]
+        calls = []
+
+        async def fake_generate_completion(**kwargs):
+            calls.append(kwargs)
+            return responses.pop(0)
+
+        original_available = submitter_module._wolfram_tool_available
+        original_get_client = wolfram_module.get_wolfram_client
+        original_generate = submitter_module.api_client_manager.generate_completion
+        try:
+            submitter_module._wolfram_tool_available = lambda: True
+            wolfram_module.get_wolfram_client = lambda: fake_client
+            submitter_module.api_client_manager.generate_completion = fake_generate_completion
+
+            content, wolfram_calls, _message = await submitter._generate_completion_with_wolfram_tool(
+                task_id="task-1",
+                initial_prompt="prompt",
+            )
+        finally:
+            submitter_module._wolfram_tool_available = original_available
+            wolfram_module.get_wolfram_client = original_get_client
+            submitter_module.api_client_manager.generate_completion = original_generate
+
+        self.assertEqual(content, '{"needs_construction": false}')
+        self.assertEqual(fake_client.queries, ["2+2"])
+        self.assertEqual(wolfram_calls[0]["query"], "2+2")
+        self.assertIsNotNone(calls[0]["tools"])
+        self.assertEqual(calls[1]["messages"][-1]["role"], "tool")
+        self.assertEqual(broadcasts[0][0], "compiler_wolfram_call")
+
+    async def test_single_turn_multiple_tool_calls_cannot_exceed_budget(self) -> None:
+        submitter = HighContextSubmitter(model_name="test-model", user_prompt="Write.")
+        fake_client = FakeWolframClient()
+        responses = [
+            {
+                "choices": [
+                    {
+                        "message": {
+                            "content": "",
+                            "tool_calls": [
+                                _tool_call("call-1", "1+1"),
+                                _tool_call("call-2", "2+2"),
+                                _tool_call("call-3", "3+3"),
+                            ],
+                        }
+                    }
+                ]
+            },
+            {"choices": [{"message": {"content": '{"needs_construction": false}'}}]},
+        ]
+
+        async def fake_generate_completion(**kwargs):
+            return responses.pop(0)
+
+        original_available = submitter_module._wolfram_tool_available
+        original_get_client = wolfram_module.get_wolfram_client
+        original_generate = submitter_module.api_client_manager.generate_completion
+        original_budget = submitter_module.WOLFRAM_MAX_CALLS_PER_SUBMISSION
+        try:
+            submitter_module._wolfram_tool_available = lambda: True
+            wolfram_module.get_wolfram_client = lambda: fake_client
+            submitter_module.api_client_manager.generate_completion = fake_generate_completion
+            submitter_module.WOLFRAM_MAX_CALLS_PER_SUBMISSION = 2
+
+            _content, wolfram_calls, _message = await submitter._generate_completion_with_wolfram_tool(
+                task_id="task-2",
+                initial_prompt="prompt",
+            )
+        finally:
+            submitter_module._wolfram_tool_available = original_available
+            wolfram_module.get_wolfram_client = original_get_client
+            submitter_module.api_client_manager.generate_completion = original_generate
+            submitter_module.WOLFRAM_MAX_CALLS_PER_SUBMISSION = original_budget
+
+        self.assertEqual(fake_client.queries, ["1+1", "2+2"])
+        self.assertEqual(len(wolfram_calls), 2)
+
+
+if __name__ == "__main__":
+    unittest.main()

From 2d0d964d88fab168ed683235f5ff32d02867bb55 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Thu, 30 Apr 2026 18:41:42 -0500
Subject: [PATCH 08/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 README.md | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/README.md b/README.md
index f53fc18..1dcea78 100644
--- a/README.md
+++ b/README.md
@@ -6,7 +6,7 @@
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in decyphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. This exact versin of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers — and the machine-checked theorem proving programming language Lean 4 proofs alongside them for definitive mathematical confirmation of correctness. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in deciphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. Additionally, MOTO ships an optional automated theorem generation pipeline that formalizes candidate theorems and lemmas in Lean 4 (with optional Z3/SMT hinting and Mathlib lemma search) and only stores proofs that Lean 4 accepts as genuinely verified. This exact version of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
 ### The Core Discovery: Top-P Exploration 
 
@@ -18,9 +18,9 @@ The brainstorming phase runs **multiple submitters in parallel**, each independe
 
 Once a brainstorm is sufficiently explored, MOTO writes a research paper from it. This step then repeats — papers become a new "Tier 2" brainstorm. Previous papers are referenced in future brainstorms and future papers. This set of Tier 2 papers is another higher-order brainstorm-like database, which also self-prunes newly discovered incorrect or redundant papers just like the Tier 1 short-hand idea brainstorm does. A third tier generates the final answer, capable of producing book-length volumes.
 
-MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its long-form synthesis mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models over 131,000 token context limits, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is a research prototype; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
+MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its long-form synthesis mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models that have context limits over 131,000 tokens, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is a research prototype; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
-Give the program a try, MOTO is as cool as it sounds - Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash "Launch MOTO.sh"`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
+Give the program a try — MOTO is as cool as it sounds. Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash "Launch MOTO.sh"`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
 
@@ -30,12 +30,12 @@ Give the program a try, MOTO is as cool as it sounds - Windows has a one-click l
 
 ## Outline of "MOTO - S.T.E.M. Mathematics Variant"
 
-MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeking AI) mathematics researcher designed to run for days at a time after pressing start without user interaction. This program can support multiple simultaneous models working in parallel from either local host LM Studio, OpenRouter API key, or both.
+MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeking AI) mathematics researcher designed to run for days at a time after you press start, without user interaction. This program can support multiple simultaneous models working in parallel from either local host LM Studio, OpenRouter API key, or both.
 
 ### Key Features
 
 - 🤖 **Autonomous Topic Selection, Brainstorming, and Paper Generation**: AI chooses research avenues based on high-level goals and produces you a final answer with ZERO extra user input. Let MOTO run for days using the best models without touching it, or for a few hours using a faster draft model. How deep you research and how long it takes is left up to you, the user.
-- **OpenRouter Integration**: Supports both local (LM Studio) and cloud (OpenRouter) models. Use your local LM Studio models run offline from your computer or add your OpenRouter API key to compete and team up 3rd party models from the largest closed source LLMs like ChatGPT, Claude, DeepSeek, Gemini and Perplexity
+- **OpenRouter Integration**: Supports both local (LM Studio) and cloud (OpenRouter) models. Run your local LM Studio models offline from your computer, or add your OpenRouter API key to compete and team up with 3rd-party models from the largest closed-source LLMs like ChatGPT, Claude, DeepSeek, Gemini, and Perplexity.
 
 ---
 
@@ -49,8 +49,8 @@ Before installation, you need:
    - ⚠️ **IMPORTANT**: Check "Add Python to PATH" during installation
 2. **Node.js 16+** - [Download here](https://nodejs.org/)
 3. **LM Studio** (optional but HIGHLY recommended - otherwise your system will need to pay OpenRouter for RAG embedding calls, which is very slow compared to LM Studio's local embeddings) - [Download here](https://lmstudio.ai/)
-   - If using OpenRouter, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle, however it is always worth a try!)
-   - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM Studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM Studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will support. In this developer tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (I.e. GPT OSS 20b, DeepSeek 32B, etc). **If you do not download LM Studio and enable the Nomic agent the system will run much slower and cost slightly more due to having to use the paid service OpenRouter for RAG calls.**
+   - If using OpenRouter, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle; however, it is always worth a try!)
+   - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM Studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM Studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will support. In this developer tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (e.g., GPT OSS 20b, DeepSeek 32B, etc.). **If you do not download LM Studio and enable the Nomic agent the system will run much slower and cost slightly more due to having to use the paid service OpenRouter for RAG calls.**
    - Start the local server (port 1234)
 4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download the MOTO deep research harness, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
 5. **On first startup, pick your provider path**: After you acknowledge the disclaimer, MOTO will prompt you to either enter an OpenRouter key or confirm that LM Studio is running. If you save an OpenRouter key there, the recommended default autonomous profile is applied immediately so you can open Settings and see it already selected.
@@ -271,7 +271,7 @@ All configurable per role:
 - Review validator reasoning in logs
 - Ensure prompt is clear and specific
 - Use larger models for better results
-- View the learning curve analysis on the Intrafere.com website and ensure you are not just at a learning curve wall - 100s of rejections in a row before the first acceptance in the brainstorming session can be common.
+- View the learning curve analysis on the Intrafere.com website and ensure you are not just at a learning curve wall - hundreds of rejections in a row before the first acceptance in the brainstorming session can be common.
 
 **System running slow**
 - Use faster/smaller models
@@ -291,10 +291,11 @@ All configurable per role:
 - Check logs for detailed token usage
 
 **JSON and output errors**
-- Monitor your model(s) output(s) occasionally to see if it's stuck in output loops and is repeatedly utilizing its entire output token budget - this is a sign the model runtime instance from either LM Studio or OpenRouter has corrupted. If this is the case you will either need to switch OpenRouter hosts for that model, switch models, or if using LM Studio you must unload and reload the model. However if this happens once, it is likely to happen again so you should either try to switch hosts (if using OpenRouter), switch runtime engines (if using LM Studio), or switch models entirely as some models may be more vulnerable to this than others. This issue does not appear to be related to the MOTO harness and the MOTO developers have no control over this deterministic model-loop corruption state. The repetitive nature of the harness appears to stress certain engines, for example when using AMD compatible engines, ROCm *may* have more instabilities than Vulkan as of 1/11/2026. This is an odd bug and it is unclear if this is related to the 3rd party runtime engine's K/V caching mechanism or some other feature of the code. If you find any information on this bug please submit it to GitHub.
+- Monitor your model(s) output(s) occasionally to see if it's stuck in output loops and is repeatedly utilizing its entire output token budget - this is a sign the model runtime instance from either LM Studio or OpenRouter has corrupted. If this is the case, you will either need to switch OpenRouter hosts for that model, switch models, or (if using LM Studio) unload and reload the model. However, if this happens once, it is likely to happen again, so you should either try to switch hosts (if using OpenRouter), switch runtime engines (if using LM Studio), or switch models entirely, as some models may be more vulnerable to this than others. This issue does not appear to be related to the MOTO harness, and the MOTO developers have no control over this deterministic model-loop corruption state. The repetitive nature of the harness appears to stress certain engines; for example, when using AMD-compatible engines, ROCm *may* have more instabilities than Vulkan as of 1/11/2026. This is an odd bug, and it is unclear whether it is related to the 3rd-party runtime engine's KV caching mechanism or some other feature of the code. If you find any information on this bug, please submit it to GitHub.
 
 **JSON truncation errors**
-- Ensure you are not experiencing the output error looping mentioned above that some LLM runtime engines seem to experience. If your JSON truncation is not a result of looping then you should try increasing your model's max output tokens. It is highly likely that your model was truncated because you did not set enough output tokens (20% or more of your token budget being allotted for token output is standard practice, longer thinking models like DeepSeek V3.2 Speciale may require much larger splits such as (164K total tokens, 64K reserved for output tokens), however most models function great closer to the 20% output budget mark.
+- Ensure you are not experiencing the output error looping mentioned above that some LLM runtime engines seem to experience. If your JSON truncation is not a result of looping, then you should try increasing your model's max output tokens. It is highly likely that your model was truncated because you did not set enough output tokens. Allotting 20% or more of your token budget for token output is standard practice. Longer-thinking models like DeepSeek V3.2 Speciale may require much larger splits, such as 164K total tokens with 64K reserved for output tokens; however, most models function great closer to the 20% output budget mark.
+
 ---
 
 ## 📚 Documentation

From 023170095e570078962be335ed34f8eed04e9124 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Thu, 30 Apr 2026 19:33:04 -0500
Subject: [PATCH 09/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 README.md           | 14 ++++++++++++++
 backend/api/main.py | 14 ++++++++++----
 2 files changed, 24 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index 1dcea78..dd9d7de 100644
--- a/README.md
+++ b/README.md
@@ -20,6 +20,19 @@ Once a brainstorm is sufficiently explored, MOTO writes a research paper from it
 
 MOTO may produce many brilliant papers as it runs; these intermediate papers are answers that rival traditional paid cloud deep research. As the user, observe MOTO as often or as little as you'd like — skip its autonomy and force it into final answer generation, or stop it early and select one of its highly creative pre-final answer papers. If the operator allows, let MOTO run for many hours and produce a final answer from its long-form synthesis mode. MOTO autonomously decides whether to output a short-form answer or collect existing papers into a long-form academic volume. With models that have context limits over 131,000 tokens, the harness easily produces final volumes exceeding 40,000 words autonomously. The built-in "critique" feature allows the user to direct-inject the full volume into nearly any AI model of their choice for evaluation. MOTO writes papers in reverse order — body first, conclusion second, introduction last — to avoid constraining the creative process with premature structural commitments. MOTO is a research prototype; the AI(s) are producing this content partially unguided and all papers should be judged with extreme scrutiny.
 
+### Secondary Feature: Automated Theorem Generation with Lean 4 Verification
+
+Paired with Top-P Exploration — and secondary to it — MOTO ships an **optional automated theorem generation pipeline** that turns the autonomous brainstorm and paper stream into **machine-checked Lean 4 proofs**. When `lean4_enabled` is on, the coordinator first runs a one-shot *proof-framing gate* to decide whether the user's prompt is proof-amenable; if it is, every subsequent brainstorm and paper becomes a candidate source for formalization. After each completed brainstorm (Tier 1) and each completed paper (Tier 2 / Tier 3 chapter), a dedicated proof stage runs:
+
+1. **Candidate identification** — an LLM agent extracts theorem/lemma candidates from the brainstorm or paper.
+2. **Mathlib lemma search** — a second agent surfaces relevant existing Mathlib lemmas and threads them into the formalization prompt.
+3. **Optional Z3/SMT early-exit** — when `smt_enabled`, an external Z3 binary classifies candidates conservatively; successful SMT results become Lean tactic hints (`nativeDecide` / `omega` / `decide`-style) — **never** standalone proofs.
+4. **Lean 4 formalization** — a two-phase retry loop (up to 3 full-proof attempts + 2 multi-tactic script attempts, 5 total per candidate), with prior failure hints direct-injected on each retry. Per-candidate work runs concurrently bounded by `proof_max_parallel_candidates`.
+5. **Novelty check** — verified proofs are compared against the existing proof library and classified as novel or known.
+6. **Storage + feedback** — `proof_database` persists every verified proof as a session-aware record (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and a reverse Mathlib usage index. Verified proofs are appended as a "Verified Proofs" section at the bottom of the source brainstorm/paper, and **novel proofs become the highest-priority direct-injection context for subsequent brainstorm and paper submitters** — so formal verification feeds directly back into Top-P exploration.
+
+**Lean 4 is authoritative.** SMT results are hints only — they never substitute for Lean verification, and any proof that would compile only because of a `sorry` or `admit` is rejected. The pipeline is entirely silent and skipped when `lean4_enabled=False`, so it never blocks brainstorm or paper completion; the default hosted image stays Lean-free and Z3-free. A manual-check endpoint (`POST /api/proofs/check`) also lets you re-run the pipeline on any stored brainstorm or paper after the fact, and the compiler's "rigor mode" reuses the same Lean 4 checker to upgrade lemmas inside a paper as it's being written.
+
 Give the program a try — MOTO is as cool as it sounds. Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash "Launch MOTO.sh"`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
@@ -36,6 +49,7 @@ MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeki
 
 - 🤖 **Autonomous Topic Selection, Brainstorming, and Paper Generation**: AI chooses research avenues based on high-level goals and produces you a final answer with ZERO extra user input. Let MOTO run for days using the best models without touching it, or for a few hours using a faster draft model. How deep you research and how long it takes is left up to you, the user.
 - **OpenRouter Integration**: Supports both local (LM Studio) and cloud (OpenRouter) models. Run your local LM Studio models offline from your computer, or add your OpenRouter API key to compete and team up with 3rd-party models from the largest closed-source LLMs like ChatGPT, Claude, DeepSeek, Gemini, and Perplexity.
+- **Optional Automated Theorem Generation (Lean 4)**: When enabled, every brainstorm and paper is run through a parallel proof pipeline that identifies theorem/lemma candidates, searches Mathlib for relevant lemmas, optionally runs Z3/SMT for conservative early-exit hints, then attempts Lean 4 formalization (up to 5 retries per candidate with failure-hint direct injection). Only Lean 4-verified proofs are stored, and novel proofs are fed back into subsequent brainstorming as highest-priority context. Secondary to Top-P Exploration and silent when disabled.
 
 ---
 
diff --git a/backend/api/main.py b/backend/api/main.py
index b7f41bf..9a04f47 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -97,16 +97,22 @@ def _restore_desktop_provider_credentials(api_client_manager) -> None:
     """Restore persisted desktop credentials from the OS-backed keyring."""
     from backend.shared.secret_store import (
         SecretStoreError,
-        get_active_service_name,
         load_openrouter_api_key,
         load_wolfram_api_key,
     )
     from backend.shared.wolfram_alpha_client import initialize_wolfram_client
 
+    # NOTE: We intentionally do NOT log `get_active_service_name()` or
+    # `system_config.secret_namespace` here. Both values are purely diagnostic
+    # identifiers (they contain no credential material), but CodeQL's
+    # "clear-text logging of sensitive information" query treats any field
+    # whose name starts with `secret_` as tainted, and any string derived
+    # from it — including the OS-keyring service name — as sensitive. Logging
+    # a boolean flag instead gives operators the diagnostic signal they need
+    # (namespaced vs. default instance) without tripping the static analyzer.
     logger.info(
-        "Secret store active: service_name='%s', namespace=%s",
-        get_active_service_name(),
-        system_config.secret_namespace or "<default>",
+        "Secret store active: namespaced_instance=%s",
+        bool(system_config.secret_namespace),
     )
 
     try:

From f3e664d5b6254e95af49538e79e3f719517ec53b Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Fri, 1 May 2026 19:54:36 -0500
Subject: [PATCH 10/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 .cursor/rules/json-prompt-design.mdc          | 187 ++++
 .../rules/part-3-autonomous-research-mode.mdc |  14 +-
 ...program-directory-and-file-definitions.mdc |  18 +-
 backend/api/routes/proofs.py                  | 142 +++
 .../agents/proof_formalization_agent.py       | 154 ++-
 .../autonomous/core/autonomous_coordinator.py |  69 +-
 .../autonomous/core/autonomous_rag_manager.py |   4 +-
 .../core/proof_verification_stage.py          |  28 +-
 .../autonomous/memory/brainstorm_memory.py    |  26 +-
 backend/autonomous/memory/paper_library.py    |  25 +-
 backend/autonomous/memory/proof_database.py   | 176 ++++
 backend/autonomous/prompts/proof_prompts.py   | 107 ++-
 backend/compiler/core/compiler_coordinator.py |  62 +-
 backend/shared/lean4_client.py                | 341 +++++--
 backend/shared/models.py                      |   1 +
 backend/shared/openrouter_client.py           |  83 +-
 frontend/src/App.jsx                          |  80 +-
 frontend/src/components/BoostControlModal.jsx |  51 +-
 .../aggregator/AggregatorSettings.jsx         |  49 +-
 .../autonomous/AutonomousResearch.css         |  63 +-
 .../autonomous/AutonomousResearchSettings.jsx |  92 +-
 .../autonomous/MathematicalProofs.jsx         |  14 +-
 .../components/autonomous/ProofLibrary.css    | 135 +++
 .../components/autonomous/ProofLibrary.jsx    | 419 ++++++++
 .../autonomous/ProofNotificationStack.jsx     |   2 +-
 frontend/src/components/autonomous/index.js   |   1 +
 .../components/compiler/CompilerSettings.jsx  |  39 +-
 frontend/src/components/settings-common.css   |   2 +-
 frontend/src/index.css                        |  73 ++
 frontend/src/services/api.js                  |  12 +
 frontend/src/utils/openRouterSelection.js     | 162 +++-
 moto_launcher.py                              | 117 ++-
 randomlog.txt                                 | 904 ++++++++++++++++++
 33 files changed, 3316 insertions(+), 336 deletions(-)
 create mode 100644 frontend/src/components/autonomous/ProofLibrary.css
 create mode 100644 frontend/src/components/autonomous/ProofLibrary.jsx
 create mode 100644 randomlog.txt

diff --git a/.cursor/rules/json-prompt-design.mdc b/.cursor/rules/json-prompt-design.mdc
index 5fdd74a..5715730 100644
--- a/.cursor/rules/json-prompt-design.mdc
+++ b/.cursor/rules/json-prompt-design.mdc
@@ -2739,6 +2739,193 @@ LaTeX notation IS ALLOWED and EXPECTED - you must escape it properly in JSON:
 - `backend/autonomous/prompts/paper_reference_prompts.py`
 - `backend/autonomous/prompts/paper_title_prompts.py`
 - `backend/autonomous/prompts/paper_redundancy_prompts.py`
+- `backend/autonomous/prompts/proof_prompts.py`
+
+---
+
+### 10. PROOF PROMPTS (Lean 4 Formal Verification)
+
+**File:** `backend/autonomous/prompts/proof_prompts.py`
+
+All proof prompts use `_json_only_footer(example)` which appends:
+`"Respond with ONLY valid JSON. Do not use markdown fences. Escape backslashes correctly for JSON."`
+All proof prompts pass `temperature=0.0`.
+
+---
+
+#### 10a. PROOF FRAMING GATE
+
+**Function:** `build_proof_framing_gate_prompt(user_prompt)`
+
+**Purpose:** One-shot decision at autonomous start — decides whether the research program should activate the full proof pipeline. Errs on the side of `true` whenever there is meaningful mathematical substance.
+
+```json
+{
+  "is_proof_amenable": true,
+  "reasoning": "brief explanation"
+}
+```
+
+**Field requirements:**
+- `is_proof_amenable`: Boolean. `true` enables `PROOF_FRAMING_CONTEXT` injection into all subsequent submitter prompts and activates the `ProofVerificationStage` after each brainstorm/paper. `false` disables the proof pipeline for this session.
+- `reasoning`: Always required.
+
+---
+
+#### 10b. PROOF IDENTIFICATION (Theorem Discovery)
+
+**Function:** `build_proof_identification_prompt(user_prompt, source_type, source_id, source_content)`
+
+**Purpose:** Novelty-seeking gate that extracts the most promising non-trivial theorem candidates from a brainstorm or paper. Rejects trivial identities and textbook restatements. Returns at most 5 candidates ranked by novelty potential.
+
+```json
+{
+  "has_provable_theorems": true,
+  "theorems": [
+    {
+      "theorem_id": "thm_1",
+      "statement": "natural-language theorem statement",
+      "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy",
+      "novelty_rationale": "why this theorem is non-trivial and worth formalizing"
+    }
+  ]
+}
+```
+
+**Field requirements:**
+- `has_provable_theorems`: Boolean. `true` when at least one non-trivial novel-potential theorem is present.
+- `theorems`: Array of candidates, ranked by novelty potential. **Maximum 5 entries.** Empty array when `has_provable_theorems` is `false`.
+- `theorem_id`: Stable string identifier such as `"thm_1"`, `"thm_2"`, etc.
+- `statement`: Natural-language theorem statement. Required.
+- `formal_sketch`: Optional Lean formalization hints, assumptions, or notation notes.
+- `novelty_rationale`: Brief explanation of why this theorem is non-trivial and worth the cost of Lean verification. Required for each candidate.
+
+**What to extract:** Novel theorems, bold conjectures that can be sharpened, non-obvious connections/bounds/structural results, ambitious claims (the formalization agent narrows if needed).
+
+**What to reject:** Trivial identities (e.g. `n + 0 = n`), standard Mathlib restatements, results closable by a single tactic (`simp`, `omega`, `norm_num`, `decide`, `rfl`), tautologies, definitional equalities.
+
+---
+
+#### 10c. MATHLIB LEMMA SEARCH
+
+**Function:** `build_lemma_search_prompt(user_prompt, source_type, theorem_statement, formal_sketch, source_excerpt)`
+
+**Purpose:** Suggests existing Mathlib declaration names likely useful for proving the target theorem. Output is injected into the formalization prompt as `RELEVANT MATHLIB LEMMAS`.
+
+```json
+{
+  "lemma_names": [
+    "Nat.add_comm",
+    "Nat.add_assoc"
+  ],
+  "reasoning": "brief explanation"
+}
+```
+
+**Field requirements:**
+- `lemma_names`: Array of 5–10 Mathlib declaration name strings when possible. Empty array if none are evident or theorem is too vague.
+- `reasoning`: Always required.
+
+---
+
+#### 10d. SMT TRANSLATION
+
+**Function:** `build_smt_translation_prompt(user_prompt, source_type, theorem_statement, formal_sketch, source_excerpt)`
+
+**Purpose:** Translates an arithmetic/SMT-amenable theorem into SMT-LIB v2 for Z3 pre-check. Only called when `smt_enabled` and the candidate passes the SMT-amenability heuristic. Result feeds tactic hints into Lean 4 formalization — never substitutes for Lean verification.
+
+```json
+{
+  "smtlib": "(set-logic QF_LIA)\n(declare-const n Int)\n(assert (not (= (+ n 0) n)))\n(check-sat)",
+  "reasoning": "Negate the target theorem so unsat means the theorem is valid."
+}
+```
+
+**Field requirements:**
+- `smtlib`: SMT-LIB v2 text encoding the **negation** of the theorem (so `unsat` = theorem is valid). Empty string `""` if a faithful SMT translation cannot be produced.
+- `reasoning`: Always required.
+
+**Constraints:** Quantifier-free arithmetic fragments preferred. Do not invent assumptions not strongly implied by the theorem statement.
+
+---
+
+#### 10e. PROOF FORMALIZATION (Full Script)
+
+**Function:** `build_proof_formalization_prompt(user_prompt, source_type, theorem_statement, formal_sketch, source_excerpt, prior_attempts, relevant_lemmas, smt_hint)`
+
+**Purpose:** Primary formalization path — generates complete Lean 4 source ready to compile. Up to 3 attempts per candidate, with the full error-feedback chain from prior attempts injected on each retry. Preserves the theorem's non-trivial content; never weakens the statement just to compile.
+
+```json
+{
+  "theorem_name": "optional_lean_identifier",
+  "lean_code": "import Mathlib\n\n theorem ... := by ...",
+  "reasoning": "brief note about the formalization strategy"
+}
+```
+
+**Field requirements:**
+- `theorem_name`: Optional Lean identifier string (e.g. `"myTheorem"`). Can be empty.
+- `lean_code`: Complete, runnable Lean 4 source including all needed imports. Must close every goal without `sorry` or `admit`. Required.
+- `reasoning`: Brief note on formalization strategy. Always required.
+
+**Critical constraints:**
+- `sorry` / `admit` anywhere → proof rejected, counts as a failed attempt.
+- Axiomatizing the theorem's own concepts to make the goal trivial → rejected.
+- If the full claim cannot be proved, return a narrower concrete lemma rather than a `sorry`-closed stub.
+- PRESERVE the theorem's non-trivial content — do not simplify into a trivial identity to make it compile.
+
+---
+
+#### 10f. PROOF FORMALIZATION (Tactic Script)
+
+**Function:** `build_proof_tactic_script_prompt(user_prompt, source_type, theorem_statement, formal_sketch, source_excerpt, prior_attempts, relevant_lemmas, smt_hint)`
+
+**Purpose:** Fallback formalization path after full-script attempts fail — returns a theorem header plus a decomposed tactic list. Up to 2 attempts. Prior attempts from the full-script phase are passed in so the tactic path sees the full failure history.
+
+```json
+{
+  "theorem_name": "optional_lean_identifier",
+  "theorem_header": "theorem optional_lean_identifier (n : Nat) : n + 0 = n",
+  "tactics": [
+    {
+      "tactic": "simpa using Nat.add_zero n",
+      "reasoning": "Close the goal with the standard right-identity lemma."
+    }
+  ],
+  "reasoning": "brief note about the tactic strategy"
+}
+```
+
+**Field requirements:**
+- `theorem_name`: Optional Lean identifier. Can be empty.
+- `theorem_header`: Lean 4 theorem signature without proof body (no `:= by`). Required.
+- `tactics`: Ordered array of tactic objects. Each entry must include `tactic` (Lean tactic string) and `reasoning` (short note). `sorry` / `admit` never allowed.
+- `reasoning`: Overall strategy note. Always required.
+
+**Fallback behavior:** If the model returns a malformed tactic response (missing header or empty tactics), the agent falls back to one additional `_run_full_script_attempt` call.
+
+---
+
+#### 10g. PROOF NOVELTY ASSESSMENT
+
+**Function:** `build_proof_novelty_prompt(user_prompt, theorem_statement, lean_code, existing_novel_proofs)`
+
+**Purpose:** Post-verification novelty gate — classifies a Lean-4-verified theorem as novel or known. Does NOT re-check validity. Errs on the side of recognizing novelty for results that required multi-step reasoning or non-trivial formalization work.
+
+```json
+{
+  "is_novel": true,
+  "reasoning": "brief explanation"
+}
+```
+
+**Field requirements:**
+- `is_novel`: Boolean. `true` → proof enters the highest-priority direct-injection block for all subsequent brainstorm/paper submitters via `proof_database.get_novel_proofs_for_injection()`. `false` → stored in the database but not injected.
+- `reasoning`: Always required.
+
+**Novel criteria (any one sufficient):** Result not in Mathlib or standard textbooks; new connection/bound/structural insight; formalizes a previously unverified conjecture; non-trivial composition of known results yielding something new; original relative to the existing stored proofs.
+
+**Not novel:** Direct Mathlib restatement; trivial identity or tautology; closable by a single standard tactic (`simp`, `omega`, `norm_num`, `decide`, `rfl`); duplicates an already-stored novel proof.
 
 ---
 
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index ba58356..571ad39 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -1245,17 +1245,17 @@ Main component for displaying Tier 3 status and content:
 
 Runs automatically after every completed brainstorm (Tier 1) and every completed paper (Tier 2 / Tier 3 chapter), gated on `system_config.lean4_enabled`. Silent no-op when disabled.
 
-**Proof Framing Gate (one-shot, at autonomous start)**: When `lean4_enabled`, the coordinator runs `_run_proof_framing_gate()` before research begins. A single LLM call on the user prompt decides `is_proof_amenable` (`build_proof_framing_gate_prompt` → `autonomous_proof_framing_gate` role). If true, `PROOF_FRAMING_CONTEXT` is appended to every subsequent submitter prompt via `_append_proof_framing()` and persisted to workflow state for crash recovery. Decision is broadcast via `proof_framing_decided`. Silent no-op when disabled or when the prompt is not proof-amenable.
+**Proof Framing Gate (one-shot, at autonomous start)**: When `lean4_enabled`, the coordinator runs `_run_proof_framing_gate()` before research begins. A single LLM call on the user prompt decides `is_proof_amenable` (`build_proof_framing_gate_prompt` → `autonomous_proof_framing_gate` role). The gate errs on the side of `true` — it returns `false` only when the prompt is purely empirical, engineering-focused, or has no meaningful mathematical content. If `true`, `PROOF_FRAMING_CONTEXT` (which directs submissions to pursue **novel, non-trivial** theorems and explicitly discourages standard identities and Mathlib restatements) is appended to every subsequent submitter prompt via `_append_proof_framing()` and persisted to workflow state for crash recovery. Decision is broadcast via `proof_framing_decided`. Silent no-op when disabled or when the prompt is not proof-amenable.
 
 **Pipeline** (`backend/autonomous/core/proof_verification_stage.py`):
-1. **Candidate identification** — `ProofIdentificationAgent` extracts theorem/lemma candidates from brainstorm or paper content
+1. **Candidate identification** — `ProofIdentificationAgent` (`build_proof_identification_prompt`) extracts up to 5 novel, non-trivial theorem candidates from brainstorm or paper content, ranked by novelty potential. Trivial identities, textbook restatements, and single-tactic-closable results are filtered out at this stage before any Lean 4 cost is incurred.
 2. **Optional Mathlib lemma search** — `MathlibLemmaSearchAgent` surfaces relevant existing lemmas into the formalization prompt
 3. **Optional SMT early-exit** — when `smt_enabled`, `SmtClient` classifies candidates conservatively; successful SMT results become Lean tactic hints (nativeDecide / omega / decide style), never stored as standalone proofs
 4. **Lean 4 formalization attempts** — two-phase retry: up to 3 full-proof attempts via `ProofFormalizationAgent.prove_candidate`, then up to 2 multi-tactic script attempts via `prove_candidate_tactic_script` (5 total per candidate). Prior `FailedProofCandidate` failure hints from `proof_database.inject_failure_hints_into_prompt()` thread into each retry.
 5. **Novelty check** — `autonomous_proof_novelty` role compares verified proof against existing proof library
-6. **Storage** — `proof_database.add_proof()` persists novel and known proofs as session-aware records (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and reverse Mathlib usage index. Verified proofs are also appended as a "Verified Proofs" section at the bottom of the source brainstorm DB and/or paper file via `append_proofs_section()`.
+6. **Storage** — `proof_database.add_proof()` persists novel and known proofs as session-aware records (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and reverse Mathlib usage index. Verified proofs are also appended as a "Verified Proofs" section at the bottom of the source brainstorm DB and/or paper file via `append_proofs_section()`. Cross-session read access is provided by `proof_database.list_proof_library()` (all sessions, novelty-filtered) and `proof_database.get_library_proof(session_id, proof_id)`, consumed by the `ProofLibrary` UI component and `/api/proofs/library` endpoints.
 
-**Parallelism (two-phase execution per stage run)**: Steps 2–4 above (the per-candidate "Phase A" Lean pipeline: lemma search → optional SMT hint → `prove_candidate` → `prove_candidate_tactic_script` → `proof_attempts_exhausted` broadcast on failure) run concurrently across *all* identified candidates inside a single `ProofVerificationStage.run()` invocation, bounded by `system_config.proof_max_parallel_candidates` (default 6, env: `MOTO_PROOF_MAX_PARALLEL_CANDIDATES` / `PROOF_MAX_PARALLEL_CANDIDATES`) via an `asyncio.Semaphore`. Completed candidates are consumed by the driver loop through `asyncio.as_completed`, and steps 5–6 (the "Phase B" post-processing: novelty assessment, `add_proof`, dependency extraction via `ProofDependencyExtractor`, `append_proofs_section`, `novel_proof_discovered` / `known_proof_verified` broadcast, `record_failed_candidate` for brainstorm failures) are performed strictly **one-at-a-time** in Phase-A completion order inside that driver loop so later candidates can observe earlier stored proofs as MOTO dependencies. Every identified candidate is attempted — no cutoff. Each Phase-A task instantiates its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` so the per-agent `task_sequence` counter cannot collide across concurrent candidates. If any Phase-A task raises `FreeModelExhaustedError` (or any other exception), the driver cancels all still-running sibling tasks and re-raises so the coordinator's recovery path runs with no orphaned background API calls. `should_stop` is plumbed into each Phase-A pipeline and checked before each Phase-B pass, so a stop-request short-circuits cleanly without leaking tasks.
+**Parallelism (two-phase execution per stage run)**: Steps 2–4 above (the per-candidate "Phase A" pipeline: lemma search → optional SMT hint → `prove_candidate` → `prove_candidate_tactic_script` → `proof_attempts_exhausted` broadcast on failure) run concurrently across *all* identified candidates inside a single `ProofVerificationStage.run()` invocation, bounded by `system_config.proof_max_parallel_candidates` (default 6, env: `MOTO_PROOF_MAX_PARALLEL_CANDIDATES` / `PROOF_MAX_PARALLEL_CANDIDATES`) via an `asyncio.Semaphore`. Phase A parallelizes agent/model work, but actual Lean 4 subprocess verification is serialized by `Lean4Client` behind a shared execution lock so all candidates queue one-at-a-time against the shared Mathlib workspace; LSP mode remains independently serialized by its operation lock and subprocess fallback uses the same shared queue. The identification stage (step 1) caps candidates at 5 and filters trivial/well-known results before Phase A begins, so Phase A only processes genuinely novel-potential theorems. Completed candidates are consumed by the driver loop through `asyncio.as_completed`, and steps 5–6 (the "Phase B" post-processing: novelty assessment, `add_proof`, dependency extraction via `ProofDependencyExtractor`, `append_proofs_section`, `novel_proof_discovered` / `known_proof_verified` broadcast, `record_failed_candidate` for brainstorm failures) are performed strictly **one-at-a-time** in Phase-A completion order inside that driver loop so later candidates can observe earlier stored proofs as MOTO dependencies. Each Phase-A task instantiates its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` so the per-agent `task_sequence` counter cannot collide across concurrent candidates. If any Phase-A task raises `FreeModelExhaustedError` (or any other exception), the driver cancels all still-running sibling tasks and re-raises so the coordinator's recovery path runs with no orphaned background API calls. `should_stop` is plumbed into each Phase-A pipeline and checked before each Phase-B pass, so a stop-request short-circuits cleanly without leaking tasks.
 
 **Rigor mode is NOT parallelized** (compiler Part 2): `submit_rigor_lean_theorem()` runs one candidate per rigor cycle by design (discovery → 5 Lean attempts → novelty → placement) and the outer `_rigor_loop` drives cycles serially so each proven theorem can land in the paper before the next discovery sees updated context. The parallel candidate pipeline lives only in `ProofVerificationStage`.
 
@@ -1263,7 +1263,7 @@ Runs automatically after every completed brainstorm (Tier 1) and every completed
 
 **Lean 4 is authoritative**: SMT results never substitute for Lean verification. The `Lean4Result` contract is the only path to a stored proof. SMT contributes hints only.
 
-**Subprocess vs LSP**: `lean4_client` runs Lean via subprocess by default. When `lean4_lsp_enabled`, a persistent LSP-style process reduces cold-start overhead; the subprocess path remains the fallback and must keep working when LSP is disabled.
+**Subprocess vs LSP**: `lean4_client` runs Lean via subprocess by default. When `lean4_lsp_enabled`, a persistent LSP-style process reduces cold-start overhead; the subprocess path remains the fallback and must keep working when LSP is disabled. Missing/corrupt Mathlib `.olean` diagnostics are infrastructure failures, not proof failures: the client must re-check workspace readiness inside the serialized Lean execution queue, invalidate readiness when the cache is bad, refetch the Mathlib cache, retry the same Lean check once, and return a distinct `LEAN 4 WORKSPACE ERROR` if repair still fails. Future checks may attempt repair again after external fixes or transient failures clear, but the current failed check must not burn proof attempts as ordinary Lean feedback.
 
 **Manual proof checks** (Build 5): `POST /api/proofs/check` reuses `ProofVerificationStage.run_manual()` with the stored `ProofRuntimeConfigSnapshot` (brainstorm / paper / validator role configs captured during autonomous startup). Readiness is surfaced via `/api/proofs/status.manual_check_ready` + `manual_check_message`. Required state: `lean4_enabled=True` AND a runtime snapshot must exist (start autonomous research once to seed it).
 
@@ -1282,14 +1282,14 @@ Runs automatically after every completed brainstorm (Tier 1) and every completed
 **Proof Stage Critical Invariants**:
 1. Proof stage is silent and skipped when `lean4_enabled=False` — never blocks brainstorm or paper completion
 2. Lean 4 is authoritative — SMT results are hints only, never stored as standalone proofs, `Lean4Result` contract is unchanged by SMT
-3. Subprocess checker must continue to work when `lean4_lsp_enabled=False`; LSP path must not regress subprocess behavior when enabled
+3. Subprocess checker must continue to work when `lean4_lsp_enabled=False`; LSP path must not regress subprocess behavior when enabled. Missing/corrupt `.olean` cache errors must trigger one workspace repair/retry, then fail the current check with `LEAN 4 WORKSPACE ERROR` if repair fails; these infrastructure failures must not fall through into tactic mode, emit `proof_attempts_exhausted`, or burn all proof attempts as ordinary Lean feedback
 4. Proof storage is session-aware (`session_manager` → `get_proofs_dir()`) and falls back to the legacy `backend/data/proofs/` layout when no session is active
 5. Per-source reservation lock prevents concurrent proof checks on the same `{source_type}:{source_id}` (autonomous vs manual interleaving)
 6. Novel proofs become highest-priority direct-injection context for subsequent brainstorm/paper submitters (via `proof_database.inject_failure_hints_into_prompt()` and stored `ProofRecord` summaries)
 7. Proof certificates stay text-based (`.lean` source + JSON metadata) — no binary artifacts
 8. Hosted/generic mode keeps `lean4_enabled` and `smt_enabled` default false and the hosted image stays Lean-free and Z3-free (no proof binaries in the `python:3.12-slim` runtime)
 9. Proof framing gate runs once per autonomous start and only when `lean4_enabled`; the resulting `proof_framing_active` flag and `PROOF_FRAMING_CONTEXT` are persisted in workflow state for crash recovery
-10. Every identified theorem candidate must be attempted — Phase A is bounded by `proof_max_parallel_candidates` but never truncates the candidate list; Phase A runs concurrently across candidates while Phase B (novelty / `add_proof` / dependency extraction / brainstorm+paper `append_proofs_section` / novel/known broadcasts / `record_failed_candidate`) remains strictly serialized in Phase-A completion order so intra-batch MOTO dependencies and per-source proof appending stay coherent
+10. Candidate identification (`build_proof_identification_prompt`) is a novelty-seeking gate — it rejects trivial identities, textbook restatements, and single-tactic-closable results, and returns **at most 5** candidates ranked by novelty potential. Every candidate that passes this gate is attempted — Phase A is bounded by `proof_max_parallel_candidates` but never truncates the post-identification candidate list; Phase A agent/model work runs concurrently across candidates while actual Lean 4 subprocess verification queues one-at-a-time through `Lean4Client`, and Phase B (novelty / `add_proof` / dependency extraction / brainstorm+paper `append_proofs_section` / novel/known broadcasts / `record_failed_candidate`) remains strictly serialized in Phase-A completion order so intra-batch MOTO dependencies and per-source proof appending stay coherent
 11. Each Phase-A task owns its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` instance to keep per-agent `task_sequence` counters collision-free; any Phase-A exception (including `FreeModelExhaustedError`) must cancel all sibling tasks and re-raise so the coordinator's recovery path runs without orphaned background API calls
 12. `should_stop` propagates into Phase A and is re-checked before each Phase-B pass so stop-requests short-circuit without leaking tasks or partially-applied Phase-B writes
 13. Compiler rigor mode (`submit_rigor_lean_theorem`, `_rigor_loop`) is NOT parallelized — rigor cycles discover, verify, and place one theorem per cycle so each verified theorem lands in the paper before the next discovery; the parallel candidate pipeline lives only in `ProofVerificationStage`
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index dd67a34..13eab9e 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -156,7 +156,7 @@ project-root/
 │   │       ├── topic_exploration_memory.py # In-memory candidate DB for topic exploration phase
 │   │       ├── paper_model_tracker.py   # Per-paper model usage tracking and author attribution
 │   │       ├── autonomous_api_logger.py # Autonomous API call logger singleton
-│   │       ├── proof_database.py        # Session-aware Lean 4 verified-proof storage (records, Lean sources, novelty index, reverse Mathlib index)
+│   │       ├── proof_database.py        # Session-aware Lean 4 verified-proof storage (records, Lean sources, novelty index, reverse Mathlib index); cross-session library access via `list_proof_library()` and `get_library_proof()`
 │   │       ├── final_answer_memory.py   # TIER 3 - Final answer state & volume management
 │   │       └── session_manager.py       # Prompt-based session folder organization
 │   │
@@ -261,12 +261,14 @@ project-root/
 │   │   │       ├── FinalAnswerLibrary.css   # Final answer library styles
 │   │   │       ├── ArchiveViewerModal.jsx   # Research lineage archive viewer (papers + brainstorms)
 │   │   │       ├── ArchiveViewerModal.css   # Archive viewer styles
-│   │   │       ├── MathematicalProofs.jsx   # Proof library tab (lists verified novel/non-novel proofs from `/api/proofs`)
+│   │   │       ├── MathematicalProofs.jsx   # Live-session proof tab (lists verified novel/non-novel proofs from current session via `/api/proofs`)
 │   │   │       ├── MathematicalProofs.css   # Proof library styles
 │   │   │       ├── ProofGraph.jsx           # Proof dependency graph view (hand-rolled SVG; Build 4, may escalate to reactflow in Build 5 if needed)
 │   │   │       ├── ProofGraph.css           # Proof graph styles
 │   │   │       ├── ProofNotificationStack.jsx # Persistent popup notifications for novel proof discoveries
-│   │   │       ├── Stage2PaperHistory.jsx   # Tier 2 paper history list (grouped per research run; used inside FinalAnswerLibrary)
+│   │   │       ├── ProofLibrary.jsx         # Cross-session novel proof library viewer (all sessions, grouped by research run; sub-tab inside CompletedWorksLibrary; fetches via `/api/proofs/library`)
+│   │   │       ├── ProofLibrary.css         # Proof library viewer styles
+│   │   │       ├── Stage2PaperHistory.jsx   # Tier 2 paper history list (grouped per research run; sub-tab inside CompletedWorksLibrary)
 │   │   │       └── Stage2PaperHistory.css   # Tier 2 paper history styles
 │   │   │
 │   │   ├── StartupProviderSetupModal.jsx # Post-disclaimer startup chooser for OpenRouter vs LM Studio setup (OpenRouter-only in generic mode)
@@ -287,7 +289,7 @@ project-root/
 │   │   ├── critique-modal.css           # Paper critique modal styles
 │   │   │
 │   │   ├── services/
-│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI, `/api/features` capability bootstrap helper, and proof routes under `/api/proofs/*`)
+│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI, `/api/features` capability bootstrap helper, proof routes under `/api/proofs/*`, and cross-session proof library routes `getProofLibrary` / `getLibraryProof` under `/api/proofs/library`)
 │   │   │   └── websocket.js             # WebSocket connection 
 │   │   │
 │   │   ├── hooks/
@@ -385,20 +387,20 @@ project-root/
 - Tier 3 Agents: `certainty_assessor.py`, `answer_format_selector.py`, `volume_organizer.py`
 - `paper_redundancy_checker.py`: Library quality maintenance (every 3 papers)
 - Prompts: `topic_prompts.py`, `topic_exploration_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_exploration_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `paper_continuation_prompts.py`, `proof_prompts.py`, `final_answer_prompts.py`
-- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py` (also stores the proof runtime config snapshot), `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `proof_database.py` (session-aware Lean 4 proof storage + novelty index + reverse Mathlib index), `final_answer_memory.py` (model tracking, archival)
+- Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py` (also stores the proof runtime config snapshot), `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `proof_database.py` (session-aware Lean 4 proof storage + novelty index + reverse Mathlib index + cross-session library access), `final_answer_memory.py` (model tracking, archival)
 
 ### API Routes
 
 - `compiler.py`: Compiler control (start/stop/status), paper/outline access, critique management
 - `autonomous.py`: Autonomous research control (start/stop/clear/status), brainstorm/paper access, Tier 3 endpoints
-- `proofs.py`: Proof database listing, `/status` runtime readiness, `POST /settings` runtime flag updates, `POST /check` manual proof check, `/{id}/certificate[.lean]` certificate export, `/{id}/dependencies` + `/graph` + `/mathlib/{lemma}/dependents` graph/lineage queries. All routes gated on `lean4_enabled`.
+- `proofs.py`: Proof database listing, `/status` runtime readiness, `POST /settings` runtime flag updates, `POST /check` manual proof check, `/{id}/certificate[.lean]` certificate export, `/{id}/dependencies` + `/graph` + `/mathlib/{lemma}/dependents` graph/lineage queries (all above gated on `lean4_enabled`); `GET /library` + `GET /library/{session_id}/{proof_id}` cross-session proof library endpoints (NOT gated — read-only file access, always available).
 
 ### Frontend Components
 
-- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global, and Build 3C bootstraps `/api/features` here so hosted mode can hide LM Studio-only UI and copy.
+- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global, and Build 3C bootstraps `/api/features` here so hosted mode can hide LM Studio-only UI and copy. **Tab persistence**: `autonomousActiveTab` → `localStorage['autonomousActiveTab']`; `completedWorksSubTab` → `localStorage['completedWorksSubTab']`; `manualActiveTab` → `localStorage['manualActiveTab']`. **Autonomous tab groups**: main tabs (interface, brainstorms, papers, proofs, optional final-answer) + settings group (Your Completed Works Library, API Call Logs, Settings). The "Your Completed Works Library" tab hosts three sub-tabs rendered inside its content area: Stage 2 Papers History, Stage 3 Final Answers History, and Proof Library.
 - **Aggregator**: `AggregatorInterface.jsx`, `AggregatorSettings.jsx`, `AggregatorLogs.jsx`, `LiveResults.jsx`
 - **Compiler**: `CompilerInterface.jsx`, `CompilerSettings.jsx`, `CompilerLogs.jsx`, `LivePaper.jsx`
-- **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx`, `ArchiveViewerModal.jsx`, `MathematicalProofs.jsx` (proof library), `ProofGraph.jsx` (dependency graph), `ProofNotificationStack.jsx` (novel-proof popups)
+- **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx` (Stage 3 history sub-tab), `ArchiveViewerModal.jsx`, `MathematicalProofs.jsx` (live-session proof tab), `ProofGraph.jsx` (dependency graph), `ProofNotificationStack.jsx` (novel-proof popups), `ProofLibrary.jsx` (cross-session proof library sub-tab), `Stage2PaperHistory.jsx` (Stage 2 history sub-tab)
 - **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
 - **Hooks**: `useProofCheckRuntime.js` (reads `/api/proofs/status` + runtime config so UI can enable/disable manual proof-check controls)
 - **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `openRouterSelection.js` (shared OpenRouter selector auto-fill helpers using model context and provider endpoint caps), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers; when editing a preset, anchor to the exact profile block and exact nested role such as `validator` or `highContext`, never to a shared literal alone, then verify the diff only touched that intended profile/role), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
diff --git a/backend/api/routes/proofs.py b/backend/api/routes/proofs.py
index c5615aa..5ec114a 100644
--- a/backend/api/routes/proofs.py
+++ b/backend/api/routes/proofs.py
@@ -181,6 +181,124 @@ async def list_novel_proofs():
     }
 
 
+@router.get("/known")
+async def list_known_proofs():
+    """Return only known (non-novel) verified proofs."""
+    proofs = await proof_database.get_all_proofs(novel_only=False)
+    return {
+        "proofs": [proof.model_dump(mode="json") for proof in proofs],
+        "counts": proof_database.count_proofs(),
+    }
+
+
+async def _strip_known_proofs_from_files() -> dict:
+    """Utility: strip non-novel proof entries from brainstorm and paper files on disk.
+
+    Iterates all brainstorm and paper files in the current session and removes
+    entries marked ``Status: Verified (Known)`` from their proof sections while
+    preserving entries marked ``Status: Verified (Novel)``.  Returns a summary
+    dict with counts of files modified and proof entries removed.
+
+    This is safe to run mid-session; the proof data is not lost — every proof
+    (novel or known) remains in ProofDatabase (the JSON index files).
+    """
+    import re as _re
+    import asyncio as _asyncio
+
+    files_checked = 0
+    files_modified = 0
+    entries_removed = 0
+
+    def _clean_content(content: str, proof_header: str) -> tuple[str, int]:
+        """Return (cleaned_content, removed_count).  Removes Known entries only."""
+        if proof_header not in content:
+            return content, 0
+
+        before, _, after = content.partition(proof_header)
+        # Split the proof section into individual proof blocks
+        # Each block starts with "Proof N:" and ends before the next "Proof N:" or EOF
+        block_pattern = _re.compile(r'(?=^Proof \d+:)', _re.MULTILINE)
+        blocks = _re.split(block_pattern, after)
+
+        kept = []
+        removed = 0
+        for block in blocks:
+            stripped = block.strip()
+            if not stripped:
+                continue
+            # Remove blocks that are explicitly marked as Known
+            if 'Status: Verified (Known)' in block:
+                removed += 1
+            else:
+                kept.append(block)
+
+        if removed == 0:
+            return content, 0
+
+        if kept:
+            new_after = "\n".join(kept)
+            new_content = before + proof_header + "\n\n" + new_after
+        else:
+            # All proofs in this section were Known — remove the header too
+            new_content = before.rstrip()
+
+        return new_content, removed
+
+    # Clean brainstorm files
+    brainstorm_paths = list(brainstorm_memory._base_dir.rglob("brainstorm_*.txt")) if hasattr(brainstorm_memory, '_base_dir') else []
+    for path in brainstorm_paths:
+        try:
+            files_checked += 1
+            text = path.read_text(encoding="utf-8")
+            cleaned, removed = _clean_content(text, "=== PROOFS GENERATED FROM THIS BRAINSTORM (Lean 4 Verified) ===")
+            if removed > 0:
+                path.write_text(cleaned, encoding="utf-8")
+                files_modified += 1
+                entries_removed += removed
+                logger.info(f"Stripped {removed} known proof(s) from brainstorm file: {path.name}")
+        except Exception as exc:
+            logger.warning(f"Skipped brainstorm file {path}: {exc}")
+
+    # Clean paper files
+    paper_paths = list(paper_library._base_dir.rglob("paper_*.txt")) if hasattr(paper_library, '_base_dir') else []
+    for path in paper_paths:
+        try:
+            files_checked += 1
+            text = path.read_text(encoding="utf-8")
+            cleaned, removed = _clean_content(text, "=== PROOFS GENERATED FROM THIS PAPER (Lean 4 Verified) ===")
+            if removed > 0:
+                path.write_text(cleaned, encoding="utf-8")
+                files_modified += 1
+                entries_removed += removed
+                logger.info(f"Stripped {removed} known proof(s) from paper file: {path.name}")
+        except Exception as exc:
+            logger.warning(f"Skipped paper file {path}: {exc}")
+
+    return {
+        "files_checked": files_checked,
+        "files_modified": files_modified,
+        "entries_removed": entries_removed,
+        "message": (
+            f"Removed {entries_removed} non-novel proof entries from {files_modified} file(s). "
+            "Proof data is retained in ProofDatabase."
+        ),
+    }
+
+
+@router.post("/cleanup-known-from-files")
+async def cleanup_known_proofs_from_files():
+    """One-time cleanup: strip non-novel proof entries from brainstorm/paper files.
+
+    Non-novel proofs are stored in ProofDatabase (no data loss).  This endpoint
+    removes their raw Lean 4 code from brainstorm and paper .txt files so that
+    compiler and RAG context is no longer polluted by standard known results.
+
+    Safe to call on a running session.  Novel proof entries are preserved.
+    """
+    result = await _strip_known_proofs_from_files()
+    return result
+
+
 @router.get("/status")
 async def get_proofs_status():
     """Return Lean 4 availability and proof-database status."""
@@ -322,6 +440,30 @@ async def run_manual_proof_check(request: ProofCheckRequest, background_tasks: B
     }
 
 
+@router.get("/library")
+async def get_proof_library(novel_only: bool = True):
+    """Return all proofs across all sessions for the proof library browser."""
+    proofs = await proof_database.list_proof_library(novel_only=novel_only)
+    novel_count = sum(1 for p in proofs if p.get("novel"))
+    return {
+        "proofs": proofs,
+        "counts": {
+            "total": len(proofs) if not novel_only else None,
+            "listed": len(proofs),
+            "novel": novel_count,
+        },
+    }
+
+
+@router.get("/library/{session_id}/{proof_id}")
+async def get_library_proof(session_id: str, proof_id: str):
+    """Return a single proof from a specific session with full Lean code."""
+    proof = await proof_database.get_library_proof(session_id, proof_id)
+    if proof is None:
+        raise HTTPException(status_code=404, detail="Proof not found")
+    return proof
+
+
 @router.get("/{proof_id}/certificate")
 async def get_proof_certificate(proof_id: str):
     """Return a machine-readable proof certificate JSON payload."""
diff --git a/backend/autonomous/agents/proof_formalization_agent.py b/backend/autonomous/agents/proof_formalization_agent.py
index 857c758..aa589e3 100644
--- a/backend/autonomous/agents/proof_formalization_agent.py
+++ b/backend/autonomous/agents/proof_formalization_agent.py
@@ -3,6 +3,7 @@
 """
 from __future__ import annotations
 
+import json
 import logging
 from typing import Awaitable, Callable, List, Optional, Tuple
 
@@ -24,6 +25,28 @@
 AttemptStartCallback = Callable[[int, str], Awaitable[None]]
 ShouldStopFn = Optional[Callable[[], bool]]
 
+_JSON_PARSE_ERROR_MARKERS = (
+    "empty or whitespace-only response",
+    "empty response from formalization model",
+    "empty response from tactic formalization model",
+    "expecting property name",
+    "expecting value",
+    "extra data",
+    "invalid control character",
+    "json response truncated",
+    "no content in formalization model response",
+    "no content in tactic formalization model response",
+    "no json found",
+    "openrouter connection failed",
+    "openrouter response missing 'choices'",
+    "openrouter returned non-json body",
+    "response too short",
+    "unterminated string",
+    "upstream provider timeout",
+)
+_MALFORMED_MODEL_OUTPUT_REASON = "Model returned malformed output (not valid JSON); retrying with clean context."
+_LEAN_WORKSPACE_ERROR_PREFIX = "LEAN 4 WORKSPACE ERROR"
+
 
 def _is_stop_requested(should_stop: ShouldStopFn) -> bool:
     if should_stop is None:
@@ -34,6 +57,32 @@ def _is_stop_requested(should_stop: ShouldStopFn) -> bool:
         return False
 
 
+def _is_json_parse_error(exc: Exception) -> bool:
+    if isinstance(exc, json.JSONDecodeError):
+        return True
+    if not isinstance(exc, ValueError):
+        return False
+    message = str(exc).lower()
+    return any(marker in message for marker in _JSON_PARSE_ERROR_MARKERS)
+
+
+def _is_malformed_model_output_feedback(feedback: ProofAttemptFeedback) -> bool:
+    return (
+        not feedback.success
+        and not feedback.lean_code
+        and not feedback.error_output
+        and feedback.reasoning == _MALFORMED_MODEL_OUTPUT_REASON
+    )
+
+
+def _is_lean_workspace_error_feedback(feedback: ProofAttemptFeedback) -> bool:
+    error_output = feedback.error_output or ""
+    return (
+        not feedback.success
+        and error_output.startswith(_LEAN_WORKSPACE_ERROR_PREFIX)
+    )
+
+
 class ProofFormalizationAgent:
     """Turn theorem candidates into Lean 4 code and retry with feedback."""
 
@@ -217,12 +266,17 @@ async def _run_full_script_attempt(
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            is_parse_error = _is_json_parse_error(exc)
             feedback = ProofAttemptFeedback(
                 attempt=attempt_number,
                 theorem_id=theorem_candidate.theorem_id,
-                reasoning="Formalization attempt failed before Lean 4 verification.",
+                reasoning=(
+                    _MALFORMED_MODEL_OUTPUT_REASON
+                    if is_parse_error
+                    else "Formalization attempt failed before Lean 4 verification."
+                ),
                 lean_code="",
-                error_output=str(exc),
+                error_output="" if is_parse_error else str(exc),
                 goal_states="",
                 strategy="full_script",
                 success=False,
@@ -264,7 +318,11 @@ async def prove_candidate(
             else (attempts[-1].attempt + 1 if attempts else 1)
         )
 
-        for attempt_offset in range(max_attempts):
+        attempt_offset = 0
+        malformed_output_retries = 0
+        max_malformed_output_retries = max(1, max_attempts)
+
+        while attempt_offset < max_attempts:
             if _is_stop_requested(should_stop):
                 logger.info(
                     "ProofFormalizationAgent.prove_candidate: stop requested, aborting before attempt %s for %s.",
@@ -273,7 +331,7 @@ async def prove_candidate(
                 )
                 break
             attempt_number = next_attempt_number + attempt_offset
-            if attempt_start_callback:
+            if attempt_start_callback and malformed_output_retries == 0:
                 await attempt_start_callback(attempt_number, "full_script")
 
             current_theorem_name, source_excerpt, feedback = await self._run_full_script_attempt(
@@ -285,6 +343,22 @@ async def prove_candidate(
                 attempt_number=attempt_number,
                 smt_hint=smt_hint,
             )
+
+            terminal_malformed_output = False
+            if _is_malformed_model_output_feedback(feedback):
+                malformed_output_retries += 1
+                logger.warning(
+                    "ProofFormalizationAgent full-script attempt %s for %s produced malformed model output; retrying without consuming Lean attempt budget (%s/%s).",
+                    attempt_number,
+                    theorem_candidate.theorem_id,
+                    malformed_output_retries,
+                    max_malformed_output_retries,
+                )
+                if malformed_output_retries < max_malformed_output_retries:
+                    continue
+                terminal_malformed_output = True
+            else:
+                malformed_output_retries = 0
             if current_theorem_name:
                 theorem_name = current_theorem_name
 
@@ -294,6 +368,11 @@ async def prove_candidate(
 
             if feedback.success:
                 return True, theorem_name, feedback.lean_code, attempts
+            if _is_lean_workspace_error_feedback(feedback):
+                break
+            if terminal_malformed_output:
+                break
+            attempt_offset += 1
 
         final_code = attempts[-1].lean_code if attempts else ""
         return False, theorem_name, final_code, attempts
@@ -327,7 +406,11 @@ async def prove_candidate_tactic_script(
             else (attempts[-1].attempt + 1 if attempts else 1)
         )
 
-        for attempt_offset in range(max_attempts):
+        attempt_offset = 0
+        malformed_output_retries = 0
+        max_malformed_output_retries = max(1, max_attempts)
+
+        while attempt_offset < max_attempts:
             if _is_stop_requested(should_stop):
                 logger.info(
                     "ProofFormalizationAgent.prove_candidate_tactic_script: stop requested, aborting before attempt %s for %s.",
@@ -336,7 +419,7 @@ async def prove_candidate_tactic_script(
                 )
                 break
             attempt_number = next_attempt_number + attempt_offset
-            if attempt_start_callback:
+            if attempt_start_callback and malformed_output_retries == 0:
                 await attempt_start_callback(attempt_number, "tactic_script")
 
             prompt, source_excerpt, max_input_tokens, prompt_tokens = self._fit_prompt_to_context(
@@ -353,6 +436,7 @@ async def prove_candidate_tactic_script(
             )
 
             if prompt_tokens > max_input_tokens:
+                malformed_output_retries = 0
                 feedback = ProofAttemptFeedback(
                     attempt=attempt_number,
                     theorem_id=theorem_candidate.theorem_id,
@@ -364,6 +448,7 @@ async def prove_candidate_tactic_script(
                 attempts.append(feedback)
                 if attempt_callback:
                     await attempt_callback(feedback)
+                attempt_offset += 1
                 continue
 
             task_id = self.get_current_task_id()
@@ -416,11 +501,31 @@ async def prove_candidate_tactic_script(
                     )
                     if current_theorem_name:
                         theorem_name = current_theorem_name
+                    terminal_malformed_output = False
+                    if _is_malformed_model_output_feedback(feedback):
+                        malformed_output_retries += 1
+                        logger.warning(
+                            "ProofFormalizationAgent fallback full-script attempt %s for %s produced malformed model output; retrying without consuming Lean attempt budget (%s/%s).",
+                            attempt_number,
+                            theorem_candidate.theorem_id,
+                            malformed_output_retries,
+                            max_malformed_output_retries,
+                        )
+                        if malformed_output_retries < max_malformed_output_retries:
+                            continue
+                        terminal_malformed_output = True
+                    else:
+                        malformed_output_retries = 0
                     attempts.append(feedback)
                     if attempt_callback:
                         await attempt_callback(feedback)
                     if feedback.success:
                         return True, theorem_name, feedback.lean_code, attempts
+                    if _is_lean_workspace_error_feedback(feedback):
+                        break
+                    if terminal_malformed_output:
+                        break
+                    attempt_offset += 1
                     continue
 
                 lean_code = self._compose_tactic_script_code(theorem_header, tactic_commands)
@@ -440,34 +545,61 @@ async def prove_candidate_tactic_script(
                     tactic_trace=tactic_trace,
                     success=lean_result.success,
                 )
+                malformed_output_retries = 0
                 attempts.append(feedback)
                 if attempt_callback:
                     await attempt_callback(feedback)
 
                 if lean_result.success:
                     return True, theorem_name, lean_code, attempts
+                if _is_lean_workspace_error_feedback(feedback):
+                    break
+                attempt_offset += 1
             except FreeModelExhaustedError:
                 raise
             except Exception as exc:
+                is_parse_error = _is_json_parse_error(exc)
                 feedback = ProofAttemptFeedback(
                     attempt=attempt_number,
                     theorem_id=theorem_candidate.theorem_id,
-                    reasoning="Tactic-script formalization attempt failed before Lean 4 verification.",
+                    reasoning=(
+                        _MALFORMED_MODEL_OUTPUT_REASON
+                        if is_parse_error
+                        else "Tactic-script formalization attempt failed before Lean 4 verification."
+                    ),
                     lean_code="",
-                    error_output=str(exc),
+                    error_output="" if is_parse_error else str(exc),
                     goal_states="",
                     strategy="tactic_script",
                     success=False,
                 )
-                attempts.append(feedback)
-                if attempt_callback:
-                    await attempt_callback(feedback)
                 logger.warning(
                     "ProofFormalizationAgent tactic-script attempt %s failed for %s: %s",
                     attempt_number,
                     theorem_candidate.theorem_id,
                     exc,
                 )
+                terminal_malformed_output = False
+                if _is_malformed_model_output_feedback(feedback):
+                    malformed_output_retries += 1
+                    logger.warning(
+                        "ProofFormalizationAgent tactic-script attempt %s for %s produced malformed model output; retrying without consuming Lean attempt budget (%s/%s).",
+                        attempt_number,
+                        theorem_candidate.theorem_id,
+                        malformed_output_retries,
+                        max_malformed_output_retries,
+                    )
+                    if malformed_output_retries < max_malformed_output_retries:
+                        continue
+                    terminal_malformed_output = True
+                else:
+                    malformed_output_retries = 0
+                attempts.append(feedback)
+                if attempt_callback:
+                    await attempt_callback(feedback)
+                if terminal_malformed_output:
+                    break
+                attempt_offset += 1
 
         final_code = attempts[-1].lean_code if attempts else ""
         return False, theorem_name, final_code, attempts
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 87b3980..38f51ac 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -207,10 +207,22 @@ def _get_effective_user_research_prompt(self) -> str:
     async def _get_effective_brainstorm_prompt(self, topic_prompt: str) -> str:
         """Return the brainstorm prompt with proof context applied."""
         effective_prompt = self._apply_proof_context(topic_prompt)
-        return await proof_database.inject_failure_hints_into_prompt(
+        effective_prompt = await proof_database.inject_failure_hints_into_prompt(
             effective_prompt,
             self._current_topic_id or "",
         )
+        # Append a compact summary of known (non-novel) proofs scoped to this
+        # brainstorm topic so the system can avoid re-proving standard results.
+        # Theorem statements only — no Lean code — to keep token cost low.
+        counts = proof_database.count_proofs()
+        if counts["known"] > 0:
+            known_summary = proof_database.get_known_proofs_summary_for_browsing(
+                source_id=self._current_topic_id or None,
+                limit=15,
+            )
+            if known_summary:
+                effective_prompt = f"{effective_prompt}\n\n{known_summary}"
+        return effective_prompt
 
     def _get_effective_compiler_prompt(self, paper_title: str) -> str:
         """Return the compiler prompt with proof context applied."""
@@ -4064,16 +4076,25 @@ async def _compile_paper(
             
             # Load brainstorm database into compiler RAG
             # This is now the ONLY aggregator content loaded (no Part 1 pollution)
-            # IMPORTANT: Use brainstorm_memory.get_database_path() for session-aware path resolution
+            # Proof sections (both novel and non-novel) are stripped before indexing
+            # so that RAG chunks contain only mathematical submission content.
+            # Novel proofs reach the compiler via proof_database.inject_into_prompt().
             brainstorm_db_path = brainstorm_memory.get_database_path(self._current_topic_id)
             if os.path.exists(brainstorm_db_path):
                 logger.info(f"Loading brainstorm database into compiler RAG: {brainstorm_db_path}")
-                await rag_manager.add_document(
-                    brainstorm_db_path,
-                    chunk_sizes=[512],  # Use standard chunk size for brainstorm
-                    is_user_file=True  # High priority, permanent
+                brainstorm_content_for_rag = await brainstorm_memory.get_database_content(
+                    self._current_topic_id, strip_proofs=True
                 )
-                logger.info("Brainstorm database loaded into compiler RAG")
+                if brainstorm_content_for_rag:
+                    await rag_manager.add_text(
+                        brainstorm_content_for_rag,
+                        f"brainstorm_{self._current_topic_id}.txt",
+                        chunk_sizes=[512],
+                        is_permanent=True
+                    )
+                    logger.info("Brainstorm database loaded into compiler RAG (proof sections stripped)")
+                else:
+                    logger.warning("Brainstorm database was empty after proof stripping")
             else:
                 logger.warning(f"Brainstorm database not found: {brainstorm_db_path}")
             
@@ -4084,12 +4105,17 @@ async def _compile_paper(
                     # IMPORTANT: Use paper_library.get_paper_path() for session-aware path resolution
                     paper_path = paper_library.get_paper_path(ref_paper_id)
                     if os.path.exists(paper_path):
-                        await rag_manager.add_document(
-                            paper_path,
-                            chunk_sizes=[512],
-                            is_user_file=False  # Lower priority than brainstorm
-                        )
-                        logger.info(f"Reference paper loaded: {ref_paper_id}")
+                        ref_content = await paper_library.get_paper_content(ref_paper_id, strip_proofs=True)
+                        if ref_content:
+                            await rag_manager.add_text(
+                                ref_content,
+                                f"reference_paper_{ref_paper_id}.txt",
+                                chunk_sizes=[512],
+                                is_permanent=False
+                            )
+                            logger.info(f"Reference paper loaded: {ref_paper_id}")
+                        else:
+                            logger.warning(f"Reference paper was empty after proof stripping: {ref_paper_id}")
                     else:
                         logger.warning(f"Reference paper not found: {paper_path}")
                 logger.info("All reference papers loaded into compiler RAG")
@@ -4100,12 +4126,17 @@ async def _compile_paper(
                 for bp_id in self._current_brainstorm_paper_ids:
                     bp_path = paper_library.get_paper_path(bp_id)
                     if os.path.exists(bp_path):
-                        await rag_manager.add_document(
-                            bp_path,
-                            chunk_sizes=[512],
-                            is_user_file=True
-                        )
-                        logger.info(f"Prior brainstorm paper loaded as auto-reference: {bp_id}")
+                        bp_content = await paper_library.get_paper_content(bp_id, strip_proofs=True)
+                        if bp_content:
+                            await rag_manager.add_text(
+                                bp_content,
+                                f"prior_paper_{bp_id}.txt",
+                                chunk_sizes=[512],
+                                is_permanent=True
+                            )
+                            logger.info(f"Prior brainstorm paper loaded as auto-reference: {bp_id}")
+                        else:
+                            logger.warning(f"Prior brainstorm paper was empty after proof stripping: {bp_id}")
                     else:
                         logger.warning(f"Prior brainstorm paper not found: {bp_path}")
             
diff --git a/backend/autonomous/core/autonomous_rag_manager.py b/backend/autonomous/core/autonomous_rag_manager.py
index 546018a..dfabcb6 100644
--- a/backend/autonomous/core/autonomous_rag_manager.py
+++ b/backend/autonomous/core/autonomous_rag_manager.py
@@ -88,7 +88,7 @@ async def get_brainstorm_context(
         Returns:
             Tuple of (content string, used_rag boolean)
         """
-        content = await brainstorm_memory.get_database_content(topic_id)
+        content = await brainstorm_memory.get_database_content(topic_id, strip_proofs=True)
         
         if not content:
             return "", False
@@ -220,7 +220,7 @@ async def get_reference_papers_context(
         total_tokens = 0
         
         for paper_id in paper_ids:
-            content = await paper_library.get_paper_content(paper_id)
+            content = await paper_library.get_paper_content(paper_id, strip_proofs=True)
             metadata = await paper_library.get_metadata(paper_id)
             
             if content and metadata:
diff --git a/backend/autonomous/core/proof_verification_stage.py b/backend/autonomous/core/proof_verification_stage.py
index 5c9f90c..58251a0 100644
--- a/backend/autonomous/core/proof_verification_stage.py
+++ b/backend/autonomous/core/proof_verification_stage.py
@@ -25,6 +25,7 @@
 
 BroadcastFn = Optional[Callable[[str, dict[str, Any]], Awaitable[None]]]
 ShouldStopFn = Optional[Callable[[], bool]]
+LEAN_WORKSPACE_ERROR_PREFIX = "LEAN 4 WORKSPACE ERROR"
 
 
 @dataclass
@@ -279,10 +280,12 @@ async def _run_smt_check(
             )
             result_name = smt_result.result if smt_result.result in {"sat", "unsat", "unknown"} else "unknown"
             suggestions = self._build_smt_tactic_suggestions(candidate) if result_name == "unsat" else []
+            z3_raw = "\n".join(part for part in [smt_result.stdout.strip(), smt_result.stderr.strip()] if part).strip()
             return SmtHint(
                 result=result_name,
                 suggested_tactics=suggestions,
                 smtlib=smtlib,
+                z3_output=z3_raw[:2000],
             )
         except Exception as exc:
             logger.debug("SMT check failed for theorem %s in %s %s: %s", candidate.theorem_id, source_type, source_id, exc)
@@ -704,6 +707,14 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
 
                     if is_novel:
                         result.novel_count += 1
+                        # Novel proofs are appended to their source document so the
+                        # paper/brainstorm they came from retains a record of them.
+                        # They are also stored in ProofDatabase and direct-injected
+                        # into all prompts via inject_into_prompt().
+                        if source_type == "brainstorm":
+                            await brainstorm_memory.append_proofs_section(source_id, stored_record)
+                        elif ":" not in source_id:
+                            await paper_library.append_proofs_section(source_id, stored_record)
                         await self._broadcast(
                             broadcast_fn,
                             "novel_proof_discovered",
@@ -716,11 +727,10 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                             },
                         )
                     else:
-                        if source_type == "brainstorm":
-                            await brainstorm_memory.append_proofs_section(source_id, stored_record)
-                        elif ":" not in source_id:
-                            await paper_library.append_proofs_section(source_id, stored_record)
-
+                        # Non-novel (known) proofs are stored in ProofDatabase only.
+                        # They are NOT appended to brainstorm/paper files to avoid
+                        # polluting compiler and RAG context with standard Lean 4 code.
+                        # They remain browsable via proof_database.get_known_proofs_summary_for_browsing().
                         await self._broadcast(
                             broadcast_fn,
                             "known_proof_verified",
@@ -918,7 +928,11 @@ async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
             smt_hint=candidate.smt_hint,
             should_stop=should_stop,
         )
-        if not success and not (should_stop and should_stop()):
+        workspace_error = bool(
+            attempts
+            and (attempts[-1].error_output or "").startswith(LEAN_WORKSPACE_ERROR_PREFIX)
+        )
+        if not success and not workspace_error and not (should_stop and should_stop()):
             tactic_success, tactic_theorem_name, lean_code, attempts = await formalization_agent.prove_candidate_tactic_script(
                 user_research_prompt=user_prompt,
                 source_type=source_type,
@@ -936,7 +950,7 @@ async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
                 theorem_name = tactic_theorem_name
             success = tactic_success
 
-        if not success and not (should_stop and should_stop()):
+        if not success and not workspace_error and not (should_stop and should_stop()):
             await self._broadcast(
                 broadcast_fn,
                 "proof_attempts_exhausted",
diff --git a/backend/autonomous/memory/brainstorm_memory.py b/backend/autonomous/memory/brainstorm_memory.py
index 0ad3cf1..a43fd76 100644
--- a/backend/autonomous/memory/brainstorm_memory.py
+++ b/backend/autonomous/memory/brainstorm_memory.py
@@ -247,16 +247,32 @@ async def add_submission(self, topic_id: str, content: str, submission_number: i
                 logger.error(f"Failed to add submission to brainstorm {topic_id}: {e}")
                 return False
     
-    async def get_database_content(self, topic_id: str) -> str:
-        """Get all content from a brainstorm database."""
+    async def get_database_content(self, topic_id: str, *, strip_proofs: bool = False) -> str:
+        """Get all content from a brainstorm database.
+
+        Args:
+            topic_id: The brainstorm topic ID.
+            strip_proofs: When True, truncate content at the proof section header.
+                Use this for compiler and RAG paths so that appended proof blocks
+                (both novel and non-novel) do not pollute LLM context.  Novel
+                proofs are available via proof_database.inject_into_prompt();
+                non-novel proofs are browsable via
+                proof_database.get_known_proofs_summary_for_browsing().
+        """
         db_path = self._get_database_path(topic_id)
-        
+
         if not db_path.exists():
             return ""
-        
+
         try:
             async with aiofiles.open(db_path, 'r', encoding='utf-8') as f:
-                return await f.read()
+                content = await f.read()
+            if strip_proofs and content:
+                marker = "=== PROOFS GENERATED FROM THIS BRAINSTORM"
+                idx = content.find(marker)
+                if idx > 0:
+                    content = content[:idx].rstrip()
+            return content
         except Exception as e:
             logger.error(f"Failed to read brainstorm database {topic_id}: {e}")
             return ""
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index e9a11be..f38ccc3 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -566,16 +566,31 @@ async def save_paper(
             logger.info(f"Saved paper {paper_id}: '{title}' ({word_count} words, {model_count} models tracked)")
             return metadata
     
-    async def get_paper_content(self, paper_id: str) -> str:
-        """Get full paper content."""
+    async def get_paper_content(self, paper_id: str, *, strip_proofs: bool = False) -> str:
+        """Get full paper content.
+
+        Args:
+            paper_id: The paper ID.
+            strip_proofs: When True, truncate content at the proof section header.
+                Use this for compiler and RAG paths so that appended proof blocks
+                do not pollute LLM context.  Novel proofs are available via
+                proof_database.inject_into_prompt(); non-novel proofs are browsable
+                via proof_database.get_known_proofs_summary_for_browsing().
+        """
         paper_path = self._get_paper_path(paper_id)
-        
+
         if not paper_path.exists():
             return ""
-        
+
         try:
             async with aiofiles.open(paper_path, 'r', encoding='utf-8') as f:
-                return await f.read()
+                content = await f.read()
+            if strip_proofs and content:
+                marker = "=== PROOFS GENERATED FROM THIS PAPER"
+                idx = content.find(marker)
+                if idx > 0:
+                    content = content[:idx].rstrip()
+            return content
         except Exception as e:
             logger.error(f"Failed to read paper {paper_id}: {e}")
             return ""
diff --git a/backend/autonomous/memory/proof_database.py b/backend/autonomous/memory/proof_database.py
index 400ec1c..2e1e227 100644
--- a/backend/autonomous/memory/proof_database.py
+++ b/backend/autonomous/memory/proof_database.py
@@ -560,6 +560,60 @@ def count_proofs(self) -> Dict[str, int]:
             "known": len(proofs) - novel_count,
         }
 
+    def get_known_proofs_summary_for_browsing(
+        self,
+        source_id: Optional[str] = None,
+        limit: int = 15,
+    ) -> str:
+        """Return a compact summary of known (non-novel) proofs for optional prompt injection.
+
+        Unlike novel proof injection this is NOT automatically prepended to prompts.
+        It is called on-demand so the system can review what standard results have
+        already been Lean 4-verified before brainstorming, avoiding redundant work.
+
+        Args:
+            source_id: When provided, only proofs whose source_id matches are
+                included (e.g. a brainstorm topic ID or paper ID).  Pass None to
+                include all known proofs across the session.
+            limit: Maximum number of proof entries to include.  The most recent
+                entries are selected.  Lean 4 code is intentionally omitted to
+                keep the block compact.
+
+        Returns:
+            A formatted string block, or an empty string when no known proofs exist.
+        """
+        self._ensure_index_loaded_sync()
+        proofs = self._index_data.get("proofs", []) if self._index_data else []
+        known_proofs = [p for p in proofs if not p.get("novel")]
+
+        if source_id:
+            known_proofs = [p for p in known_proofs if p.get("source_id") == source_id]
+
+        if not known_proofs:
+            return ""
+
+        total = len(known_proofs)
+        # Most-recent first (index is already sorted newest-first by add_proof)
+        shown = known_proofs[:limit]
+
+        lines = [
+            f"=== KNOWN VERIFIED PROOFS ({len(shown)} of {total} shown, Lean 4 Verified) ===",
+            "[Standard/known results already formally verified. For reference to avoid re-proving.]",
+            "",
+        ]
+        for index, proof in enumerate(shown, start=1):
+            statement = proof.get("theorem_statement", "").strip()
+            src_type = proof.get("source_type", "")
+            src_id = proof.get("source_id", "")
+            proof_id = proof.get("proof_id", "")
+            lines.append(
+                f"KNOWN {index}: {statement}"
+                f"  (source: {src_type} {src_id}, id: {proof_id})".rstrip()
+            )
+        lines.append("")
+        lines.append("=== END KNOWN PROOFS ===")
+        return "\n".join(lines)
+
     def get_novel_proofs_for_injection(self) -> str:
         """Format the novel proofs block for highest-priority prompt injection."""
         self._ensure_index_loaded_sync()
@@ -619,6 +673,128 @@ async def inject_failure_hints_into_prompt(
             return hints_block
         return f"{hints_block}\n\n{prompt}"
 
+    async def list_proof_library(self, novel_only: bool = True) -> List[Dict[str, Any]]:
+        """List all proofs across all sessions (legacy + session-based) for the proof library.
+
+        Mirrors the cross-session listing pattern used by PaperLibrary.list_history_papers().
+        """
+        all_proofs: List[Dict[str, Any]] = []
+
+        legacy_proofs_dir = Path(system_config.data_dir) / "proofs"
+        if legacy_proofs_dir.exists():
+            all_proofs.extend(
+                await self._list_proofs_from_directory(legacy_proofs_dir, "legacy", novel_only)
+            )
+
+        sessions_dir = Path(system_config.auto_sessions_base_dir)
+        if sessions_dir.exists():
+            for session_dir in sorted(
+                (p for p in sessions_dir.iterdir() if p.is_dir()), reverse=True
+            ):
+                proofs_dir = session_dir / "proofs"
+                if not proofs_dir.exists():
+                    continue
+                all_proofs.extend(
+                    await self._list_proofs_from_directory(proofs_dir, session_dir.name, novel_only)
+                )
+
+        all_proofs.sort(key=lambda p: p.get("created_at") or "", reverse=True)
+        return all_proofs
+
+    async def _list_proofs_from_directory(
+        self, proofs_dir: Path, session_id: str, novel_only: bool
+    ) -> List[Dict[str, Any]]:
+        """Read the proofs index from a specific directory and return library entries."""
+        index_path = proofs_dir / "proofs_index.json"
+        if not index_path.exists():
+            return []
+
+        try:
+            async with aiofiles.open(index_path, "r", encoding="utf-8") as handle:
+                index_data = json.loads(await handle.read())
+        except Exception as exc:
+            logger.warning("Failed to read proofs index at %s: %s", index_path, exc)
+            return []
+
+        session_metadata_path = proofs_dir.parent / "session_metadata.json"
+        user_prompt = ""
+        if session_metadata_path.exists():
+            try:
+                async with aiofiles.open(session_metadata_path, "r", encoding="utf-8") as handle:
+                    meta = json.loads(await handle.read())
+                    user_prompt = meta.get("user_prompt", "")
+            except Exception:
+                pass
+
+        results: List[Dict[str, Any]] = []
+        for proof_data in index_data.get("proofs", []):
+            is_novel = proof_data.get("novel", False)
+            if novel_only and not is_novel:
+                continue
+
+            results.append({
+                "library_id": f"{session_id}:{proof_data.get('proof_id', '')}",
+                "session_id": session_id,
+                "proof_id": proof_data.get("proof_id", ""),
+                "theorem_name": proof_data.get("theorem_name", ""),
+                "theorem_statement": proof_data.get("theorem_statement", ""),
+                "formal_sketch": proof_data.get("formal_sketch", ""),
+                "source_type": proof_data.get("source_type", ""),
+                "source_id": proof_data.get("source_id", ""),
+                "source_title": proof_data.get("source_title", ""),
+                "solver": proof_data.get("solver", "Lean 4"),
+                "novel": is_novel,
+                "novelty_reasoning": proof_data.get("novelty_reasoning", ""),
+                "verification_notes": proof_data.get("verification_notes", ""),
+                "attempt_count": proof_data.get("attempt_count", 0),
+                "created_at": proof_data.get("created_at", ""),
+                "user_prompt": user_prompt,
+                "dependencies": proof_data.get("dependencies", []),
+            })
+
+        return results
+
+    async def get_library_proof(self, session_id: str, proof_id: str) -> Optional[Dict[str, Any]]:
+        """Get a single proof from a specific session for the proof library viewer."""
+        if session_id == "legacy":
+            proofs_dir = Path(system_config.data_dir) / "proofs"
+        else:
+            proofs_dir = Path(system_config.auto_sessions_base_dir) / validate_single_path_component(session_id, "session ID") / "proofs"
+
+        if not proofs_dir.exists():
+            return None
+
+        safe_id = validate_single_path_component(proof_id, "proof ID")
+        record_path = proofs_dir / f"proof_{safe_id}.json"
+        lean_path = proofs_dir / f"proof_{safe_id}_lean.lean"
+
+        if not record_path.exists():
+            return None
+
+        try:
+            async with aiofiles.open(record_path, "r", encoding="utf-8") as handle:
+                proof_data = json.loads(await handle.read())
+        except Exception as exc:
+            logger.error("Failed to read proof %s from session %s: %s", proof_id, session_id, exc)
+            return None
+
+        lean_code = ""
+        if lean_path.exists():
+            try:
+                async with aiofiles.open(lean_path, "r", encoding="utf-8") as handle:
+                    lean_code = await handle.read()
+            except Exception:
+                lean_code = str(proof_data.get("lean_code", "") or "")
+        else:
+            lean_code = str(proof_data.get("lean_code", "") or "")
+
+        return {
+            "library_id": f"{session_id}:{proof_id}",
+            "session_id": session_id,
+            **proof_data,
+            "lean_code": lean_code,
+        }
+
     async def clear_all(self) -> None:
         """Remove all proof files and reset the index."""
         async with self._lock:
diff --git a/backend/autonomous/prompts/proof_prompts.py b/backend/autonomous/prompts/proof_prompts.py
index bc57009..4726504 100644
--- a/backend/autonomous/prompts/proof_prompts.py
+++ b/backend/autonomous/prompts/proof_prompts.py
@@ -8,11 +8,12 @@
 from backend.shared.models import MathlibLemmaHint, ProofAttemptFeedback, SmtHint
 
 
-PROOF_FRAMING_CONTEXT = """[PROOF FRAMING CONTEXT -- This research prompt is amenable to formal mathematical proof.
-All submissions should work toward producing formally testable theorems where possible.
-The validator should additionally assess whether submissions contribute toward results
-that can be verified by the Lean 4 proof assistant. This framing does not exclude
-non-proof explorations but provides a directional objective.]"""
+PROOF_FRAMING_CONTEXT = """[PROOF FRAMING CONTEXT -- This research prompt targets formal mathematical proof.
+Submissions should aggressively pursue NOVEL, NON-TRIVIAL theorems that push the
+boundaries of what is known. The Lean 4 proof assistant is available for formal
+verification. Prioritize ambitious conjectures, original results, and theorems that
+would represent genuine mathematical contributions over safe restatements of textbook
+facts. Standard identities and well-known Mathlib lemmas are NOT valuable targets.]"""
 
 
 def _json_only_footer(example: str) -> str:
@@ -30,6 +31,12 @@ def _format_attempt_history(prior_attempts: Iterable[ProofAttemptFeedback]) -> s
 
     lines = []
     for attempt in attempts:
+        if (
+            not attempt.lean_code
+            and not attempt.error_output
+            and "malformed output" in (attempt.reasoning or "").lower()
+        ):
+            continue
         tactic_trace = "\n".join(
             f"  - {step}"
             for step in (attempt.tactic_trace or [])
@@ -59,6 +66,8 @@ def _format_attempt_history(prior_attempts: Iterable[ProofAttemptFeedback]) -> s
             block.append(rejection_banner)
         block.append("---")
         lines.extend(block)
+    if not lines:
+        return "No prior Lean-checked attempts."
     return "\n".join(lines)
 
 
@@ -90,12 +99,15 @@ def _format_smt_hint(smt_hint: SmtHint | None) -> str:
         return "[No SMT guidance available.]"
 
     tactics = ", ".join(smt_hint.suggested_tactics or []) or "[none]"
-    return "\n".join(
-        [
-            f"SMT result: {smt_hint.result}",
-            f"Suggested Lean tactics: {tactics}",
-        ]
-    )
+    sections = [
+        f"SMT result: {smt_hint.result}",
+        f"Suggested Lean tactics: {tactics}",
+    ]
+    if smt_hint.smtlib.strip():
+        sections.append(f"SMT-LIB encoding sent to Z3:\n{_truncate_text(smt_hint.smtlib, 1500)}")
+    if smt_hint.z3_output.strip():
+        sections.append(f"Z3 solver output:\n{_truncate_text(smt_hint.z3_output, 1000)}")
+    return "\n".join(sections)
 
 
 LEAN4_COMMON_PITFALLS = """COMMON LEAN 4 PITFALLS TO AVOID:
@@ -194,18 +206,20 @@ def format_failure_hints_for_injection(failure_hints: Iterable[Any]) -> str:
 
 def build_proof_framing_gate_prompt(user_prompt: str) -> str:
     """Ask whether the research goal should be framed toward formal proof."""
-    return f"""You are deciding whether a research program should be explicitly framed toward formal mathematical proof.
+    return f"""You are deciding whether a research program should be explicitly framed toward formal mathematical proof and novel theorem discovery.
 
 USER RESEARCH PROMPT:
 {user_prompt}
 
-Return TRUE only if the prompt is meaningfully served by working toward formally provable theorems in a proof assistant such as Lean 4.
-Return FALSE if the prompt is primarily empirical, engineering-focused, descriptive, or only tangentially mathematical.
+Return TRUE if the prompt would benefit from working toward formally provable theorems in Lean 4, especially novel or non-trivial ones.
+Return FALSE only if the prompt is purely empirical, engineering-focused, descriptive, or has no meaningful mathematical content.
 
 Consider:
-- Is the core task mathematical rather than experimental?
-- Are theorem statements or proof obligations likely to be central?
-- Would proof-oriented framing materially improve the research direction?
+- Does the research involve mathematical structures, proofs, bounds, or formal reasoning?
+- Could novel theorems or formalizations emerge from this research direction?
+- Would formal verification add rigor or uncover new results?
+
+Err on the side of TRUE -- if there is any mathematical substance worth formalizing, enable the proof pipeline.
 
 {_json_only_footer('{"is_proof_amenable": true, "reasoning": "brief explanation"}')}
 """
@@ -217,26 +231,42 @@ def build_proof_identification_prompt(
     source_id: str,
     source_content: str,
 ) -> str:
-    """Identify complete, testable theorem candidates from a brainstorm or paper."""
+    """Identify novel, non-trivial theorem candidates from a brainstorm or paper."""
     example_json = """{
   "has_provable_theorems": true,
   "theorems": [
     {
       "theorem_id": "thm_1",
       "statement": "natural-language theorem statement",
-      "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy"
+      "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy",
+      "novelty_rationale": "why this theorem is non-trivial and worth formalizing"
     }
   ]
 }"""
-    return f"""You are a theorem-identification agent for MOTO. Lean 4 is available as an external proof checker.
+    return f"""You are a theorem-discovery agent for MOTO. Your mission is to find NOVEL, NON-TRIVIAL mathematical claims in the source below that deserve formal verification in Lean 4.
 
-Your job is NOT to prove anything yet. Your job is only to decide whether the source below contains any COMPLETE, TESTABLE mathematical theorem statements that should be submitted to Lean 4.
+MOTO's goal is to push the frontier of mathematical knowledge. You are the gatekeeper that decides which theorems are worth the cost of formal verification. Be ambitious -- seek out the most original, surprising, or substantive results the source offers.
+
+WHAT TO EXTRACT (prioritize these):
+- Novel theorems, lemmas, or propositions that represent genuine mathematical insight
+- Bold conjectures that can be sharpened into provable statements
+- Non-obvious connections, bounds, inequalities, or structural results
+- Original formalizations of results not yet in Mathlib
+- Ambitious claims even if they need narrowing -- the formalization agent can refine them
+
+WHAT TO REJECT (never extract these):
+- Trivial identities (e.g. n + 0 = n, a * 1 = a, commutativity of addition)
+- Direct restatements of well-known Mathlib lemmas or standard textbook results
+- Results closable by a single tactic like `simp`, `omega`, `norm_num`, `decide`, or `rfl`
+- Tautologies, definitional equalities, or purely notational rewrites
+- Routine algebraic manipulations with no conceptual content
 
 Rules:
-- Return FALSE if the content only contains conjectures, loose ideas, heuristics, empirical claims, or incomplete proof sketches.
-- Return TRUE only for theorem candidates that are stated clearly enough to attempt formalization now.
-- Include ALL viable candidate theorems, not just the best one.
-- Prefer exact theorem statements over vague summaries.
+- Return TRUE when at least one non-trivial, novel-potential theorem is found.
+- Return FALSE only if the source genuinely contains nothing beyond trivial or well-known results.
+- Rank candidates by novelty potential. Return at most 5 of the most promising theorems.
+- For each candidate, include a brief novelty_rationale explaining why it is worth formalizing.
+- Welcome bold or speculative claims -- if the source proposes something ambitious that might be provable with the right formalization, extract it. The downstream formalization agent will handle narrowing if needed.
 - Use theorem IDs that are stable strings such as "thm_1", "thm_2", etc.
 
 USER RESEARCH PROMPT:
@@ -367,6 +397,9 @@ def build_proof_formalization_prompt(
 - Include needed imports.
 - State assumptions explicitly.
 - Prefer correct, minimal, compilable code over stylistic elegance.
+- PRESERVE the theorem's non-trivial content. Do not simplify or weaken the
+  statement into a trivial identity just to make it compile. The goal is to
+  formalize the ACTUAL claim, not a watered-down version of it.
 - Your proof MUST close every goal without `sorry` or `admit`. Vacuous
   proofs (e.g. axiomatizing the theorem's own concepts and then closing
   with `sorry`) will be rejected even if Lean compiles them with only a
@@ -441,6 +474,8 @@ def build_proof_tactic_script_prompt(
 - Return a short, ordered list of tactics that can be appended under a `by` block.
 - Each tactic entry must include the Lean tactic string and one short reasoning note.
 - Prefer small, composable tactics over a single opaque script.
+- PRESERVE the theorem's non-trivial content. Do not simplify or weaken the
+  statement into a trivial identity just to make it compile.
 - NEVER include `sorry` or `admit` in the tactic list. A script that uses
   `sorry`/`admit` will be rejected even if Lean compiles it.
 - Include needed assumptions in the theorem header. Do NOT axiomatize the
@@ -491,13 +526,25 @@ def build_proof_novelty_prompt(
     existing_proofs_block = existing_novel_proofs or "[No previously stored novel proofs.]"
     return f"""This proof has been FORMALLY VERIFIED by Lean 4. It is mathematically valid.
 
-Your ONLY task: decide whether the verified result appears NOVEL in the context of this research program.
+Your ONLY task: decide whether the verified result is NOVEL in the context of this research program.
+
+A proof is NOVEL if it meets ANY of these criteria:
+- It proves a result not already present in Mathlib or standard textbooks
+- It establishes a new connection, bound, or structural insight
+- It formalizes a conjecture or claim that was previously unverified
+- It is a non-trivial composition of known results yielding something new
+- It represents original work relative to the existing stored proofs below
+
+A proof is NOT novel if:
+- It is a direct restatement of a well-known Mathlib lemma or textbook theorem
+- It is a trivial identity, tautology, or definitional equality
+- It is closable by a single standard tactic (simp, omega, norm_num, decide, rfl)
+- It duplicates a result already in the stored novel proofs below
 
 Rules:
 - Do NOT re-check validity. Lean 4 already verified it.
-- Focus only on novelty/originality relative to known mathematics and the currently stored novel proofs.
-- If the theorem appears standard, classical, or already well known, mark it as not novel.
-- If you are uncertain, prefer FALSE unless there is a strong reason to believe the result is genuinely new.
+- When uncertain, consider the research prompt context -- a result that is textbook-standard in one field may be a novel formalization contribution in the context of this specific research program.
+- Err on the side of recognizing novelty for results that required multi-step reasoning or non-trivial formalization work.
 
 USER RESEARCH PROMPT:
 {user_prompt}
@@ -511,5 +558,5 @@ def build_proof_novelty_prompt(
 EXISTING STORED NOVEL PROOFS:
 {existing_proofs_block}
 
-{_json_only_footer('{"is_novel": false, "reasoning": "brief explanation"}')}
+{_json_only_footer('{"is_novel": true, "reasoning": "brief explanation"}')}
 """
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index ba2b5ef..7225e9c 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -16,7 +16,7 @@
 from backend.shared.models import CompilerState, CompilerSubmission, CompilerValidationResult, WorkflowTask, SubmitterConfig, ValidationResult, ModelConfig
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.api_client_manager import api_client_manager
-from backend.shared.openrouter_client import FreeModelExhaustedError
+from backend.shared.openrouter_client import FreeModelExhaustedError, OpenRouterInvalidResponseError
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.json_parser import parse_json
 from backend.shared.utils import count_tokens
@@ -40,6 +40,37 @@
 logger = logging.getLogger(__name__)
 
 
+def _classify_submitter_error(err: BaseException) -> tuple[str, str]:
+    """
+    Classify an exception raised by a HighContextSubmitter.submit_* call.
+
+    Distinguishes true context / prompt-size overflows (which are meaningful
+    "decline to submit" signals) from upstream transport / API failures
+    (non-JSON responses, connection errors, generic API errors) which are NOT
+    context overflows and should not be reported to the user as such.
+
+    Returns:
+        (label, reason_prefix) where:
+            - label is a short human-readable classification used in logs
+              and UI messages (e.g. "Context overflow", "API transport error")
+            - reason_prefix is the leading text used when building the
+              full reason/reasoning string (e.g. "Context overflow: ...")
+    """
+    msg = str(err) if err is not None else ""
+    msg_lower = msg.lower()
+
+    if isinstance(err, OpenRouterInvalidResponseError):
+        return ("API transport error", "API transport error")
+
+    if "prompt too large" in msg_lower or "tokens > " in msg_lower:
+        return ("Context overflow", "Context overflow")
+
+    if msg_lower.startswith("openrouter api error") or msg_lower.startswith("openrouter connection failed") or msg_lower.startswith("openrouter rate limit"):
+        return ("API transport error", "API transport error")
+
+    return ("Submitter error", "Submitter error")
+
+
 class CompilerCoordinator:
     """
     Coordinates the compiler system.
@@ -957,7 +988,7 @@ async def _initial_paper_loop(self) -> None:
                 if self.autonomous_mode and self._current_topic_id:
                     try:
                         from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
-                        first_brainstorm_content = await brainstorm_memory.get_database_content(self._current_topic_id)
+                        first_brainstorm_content = await brainstorm_memory.get_database_content(self._current_topic_id, strip_proofs=True)
                         first_brainstorm_source = f"brainstorm_{self._current_topic_id}.txt"
                     except Exception:
                         pass
@@ -988,11 +1019,12 @@ async def _initial_paper_loop(self) -> None:
                     
             except FreeModelExhaustedError:
                 raise
-            except ValueError as e:
-                logger.error(f"Construction context overflow in initial loop (attempt {attempt}): {e}")
+            except (ValueError, OpenRouterInvalidResponseError) as e:
+                label, reason_prefix = _classify_submitter_error(e)
+                logger.error(f"Construction {label.lower()} in initial loop (attempt {attempt}): {e}")
                 await self._broadcast("compiler_rejection", {
                     "mode": "construction",
-                    "reasoning": f"Context overflow: {e}"
+                    "reasoning": f"{reason_prefix}: {e}"
                 })
                 await compiler_rejection_log.add_rejection(
                     CompilerValidationResult(
@@ -1227,7 +1259,7 @@ async def _submit_and_validate_construction(self, rejection_feedback: Optional[s
         if self.autonomous_mode and self._current_topic_id:
             try:
                 from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
-                brainstorm_content_for_submitter = await brainstorm_memory.get_database_content(self._current_topic_id)
+                brainstorm_content_for_submitter = await brainstorm_memory.get_database_content(self._current_topic_id, strip_proofs=True)
                 brainstorm_source_for_submitter = f"brainstorm_{self._current_topic_id}.txt"
                 if brainstorm_content_for_submitter:
                     logger.info(f"Loaded brainstorm content for retroactive corrections: {len(brainstorm_content_for_submitter)} chars")
@@ -1245,10 +1277,11 @@ async def _submit_and_validate_construction(self, rejection_feedback: Optional[s
                 brainstorm_content=brainstorm_content_for_submitter,
                 brainstorm_source_name=brainstorm_source_for_submitter
             )
-        except ValueError as e:
-            logger.error(f"Construction context overflow: {e}")
+        except (ValueError, OpenRouterInvalidResponseError) as e:
+            label, reason_prefix = _classify_submitter_error(e)
+            logger.error(f"Construction {label.lower()}: {e}")
             self.construction_rejections += 1
-            overflow_reason = f"Context overflow: {e}"
+            overflow_reason = f"{reason_prefix}: {e}"
             await compiler_rejection_log.add_rejection(
                 CompilerValidationResult(
                     submission_id=str(uuid.uuid4()),
@@ -1647,7 +1680,7 @@ async def _handle_brainstorm_retroactive_operation(self, brainstorm_op) -> None:
         logger.info(f"Processing retroactive brainstorm {brainstorm_op.action} for topic {topic_id}")
         
         try:
-            brainstorm_content = await brainstorm_memory.get_database_content(topic_id)
+            brainstorm_content = await brainstorm_memory.get_database_content(topic_id, strip_proofs=True)
             if not brainstorm_content:
                 logger.warning(f"Brainstorm {topic_id} is empty, skipping retroactive operation")
                 return
@@ -1820,14 +1853,15 @@ async def _submit_and_validate_review(self, review_focus: str = "general") -> bo
         submission = None
         try:
             submission = await self.high_context_submitter.submit_review(review_focus=review_focus)
-        except ValueError as e:
-            logger.error(f"{review_label.capitalize()} context overflow: {e}")
+        except (ValueError, OpenRouterInvalidResponseError) as e:
+            label, reason_prefix = _classify_submitter_error(e)
+            logger.error(f"{review_label.capitalize()} {label.lower()}: {e}")
             self.review_declines += 1
-            await compiler_rejection_log.add_decline("review", f"Context overflow: {e}")
+            await compiler_rejection_log.add_decline("review", f"{reason_prefix}: {e}")
             await self._broadcast("compiler_decline", {
                 "mode": "review",
                 "review_focus": review_focus,
-                "reasoning": f"Context overflow: {e}"
+                "reasoning": f"{reason_prefix}: {e}"
             })
             return False
         
diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index ea46270..2c6a2e0 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -94,6 +94,16 @@ def _output_contains_sorry_warning(output: str) -> bool:
 
 _PLACEHOLDER_REJECTION_PREFIX = "PROOF REJECTED: PLACEHOLDER USED"
 _MATHLIB_CACHE_ARCHIVE_RE = re.compile(r"\(([^()\r\n]+?\.ltar)\)")
+_LEAN_WORKSPACE_ERROR_PREFIX = "LEAN 4 WORKSPACE ERROR"
+_OLEAN_OBJECT_FILE_MISSING_RE = re.compile(
+    r"object file ['\"].*?\.olean['\"] of module .*? does not exist",
+    re.IGNORECASE,
+)
+_LEAN_WORKSPACE_ERROR_MARKERS: tuple[str, ...] = (
+    "imports are out of date",
+    "invalid or corrupt .olean",
+    "invalid or corrupt olean",
+)
 
 # Markdown fence markers the LLM occasionally emits inside the `lean_code`
 # JSON field even when instructed to return raw code. Strip them defensively so
@@ -188,12 +198,21 @@ def _format_placeholder_rejection(token_name: str, *, from_lean_diagnostic: bool
 class Lean4Client:
     """Subprocess wrapper around the Lean 4 toolchain."""
 
+    _lean_execution_lock: Optional[asyncio.Lock] = None
+
     def __init__(self, lean_path: str, workspace_dir: str) -> None:
         self.lean_path = str(lean_path or "").strip()
         self.workspace_dir = Path(workspace_dir).resolve()
         self._workspace_ready = False
+        self._workspace_unhealthy_error = ""
         self._workspace_lock = asyncio.Lock()
 
+    @classmethod
+    def _get_lean_execution_lock(cls) -> asyncio.Lock:
+        if Lean4Client._lean_execution_lock is None:
+            Lean4Client._lean_execution_lock = asyncio.Lock()
+        return Lean4Client._lean_execution_lock
+
     def _resolve_executable(self, name: str) -> str:
         if self.lean_path:
             lean_bin = Path(self.lean_path).resolve()
@@ -312,6 +331,83 @@ async def _run_process(
         stderr = stderr_bytes.decode("utf-8", errors="replace")
         return process.returncode, stdout, stderr
 
+    async def _run_lean_file_once(
+        self,
+        *,
+        temp_filename: str,
+        prepared_code: str,
+        timeout: int,
+    ) -> tuple[int, str, str]:
+        temp_path = self.workspace_dir / temp_filename
+        try:
+            temp_path.write_text(prepared_code, encoding="utf-8")
+            return await self._run_process(
+                [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
+                cwd=self.workspace_dir,
+                timeout=timeout,
+            )
+        finally:
+            try:
+                if temp_path.exists():
+                    temp_path.unlink()
+            except OSError:
+                logger.debug("Could not remove temporary Lean file %s", temp_path)
+
+    @staticmethod
+    def _combined_process_output(stdout: str, stderr: str) -> str:
+        return "\n".join(part for part in [stdout.strip(), stderr.strip()] if part).strip()
+
+    @staticmethod
+    def _is_workspace_infrastructure_error(output: str) -> bool:
+        text = output or ""
+        lowered = text.lower()
+        return bool(_OLEAN_OBJECT_FILE_MISSING_RE.search(text)) or any(
+            marker in lowered for marker in _LEAN_WORKSPACE_ERROR_MARKERS
+        )
+
+    @staticmethod
+    def _format_workspace_infrastructure_error(output: str) -> str:
+        detail = " ".join((output or "").split())
+        if len(detail) > 2000:
+            detail = detail[:2000] + "..."
+        return (
+            f"{_LEAN_WORKSPACE_ERROR_PREFIX}: Mathlib cache/workspace repair failed. "
+            "This is an infrastructure problem, not a proof error. "
+            "Lean reported missing or invalid compiled Mathlib artifacts. "
+            f"Original diagnostic: {detail or '[none]'}"
+        )
+
+    def _mark_workspace_unhealthy(self, output: str) -> None:
+        self._workspace_ready = False
+        self._workspace_unhealthy_error = self._format_workspace_infrastructure_error(output)
+
+    def _workspace_unavailable_result(self, *, tactic_script: bool = False) -> Lean4Result:
+        error_output = self._workspace_unhealthy_error or (
+            f"{_LEAN_WORKSPACE_ERROR_PREFIX}: Lean 4 workspace is not ready. "
+            "This is an infrastructure problem, not a proof error."
+        )
+        if tactic_script:
+            return Lean4Result(
+                success=False,
+                error_output=error_output,
+                tactic_error_slice=error_output,
+                failing_tactic_index=-1,
+            )
+        return Lean4Result(success=False, error_output=error_output)
+
+    async def _repair_workspace_after_infrastructure_error(self, output: str) -> bool:
+        logger.warning(
+            "Lean 4 workspace infrastructure error detected; invalidating workspace cache and refetching Mathlib artifacts. Diagnostic: %s",
+            self._format_workspace_infrastructure_error(output),
+        )
+        async with self._workspace_lock:
+            self._workspace_unhealthy_error = ""
+            self._workspace_ready = False
+            repaired = await self._ensure_workspace_locked()
+            if not repaired:
+                self._mark_workspace_unhealthy(output)
+            return repaired
+
     async def get_version(self) -> str:
         """Return the Lean 4 version string when available."""
         lean_cmd = self.lean_path or self._resolve_executable("lean")
@@ -377,6 +473,7 @@ async def _ensure_workspace_locked(self) -> bool:
                 timeout=max(system_config.lean4_proof_timeout, 120),
             )
             if update_rc != 0:
+                self._mark_workspace_unhealthy(update_stderr or update_stdout)
                 logger.warning(
                     "Lean 4 workspace update failed: %s",
                     (update_stderr or update_stdout).strip(),
@@ -401,6 +498,7 @@ async def _ensure_workspace_locked(self) -> bool:
                     timeout=max(system_config.lean4_proof_timeout, 120),
                 )
                 if update_rc != 0:
+                    self._mark_workspace_unhealthy(update_stderr or update_stdout)
                     logger.warning(
                         "Lean 4 workspace update after toolchain alignment failed: %s",
                         (update_stderr or update_stdout).strip(),
@@ -412,6 +510,7 @@ async def _ensure_workspace_locked(self) -> bool:
                 cwd=self.workspace_dir,
             )
             if cache_rc != 0:
+                self._mark_workspace_unhealthy(cache_stderr or cache_stdout)
                 logger.error(
                     "Lean 4 Mathlib cache fetch failed; proof checking would hit "
                     "'object file' errors. Details: %s",
@@ -420,6 +519,7 @@ async def _ensure_workspace_locked(self) -> bool:
                 return False
 
         self._workspace_ready = True
+        self._workspace_unhealthy_error = ""
         return True
 
     async def _fetch_mathlib_cache(
@@ -732,66 +832,78 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
 
         workspace_ready = await self.ensure_workspace()
         if not workspace_ready:
-            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+            return self._workspace_unavailable_result()
 
         temp_filename = f"MOTOProofCheck_{uuid.uuid4().hex}.lean"
-        temp_path = self.workspace_dir / temp_filename
-        try:
-            temp_path.write_text(prepared_code, encoding="utf-8")
-            returncode, stdout, stderr = await self._run_process(
-                [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
-                cwd=self.workspace_dir,
+        async with self._get_lean_execution_lock():
+            workspace_ready = await self.ensure_workspace()
+            if not workspace_ready:
+                return self._workspace_unavailable_result()
+            returncode, stdout, stderr = await self._run_lean_file_once(
+                temp_filename=temp_filename,
+                prepared_code=prepared_code,
                 timeout=timeout,
             )
+            combined_output = self._combined_process_output(stdout, stderr)
+            if self._is_workspace_infrastructure_error(combined_output):
+                repaired = await self._repair_workspace_after_infrastructure_error(combined_output)
+                if repaired:
+                    returncode, stdout, stderr = await self._run_lean_file_once(
+                        temp_filename=temp_filename,
+                        prepared_code=prepared_code,
+                        timeout=timeout,
+                    )
+                    combined_output = self._combined_process_output(stdout, stderr)
+                if self._is_workspace_infrastructure_error(combined_output):
+                    self._mark_workspace_unhealthy(combined_output)
+                    return Lean4Result(
+                        success=False,
+                        error_output=self._workspace_unhealthy_error,
+                        goal_states=self._extract_goal_states(combined_output),
+                        raw_stderr=stderr.strip(),
+                    )
 
-            combined_output = "\n".join(part for part in [stdout.strip(), stderr.strip()] if part).strip()
-            goal_states = self._extract_goal_states(combined_output)
-
-            # Positive pass: Lean must exit cleanly AND the diagnostics must
-            # not contain an `error:` line AND must not contain Lean's own
-            # "declaration uses 'sorry'" warning. We treat the sorry warning
-            # as a proof-level failure so vacuous proofs cannot slip through.
-            lowered = combined_output.lower()
-            has_error_diagnostic = "error:" in lowered
-            has_sorry_warning = _output_contains_sorry_warning(combined_output)
-            lean_exited_cleanly = returncode == 0
-            positive_pass = (
-                lean_exited_cleanly
-                and not has_error_diagnostic
-                and not has_sorry_warning
-            )
+        goal_states = self._extract_goal_states(combined_output)
 
-            if positive_pass:
-                return Lean4Result(
-                    success=True,
-                    error_output="",
-                    goal_states=goal_states,
-                    raw_stderr=stderr.strip(),
-                )
+        # Positive pass: Lean must exit cleanly AND the diagnostics must
+        # not contain an `error:` line AND must not contain Lean's own
+        # "declaration uses 'sorry'" warning. We treat the sorry warning
+        # as a proof-level failure so vacuous proofs cannot slip through.
+        lowered = combined_output.lower()
+        has_error_diagnostic = "error:" in lowered
+        has_sorry_warning = _output_contains_sorry_warning(combined_output)
+        lean_exited_cleanly = returncode == 0
+        positive_pass = (
+            lean_exited_cleanly
+            and not has_error_diagnostic
+            and not has_sorry_warning
+        )
 
-            if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
-                rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
-                detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
-                return Lean4Result(
-                    success=False,
-                    error_output=detail,
-                    goal_states=goal_states,
-                    raw_stderr=stderr.strip(),
-                )
+        if positive_pass:
+            return Lean4Result(
+                success=True,
+                error_output="",
+                goal_states=goal_states,
+                raw_stderr=stderr.strip(),
+            )
 
-            error_output = combined_output or "Lean 4 rejected the proof without additional diagnostics."
+        if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
+            rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
+            detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
             return Lean4Result(
                 success=False,
-                error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+                error_output=detail,
                 goal_states=goal_states,
                 raw_stderr=stderr.strip(),
             )
-        finally:
-            try:
-                if temp_path.exists():
-                    temp_path.unlink()
-            except OSError:
-                logger.debug("Could not remove temporary Lean file %s", temp_path)
+
+        error_output = combined_output or "Lean 4 rejected the proof without additional diagnostics."
+        return Lean4Result(
+            success=False,
+            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            goal_states=goal_states,
+            raw_stderr=stderr.strip(),
+        )
 
     async def check_tactic_script(
         self,
@@ -876,72 +988,87 @@ async def _run_tactic_script_once(
 
         workspace_ready = await self.ensure_workspace()
         if not workspace_ready:
-            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+            return self._workspace_unavailable_result(tactic_script=True)
 
         temp_filename = f"MOTOProofTacticCheck_{uuid.uuid4().hex}.lean"
-        temp_path = self.workspace_dir / temp_filename
-        try:
-            temp_path.write_text(prepared_code, encoding="utf-8")
-            returncode, stdout, stderr = await self._run_process(
-                [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
-                cwd=self.workspace_dir,
+        async with self._get_lean_execution_lock():
+            workspace_ready = await self.ensure_workspace()
+            if not workspace_ready:
+                return self._workspace_unavailable_result(tactic_script=True)
+            returncode, stdout, stderr = await self._run_lean_file_once(
+                temp_filename=temp_filename,
+                prepared_code=prepared_code,
                 timeout=timeout,
             )
+            combined_output = self._combined_process_output(stdout, stderr)
+            if self._is_workspace_infrastructure_error(combined_output):
+                repaired = await self._repair_workspace_after_infrastructure_error(combined_output)
+                if repaired:
+                    returncode, stdout, stderr = await self._run_lean_file_once(
+                        temp_filename=temp_filename,
+                        prepared_code=prepared_code,
+                        timeout=timeout,
+                    )
+                    combined_output = self._combined_process_output(stdout, stderr)
+                if self._is_workspace_infrastructure_error(combined_output):
+                    self._mark_workspace_unhealthy(combined_output)
+                    error_output = self._workspace_unhealthy_error
+                    return Lean4Result(
+                        success=False,
+                        error_output=error_output,
+                        goal_states=self._extract_goal_states(combined_output),
+                        raw_stderr=stderr.strip(),
+                        tactic_error_slice=error_output,
+                        failing_tactic_index=-1,
+                    )
 
-            combined_output = "\n".join(part for part in [stdout.strip(), stderr.strip()] if part).strip()
-            goal_states = self._extract_goal_states(combined_output)
-            lowered = combined_output.lower()
-            has_error_diagnostic = "error:" in lowered
-            has_sorry_warning = _output_contains_sorry_warning(combined_output)
-            lean_exited_cleanly = returncode == 0
-            positive_pass = (
-                lean_exited_cleanly
-                and not has_error_diagnostic
-                and not has_sorry_warning
-            )
-            tactic_error_slice, failing_tactic_index = self._extract_tactic_error_slice(
-                combined_output,
-                temp_filename,
-                tactic_ranges,
-            )
-
-            if positive_pass:
-                return Lean4Result(
-                    success=True,
-                    error_output="",
-                    goal_states=goal_states,
-                    raw_stderr=stderr.strip(),
-                    tactic_error_slice="",
-                    failing_tactic_index=-1,
-                )
+        goal_states = self._extract_goal_states(combined_output)
+        lowered = combined_output.lower()
+        has_error_diagnostic = "error:" in lowered
+        has_sorry_warning = _output_contains_sorry_warning(combined_output)
+        lean_exited_cleanly = returncode == 0
+        positive_pass = (
+            lean_exited_cleanly
+            and not has_error_diagnostic
+            and not has_sorry_warning
+        )
+        tactic_error_slice, failing_tactic_index = self._extract_tactic_error_slice(
+            combined_output,
+            temp_filename,
+            tactic_ranges,
+        )
 
-            if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
-                rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
-                detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
-                return Lean4Result(
-                    success=False,
-                    error_output=detail,
-                    goal_states=goal_states,
-                    raw_stderr=stderr.strip(),
-                    tactic_error_slice=rejection,
-                    failing_tactic_index=failing_tactic_index,
-                )
+        if positive_pass:
+            return Lean4Result(
+                success=True,
+                error_output="",
+                goal_states=goal_states,
+                raw_stderr=stderr.strip(),
+                tactic_error_slice="",
+                failing_tactic_index=-1,
+            )
 
-            error_output = tactic_error_slice or combined_output or "Lean 4 rejected the tactic script without additional diagnostics."
+        if has_sorry_warning and not has_error_diagnostic and lean_exited_cleanly:
+            rejection = _format_placeholder_rejection("sorry", from_lean_diagnostic=True)
+            detail = f"{rejection}\n\nOriginal Lean 4 diagnostics:\n{combined_output}".strip()
             return Lean4Result(
                 success=False,
-                error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+                error_output=detail,
                 goal_states=goal_states,
                 raw_stderr=stderr.strip(),
-                tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+                tactic_error_slice=rejection,
                 failing_tactic_index=failing_tactic_index,
             )
-        finally:
-            try:
-                if temp_path.exists():
-                    temp_path.unlink()
-            except OSError:
-                logger.debug("Could not remove temporary Lean file %s", temp_path)
+
+        error_output = tactic_error_slice or combined_output or "Lean 4 rejected the tactic script without additional diagnostics."
+        return Lean4Result(
+            success=False,
+            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            goal_states=goal_states,
+            raw_stderr=stderr.strip(),
+            tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+            failing_tactic_index=failing_tactic_index,
+        )
 
 
 class Lean4LspClient(Lean4Client):
@@ -1451,7 +1578,7 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
 
         workspace_ready = await self.ensure_workspace()
         if not workspace_ready:
-            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+            return self._workspace_unavailable_result()
 
         if not self._lsp_healthy:
             return await self._subprocess_fallback.check_proof(lean_code, timeout=timeout)
@@ -1464,6 +1591,9 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
                     temp_filename=f"MOTOProofCheck_{uuid.uuid4().hex}.lean",
                     timeout=timeout,
                 )
+                if self._is_workspace_infrastructure_error(result.error_output):
+                    await self._mark_unhealthy(result.error_output)
+                    return await self._subprocess_fallback.check_proof(lean_code, timeout=timeout)
                 return result
             except Exception as exc:
                 await self._mark_unhealthy(str(exc))
@@ -1554,7 +1684,7 @@ async def _run_tactic_script_via_lsp_once(
 
         workspace_ready = await self.ensure_workspace()
         if not workspace_ready:
-            return Lean4Result(success=False, error_output="Lean 4 workspace is not ready.")
+            return self._workspace_unavailable_result(tactic_script=True)
 
         if not self._lsp_healthy:
             return await self._subprocess_fallback._run_tactic_script_once(
@@ -1572,6 +1702,13 @@ async def _run_tactic_script_via_lsp_once(
                     timeout=timeout,
                     tactic_ranges=tactic_ranges,
                 )
+                if self._is_workspace_infrastructure_error(result.error_output):
+                    await self._mark_unhealthy(result.error_output)
+                    return await self._subprocess_fallback._run_tactic_script_once(
+                        theorem_header=theorem_header,
+                        tactic_list=tactic_list,
+                        timeout=timeout,
+                    )
                 return result
             except Exception as exc:
                 await self._mark_unhealthy(str(exc))
diff --git a/backend/shared/models.py b/backend/shared/models.py
index 9c10e22..9401a38 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -485,6 +485,7 @@ class SmtHint(BaseModel):
     result: Literal["sat", "unsat", "unknown"] = "unknown"
     suggested_tactics: List[str] = Field(default_factory=list)
     smtlib: str = ""
+    z3_output: str = ""
 
 
 class ProofCandidate(BaseModel):
diff --git a/backend/shared/openrouter_client.py b/backend/shared/openrouter_client.py
index 50b9c39..6533957 100644
--- a/backend/shared/openrouter_client.py
+++ b/backend/shared/openrouter_client.py
@@ -6,6 +6,7 @@
 """
 import httpx
 import asyncio
+import json
 import logging
 import time
 from typing import List, Dict, Any, Optional
@@ -484,7 +485,35 @@ async def _execute_completion_request(
                     )
                 
                 response.raise_for_status()
-                return response.json()
+                try:
+                    return response.json()
+                except (json.JSONDecodeError, ValueError) as json_err:
+                    # OpenRouter returned 2xx but body is not valid JSON.
+                    # This is typically a gateway/CDN error page, truncated stream,
+                    # or other transport-level failure — NOT a context-size problem.
+                    body_text = ""
+                    try:
+                        body_text = response.text or ""
+                    except Exception:
+                        body_text = ""
+                    body_preview = body_text[:500]
+                    content_type = response.headers.get("content-type", "") if hasattr(response, "headers") else ""
+                    logger.error(
+                        f"OpenRouter returned non-JSON body (status={response.status_code}, "
+                        f"content_type={content_type!r}, body_len={len(body_text)}, "
+                        f"parse_error={json_err}). Body preview: {body_preview!r}"
+                    )
+                    # Retry on transient malformed responses
+                    if attempt < self.MAX_RETRIES - 1:
+                        await asyncio.sleep(self.RETRY_DELAY * (attempt + 1))
+                        continue
+                    raise OpenRouterInvalidResponseError(
+                        f"OpenRouter returned non-JSON body after {self.MAX_RETRIES} attempts "
+                        f"(status={response.status_code}, content_type={content_type!r}): {json_err}",
+                        status_code=response.status_code,
+                        content_type=content_type,
+                        body_preview=body_preview,
+                    )
                 
             except CreditExhaustionError:
                 # Don't retry credit exhaustion - propagate immediately
@@ -493,6 +522,11 @@ async def _execute_completion_request(
             except OpenRouterPrivacyPolicyError:
                 # Don't retry privacy policy errors - propagate immediately
                 raise
+
+            except OpenRouterInvalidResponseError:
+                # Already handled/retried above; propagate cleanly so callers can
+                # distinguish transport failures from real context overflows.
+                raise
                 
             except httpx.HTTPStatusError as e:
                 error_detail = e.response.text if hasattr(e.response, 'text') else str(e)
@@ -638,7 +672,28 @@ async def get_embeddings(self, texts: List[str], model: str = None) -> List[List
                 raise CreditExhaustionError("OpenRouter credits exhausted for embeddings")
             
             response.raise_for_status()
-            data = response.json()
+            try:
+                data = response.json()
+            except (json.JSONDecodeError, ValueError) as json_err:
+                body_text = ""
+                try:
+                    body_text = response.text or ""
+                except Exception:
+                    body_text = ""
+                body_preview = body_text[:500]
+                content_type = response.headers.get("content-type", "") if hasattr(response, "headers") else ""
+                logger.error(
+                    f"OpenRouter embeddings returned non-JSON body (status={response.status_code}, "
+                    f"content_type={content_type!r}, body_len={len(body_text)}, "
+                    f"parse_error={json_err}). Body preview: {body_preview!r}"
+                )
+                raise OpenRouterInvalidResponseError(
+                    f"OpenRouter embeddings returned non-JSON body "
+                    f"(status={response.status_code}, content_type={content_type!r}): {json_err}",
+                    status_code=response.status_code,
+                    content_type=content_type,
+                    body_preview=body_preview,
+                )
             
             # Extract embeddings in order
             embeddings = [
@@ -751,6 +806,30 @@ async def close(self):
             logger.error(f"Error closing OpenRouter client: {e}")
 
 
+class OpenRouterInvalidResponseError(ValueError):
+    """
+    Raised when OpenRouter returns a non-JSON (or otherwise malformed) response body
+    on a 2xx status. This typically indicates an upstream proxy/CDN error page,
+    a truncated stream, or a transient gateway failure rather than a real
+    context-window / prompt-size problem.
+
+    Inherits from ValueError so that existing ``except ValueError`` handlers in
+    the submitter chain continue to propagate transport failures correctly
+    (rather than accidentally swallowing them via a broad ``except Exception:
+    return None`` further up the call stack).
+
+    Attributes:
+        status_code: HTTP status code returned by OpenRouter
+        content_type: Content-Type header (if any)
+        body_preview: First ~500 chars of the response body, for diagnostics
+    """
+    def __init__(self, message: str, status_code: int, content_type: str, body_preview: str):
+        super().__init__(message)
+        self.status_code = status_code
+        self.content_type = content_type
+        self.body_preview = body_preview
+
+
 class CreditExhaustionError(Exception):
     """Raised when OpenRouter credits are exhausted."""
     pass
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index e9a22f6..a61a21c 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -16,7 +16,8 @@ import {
   AutonomousResearchLogs,
   FinalAnswerView,
   FinalAnswerLibrary,
-  MathematicalProofs
+  MathematicalProofs,
+  ProofLibrary
 } from './components/autonomous';
 import WorkflowPanel from './components/WorkflowPanel';
 import BoostControlModal from './components/BoostControlModal';
@@ -44,6 +45,7 @@ import {
 const APP_MODE_STORAGE_KEY = 'appMode';
 const AUTONOMOUS_TAB_STORAGE_KEY = 'autonomousActiveTab';
 const MANUAL_TAB_STORAGE_KEY = 'manualActiveTab';
+const COMPLETED_WORKS_SUB_TAB_STORAGE_KEY = 'completedWorksSubTab';
 const LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY = 'singlePaperWriterExpanded';
 const EMBEDDING_MODEL_HINTS = ['embed', 'embedding', 'nomic', 'bge', 'e5', 'gte'];
 const AUTONOMOUS_ROLE_PREFIXES = ['validator', 'high_context', 'high_param', 'critique_submitter'];
@@ -170,8 +172,22 @@ function App() {
       return 'autonomous';
     }
   });
-  const [autonomousActiveTab, setAutonomousActiveTab] = useState('auto-interface');
+  const [autonomousActiveTab, setAutonomousActiveTab] = useState(() => {
+    const saved = localStorage.getItem(AUTONOMOUS_TAB_STORAGE_KEY);
+    if (saved === 'auto-stage2-history' || saved === 'auto-final-answer-library') {
+      return 'auto-completed-works';
+    }
+    return saved || 'auto-interface';
+  });
   const [manualActiveTab, setManualActiveTab] = useState('aggregator-interface');
+  const [completedWorksSubTab, setCompletedWorksSubTab] = useState(() => {
+    const savedSubTab = localStorage.getItem(COMPLETED_WORKS_SUB_TAB_STORAGE_KEY);
+    if (savedSubTab) return savedSubTab;
+    const savedTab = localStorage.getItem(AUTONOMOUS_TAB_STORAGE_KEY);
+    if (savedTab === 'auto-stage2-history') return 'stage2-history';
+    if (savedTab === 'auto-final-answer-library') return 'stage3-history';
+    return 'stage2-history';
+  });
   const activeTab = appMode === 'manual' ? manualActiveTab : autonomousActiveTab;
   const shimmerAccentsEnabled = (() => {
     const saved = localStorage.getItem('banner_shimmer_enabled');
@@ -236,6 +252,10 @@ function App() {
   useEffect(() => {
     localStorage.setItem(MANUAL_TAB_STORAGE_KEY, manualActiveTab);
   }, [manualActiveTab]);
+
+  useEffect(() => {
+    localStorage.setItem(COMPLETED_WORKS_SUB_TAB_STORAGE_KEY, completedWorksSubTab);
+  }, [completedWorksSubTab]);
   
   // Initialize config from localStorage or use defaults
   // CRITICAL: Read from 'aggregator_settings' (used by AggregatorSettings component)
@@ -1975,8 +1995,7 @@ function App() {
   ];
 
   const autonomousSettingsTabs = [
-    { id: 'auto-stage2-history', label: 'Stage 2 Final Answers History', group: 'autonomous-settings' },
-    { id: 'auto-final-answer-library', label: 'Stage 3 Final Answers History', subtext: '(In Development / Highly Hallucinatory)', group: 'autonomous-settings' },
+    { id: 'auto-completed-works', label: 'Your Completed Works Library', group: 'autonomous-settings' },
     { id: 'auto-logs', label: 'API Call Logs', group: 'autonomous-settings' },
     { id: 'auto-settings', label: 'Autonomous Model Selection & Settings', group: 'autonomous-settings' },
   ];
@@ -2314,15 +2333,50 @@ function App() {
               status={autonomousStatus}
             />
           )}
-          {activeTab === 'auto-stage2-history' && (
-            <Stage2PaperHistory
-              onCurrentSessionDataChanged={async () => {
-                await Promise.all([refreshPapers(), refreshBrainstorms()]);
-              }}
-            />
-          )}
-          {activeTab === 'auto-final-answer-library' && (
-            <FinalAnswerLibrary />
+          {activeTab === 'auto-completed-works' && (
+            <div className="completed-works-library">
+              <div className="completed-works-header">
+                <h2 className="completed-works-title">Your Completed Works Library</h2>
+                <p className="completed-works-subtitle">
+                  Browse all research outputs across every session — papers, final answers, and verified proofs.
+                </p>
+              </div>
+              <div className="completed-works-sub-tabs">
+                <button
+                  className={`completed-works-sub-tab ${completedWorksSubTab === 'stage2-history' ? 'active' : ''}`}
+                  onClick={() => setCompletedWorksSubTab('stage2-history')}
+                >
+                  Stage 2 Papers History
+                </button>
+                <button
+                  className={`completed-works-sub-tab ${completedWorksSubTab === 'stage3-history' ? 'active' : ''}`}
+                  onClick={() => setCompletedWorksSubTab('stage3-history')}
+                >
+                  Stage 3 Final Answers History
+                </button>
+                <button
+                  className={`completed-works-sub-tab ${completedWorksSubTab === 'proof-library' ? 'active' : ''}`}
+                  onClick={() => setCompletedWorksSubTab('proof-library')}
+                >
+                  Proof Library
+                </button>
+              </div>
+              <div className="completed-works-content">
+                {completedWorksSubTab === 'stage2-history' && (
+                  <Stage2PaperHistory
+                    onCurrentSessionDataChanged={async () => {
+                      await Promise.all([refreshPapers(), refreshBrainstorms()]);
+                    }}
+                  />
+                )}
+                {completedWorksSubTab === 'stage3-history' && (
+                  <FinalAnswerLibrary />
+                )}
+                {completedWorksSubTab === 'proof-library' && (
+                  <ProofLibrary />
+                )}
+              </div>
+            </div>
           )}
           {activeTab === 'auto-logs' && (
             <AutonomousResearchLogs
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 6d0998b..7aafed3 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -98,11 +98,23 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
   const getAutoSettingsForModel = async (modelId, selectedProvider = null, keyOverride = undefined) => {
     const model = findOpenRouterModel(models, modelId);
     if (!model) {
+      console.debug('[BoostAutoFill] model not in loaded models list, skipping auto-fill', { modelId });
       return null;
     }
 
     const nextProviderData = await fetchProviders(modelId, keyOverride);
-    return computeOpenRouterAutoSettings(model, nextProviderData, selectedProvider);
+    const autoSettings = computeOpenRouterAutoSettings(model, nextProviderData, selectedProvider);
+    if (autoSettings) {
+      console.debug('[BoostAutoFill] computed auto-settings', {
+        modelId,
+        selectedProvider,
+        source: autoSettings.source,
+        contextWindow: autoSettings.contextWindow,
+        maxOutputTokens: autoSettings.maxOutputTokens,
+        warnings: autoSettings.warnings,
+      });
+    }
+    return autoSettings;
   };
 
   const fetchBoostStatus = async (keyOverride = undefined) => {
@@ -152,8 +164,15 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
     if (modelId) {
       const autoSettings = await getAutoSettingsForModel(modelId, null);
       if (autoSettings) {
-        setContextWindow(autoSettings.contextWindow);
-        setMaxOutputTokens(autoSettings.maxOutputTokens);
+        if (autoSettings.contextWindowKnown) {
+          setContextWindow(autoSettings.contextWindow);
+        }
+        if (autoSettings.outputCapKnown) {
+          setMaxOutputTokens(autoSettings.maxOutputTokens);
+        }
+        if (autoSettings.warnings && autoSettings.warnings.length > 0) {
+          console.warn('[BoostAutoFill] auto-settings fallback used:', autoSettings.warnings);
+        }
       }
     } else {
       setProviderData(null);
@@ -456,8 +475,12 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
                   setSelectedProvider(providerName);
                   const autoSettings = await getAutoSettingsForModel(boostModel, providerName || null);
                   if (autoSettings) {
-                    setContextWindow(autoSettings.contextWindow);
-                    setMaxOutputTokens(autoSettings.maxOutputTokens);
+                    if (autoSettings.contextWindowKnown) {
+                      setContextWindow(autoSettings.contextWindow);
+                    }
+                    if (autoSettings.outputCapKnown) {
+                      setMaxOutputTokens(autoSettings.maxOutputTokens);
+                    }
                   }
                 }}
                 disabled={loading || loadingProviders}
@@ -487,9 +510,14 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
               <input
                 type="number"
                 value={contextWindow}
-                onChange={(e) => setContextWindow(parseInt(e.target.value) || 131072)}
+                onChange={(e) => {
+                  const parsed = parseInt(e.target.value, 10);
+                  if (Number.isFinite(parsed) && parsed > 0) {
+                    setContextWindow(parsed);
+                  }
+                }}
                 min="4096"
-                max="999999"
+                max="50000000"
                 step="1024"
                 disabled={loading}
               />
@@ -500,9 +528,14 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
               <input
                 type="number"
                 value={maxOutputTokens}
-                onChange={(e) => setMaxOutputTokens(parseInt(e.target.value) || 25000)}
+                onChange={(e) => {
+                  const parsed = parseInt(e.target.value, 10);
+                  if (Number.isFinite(parsed) && parsed > 0) {
+                    setMaxOutputTokens(parsed);
+                  }
+                }}
                 min="1000"
-                max="100000"
+                max="50000000"
                 step="1000"
                 disabled={loading}
               />
diff --git a/frontend/src/components/aggregator/AggregatorSettings.jsx b/frontend/src/components/aggregator/AggregatorSettings.jsx
index 46d0cf9..a90b700 100644
--- a/frontend/src/components/aggregator/AggregatorSettings.jsx
+++ b/frontend/src/components/aggregator/AggregatorSettings.jsx
@@ -232,11 +232,26 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
   const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
     const model = findOpenRouterModel(openRouterModels, modelId);
     if (!model) {
+      console.debug('[AggregatorAutoFill] model not in loaded list, skipping auto-fill', { modelId });
       return null;
     }
 
     const providerData = await fetchProvidersForModel(modelId);
-    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    const autoSettings = computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    if (autoSettings) {
+      console.debug('[AggregatorAutoFill] computed auto-settings', {
+        modelId,
+        selectedProvider,
+        source: autoSettings.source,
+        contextWindow: autoSettings.contextWindow,
+        maxOutputTokens: autoSettings.maxOutputTokens,
+        warnings: autoSettings.warnings,
+      });
+      if (autoSettings.warnings && autoSettings.warnings.length > 0) {
+        console.warn('[AggregatorAutoFill] auto-settings fallback used:', autoSettings.warnings);
+      }
+    }
+    return autoSettings;
   };
 
   const handleSubmitterModelChange = async (submitterId, modelId) => {
@@ -262,8 +277,8 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       c.submitterId === submitterId
         ? {
             ...c,
-            contextWindow: autoSettings.contextWindow,
-            maxOutputTokens: autoSettings.maxOutputTokens,
+            ...(autoSettings.contextWindowKnown ? { contextWindow: autoSettings.contextWindow } : {}),
+            ...(autoSettings.outputCapKnown ? { maxOutputTokens: autoSettings.maxOutputTokens } : {}),
           }
         : c
     );
@@ -294,8 +309,8 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       c.submitterId === submitterId
         ? {
             ...c,
-            contextWindow: autoSettings.contextWindow,
-            maxOutputTokens: autoSettings.maxOutputTokens,
+            ...(autoSettings.contextWindowKnown ? { contextWindow: autoSettings.contextWindow } : {}),
+            ...(autoSettings.outputCapKnown ? { maxOutputTokens: autoSettings.maxOutputTokens } : {}),
           }
         : c
     );
@@ -320,13 +335,15 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       return;
     }
 
-    setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    if (autoSettings.outputCapKnown) {
+      setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    }
     setConfig(prev => ({
       ...prev,
       validatorModel: modelId,
       validatorOpenrouterProvider: null,
-      validatorContextSize: autoSettings.contextWindow,
-      validatorMaxOutput: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { validatorContextSize: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { validatorMaxOutput: autoSettings.maxOutputTokens } : {}),
     }));
   };
 
@@ -346,12 +363,14 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       return;
     }
 
-    setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    if (autoSettings.outputCapKnown) {
+      setValidatorMaxOutput(autoSettings.maxOutputTokens);
+    }
     setConfig(prev => ({
       ...prev,
       validatorOpenrouterProvider: providerName,
-      validatorContextSize: autoSettings.contextWindow,
-      validatorMaxOutput: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { validatorContextSize: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { validatorMaxOutput: autoSettings.maxOutputTokens } : {}),
     }));
   };
 
@@ -700,7 +719,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       value={cfg.contextWindow}
                       onChange={(e) => updateSubmitterConfig(cfg.submitterId, 'contextWindow', parseInt(e.target.value))}
                       min="4096"
-                      max="999999"
+                      max="50000000"
                       step="1024"
                       className="input--sm"
                     />
@@ -713,7 +732,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       value={cfg.maxOutputTokens}
                       onChange={(e) => updateSubmitterConfig(cfg.submitterId, 'maxOutputTokens', parseInt(e.target.value))}
                       min="1000"
-                      max="100000"
+                      max="50000000"
                       step="1000"
                       className="input--sm"
                     />
@@ -760,7 +779,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                   setConfig({ ...config, validatorContextSize: isNaN(parsed) ? 131072 : parsed });
                 }}
                 min="4096"
-                max="999999"
+                max="50000000"
                 step="1024"
               />
               <small className="hint-text">
@@ -792,7 +811,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                   setConfig({ ...config, validatorMaxOutput: value });
                 }}
                 min="1000"
-                max="100000"
+                max="50000000"
                 step="1000"
               />
             </div>
diff --git a/frontend/src/components/autonomous/AutonomousResearch.css b/frontend/src/components/autonomous/AutonomousResearch.css
index 061002a..c9ad866 100644
--- a/frontend/src/components/autonomous/AutonomousResearch.css
+++ b/frontend/src/components/autonomous/AutonomousResearch.css
@@ -1013,6 +1013,65 @@
   font-style: italic;
 }
 
+/* Open Source tag */
+.model-item--os {
+  position: relative;
+}
+
+.os-tag {
+  position: absolute;
+  top: 0.35rem;
+  right: 0.35rem;
+  background: linear-gradient(135deg, #6366f1, #4f46e5);
+  color: #fff;
+  font-size: 0.58rem;
+  font-weight: 700;
+  letter-spacing: 0.05em;
+  padding: 0.15rem 0.35rem;
+  border-radius: 3px;
+  line-height: 1;
+  user-select: none;
+  cursor: default;
+  z-index: 2;
+  box-shadow: 0 1px 4px rgba(79, 70, 229, 0.45);
+  transition: opacity 0.15s;
+}
+
+.os-tag-tooltip-anchor {
+  position: absolute;
+  top: 0.35rem;
+  right: 0.35rem;
+  z-index: 2;
+  display: inline-block;
+}
+
+.os-tag-tooltip-anchor .os-tag {
+  position: static;
+}
+
+.os-tag-tooltip {
+  display: none;
+  position: absolute;
+  top: calc(100% + 6px);
+  right: 0;
+  min-width: 210px;
+  background: #1a1a2e;
+  border: 1px solid rgba(99, 102, 241, 0.5);
+  border-radius: 6px;
+  padding: 0.55rem 0.75rem;
+  color: #c4c4ff;
+  font-size: 0.72rem;
+  line-height: 1.45;
+  box-shadow: 0 6px 18px rgba(0, 0, 0, 0.5);
+  pointer-events: none;
+  z-index: 200;
+  white-space: normal;
+}
+
+.os-tag-tooltip-anchor:hover .os-tag-tooltip {
+  display: block;
+}
+
 /* Main settings content area */
 .autonomous-settings {
   flex: 1;
@@ -1044,7 +1103,7 @@
 
 .settings-group {
   background: var(--bg-secondary, #1e1e1e);
-  border: 1px solid #18cc17;
+  border: 1px solid #2a2a2a;
   border-radius: 8px;
   padding: 1rem;
   width: 100%;
@@ -1165,7 +1224,7 @@
 /* Per-submitter config section */
 .submitter-config-section {
   background: var(--bg-tertiary, #252525);
-  border: 1px solid #18cc17;
+  border: 1px solid #2a2a2a;
   border-radius: 6px;
   padding: 1rem;
   margin-bottom: 1rem;
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index 81b72ed..1dcbb38 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -34,6 +34,15 @@ const DEFAULT_SUBMITTER_CONFIG = {
   maxOutputTokens: 25000
 };
 
+const OsTag = () => (
+  <span className="os-tag-tooltip-anchor">
+    <span className="os-tag">OS</span>
+    <span className="os-tag-tooltip">
+      Open source — weights available on Hugging Face for local use with LM Studio.
+    </span>
+  </span>
+);
+
 // ModelSelector component - extracted outside to prevent recreation on every render
 const ModelSelector = ({
   provider,
@@ -214,7 +223,7 @@ const RoleConfig = ({
           onBlur={(e) => handleNumericBlur(`${rolePrefix}_context_window`, e.target.value)}
           disabled={isRunning}
           min={4096}
-          max={999999}
+          max={50000000}
           step={1024}
         />
       </div>
@@ -228,7 +237,7 @@ const RoleConfig = ({
           onBlur={(e) => handleNumericBlur(`${rolePrefix}_max_tokens`, e.target.value)}
           disabled={isRunning}
           min={1000}
-          max={100000}
+          max={50000000}
           step={1000}
         />
       </div>
@@ -719,11 +728,26 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
     const model = findOpenRouterModel(openRouterModels, modelId);
     if (!model) {
+      console.debug('[AutonomousAutoFill] model not in loaded list, skipping auto-fill', { modelId });
       return null;
     }
 
     const providerData = await fetchProvidersForModel(modelId);
-    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    const autoSettings = computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    if (autoSettings) {
+      console.debug('[AutonomousAutoFill] computed auto-settings', {
+        modelId,
+        selectedProvider,
+        source: autoSettings.source,
+        contextWindow: autoSettings.contextWindow,
+        maxOutputTokens: autoSettings.maxOutputTokens,
+        warnings: autoSettings.warnings,
+      });
+      if (autoSettings.warnings && autoSettings.warnings.length > 0) {
+        console.warn('[AutonomousAutoFill] auto-settings fallback used:', autoSettings.warnings);
+      }
+    }
+    return autoSettings;
   };
 
   const markProfileAsCustom = () => {
@@ -813,8 +837,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
     const autofilledConfig = {
       ...newConfig,
-      [`${rolePrefix}_context_window`]: autoSettings.contextWindow,
-      [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { [`${rolePrefix}_context_window`]: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens } : {}),
     };
     setLocalConfig(autofilledConfig);
     onConfigChange({ ...autofilledConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
@@ -841,8 +865,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
     const autofilledConfig = {
       ...newConfig,
-      [`${rolePrefix}_context_window`]: autoSettings.contextWindow,
-      [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { [`${rolePrefix}_context_window`]: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { [`${rolePrefix}_max_tokens`]: autoSettings.maxOutputTokens } : {}),
     };
     setLocalConfig(autofilledConfig);
     onConfigChange({ ...autofilledConfig, submitter_configs: submitterConfigs.slice(0, numSubmitters) });
@@ -949,8 +973,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     const autofilledConfigs = [...newConfigs];
     autofilledConfigs[index] = {
       ...autofilledConfigs[index],
-      contextWindow: autoSettings.contextWindow,
-      maxOutputTokens: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { contextWindow: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { maxOutputTokens: autoSettings.maxOutputTokens } : {}),
     };
 
     setSubmitterConfigs(autofilledConfigs);
@@ -981,8 +1005,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     const autofilledConfigs = [...newConfigs];
     autofilledConfigs[index] = {
       ...autofilledConfigs[index],
-      contextWindow: autoSettings.contextWindow,
-      maxOutputTokens: autoSettings.maxOutputTokens,
+      ...(autoSettings.contextWindowKnown ? { contextWindow: autoSettings.contextWindow } : {}),
+      ...(autoSettings.outputCapKnown ? { maxOutputTokens: autoSettings.maxOutputTokens } : {}),
     };
 
     setSubmitterConfigs(autofilledConfigs);
@@ -1271,7 +1295,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             {/* Podium - Top 3 */}
             <div className="models-podium">
               <div className="models-podium-label">Leaderboard</div>
-              <div className="model-item model-item--ranked model-item--gold">
+              <div className="model-item model-item--ranked model-item--gold model-item--os">
+                <OsTag />
                 <div className="flex-row-center">
                   <div className="model-item-name">Kimi K2.6</div>
                   <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
@@ -1308,7 +1333,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 <div className="model-item-badge">Fast validator</div>
               </div>
 
-              <div className="model-item model-item--ranked model-item--bronze">
+              <div className="model-item model-item--ranked model-item--bronze model-item--os">
+                <OsTag />
                 <div className="flex-row-center">
                   <div className="model-item-name">GPT OSS 120B</div>
                   <div className="ranking-badge ranking-badge--bronze">🥉 BRONZE</div>
@@ -1334,7 +1360,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">DeepSeek</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
@@ -1349,17 +1376,20 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Google's Gemma</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">GLM</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">GLM Turbo</div>
               <div className="model-item-badge">Fast validator</div>
             </div>
@@ -1369,7 +1399,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Computer science</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">OpenAI's GPT OSS</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
@@ -1389,12 +1420,14 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Rapid knowledge</div>
             </div>
 
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Nemotron Super</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
 
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Nous Hermes</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
@@ -1404,7 +1437,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Native internet search capability</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Microsoft's Phi</div>
               <div className="model-item-badge">Balanced knowledge and speed</div>
             </div>
@@ -1414,12 +1448,14 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Qwen Coder</div>
               <div className="model-item-badge">Computer science</div>
             </div>
             
-            <div className="model-item">
+            <div className="model-item model-item--os">
+              <OsTag />
               <div className="model-item-name">Qwen</div>
               <div className="model-item-badge">Highly knowledgeable</div>
             </div>
@@ -1696,7 +1732,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 onBlur={(e) => handleSubmitterNumericBlur(idx, 'contextWindow', e.target.value)}
                 disabled={isRunning}
                 min={4096}
-                max={999999}
+                max={50000000}
                 step={1024}
               />
             </div>
@@ -1710,7 +1746,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 onBlur={(e) => handleSubmitterNumericBlur(idx, 'maxOutputTokens', e.target.value)}
                 disabled={isRunning}
                 min={1000}
-                max={100000}
+                max={50000000}
                 step={1000}
               />
             </div>
@@ -1776,7 +1812,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           title="High-Parameter Submitter"
           hint="Handles mathematical rigor enhancement."
           rolePrefix="high_param"
-          borderColor="#1eff1c"
+          borderColor="#2a2a2a"
           localConfig={localConfig}
           handleProviderChange={handleProviderChange}
           handleModelChange={handleModelChange}
@@ -1858,9 +1894,9 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   <div className="settings-row">
                     <label>Lean 4 Status</label>
                     <div>
-                      <strong>{proofStatus?.lean4_enabled ? 'Enabled' : 'Disabled'}</strong>
+                      <strong>{proofStatus ? (proofStatus.lean4_enabled ? 'Enabled' : 'Disabled') : 'Starting…'}</strong>
                       <small className="settings-hint" style={{ display: 'block', marginTop: '0.35rem' }}>
-                        Workspace: {proofStatus?.workspace_ready ? 'Ready' : 'Not ready yet'}
+                        Workspace: {proofStatus ? (proofStatus.workspace_ready ? 'Ready' : 'Not ready yet') : 'Starting…'}
                       </small>
                     </div>
                   </div>
diff --git a/frontend/src/components/autonomous/MathematicalProofs.jsx b/frontend/src/components/autonomous/MathematicalProofs.jsx
index b77cddc..0b6fedc 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.jsx
+++ b/frontend/src/components/autonomous/MathematicalProofs.jsx
@@ -21,10 +21,13 @@ function truncate(text, maxLength = 220) {
 }
 
 function getLeanStatusLabel(status) {
-  if (!status?.lean4_enabled) {
+  if (!status) {
+    return 'Lean 4 Starting';
+  }
+  if (!status.lean4_enabled) {
     return 'Lean 4 Disabled';
   }
-  if (status?.lsp_active) {
+  if (status.lsp_active) {
     return status.workspace_ready ? 'Lean 4 Ready (LSP)' : 'Lean 4 LSP Starting';
   }
   if (status.workspace_ready) {
@@ -363,7 +366,7 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
         </div>
 
         <div className="math-proofs-status-group">
-          <span className={`math-proofs-status ${proofStatus?.workspace_ready ? 'ready' : 'pending'} ${proofStatus?.lean4_enabled ? '' : 'disabled'}`}>
+          <span className={`math-proofs-status ${proofStatus?.workspace_ready ? 'ready' : 'pending'} ${proofStatus && !proofStatus.lean4_enabled ? 'disabled' : ''}`}>
             {getLeanStatusLabel(proofStatus)}
           </span>
           <span className="math-proofs-count">
@@ -490,11 +493,14 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
 
       {!loading && !error && visibleProofs.length > 0 && viewMode === 'graph' && (
         <>
-          {!proofStatus?.lean4_enabled && (
+          {proofStatus && !proofStatus.lean4_enabled && (
             <div className="math-proofs-empty">
               Graph view is unavailable while Lean 4 proof support is disabled.
             </div>
           )}
+          {!proofStatus && (
+            <div className="math-proofs-empty">Loading proof runtime status…</div>
+          )}
           {proofStatus?.lean4_enabled && proofGraphState.loading && (
             <div className="math-proofs-empty">Loading proof dependency graph...</div>
           )}
diff --git a/frontend/src/components/autonomous/ProofLibrary.css b/frontend/src/components/autonomous/ProofLibrary.css
new file mode 100644
index 0000000..7c9d881
--- /dev/null
+++ b/frontend/src/components/autonomous/ProofLibrary.css
@@ -0,0 +1,135 @@
+/* ProofLibrary.css - Proof-specific overrides for the FinalAnswerLibrary layout */
+
+.proof-library .library-header h2 {
+  color: #1eff1c;
+}
+
+.proof-card--novel {
+  border-left: 3px solid #1eff1c;
+}
+
+.proof-card--known {
+  border-left: 3px solid #666;
+}
+
+.proof-badge--novel {
+  background: linear-gradient(135deg, #1eff1c 0%, #7dff6f 100%);
+  color: #000;
+}
+
+.proof-badge--known {
+  background: #555;
+  color: #ccc;
+}
+
+.proof-title {
+  font-family: 'Courier New', monospace;
+  letter-spacing: 0.02em;
+}
+
+.proof-statement {
+  color: #b9b9c6;
+  font-size: 0.92rem;
+  line-height: 1.55;
+  margin-bottom: 8px;
+  font-style: italic;
+}
+
+/* Expanded proof details */
+.proof-expanded-content {
+  display: flex;
+  flex-direction: column;
+  gap: 18px;
+}
+
+.proof-detail-section h4 {
+  color: #1eff1c;
+  font-size: 0.95rem;
+  margin: 0 0 8px 0;
+  text-transform: uppercase;
+  letter-spacing: 0.05em;
+}
+
+.proof-detail-section p {
+  color: #ccc;
+  font-size: 0.93rem;
+  line-height: 1.6;
+  margin: 0;
+}
+
+.proof-code-block {
+  background: #0d0d0d;
+  border: 1px solid #333;
+  border-radius: 6px;
+  padding: 14px 16px;
+  color: #e0e0e0;
+  font-family: 'Courier New', monospace;
+  font-size: 0.88rem;
+  line-height: 1.6;
+  white-space: pre-wrap;
+  word-wrap: break-word;
+  overflow-x: auto;
+  max-height: 500px;
+  overflow-y: auto;
+  margin: 0;
+}
+
+.proof-lean-code {
+  color: #7dff6f;
+}
+
+.proof-dependencies-list {
+  list-style: none;
+  padding: 0;
+  margin: 0;
+  display: flex;
+  flex-direction: column;
+  gap: 6px;
+}
+
+.proof-dependencies-list li {
+  color: #ccc;
+  font-size: 0.9rem;
+  padding: 4px 0;
+}
+
+.proof-dep-kind {
+  display: inline-block;
+  padding: 2px 8px;
+  border-radius: 4px;
+  font-size: 0.75rem;
+  font-weight: 700;
+  text-transform: uppercase;
+  letter-spacing: 0.04em;
+}
+
+.proof-dep-kind--mathlib {
+  background: rgba(46, 134, 222, 0.2);
+  border: 1px solid rgba(46, 134, 222, 0.4);
+  color: #b9ddff;
+}
+
+.proof-dep-kind--moto {
+  background: rgba(30, 255, 28, 0.15);
+  border: 1px solid rgba(30, 255, 28, 0.3);
+  color: #b7ffb6;
+}
+
+/* Code block scrollbar */
+.proof-code-block::-webkit-scrollbar {
+  width: 8px;
+  height: 8px;
+}
+
+.proof-code-block::-webkit-scrollbar-track {
+  background: #111;
+}
+
+.proof-code-block::-webkit-scrollbar-thumb {
+  background: #444;
+  border-radius: 4px;
+}
+
+.proof-code-block::-webkit-scrollbar-thumb:hover {
+  background: #666;
+}
diff --git a/frontend/src/components/autonomous/ProofLibrary.jsx b/frontend/src/components/autonomous/ProofLibrary.jsx
new file mode 100644
index 0000000..49ca273
--- /dev/null
+++ b/frontend/src/components/autonomous/ProofLibrary.jsx
@@ -0,0 +1,419 @@
+import React, { useState, useEffect, useMemo } from 'react';
+import { autonomousAPI } from '../../services/api';
+import { buildResearchRunGroups } from '../../utils/researchRunHistory';
+import { downloadRawText } from '../../utils/downloadHelpers';
+import './FinalAnswerLibrary.css';
+import './ProofLibrary.css';
+
+function formatDate(isoString) {
+  if (!isoString) return 'N/A';
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function truncate(text, maxLength = 220) {
+  if (!text) return '';
+  return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
+}
+
+export default function ProofLibrary() {
+  const [proofs, setProofs] = useState([]);
+  const [sessionsResponse, setSessionsResponse] = useState(null);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState(null);
+  const [expandedId, setExpandedId] = useState(null);
+  const [expandedProof, setExpandedProof] = useState(null);
+  const [loadingContentId, setLoadingContentId] = useState(null);
+  const [searchTerm, setSearchTerm] = useState('');
+  const [filterNovelty, setFilterNovelty] = useState('novel');
+
+  useEffect(() => {
+    loadProofLibrary();
+  }, [filterNovelty]);
+
+  const loadProofLibrary = async () => {
+    try {
+      setLoading(true);
+      setError(null);
+
+      const novelOnly = filterNovelty === 'novel';
+      const [proofsResult, sessionsResult] = await Promise.allSettled([
+        autonomousAPI.getProofLibrary(novelOnly),
+        autonomousAPI.getSessions(),
+      ]);
+
+      if (proofsResult.status !== 'fulfilled') {
+        throw proofsResult.reason;
+      }
+
+      setProofs(proofsResult.value.proofs || []);
+
+      if (sessionsResult.status === 'fulfilled') {
+        setSessionsResponse(sessionsResult.value);
+      } else {
+        setSessionsResponse(null);
+      }
+    } catch (err) {
+      setError(err.message || 'Failed to load proof library');
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    loadProofLibrary();
+  }, [filterNovelty]);
+
+  const filteredProofs = useMemo(() => {
+    if (!searchTerm.trim()) return proofs;
+    const lower = searchTerm.toLowerCase();
+    return proofs.filter(
+      (p) =>
+        (p.theorem_name || '').toLowerCase().includes(lower) ||
+        (p.theorem_statement || '').toLowerCase().includes(lower) ||
+        (p.source_title || '').toLowerCase().includes(lower) ||
+        (p.user_prompt || '').toLowerCase().includes(lower) ||
+        (p.novelty_reasoning || '').toLowerCase().includes(lower)
+    );
+  }, [proofs, searchTerm]);
+
+  const runGroups = useMemo(() => {
+    const pseudoPapers = filteredProofs.map((p) => ({
+      session_id: p.session_id,
+      paper_id: p.proof_id,
+      created_at: p.created_at,
+      user_prompt: p.user_prompt,
+    }));
+
+    return buildResearchRunGroups({
+      sessionsResponse,
+      stage2Papers: pseudoPapers,
+      stage3Answers: [],
+    });
+  }, [filteredProofs, sessionsResponse]);
+
+  const proofsBySession = useMemo(() => {
+    const map = new Map();
+    for (const proof of filteredProofs) {
+      const sid = proof.session_id || 'unknown';
+      if (!map.has(sid)) map.set(sid, []);
+      map.get(sid).push(proof);
+    }
+    return map;
+  }, [filteredProofs]);
+
+  const handleExpand = async (proof) => {
+    const id = proof.library_id || proof.proof_id;
+    if (expandedId === id) {
+      setExpandedId(null);
+      setExpandedProof(null);
+      return;
+    }
+
+    setExpandedId(id);
+    setLoadingContentId(id);
+
+    try {
+      const fullProof = await autonomousAPI.getLibraryProof(proof.session_id, proof.proof_id);
+      setExpandedProof(fullProof);
+    } catch {
+      setExpandedProof(proof);
+    } finally {
+      setLoadingContentId(null);
+    }
+  };
+
+  const handleDownloadLean = (proof) => {
+    const leanCode = proof.lean_code || '';
+    if (!leanCode) return;
+    const filename = `${proof.theorem_name || proof.proof_id}.lean`;
+    downloadRawText(leanCode, filename);
+  };
+
+  const novelCount = proofs.filter((p) => p.novel).length;
+  const totalCount = proofs.length;
+
+  if (loading) {
+    return (
+      <div className="final-answer-library">
+        <div className="library-loading">
+          <span className="library-loading__icon">&#x21BB;</span>
+          <span className="library-loading__text">Loading proof library...</span>
+        </div>
+      </div>
+    );
+  }
+
+  if (error) {
+    return (
+      <div className="final-answer-library">
+        <div className="error-message">
+          <span>&#x26A0;</span>
+          <p>{error}</p>
+          <button className="retry-button" onClick={loadProofLibrary}>
+            Retry
+          </button>
+        </div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="final-answer-library proof-library">
+      <div className="library-header">
+        <h2>Proof Library</h2>
+        <p>
+          All verified mathematical proofs generated across research sessions.
+        </p>
+        <div className="library-stats">
+          {filterNovelty === 'novel' ? (
+            <span className="stat-badge">{novelCount} Novel Proof{novelCount !== 1 ? 's' : ''}</span>
+          ) : (
+            <>
+              <span className="stat-badge">{totalCount} Total Proof{totalCount !== 1 ? 's' : ''}</span>
+              <span className="stat-badge">{novelCount} Novel</span>
+              <span className="stat-badge">{totalCount - novelCount} Known</span>
+            </>
+          )}
+        </div>
+      </div>
+
+      <div className="library-controls">
+        <input
+          className="search-input"
+          type="text"
+          placeholder="Search by theorem name, statement, source, or research question..."
+          value={searchTerm}
+          onChange={(e) => setSearchTerm(e.target.value)}
+        />
+        <div className="filter-buttons">
+          <button
+            className={filterNovelty === 'novel' ? 'active' : ''}
+            onClick={() => setFilterNovelty('novel')}
+          >
+            Novel Only
+          </button>
+          <button
+            className={filterNovelty === 'all' ? 'active' : ''}
+            onClick={() => setFilterNovelty('all')}
+          >
+            All Proofs
+          </button>
+        </div>
+      </div>
+
+      {filteredProofs.length === 0 ? (
+        <div className="fal-empty-state">
+          <span className="empty-icon">&#x1F9EE;</span>
+          <h3>No Proofs Found</h3>
+          <p>
+            {proofs.length === 0
+              ? 'No verified proofs have been generated yet. Run autonomous research with Lean 4 enabled to generate proofs.'
+              : 'No proofs match your search criteria.'}
+          </p>
+        </div>
+      ) : runGroups.length > 0 ? (
+        <div className="run-history-groups">
+          {runGroups.map((group) => {
+            const sessionProofs = proofsBySession.get(group.sessionId) || [];
+            if (sessionProofs.length === 0) return null;
+
+            return (
+              <div key={group.sessionId} className="run-history-group">
+                <div className="run-history-group-header">
+                  <div className="run-history-group-heading">
+                    <h3 className="run-history-group-title">{group.userPrompt}</h3>
+                    <p className="run-history-group-subtitle">
+                      {sessionProofs.length} proof{sessionProofs.length !== 1 ? 's' : ''}
+                      {group.createdAt && ` \u00B7 ${formatDate(group.createdAt)}`}
+                    </p>
+                  </div>
+                  <div className="run-history-group-badges">
+                    {group.isCurrent && (
+                      <span className="run-history-group-badge run-history-group-badge--current">
+                        Current Session
+                      </span>
+                    )}
+                    {group.isLegacy && (
+                      <span className="run-history-group-badge">Legacy</span>
+                    )}
+                  </div>
+                </div>
+
+                <div className="run-history-group-body">
+                  <div className="answer-list">
+                    {sessionProofs.map((proof) => {
+                      const id = proof.library_id || proof.proof_id;
+                      const isExpanded = expandedId === id;
+
+                      return (
+                        <div
+                          key={id}
+                          className={`answer-card proof-card ${isExpanded ? 'expanded' : ''} ${
+                            proof.novel ? 'proof-card--novel' : 'proof-card--known'
+                          }`}
+                        >
+                          <div
+                            className="answer-header"
+                            onClick={() => handleExpand(proof)}
+                          >
+                            <div className="answer-title-row">
+                              <h4 className="answer-title proof-title">
+                                {proof.theorem_name || proof.proof_id}
+                              </h4>
+                              <button className="expand-button">
+                                {isExpanded ? '\u25B2' : '\u25BC'}
+                              </button>
+                            </div>
+
+                            <div className="answer-metadata">
+                              <span
+                                className={`format-badge ${
+                                  proof.novel ? 'proof-badge--novel' : 'proof-badge--known'
+                                }`}
+                              >
+                                {proof.novel ? 'Novel' : 'Known'}
+                              </span>
+                              <span className="word-count">
+                                {proof.solver || 'Lean 4'}
+                              </span>
+                              <span className="word-count">
+                                {proof.attempt_count || 1} attempt{(proof.attempt_count || 1) !== 1 ? 's' : ''}
+                              </span>
+                              <span className="word-count">
+                                Source: {proof.source_type === 'brainstorm' ? 'Brainstorm' : 'Paper'}
+                              </span>
+                            </div>
+
+                            <p className="proof-statement">
+                              {truncate(proof.theorem_statement, 300)}
+                            </p>
+
+                            {proof.source_title && (
+                              <p className="answer-prompt">
+                                <strong>Source:</strong> {proof.source_title}
+                              </p>
+                            )}
+
+                            <div className="answer-footer-info">
+                              <span className="completion-date">
+                                Verified: {formatDate(proof.created_at)}
+                              </span>
+                            </div>
+                          </div>
+
+                          {isExpanded && (
+                            <div className="answer-content">
+                              {loadingContentId === id ? (
+                                <div className="library-loading" style={{ padding: '20px' }}>
+                                  <span className="library-loading__icon">&#x21BB;</span>
+                                  <span className="library-loading__text">Loading proof details...</span>
+                                </div>
+                              ) : expandedProof ? (
+                                <div className="proof-expanded-content">
+                                  <div className="proof-detail-section">
+                                    <h4>Theorem Statement</h4>
+                                    <pre className="proof-code-block">
+                                      {expandedProof.theorem_statement}
+                                    </pre>
+                                  </div>
+
+                                  {expandedProof.novelty_reasoning && (
+                                    <div className="proof-detail-section">
+                                      <h4>Novelty Assessment</h4>
+                                      <p>{expandedProof.novelty_reasoning}</p>
+                                    </div>
+                                  )}
+
+                                  {expandedProof.verification_notes && (
+                                    <div className="proof-detail-section">
+                                      <h4>Verification Notes</h4>
+                                      <p>{expandedProof.verification_notes}</p>
+                                    </div>
+                                  )}
+
+                                  {expandedProof.formal_sketch && (
+                                    <div className="proof-detail-section">
+                                      <h4>Formal Sketch</h4>
+                                      <pre className="proof-code-block">
+                                        {expandedProof.formal_sketch}
+                                      </pre>
+                                    </div>
+                                  )}
+
+                                  {expandedProof.lean_code && (
+                                    <div className="proof-detail-section">
+                                      <h4>Lean 4 Source Code</h4>
+                                      <pre className="proof-code-block proof-lean-code">
+                                        {expandedProof.lean_code}
+                                      </pre>
+                                    </div>
+                                  )}
+
+                                  {expandedProof.dependencies && expandedProof.dependencies.length > 0 && (
+                                    <div className="proof-detail-section">
+                                      <h4>Dependencies</h4>
+                                      <ul className="proof-dependencies-list">
+                                        {expandedProof.dependencies.map((dep, i) => (
+                                          <li key={i}>
+                                            <span className={`proof-dep-kind proof-dep-kind--${dep.kind}`}>
+                                              {dep.kind}
+                                            </span>
+                                            {' '}
+                                            {dep.name}
+                                            {dep.source_ref ? ` (${dep.source_ref})` : ''}
+                                          </li>
+                                        ))}
+                                      </ul>
+                                    </div>
+                                  )}
+
+                                  <div className="quick-download-buttons">
+                                    {expandedProof.lean_code && (
+                                      <button
+                                        className="quick-download-raw"
+                                        onClick={() => handleDownloadLean(expandedProof)}
+                                      >
+                                        Download .lean
+                                      </button>
+                                    )}
+                                  </div>
+                                </div>
+                              ) : null}
+                            </div>
+                          )}
+                        </div>
+                      );
+                    })}
+                  </div>
+                </div>
+              </div>
+            );
+          })}
+        </div>
+      ) : (
+        <div className="answer-list">
+          {filteredProofs.map((proof) => {
+            const id = proof.library_id || proof.proof_id;
+            return (
+              <div key={id} className="answer-card proof-card">
+                <div className="answer-header" onClick={() => handleExpand(proof)}>
+                  <h4 className="answer-title">{proof.theorem_name || proof.proof_id}</h4>
+                </div>
+              </div>
+            );
+          })}
+        </div>
+      )}
+
+      <div className="library-footer">
+        <button className="refresh-button" onClick={loadProofLibrary}>
+          Refresh Proof Library
+        </button>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/autonomous/ProofNotificationStack.jsx b/frontend/src/components/autonomous/ProofNotificationStack.jsx
index 8ff6b32..54db44c 100644
--- a/frontend/src/components/autonomous/ProofNotificationStack.jsx
+++ b/frontend/src/components/autonomous/ProofNotificationStack.jsx
@@ -76,7 +76,7 @@ export default function ProofNotificationStack({ notifications, onDismiss, onCli
                   fontWeight: 700,
                 }}
               >
-                Congratulations! Novel Mathematical Proof Discovered
+                Congratulations! Novel Proof or Novel Formulation Discovered
               </div>
               <div
                 style={{
diff --git a/frontend/src/components/autonomous/index.js b/frontend/src/components/autonomous/index.js
index 3d03683..518b1cf 100644
--- a/frontend/src/components/autonomous/index.js
+++ b/frontend/src/components/autonomous/index.js
@@ -10,4 +10,5 @@ export { default as AutonomousResearchLogs } from './AutonomousResearchLogs';
 export { default as FinalAnswerView } from './FinalAnswerView';
 export { default as FinalAnswerLibrary } from './FinalAnswerLibrary';
 export { default as MathematicalProofs } from './MathematicalProofs';
+export { default as ProofLibrary } from './ProofLibrary';
 
diff --git a/frontend/src/components/compiler/CompilerSettings.jsx b/frontend/src/components/compiler/CompilerSettings.jsx
index c6c4bba..37de78e 100644
--- a/frontend/src/components/compiler/CompilerSettings.jsx
+++ b/frontend/src/components/compiler/CompilerSettings.jsx
@@ -393,11 +393,26 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   const getAutoSettingsForModel = async (modelId, selectedProvider = null) => {
     const model = findOpenRouterModel(openRouterModels, modelId);
     if (!model) {
+      console.debug('[CompilerAutoFill] model not in loaded list, skipping auto-fill', { modelId });
       return null;
     }
 
     const providerData = await fetchProvidersForModel(modelId);
-    return computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    const autoSettings = computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    if (autoSettings) {
+      console.debug('[CompilerAutoFill] computed auto-settings', {
+        modelId,
+        selectedProvider,
+        source: autoSettings.source,
+        contextWindow: autoSettings.contextWindow,
+        maxOutputTokens: autoSettings.maxOutputTokens,
+        warnings: autoSettings.warnings,
+      });
+      if (autoSettings.warnings && autoSettings.warnings.length > 0) {
+        console.warn('[CompilerAutoFill] auto-settings fallback used:', autoSettings.warnings);
+      }
+    }
+    return autoSettings;
   };
 
   // Critique prompt handlers
@@ -585,8 +600,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               if (effectiveProvider === 'openrouter' && m) {
                 const autoSettings = await getAutoSettingsForModel(m, null);
                 if (autoSettings) {
-                  setContextSize(autoSettings.contextWindow);
-                  setMaxOutput(autoSettings.maxOutputTokens);
+                  if (autoSettings.contextWindowKnown) {
+                    setContextSize(autoSettings.contextWindow);
+                  }
+                  if (autoSettings.outputCapKnown) {
+                    setMaxOutput(autoSettings.maxOutputTokens);
+                  }
                 }
               }
             }}
@@ -619,8 +638,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 setOpenrouterProv(providerName);
                 const autoSettings = await getAutoSettingsForModel(model, providerName);
                 if (autoSettings) {
-                  setContextSize(autoSettings.contextWindow);
-                  setMaxOutput(autoSettings.maxOutputTokens);
+                  if (autoSettings.contextWindowKnown) {
+                    setContextSize(autoSettings.contextWindow);
+                  }
+                  if (autoSettings.outputCapKnown) {
+                    setMaxOutput(autoSettings.maxOutputTokens);
+                  }
                 }
               }}
             >
@@ -660,7 +683,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 setContextSize(isNaN(parsed) ? 131072 : parsed);
               }}
               min={4096}
-              max={999999}
+              max={50000000}
               step={1024}
             />
           </div>
@@ -675,7 +698,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 setMaxOutput(isNaN(parsed) ? 25000 : parsed);
               }}
               min={1000}
-              max={100000}
+              max={50000000}
               step={1000}
             />
           </div>
@@ -737,7 +760,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         <RoleConfig
           title="High-Parameter Model"
           description="Rigor enhancement mode: adds citations, strengthens methodology, and clarifies assumptions."
-          borderColor="#1eff1c"
+          borderColor="#2a2a2a"
           provider={highParamProvider} setProvider={setHighParamProvider}
           model={highParamModel} setModel={setHighParamModel}
           openrouterProv={highParamOpenrouterProvider} setOpenrouterProv={setHighParamOpenrouterProvider}
diff --git a/frontend/src/components/settings-common.css b/frontend/src/components/settings-common.css
index 8845e5e..2d62893 100644
--- a/frontend/src/components/settings-common.css
+++ b/frontend/src/components/settings-common.css
@@ -185,7 +185,7 @@
 }
 
 .role-config-card--openrouter {
-  border-color: #18cc17;
+  border-color: #2a2a2a;
   background: rgba(26, 26, 56, 0.8);
 }
 
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 6666081..0b0d539 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -1543,6 +1543,79 @@ button.danger:hover {
   50% { opacity: 0.7; }
 }
 
+/* ============================================================================
+   Your Completed Works Library - Parent Tab with Sub-Tabs
+   ============================================================================ */
+
+.completed-works-library {
+  min-height: calc(100vh - 160px);
+}
+
+.completed-works-header {
+  text-align: center;
+  margin-bottom: 24px;
+  padding-bottom: 16px;
+  border-bottom: 1px solid rgba(30, 255, 28, 0.12);
+}
+
+.completed-works-title {
+  color: #1eff1c;
+  font-size: 2rem;
+  font-weight: 700;
+  margin: 0 0 8px 0;
+}
+
+.completed-works-subtitle {
+  color: #b9b9c6;
+  font-size: 1rem;
+  margin: 0;
+}
+
+.completed-works-sub-tabs {
+  display: flex;
+  gap: 4px;
+  margin-bottom: 20px;
+  padding: 4px;
+  background: var(--surface-2, #1a1a22);
+  border-radius: 10px;
+  border: 1px solid rgba(255, 255, 255, 0.07);
+}
+
+.completed-works-sub-tab {
+  flex: 1;
+  padding: 12px 20px;
+  background: transparent;
+  border: 2px solid transparent;
+  border-radius: 8px;
+  color: #888;
+  font-size: 0.92rem;
+  font-weight: 600;
+  cursor: pointer;
+  transition: all 0.25s ease;
+  white-space: nowrap;
+}
+
+.completed-works-sub-tab:hover {
+  background: rgba(255, 255, 255, 0.05);
+  color: #ccc;
+}
+
+.completed-works-sub-tab.active {
+  background: linear-gradient(135deg, rgba(30, 255, 28, 0.12) 0%, rgba(30, 255, 28, 0.05) 100%);
+  border-color: rgba(30, 255, 28, 0.35);
+  color: #1eff1c;
+}
+
+.completed-works-content {
+  min-height: 400px;
+}
+
+@media (max-width: 768px) {
+  .completed-works-sub-tabs {
+    flex-direction: column;
+  }
+}
+
 /* Autonomous Research Styles */
 .autonomous-research {
   padding: 1rem;
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index 8280637..8fc17d5 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -560,6 +560,18 @@ export const autonomousAPI = {
     return `${API_BASE}/proofs/${encodeURIComponent(proofId)}/certificate.lean`;
   },
 
+  async getProofLibrary(novelOnly = true) {
+    const response = await fetch(`${API_BASE}/proofs/library?novel_only=${novelOnly}`);
+    if (!response.ok) throw new Error('Failed to get proof library');
+    return response.json();
+  },
+
+  async getLibraryProof(sessionId, proofId) {
+    const response = await fetch(`${API_BASE}/proofs/library/${encodeURIComponent(sessionId)}/${encodeURIComponent(proofId)}`);
+    if (!response.ok) throw new Error(`Failed to get library proof ${proofId}`);
+    return response.json();
+  },
+
   // Get current paper progress (in-progress paper during Tier 2)
   async getCurrentPaperProgress() {
     const response = await fetch(`${API_BASE}/auto-research/current-paper-progress`);
diff --git a/frontend/src/utils/openRouterSelection.js b/frontend/src/utils/openRouterSelection.js
index 11eded4..4d08e33 100644
--- a/frontend/src/utils/openRouterSelection.js
+++ b/frontend/src/utils/openRouterSelection.js
@@ -1,5 +1,8 @@
 const DEFAULT_CONTEXT_WINDOW = 131072;
 const CONTEXT_BUFFER_TOKENS = 500;
+const KNOWN_NO_OUTPUT_CAP_DEFAULTS = {
+  'x-ai/grok-4.3': 128000,
+};
 
 function toPositiveInteger(value) {
   const parsed = Number(value);
@@ -9,6 +12,11 @@ function toPositiveInteger(value) {
   return Math.floor(parsed);
 }
 
+function getKnownNoOutputCapDefault(model) {
+  const modelId = typeof model?.id === 'string' ? model.id.toLowerCase() : '';
+  return KNOWN_NO_OUTPUT_CAP_DEFAULTS[modelId] || null;
+}
+
 export function findOpenRouterModel(models, modelId) {
   if (!Array.isArray(models) || !modelId) {
     return null;
@@ -49,30 +57,82 @@ export function getProviderNames(providerData) {
   return normalizeProviderData(providerData).providers;
 }
 
+/**
+ * Compute auto-fill context window + max output tokens for an OpenRouter model.
+ *
+ * Returns a valid object and marks which values are metadata-backed:
+ *   1. Best: full endpoint metadata for the relevant provider(s)
+ *   2. Partial: use explicit `max_completion_tokens` when present
+ *   3. No-cap: use vetted model-specific defaults for known no-cap models
+ *   4. Unknown: fill context only and ask callers not to overwrite output
+ *
+ * The `source` field reports which tier produced the answer, and `warnings`
+ * is a list of human-readable diagnostics for logging.
+ */
 export function computeOpenRouterAutoSettings(model, providerData, selectedProvider = null) {
   const { endpoints } = normalizeProviderData(providerData);
+  const warnings = [];
 
   const relevantEndpoints = selectedProvider
     ? endpoints.filter((endpoint) => endpoint?.provider_name === selectedProvider)
     : endpoints;
 
+  if (selectedProvider && relevantEndpoints.length === 0 && endpoints.length > 0) {
+    warnings.push(
+      `Selected provider "${selectedProvider}" not present in endpoint list; falling back to model-level context.`
+    );
+  }
+
+  const modelContext = toPositiveInteger(model?.context_length);
+  const knownNoOutputCapDefault = getKnownNoOutputCapDefault(model);
+
   if (relevantEndpoints.length === 0) {
-    return null;
+    const contextWindow = modelContext || DEFAULT_CONTEXT_WINDOW;
+    const contextWindowKnown = modelContext !== null;
+    const maxOutputTokens = knownNoOutputCapDefault;
+
+    if (!modelContext) {
+      warnings.push(
+        `No endpoint metadata and no model.context_length; using default ${DEFAULT_CONTEXT_WINDOW}.`
+      );
+    } else {
+      warnings.push(
+        `No endpoint metadata available; falling back to model.context_length=${modelContext}.`
+      );
+    }
+
+    if (maxOutputTokens === null) {
+      warnings.push(
+        'No endpoint metadata exposed max_completion_tokens; preserving the current max output setting.'
+      );
+    } else {
+      warnings.push(
+        `No endpoint metadata exposed max_completion_tokens; using known no-cap default ${maxOutputTokens}.`
+      );
+    }
+
+    return {
+      contextWindow,
+      contextWindowKnown,
+      maxOutputTokens,
+      outputCapKnown: maxOutputTokens !== null,
+      outputCapSource: maxOutputTokens !== null ? 'known-no-cap-default' : 'unknown',
+      smallestEndpointOutputCap: null,
+      smallestEndpointContext: null,
+      smallestEndpointPromptCap: null,
+      fallbackModelContext: modelContext || DEFAULT_CONTEXT_WINDOW,
+      source: modelContext ? 'model-context-length' : 'hardcoded-default',
+      warnings,
+    };
   }
 
-  const hasCompleteEndpointContexts = relevantEndpoints.every(
+  // Filter endpoints to only those that expose a usable context_length.
+  const endpointsWithContext = relevantEndpoints.filter(
     (endpoint) => toPositiveInteger(endpoint?.context_length) !== null
   );
-  const hasCompleteEndpointOutputCaps = relevantEndpoints.every(
-    (endpoint) => toPositiveInteger(endpoint?.max_completion_tokens) !== null
-  );
-
-  if (!hasCompleteEndpointContexts || !hasCompleteEndpointOutputCaps) {
-    return null;
-  }
 
-  const endpointContexts = relevantEndpoints
-    .map((endpoint) => toPositiveInteger(endpoint?.context_length))
+  const endpointContexts = endpointsWithContext
+    .map((endpoint) => toPositiveInteger(endpoint.context_length))
     .filter((value) => value !== null);
 
   const endpointOutputCaps = relevantEndpoints
@@ -83,39 +143,83 @@ export function computeOpenRouterAutoSettings(model, providerData, selectedProvi
     .map((endpoint) => toPositiveInteger(endpoint?.max_prompt_tokens))
     .filter((value) => value !== null);
 
-  const smallestEndpointContext = Math.min(...endpointContexts);
-  const smallestEndpointOutputCap = Math.min(...endpointOutputCaps);
-  const smallestEndpointPromptCap = endpointPromptCaps.length > 0
-    ? Math.min(...endpointPromptCaps)
-    : null;
-
-  let contextWindow = smallestEndpointContext;
-  let twentyPercentOutputCap = Math.max(1, Math.floor(contextWindow * 0.2));
-
-  if (smallestEndpointPromptCap !== null) {
-    const promptLimitedOutputCap = Math.max(
-      1,
-      Math.floor((smallestEndpointPromptCap + CONTEXT_BUFFER_TOKENS) / 4)
+  // Choose a base context: smallest endpoint context, then model context, then default.
+  let contextWindow;
+  let contextWindowKnown = true;
+  if (endpointContexts.length > 0) {
+    contextWindow = Math.min(...endpointContexts);
+    if (endpointContexts.length < relevantEndpoints.length) {
+      warnings.push(
+        `${relevantEndpoints.length - endpointContexts.length}/${relevantEndpoints.length} endpoints missing context_length; using min of remaining.`
+      );
+    }
+  } else if (modelContext) {
+    contextWindow = modelContext;
+    warnings.push(
+      'No endpoints exposed context_length; falling back to model.context_length.'
+    );
+  } else {
+    contextWindow = DEFAULT_CONTEXT_WINDOW;
+    contextWindowKnown = false;
+    warnings.push(
+      `No endpoint or model context_length; using default ${DEFAULT_CONTEXT_WINDOW}.`
     );
-    twentyPercentOutputCap = Math.min(twentyPercentOutputCap, promptLimitedOutputCap);
   }
 
-  const maxOutputTokens = Math.min(smallestEndpointOutputCap, twentyPercentOutputCap);
+  const smallestEndpointContext = endpointContexts.length > 0 ? Math.min(...endpointContexts) : null;
+  const smallestEndpointOutputCap = endpointOutputCaps.length > 0 ? Math.min(...endpointOutputCaps) : null;
+  const smallestEndpointPromptCap = endpointPromptCaps.length > 0 ? Math.min(...endpointPromptCaps) : null;
+
+  // Determine max output tokens.
+  // If at least one endpoint provides max_completion_tokens, honor the smallest.
+  // If none do, use only vetted model-specific defaults; otherwise preserve
+  // the user's current setting instead of guessing from context length.
+  let maxOutputTokens;
+  let outputCapSource;
+  if (smallestEndpointOutputCap !== null) {
+    maxOutputTokens = smallestEndpointOutputCap;
+    outputCapSource = 'endpoint-metadata';
+    if (endpointOutputCaps.length < relevantEndpoints.length) {
+      warnings.push(
+        `${relevantEndpoints.length - endpointOutputCaps.length}/${relevantEndpoints.length} endpoints missing max_completion_tokens; using min of remaining.`
+      );
+    }
+  } else if (knownNoOutputCapDefault !== null) {
+    maxOutputTokens = knownNoOutputCapDefault;
+    outputCapSource = 'known-no-cap-default';
+    warnings.push(
+      `No endpoints exposed max_completion_tokens; using known no-cap default ${maxOutputTokens}.`
+    );
+  } else {
+    maxOutputTokens = null;
+    outputCapSource = 'unknown';
+    warnings.push(
+      'No endpoints exposed max_completion_tokens; preserving the current max output setting.'
+    );
+  }
 
-  if (smallestEndpointPromptCap !== null) {
+  if (smallestEndpointPromptCap !== null && maxOutputTokens !== null) {
     contextWindow = Math.min(
       contextWindow,
       smallestEndpointPromptCap + maxOutputTokens + CONTEXT_BUFFER_TOKENS
     );
   }
 
+  const source = smallestEndpointContext !== null && smallestEndpointOutputCap !== null
+    ? 'endpoint-metadata'
+    : 'partial-endpoint-metadata';
+
   return {
     contextWindow,
+    contextWindowKnown,
     maxOutputTokens,
-    twentyPercentOutputCap,
+    outputCapKnown: maxOutputTokens !== null,
+    outputCapSource,
     smallestEndpointOutputCap,
     smallestEndpointContext,
     smallestEndpointPromptCap,
-    fallbackModelContext: toPositiveInteger(model?.context_length) || DEFAULT_CONTEXT_WINDOW,
+    fallbackModelContext: modelContext || DEFAULT_CONTEXT_WINDOW,
+    source,
+    warnings,
   };
 }
diff --git a/moto_launcher.py b/moto_launcher.py
index 1c6d5e0..b823681 100644
--- a/moto_launcher.py
+++ b/moto_launcher.py
@@ -14,7 +14,7 @@
 import re
 import socket
 import shlex
-from shutil import which
+from shutil import rmtree, which
 import subprocess
 import sys
 import tarfile
@@ -885,15 +885,29 @@ def _write_lean_workspace_files(workspace_dir: Path) -> None:
 
 
 def _download_file(url: str, destination: Path) -> None:
-    """Download a remote file to disk using the standard library."""
+    """Download a remote file to disk using the standard library.
+
+    Writes to a sibling temp file first, then atomically renames on success so
+    a partial download caused by a timeout or interruption never leaves a
+    corrupt file at the destination path.
+    """
     destination.parent.mkdir(parents=True, exist_ok=True)
-    request = Request(url, headers={"User-Agent": "MOTO Launcher"})
-    with urlopen(request, timeout=120) as response, destination.open("wb") as handle:
-        while True:
-            chunk = response.read(1024 * 1024)
-            if not chunk:
-                break
-            handle.write(chunk)
+    tmp = destination.with_suffix(destination.suffix + ".tmp")
+    try:
+        request = Request(url, headers={"User-Agent": "MOTO Launcher"})
+        with urlopen(request) as response, tmp.open("wb") as handle:
+            while True:
+                chunk = response.read(1024 * 1024)
+                if not chunk:
+                    break
+                handle.write(chunk)
+        tmp.replace(destination)
+    except Exception:
+        try:
+            tmp.unlink(missing_ok=True)
+        except OSError:
+            pass
+        raise
 
 
 def _extract_archive(archive_path: Path, destination: Path) -> None:
@@ -911,6 +925,19 @@ def _extract_archive(archive_path: Path, destination: Path) -> None:
     raise RuntimeError(f"Unsupported archive format: {archive_path.name}")
 
 
+def _is_valid_archive(archive_path: Path) -> bool:
+    """Return True when the file at archive_path is a readable zip or tarball."""
+    try:
+        name = archive_path.name.lower()
+        if name.endswith(".zip"):
+            return zipfile.is_zipfile(archive_path)
+        if name.endswith(".tar.gz") or name.endswith(".tgz"):
+            return tarfile.is_tarfile(archive_path)
+        return False
+    except OSError:
+        return False
+
+
 def _detect_z3_asset_name() -> tuple[str, tuple[str, ...]]:
     """Return the preferred platform marker and fallback markers for Z3 assets."""
     machine = platform.machine().lower()
@@ -1040,15 +1067,21 @@ def _set_smt_env_flags(
     env["MOTO_SMT_TIMEOUT"] = env.get("MOTO_SMT_TIMEOUT", "").strip() or "30"
 
 
-def install_lean4(runtime: InstanceRuntime, env: dict[str, str]) -> None:
+def install_lean4(
+    runtime: InstanceRuntime,
+    env: dict[str, str],
+    *,
+    _is_repair: bool = False,
+) -> None:
     """
     Ensure Lean 4 / elan is available for proof verification.
 
     This step is intentionally non-fatal: if installation fails, MOTO still
     launches and simply skips automated proof verification.
     """
-    cprint("[4c/8] Checking Lean 4 / elan for proof verification...", YELLOW)
-    print()
+    if not _is_repair:
+        cprint("[4c/8] Checking Lean 4 / elan for proof verification...", YELLOW)
+        print()
 
     elan_bin_dir = Path.home() / ".elan" / "bin"
     lean_cmd = get_lean_command()
@@ -1076,6 +1109,10 @@ def install_lean4(runtime: InstanceRuntime, env: dict[str, str]) -> None:
                 archive_path = managed_root / "downloads" / asset["name"]
                 install_root = managed_root / "current"
 
+                if archive_path.exists() and not _is_valid_archive(archive_path):
+                    cprint("Cached elan archive appears corrupt — re-downloading...", YELLOW)
+                    archive_path.unlink(missing_ok=True)
+
                 if not archive_path.exists():
                     _download_file(asset["browser_download_url"], archive_path)
 
@@ -1127,7 +1164,26 @@ def install_lean4(runtime: InstanceRuntime, env: dict[str, str]) -> None:
     lean_cmd = get_lean_command()
     lake_cmd = get_lake_command()
     if not lean_cmd or not lake_cmd:
-        cprint("WARNING: Lean 4 tooling is incomplete -- proof verification will be skipped.", YELLOW)
+        # Tooling is incomplete (e.g. lake missing after a partial elan update).
+        # Attempt the same wipe-and-retry repair before giving up.
+        cprint("Lean 4 tooling is incomplete (lean or lake not found after install).", YELLOW)
+        if env.get("_MOTO_LEAN4_REPAIR_ATTEMPTED") != "1":
+            cprint("Attempting to repair by wiping elan and reinstalling...", YELLOW)
+            print()
+            try:
+                if elan_bin_dir.parent.exists():
+                    rmtree(str(elan_bin_dir.parent), ignore_errors=True)
+                managed_elan_root = Path(runtime.data_root) / "elan"
+                if managed_elan_root.exists():
+                    rmtree(str(managed_elan_root), ignore_errors=True)
+                env["_MOTO_LEAN4_REPAIR_ATTEMPTED"] = "1"
+                install_lean4(runtime, env, _is_repair=True)
+                return
+            except Exception as repair_exc:
+                cprint("WARNING: Lean 4 repair failed -- proof verification will be skipped.", YELLOW)
+                cprint(str(repair_exc), YELLOW)
+        else:
+            cprint("WARNING: Lean 4 tooling still incomplete after repair -- proof verification will be skipped.", YELLOW)
         _set_lean_env_flags(env, enabled=False)
         print()
         return
@@ -1136,8 +1192,37 @@ def install_lean4(runtime: InstanceRuntime, env: dict[str, str]) -> None:
         lean_version = subprocess.check_output([lean_cmd, "--version"], text=True).strip()
         cprint(f"Lean 4 ready: {lean_version}", GREEN)
     except Exception as exc:
-        cprint("WARNING: Lean 4 verification failed during version check -- proof verification will be skipped.", YELLOW)
+        # The lean binary exists but is broken (corrupted toolchain, bad elan state,
+        # incomplete update, etc.).  Wipe the elan directory and retry installation
+        # once rather than giving up — this is the same non-fatal install path used
+        # when Lean is missing entirely.
+        cprint("Lean 4 version check failed — installation may be corrupt.", YELLOW)
         cprint(str(exc), YELLOW)
+        if env.get("_MOTO_LEAN4_REPAIR_ATTEMPTED") != "1":
+            cprint("Attempting to repair by wiping elan and reinstalling...", YELLOW)
+            print()
+            try:
+                if elan_bin_dir.parent.exists():
+                    rmtree(str(elan_bin_dir.parent), ignore_errors=True)
+                managed_elan_root = Path(runtime.data_root) / "elan"
+                if managed_elan_root.exists():
+                    rmtree(str(managed_elan_root), ignore_errors=True)
+                # Verify the wipe actually removed the binary — on Windows, file
+                # locks from the just-invoked lean process can cause rmtree to
+                # silently skip files when ignore_errors=True.
+                if get_lean_command() is not None:
+                    raise RuntimeError(
+                        "Could not remove corrupt Lean binary (file may be locked). "
+                        "Try closing any running Lean processes and relaunching MOTO."
+                    )
+                env["_MOTO_LEAN4_REPAIR_ATTEMPTED"] = "1"
+                install_lean4(runtime, env, _is_repair=True)
+                return
+            except Exception as repair_exc:
+                cprint("WARNING: Lean 4 repair failed -- proof verification will be skipped.", YELLOW)
+                cprint(str(repair_exc), YELLOW)
+        else:
+            cprint("WARNING: Lean 4 still broken after repair -- proof verification will be skipped.", YELLOW)
         _set_lean_env_flags(env, enabled=False)
         print()
         return
@@ -1195,6 +1280,10 @@ def install_z3(runtime: InstanceRuntime, env: dict[str, str]) -> None:
             archive_path = managed_root / "downloads" / asset["name"]
             install_root = managed_root / "current"
 
+            if archive_path.exists() and not _is_valid_archive(archive_path):
+                cprint("Cached Z3 archive appears corrupt — re-downloading...", YELLOW)
+                archive_path.unlink(missing_ok=True)
+
             if not archive_path.exists():
                 _download_file(asset["browser_download_url"], archive_path)
 
diff --git a/randomlog.txt b/randomlog.txt
new file mode 100644
index 0000000..7818869
--- /dev/null
+++ b/randomlog.txt
@@ -0,0 +1,904 @@
+2026-04-30 19:29:13.331 - backend.api.middleware - INFO - Using default CORS origins: ['http://localhost:5173', 'http://127.0.0.1:5173', 'http://localhost:8000', 'http://127.0.0.1:8000']
+2026-04-30 19:29:13.331 - backend.api.middleware - INFO - Middleware configured
+INFO:     Started server process [51848]
+INFO:     Waiting for application startup.
+2026-04-30 19:29:13.347 - backend.api.main - INFO - Starting ASI Aggregator System instance 'default' (data_dir=C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data, logs_dir=C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\logs)
+2026-04-30 19:29:13.347 - backend.api.main - INFO - Secret store active: namespaced_instance=False
+2026-04-30 19:29:13.760 - backend.shared.api_client_manager - INFO - OpenRouter client initialized
+2026-04-30 19:29:13.760 - backend.api.main - INFO - Restored OpenRouter API key from secure backend storage
+2026-04-30 19:29:14.126 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha client initialized
+2026-04-30 19:29:14.126 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha singleton client initialized
+2026-04-30 19:29:14.126 - backend.api.main - INFO - Restored Wolfram Alpha API key from secure backend storage
+2026-04-30 19:29:14.142 - backend.shared.lm_studio_client - INFO - Successfully connected to LM Studio. Found 36 models.
+2026-04-30 19:29:14.159 - backend.autonomous.memory.session_manager - INFO - Found paused session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34 (last updated: 2026-04-30T17:41:52.645719)
+2026-04-30 19:29:14.159 - backend.api.main - INFO - Found resumable session on startup: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:14.159 - backend.autonomous.memory.session_manager - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:14.159 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
+2026-04-30 19:29:14.159 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
+2026-04-30 19:29:14.159 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:14.159 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
+2026-04-30 19:29:14.159 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\proofs
+2026-04-30 19:29:14.159 - backend.api.main - INFO - Session context restored - brainstorms and papers will load from session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:14.172 - backend.api.main - INFO - ASI Aggregator System ready
+2026-04-30 19:29:14.172 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\lean4_workspace
+INFO:     Application startup complete.
+INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)
+2026-04-30 19:29:26.185 - backend.autonomous.memory.research_metadata - INFO - Workflow state loaded: tier=tier2_paper_writing
+INFO:     127.0.0.1:52471 - "WebSocket /ws" [accepted]
+2026-04-30 19:29:26.465 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
+INFO:     connection open
+2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 1 (Main Submitter): model=moonshotai/kimi-k2.6, context=262000, max_tokens=40000
+2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 2 : model=openai/gpt-oss-120b, context=131072, max_tokens=25000
+2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 3 : model=deepseek/deepseek-v4-pro, context=1048576, max_tokens=65500
+2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 4 : model=inception/mercury-2, context=128000, max_tokens=25000
+2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Validator: model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
+2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous coordinator initializing with 4 submitters
+2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 1 (Main Submitter): model=moonshotai/kimi-k2.6, context=262000
+2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 2 : model=openai/gpt-oss-120b, context=131072
+2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 3 : model=deepseek/deepseek-v4-pro, context=1048576
+2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 4 : model=inception/mercury-2, context=128000
+2026-04-30 19:29:33.301 - backend.autonomous.memory.session_manager - INFO - Found paused session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34 (last updated: 2026-04-30T17:41:52.645719)
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO - Found interrupted session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   User prompt: Solve does P = NP or does P DNE NP, or something else. Find the solution of P and NP....
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Last updated: 2026-04-30T17:41:52.645719
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Tier: tier2_paper_writing
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Topic: topic_004
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Acceptances: 20
+2026-04-30 19:29:33.301 - backend.autonomous.memory.session_manager - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:33.301 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
+2026-04-30 19:29:33.301 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
+2026-04-30 19:29:33.301 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
+2026-04-30 19:29:33.301 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
+2026-04-30 19:29:33.301 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\proofs
+2026-04-30 19:29:33.301 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
+2026-04-30 19:29:33.301 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
+2026-04-30 19:29:33.316 - backend.autonomous.memory.research_metadata - INFO - Workflow state loaded: tier=tier2_paper_writing
+2026-04-30 19:29:33.317 - backend.autonomous.memory.research_metadata - INFO - Research metadata initialized
+2026-04-30 19:29:33.317 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Autonomous rejection logs initialized
+2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_coordinator - INFO - Resetting RAG state for fresh autonomous research mode...
+2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
+2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
+2026-04-30 19:29:33.317 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
+2026-04-30 19:29:33.373 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
+2026-04-30 19:29:33.619 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
+2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
+2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
+2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
+2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
+2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
+2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
+2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
+2026-04-30 19:29:33.652 - backend.autonomous.core.autonomous_coordinator - INFO - RAG state reset and cleared for autonomous mode
+2026-04-30 19:29:33.652 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
+2026-04-30 19:29:33.667 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
+2026-04-30 19:29:33.667 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager initialized
+2026-04-30 19:29:33.668 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_selector': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_completion_reviewer': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_reference_selector': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_title_selector': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_redundancy_checker': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_framing_gate': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_novelty': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_certainty_assessor': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_format_selector': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_volume_organizer': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Configured Tier 3 Final Answer agents with api_client_manager
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Found interrupted workflow state: tier=tier2_paper_writing
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Workflow state restored: topic=topic_004, paper=None, phase=None, acceptances=20, reference_papers=0, tier3_active=False, tier3_phase=None, tier3_format=None
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator initialized
+2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Autonomous API logger callback set
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging enabled
+2026-04-30 19:29:33.669 - backend.shared.token_tracker - INFO - TokenTracker reset
+2026-04-30 19:29:33.669 - backend.shared.token_tracker - INFO - TokenTracker timer started
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator started
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Resuming from interrupted workflow: tier=tier2_paper_writing, topic=topic_004, paper=None
+2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper compilation for brainstorm topic_004
+2026-04-30 19:29:33.702 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Starting selection (limit=3, total_cap=3, 4 available, 0 already selected)
+2026-04-30 19:29:33.853 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector: Requesting expansion with model moonshotai/kimi-k2.6 (prompt=9729t, task_id=agg_sub1_000)
+2026-04-30 19:31:01.064 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Direct injection for 2 papers (27640 tokens <= 88800 budget)
+2026-04-30 19:31:01.066 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Making final selection with model moonshotai/kimi-k2.6 (prompt=35377t, max=3 papers, task_id=agg_sub1_001)
+2026-04-30 19:31:14.193 - backend.shared.lean4_client - WARNING - Lean 4 workspace update failed: Lean 4 process timed out after 120 seconds.
+2026-04-30 19:31:14.194 - backend.shared.lean4_client - WARNING - Lean 4 LSP warm start skipped because the workspace is not ready.
+2026-04-30 19:31:44.236 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Selected 2 reference papers
+2026-04-30 19:31:44.237 - backend.autonomous.core.autonomous_coordinator - INFO - Additional reference selection: 2 new + 0 existing = 2 total
+2026-04-30 19:31:44.249 - backend.aggregator.memory.shared_training - INFO - Brainstorm database file doesn't exist yet: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\title_candidates_topic_004.txt
+2026-04-30 19:31:44.249 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper title exploration phase (target: 5 candidates, resumed: 0)
+2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
+2026-04-30 19:31:44.250 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 262000, Validator: 2000000
+2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 4 submitters with models ['moonshotai/kimi-k2.6', 'openai/gpt-oss-120b', 'deepseek/deepseek-v4-pro', 'inception/mercury-2'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
+2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Boost mode ACTIVE: Will route selected tasks to openai/gpt-5.5-pro. This does NOT affect parallel execution mode.
+2026-04-30 19:31:44.689 - backend.aggregator.core.coordinator - INFO - Currently loaded models: []
+2026-04-30 19:31:44.689 - backend.aggregator.core.coordinator - INFO - Context window configuration:
+  - Submitter 1: 262000 tokens (model: moonshotai/kimi-k2.6)
+  - Submitter 2: 131072 tokens (model: openai/gpt-oss-120b)
+  - Submitter 3: 1048576 tokens (model: deepseek/deepseek-v4-pro)
+  - Submitter 4: 128000 tokens (model: inception/mercury-2)
+  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
+2026-04-30 19:31:44.691 - backend.aggregator.memory.shared_training - INFO - Created new shared training file
+2026-04-30 19:31:44.692 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
+2026-04-30 19:31:44.797 - backend.aggregator.memory.event_log - INFO - Loaded 11401 events from event log
+2026-04-30 19:31:44.812 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 1
+2026-04-30 19:31:44.812 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model moonshotai/kimi-k2.6
+2026-04-30 19:31:44.812 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:31:44.812 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
+2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 2
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model openai/gpt-oss-120b
+2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=openai/gpt-oss-120b via Groq
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=openai/gpt-oss-120b, provider=openrouter, context=131072
+2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 3
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model deepseek/deepseek-v4-pro
+2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=deepseek/deepseek-v4-pro
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=deepseek/deepseek-v4-pro, provider=openrouter, context=1048576
+2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 4
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 4 initialized with model inception/mercury-2
+2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_4': provider=openrouter, model=inception/mercury-2
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 4: model=inception/mercury-2, provider=openrouter, context=128000
+2026-04-30 19:31:44.820 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
+2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 4 submitters
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 4 started
+2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
+2026-04-30 19:31:44.820 - backend.autonomous.core.autonomous_coordinator - INFO - Title exploration aggregator started with parallel submitters
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
+2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
+2026-04-30 19:31:44.837 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
+2026-04-30 19:31:44.837 - backend.aggregator.agents.submitter - INFO - Submitter 4 run loop started - will run continuously until stopped
+2026-04-30 19:31:44.851 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
+2026-04-30 19:31:45.967 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 90ff3b52-2cd0-4836-b84b-c9a8b6f09923 (iteration 1)
+2026-04-30 19:31:46.533 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission a13f37f2-dba1-4954-90e3-c51ed09299df (iteration 1)
+2026-04-30 19:31:46.869 - backend.aggregator.core.coordinator - INFO - Validator iteration 3 - batch validating 2 submissions: ['90ff3b52-2cd0-4836-b84b-c9a8b6f09923', 'a13f37f2-dba1-4954-90e3-c51ed09299df']
+2026-04-30 19:31:46.869 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
+2026-04-30 19:31:46.869 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
+2026-04-30 19:31:49.165 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 108946eb-bded-4310-82e4-6ada17054636 (iteration 2)
+2026-04-30 19:31:50.267 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 142a762f-32c5-4c54-a884-34f04586e893 (iteration 2)
+2026-04-30 19:31:52.092 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 12d94cc1-78a2-44ea-b05f-1046e5f56ef7 (iteration 3)
+2026-04-30 19:31:54.326 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cee583c3-8a97-4c8c-b922-0fd8bb290de3 (iteration 3)
+2026-04-30 19:31:54.984 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 988c5fc6-6301-466d-8b78-eb991f517bf3 (iteration 4)
+2026-04-30 19:31:57.565 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 9ac811a6-d27f-4fb2-bdf3-8ce6c98ec4f4 (iteration 4)
+2026-04-30 19:31:58.096 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 3a3d3d0e-a5ae-497e-b0bc-3348c65ee135 (iteration 5)
+2026-04-30 19:32:00.958 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 6d18dff1-623f-479e-b972-e109f555d9d9 (iteration 5)
+2026-04-30 19:32:01.082 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 00db103c-1bd8-4282-973c-f77c2f9ec7dc (iteration 6)
+2026-04-30 19:32:04.022 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission c52670ac-49d7-477a-b64c-e581d1130917 (iteration 6)
+2026-04-30 19:32:14.911 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/2 accepted
+2026-04-30 19:32:14.915 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
+2026-04-30 19:32:14.915 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-04-30 19:32:14.915 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission accepted (total: 1)
+2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 4 (total: 1)
+2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-04-30 19:32:14.917 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 1 total chunks
+2026-04-30 19:32:14.917 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
+2026-04-30 19:32:14.917 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 1)
+2026-04-30 19:32:14.927 - backend.aggregator.core.coordinator - INFO - Queue size (10) >= threshold (10). Pausing submitters.
+2026-04-30 19:32:14.927 - backend.aggregator.core.coordinator - INFO - Validator iteration 4 - batch validating 3 submissions: ['108946eb-bded-4310-82e4-6ada17054636', '142a762f-32c5-4c54-a884-34f04586e893', '12d94cc1-78a2-44ea-b05f-1046e5f56ef7']
+2026-04-30 19:32:14.927 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:32:14.927 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:32:14.994 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 1/5 candidates accepted
+2026-04-30 19:32:16.139 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-04-30 19:32:16.139 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-04-30 19:32:40.316 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
+2026-04-30 19:32:40.318 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 1)
+2026-04-30 19:32:40.318 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 2)
+2026-04-30 19:32:40.321 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 2)
+2026-04-30 19:32:40.321 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 3)
+2026-04-30 19:32:40.324 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
+2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-04-30 19:32:40.325 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission accepted (total: 2)
+2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 4 (total: 2)
+2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-04-30 19:32:40.326 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-04-30 19:32:40.326 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
+2026-04-30 19:32:40.326 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 1 total chunks
+2026-04-30 19:32:40.330 - backend.aggregator.core.coordinator - INFO - Queue size (7) < threshold (10). Resuming submitters.
+2026-04-30 19:32:40.331 - backend.aggregator.core.coordinator - INFO - Validator iteration 5 - batch validating 3 submissions: ['cee583c3-8a97-4c8c-b922-0fd8bb290de3', '988c5fc6-6301-466d-8b78-eb991f517bf3', '9ac811a6-d27f-4fb2-bdf3-8ce6c98ec4f4']
+2026-04-30 19:32:40.331 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:32:40.331 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:32:40.364 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
+2026-04-30 19:32:40.364 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
+2026-04-30 19:32:40.523 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 44116b14-83a3-4e5c-9892-b768941b848c (iteration 1)
+2026-04-30 19:32:41.086 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 2/5 candidates accepted
+2026-04-30 19:32:42.437 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission acbc42c6-e70c-4e5f-a141-4f6b6165214f (iteration 7)
+2026-04-30 19:32:44.108 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cf198397-5da9-44b7-896b-40905acbd42d (iteration 7)
+2026-04-30 19:32:45.695 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission ffb22bc0-8c59-454b-bb1b-561b7ebecf3e (iteration 8)
+2026-04-30 19:32:47.524 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 2d78831a-7c3e-4354-8d3c-81758b2627d9 (iteration 8)
+2026-04-30 19:32:49.018 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 50605199-ecaa-4ab1-8829-3468e76092f1 (iteration 9)
+2026-04-30 19:32:51.107 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cd68c0a9-f4c2-4f11-afd6-333af4025879 (iteration 9)
+2026-04-30 19:32:55.641 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
+2026-04-30 19:32:55.644 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
+2026-04-30 19:32:55.644 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-04-30 19:32:55.645 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 1)
+2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 3)
+2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
+2026-04-30 19:32:55.645 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 2 total chunks
+2026-04-30 19:32:55.652 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 1)
+2026-04-30 19:32:55.652 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 4)
+2026-04-30 19:32:55.656 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
+2026-04-30 19:32:55.656 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 5)
+2026-04-30 19:32:55.658 - backend.aggregator.core.coordinator - INFO - Queue size (11) >= threshold (10). Pausing submitters.
+2026-04-30 19:32:55.658 - backend.aggregator.core.coordinator - INFO - Validator iteration 6 - batch validating 3 submissions: ['3a3d3d0e-a5ae-497e-b0bc-3348c65ee135', '6d18dff1-623f-479e-b972-e109f555d9d9', '00db103c-1bd8-4282-973c-f77c2f9ec7dc']
+2026-04-30 19:32:55.659 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:32:55.659 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:32:55.704 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
+2026-04-30 19:32:55.704 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
+2026-04-30 19:32:57.100 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 3/5 candidates accepted
+2026-04-30 19:33:31.671 - backend.aggregator.agents.validator - INFO - Batch validation complete: 0/3 accepted
+2026-04-30 19:33:31.671 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 2)
+2026-04-30 19:33:31.671 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 6)
+2026-04-30 19:33:31.687 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 2)
+2026-04-30 19:33:31.687 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 7)
+2026-04-30 19:33:31.687 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 3)
+2026-04-30 19:33:31.687 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 8)
+2026-04-30 19:33:31.703 - backend.aggregator.core.coordinator - INFO - Queue size (8) < threshold (10). Resuming submitters.
+2026-04-30 19:33:31.703 - backend.aggregator.core.coordinator - INFO - Validator iteration 7 - batch validating 3 submissions: ['c52670ac-49d7-477a-b64c-e581d1130917', '44116b14-83a3-4e5c-9892-b768941b848c', 'acbc42c6-e70c-4e5f-a141-4f6b6165214f']
+2026-04-30 19:33:31.703 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:33:31.703 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:33:32.226 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f4e42d31-3e25-4cf7-8cf9-855d0fe72d09 (iteration 1)
+2026-04-30 19:33:34.146 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission d749aa5b-7242-4ed0-8f60-be13c42385b0 (iteration 10)
+2026-04-30 19:33:35.328 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 46c7a011-7b74-4d48-92ff-d990536817c5 (iteration 10)
+2026-04-30 19:33:37.594 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 338945b2-b322-4e41-9c2f-dabe2356ed7a (iteration 11)
+2026-04-30 19:33:38.927 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 2314ec88-7a07-4349-9567-048d64f5df76 (iteration 11)
+2026-04-30 19:33:40.486 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 489c5d4c-89a1-4635-a8ac-1b66bfaf4905 (iteration 12)
+2026-04-30 19:33:47.193 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
+2026-04-30 19:33:47.193 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 3)
+2026-04-30 19:33:47.193 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 9)
+2026-04-30 19:33:47.210 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-04-30 19:33:47.210 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
+2026-04-30 19:33:47.210 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 2 total chunks
+2026-04-30 19:33:47.210 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 4)
+2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 10)
+2026-04-30 19:33:47.221 - backend.aggregator.core.coordinator - INFO - Queue size (11) >= threshold (10). Pausing submitters.
+2026-04-30 19:33:47.223 - backend.aggregator.core.coordinator - INFO - Validator iteration 8 - batch validating 3 submissions: ['cf198397-5da9-44b7-896b-40905acbd42d', 'ffb22bc0-8c59-454b-bb1b-561b7ebecf3e', '2d78831a-7c3e-4354-8d3c-81758b2627d9']
+2026-04-30 19:33:47.223 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:33:47.223 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:33:47.266 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
+2026-04-30 19:33:47.266 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
+2026-04-30 19:33:49.233 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 4/5 candidates accepted
+2026-04-30 19:34:14.439 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
+2026-04-30 19:34:14.455 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 2)
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 5)
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-04-30 19:34:14.455 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 1 total chunks
+2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 5)
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 11)
+2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 12)
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Queue size (8) < threshold (10). Resuming submitters.
+2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Validator iteration 9 - batch validating 3 submissions: ['50605199-ecaa-4ab1-8829-3468e76092f1', 'cd68c0a9-f4c2-4f11-afd6-333af4025879', 'f4e42d31-3e25-4cf7-8cf9-855d0fe72d09']
+2026-04-30 19:34:14.455 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
+2026-04-30 19:34:14.455 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
+2026-04-30 19:34:14.486 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-04-30 19:34:14.486 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-04-30 19:34:14.728 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission a0422046-e395-42b4-8f4e-39333726c738 (iteration 2)
+2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 5/5 candidates accepted
+2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: Target of 5 candidates reached
+2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
+2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
+2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
+2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
+2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 4 stopped
+2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 9
+2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 9 iterations - is_running=False
+2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
+2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - Paper title exploration complete: 5 candidates accepted
+2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: Restored shared_training_memory state
+2026-04-30 19:34:15.263 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 1
+2026-04-30 19:34:15.279 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model moonshotai/kimi-k2.6 (task_id=agg_sub1_000)
+2026-04-30 19:35:52.374 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=agg_sub1_001)
+2026-04-30 19:37:06.565 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title accepted: 'Verified Proof Complexity in Lean 4: From Polynomial Verifiers to Exponential Lower Bounds'
+2026-04-30 19:37:06.565 - backend.autonomous.core.autonomous_coordinator - INFO - Compiling paper: Verified Proof Complexity in Lean 4: From Polynomial Verifiers to Exponential Lower Bounds
+2026-04-30 19:37:06.565 - backend.autonomous.core.autonomous_coordinator - INFO - Clearing RAG for autonomous paper compilation...
+2026-04-30 19:37:06.565 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
+2026-04-30 19:37:06.580 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
+2026-04-30 19:37:06.580 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
+2026-04-30 19:37:06.596 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
+2026-04-30 19:37:06.596 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
+2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
+2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
+2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
+2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
+2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
+2026-04-30 19:37:06.611 - backend.autonomous.core.autonomous_coordinator - INFO - RAG cleared successfully
+2026-04-30 19:37:06.611 - backend.compiler.core.compiler_coordinator - INFO - Initializing compiler coordinator...
+2026-04-30 19:37:06.611 - backend.compiler.memory.outline_memory - INFO - Outline memory initialized
+2026-04-30 19:37:06.627 - backend.compiler.memory.paper_memory - INFO - Paper memory initialized
+2026-04-30 19:37:06.627 - backend.compiler.memory.compiler_rejection_log - INFO - Compiler rejection/acceptance logs initialized
+2026-04-30 19:37:07.008 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha client initialized
+2026-04-30 19:37:07.015 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha singleton client initialized
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Wolfram Alpha client initialized (available as a construction-mode tool)
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Resetting compiler RAG manager state...
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager state reset
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Initializing compiler RAG manager...
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Updating compiler context window from 131072 to 2000000
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager initialized
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Skipping Part 1 aggregator database load (autonomous mode)
+2026-04-30 19:37:07.015 - backend.compiler.agents.high_context_submitter - INFO - High-context submitter initialized with model: moonshotai/kimi-k2.6
+2026-04-30 19:37:07.015 - backend.compiler.agents.high_context_submitter - INFO - Context budget: 221500 tokens (window: 262000)
+2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_context': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-04-30 19:37:07.015 - backend.compiler.agents.high_param_submitter - INFO - High-param submitter initialized with model: openai/gpt-5.5
+2026-04-30 19:37:07.015 - backend.compiler.agents.high_param_submitter - INFO - Context budget: 921500 tokens (window: 1050000)
+2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_param': provider=openrouter, model=openai/gpt-5.5
+2026-04-30 19:37:07.015 - backend.compiler.validation.compiler_validator - INFO - Compiler validator initialized with model: x-ai/grok-4.1-fast
+2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Per-paper model tracking enabled for manual compiler mode
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Compiler coordinator initialized successfully
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Autonomous mode enabled - section order: Body → Conclusion → Intro → Abstract
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Clearing paper and outline...
+2026-04-30 19:37:07.015 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 1, 0 words)
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Paper is empty, skipping re-chunking
+2026-04-30 19:37:07.015 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 1)
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Outline is empty, skipping re-chunking
+2026-04-30 19:37:07.015 - backend.compiler.memory.critique_memory - ERROR - Critique memory not initialized - call initialize() first
+2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique memory
+2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Cleared rejection/acceptance logs
+2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset per-paper model tracker
+2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset autonomous section phase to body
+2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset critique phase state
+2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Paper and outline cleared - system reset to fresh start
+2026-04-30 19:37:07.024 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared previous paper/outline for fresh paper paper_007
+2026-04-30 19:37:07.024 - backend.autonomous.core.autonomous_coordinator - INFO - Loading brainstorm database into compiler RAG: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\brainstorm_topic_004.txt
+2026-04-30 19:37:07.040 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_004.txt: 556 total chunks
+2026-04-30 19:37:12.336 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\brainstorm_topic_004.txt
+2026-04-30 19:37:12.336 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm database loaded into compiler RAG
+2026-04-30 19:37:12.336 - backend.autonomous.core.autonomous_coordinator - INFO - Loading 2 reference papers into compiler RAG
+2026-04-30 19:37:12.336 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_006.txt: 234 total chunks
+2026-04-30 19:37:14.214 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers\paper_paper_006.txt
+2026-04-30 19:37:14.214 - backend.autonomous.core.autonomous_coordinator - INFO - Reference paper loaded: paper_006
+2026-04-30 19:37:14.216 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_003.txt: 87 total chunks
+2026-04-30 19:37:14.930 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers\paper_paper_003.txt
+2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Reference paper loaded: paper_003
+2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - All reference papers loaded into compiler RAG
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Starting compiler...
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Compiler started successfully
+2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Compiler started for paper paper_007
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow started
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring started - will check for new acceptances every 30 seconds
+2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: None → body
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Starting fresh - no existing paper or outline found
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - PHASE 1: ITERATIVE OUTLINE CREATION
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO -
+--- Outline Creation Iteration 1/15 ---
+2026-04-30 19:37:14.930 - backend.compiler.agents.high_context_submitter - INFO - Starting outline creation submission generation...
+2026-04-30 19:37:14.930 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 19:37:14.930 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_create, query_length=14810
+2026-04-30 19:37:40.825 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_create in 25.90s (coverage=0.50, tokens=10764)
+2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 68648 chars retrieved
+2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Building outline creation prompt...
+2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 102033 chars
+2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_000)...
+2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 3617 chars
+2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 19:40:28.116 - backend.compiler.agents.high_context_submitter - INFO - Outline creation submission generated: 126dcdd9-cf47-44f1-b018-a16e8155c8e8, outline_complete=True
+2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - Validating outline_create submission: 126dcdd9-cf47-44f1-b018-a16e8155c8e8
+2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_create, operation=full_content
+2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_000)...
+2026-04-30 19:40:37.782 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 19:40:37.798 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_create)
+2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ✓ Iteration 1: Outline ACCEPTED
+2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO -   Validator feedback: The submitted outline fully meets all validation criteria. It includes the optional Abstract, required Introduction ('I. Introduction'), multiple body sections (II through VIII), and Conclusion ('IX. ...
+2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
+2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - OUTLINE MARKED COMPLETE BY SUBMITTER - LOCKING
+2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
+2026-04-30 19:40:37.803 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 2)
+2026-04-30 19:40:37.814 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
+2026-04-30 19:40:37.814 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 7 total chunks
+2026-04-30 19:40:37.935 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
+2026-04-30 19:40:37.937 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
+2026-04-30 19:40:37.937 - backend.compiler.memory.outline_memory - INFO - Outline creation feedback cleared
+2026-04-30 19:40:37.937 - backend.compiler.core.compiler_coordinator - INFO - Outline locked after 1 iterations
+2026-04-30 19:40:37.937 - backend.compiler.core.compiler_coordinator - INFO - Starting initial paper loop...
+2026-04-30 19:40:37.939 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=True, phase=body)
+2026-04-30 19:40:37.939 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 19:40:37.941 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=0 chars
+2026-04-30 19:40:37.941 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 0 chars → 0 chars (markers preserved)
+2026-04-30 19:40:37.973 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=0, brainstorm=74310, overhead=5000, rag_budget=141636
+2026-04-30 19:40:37.973 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 19:40:37.973 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=14810
+2026-04-30 19:40:37.973 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:41:11.848 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:41:11.848 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
+2026-04-30 19:41:11.848 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 33.88s (coverage=0.32, tokens=1810)
+2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 14156 chars retrieved
+2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 307904 chars
+2026-04-30 19:41:11.880 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_001)...
+2026-04-30 19:45:54.178 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 9286 chars (0 Wolfram tool call(s))
+2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: eee4f7ad-46d6-46e7-b078-34784dc32a1d (section_complete=False)
+2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: eee4f7ad-46d6-46e7-b078-34784dc32a1d
+2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=full_content
+2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_001)...
+2026-04-30 19:46:08.525 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 19:46:08.540 - backend.compiler.memory.paper_memory - INFO - Paper initialized with placeholders (version 2)
+2026-04-30 19:46:08.540 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
+2026-04-30 19:46:08.540 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 26 total chunks
+2026-04-30 19:46:08.794 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
+2026-04-30 19:46:08.794 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
+2026-04-30 19:46:08.794 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
+2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Initial paper portion accepted with placeholders! (1131 words)
+2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Initial paper loop complete
+2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
+2026-04-30 19:46:08.811 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
+2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
+2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
+2026-04-30 19:46:08.825 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
+2026-04-30 19:46:08.825 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 19:46:08.825 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 19:46:08.825 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:46:34.389 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:46:34.389 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
+2026-04-30 19:46:34.389 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.56s (coverage=0.30, tokens=1739)
+2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
+2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 316065 chars
+2026-04-30 19:46:34.420 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_002)...
+2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14015 chars (0 Wolfram tool call(s))
+2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 19:52:38.052 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: f58caf39-ee36-400e-af84-0366b9400553 (section_complete=False)
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: f58caf39-ee36-400e-af84-0366b9400553
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11972 -> 11868 chars, new_string: 11972 -> 11868 chars)
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and'...
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 7951
+2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_002)...
+2026-04-30 19:53:11.368 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=False, rigor=False, placement=False)
+2026-04-30 19:53:11.368 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: construction)
+2026-04-30 19:53:11.368 - backend.compiler.core.compiler_coordinator - INFO - Construction rejected
+2026-04-30 19:53:11.368 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body, retry with feedback)
+2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
+2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
+2026-04-30 19:53:11.398 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
+2026-04-30 19:53:11.398 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 19:53:11.398 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 19:53:11.398 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:53:37.017 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 19:53:37.019 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
+2026-04-30 19:53:37.019 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.62s (coverage=0.30, tokens=1739)
+2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
+2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 321059 chars
+2026-04-30 19:53:37.047 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_003)...
+2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 11972 chars (0 Wolfram tool call(s))
+2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 30d56c2e-c869-4b79-b1db-090cd0194d17 (section_complete=False)
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 30d56c2e-c869-4b79-b1db-090cd0194d17
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 10228 -> 10226 chars, new_string: 10228 -> 10226 chars)
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'...
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=570 | double_spaces=1 | first20='Since polynomial bou' | last20='orems in Section~IV.'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=8754 | double_spaces=21 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle FULL:
+Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
+
+This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars repr): 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\\pi_{C}|+|\\varphi|$ (\\texttt{polynomial\\_simulation\\_transitive}, Proof~7).\n\nThis preorder str'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars repr): 'fied, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'eorems not placed inline will appear here]\n[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 7756
+2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=570 | double_spaces=1 | first20='Since polynomial bou' | last20='orems in Section~IV.'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=2504 | double_spaces=36 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle FULL:
+Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
+
+This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars repr): 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\\pi_{C}|+|\\varphi|$ (\\texttt{polynomial\\_simulation\\_transitive}, Proof~7).\n\nThis preorder str'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars repr): 'fied, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. The Cook-Reckhow program and NP versus coNP\n   B. Verified proof complexity and the role of Lean 4\n   C. Overview of contributions\n   D. Roadmap\n\nII. Preliminaries and '
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'pen formalization targets and future work\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - FULL old_string that failed to match:
+Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
+
+This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
+2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
+2026-04-30 20:04:01.742 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: construction)
+2026-04-30 20:04:01.742 - backend.compiler.core.compiler_coordinator - INFO - Construction rejected
+2026-04-30 20:04:01.742 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body, retry with feedback)
+2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
+2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
+2026-04-30 20:04:01.758 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
+2026-04-30 20:04:01.758 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:04:01.758 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 20:04:01.758 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:04:27.281 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:04:27.297 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
+2026-04-30 20:04:27.297 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.54s (coverage=0.30, tokens=1739)
+2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
+2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 322306 chars
+2026-04-30 20:04:27.312 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_004)...
+2026-04-30 20:15:16.266 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10878 chars (0 Wolfram tool call(s))
+2026-04-30 20:15:16.266 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:15:16.281 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:15:16.281 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6ea8047a-c2c4-4a4f-bfa2-4162c71a2f92 (section_complete=False)
+2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6ea8047a-c2c4-4a4f-bfa2-4162c71a2f92
+2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 8884 -> 8882 chars, new_string: 8884 -> 8882 chars)
+2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'...
+2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 7756
+2026-04-30 20:15:16.291 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_003)...
+2026-04-30 20:15:29.618 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 20:15:29.618 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=582, new_string_len=8882
+2026-04-30 20:15:29.618 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 8882 chars (conclusion boundary preserved)
+2026-04-30 20:15:29.618 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 3, 2139 words)
+2026-04-30 20:15:29.665 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
+2026-04-30 20:15:29.665 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 54 total chunks
+2026-04-30 20:15:30.103 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
+2026-04-30 20:15:30.103 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
+2026-04-30 20:15:30.108 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
+2026-04-30 20:15:30.108 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2139 words)
+2026-04-30 20:15:30.108 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
+2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=17638 chars
+2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 17638 chars → 17638 chars (markers preserved)
+2026-04-30 20:15:30.139 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=5123, brainstorm=74310, overhead=5000, rag_budget=136513
+2026-04-30 20:15:30.139 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:15:30.139 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 20:15:30.139 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:15:55.850 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:15:55.853 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
+2026-04-30 20:15:55.853 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.71s (coverage=0.31, tokens=1739)
+2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
+2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 330093 chars
+2026-04-30 20:15:55.881 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_005)...
+2026-04-30 20:21:30.392 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\lean4_workspace
+2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 5202 chars (0 Wolfram tool call(s))
+2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 07747a60-615b-43b7-9046-3c705a0315d2 (section_complete=False)
+2026-04-30 20:26:31.793 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 07747a60-615b-43b7-9046-3c705a0315d2
+2026-04-30 20:26:31.793 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 4088 -> 4086 chars, new_string: 4088 -> 4086 chars)
+2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Polynomial-time checkability follows because $\\operatorname{TseitinFalse}(\\varphi)$ is computable in'...
+2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 16937
+2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_004)...
+2026-04-30 20:26:39.116 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 20:26:39.116 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=285, new_string_len=4086
+2026-04-30 20:26:39.116 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 4086 chars (conclusion boundary preserved)
+2026-04-30 20:26:39.116 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 4, 2596 words)
+2026-04-30 20:26:39.166 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
+2026-04-30 20:26:39.166 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 67 total chunks
+2026-04-30 20:26:39.718 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
+2026-04-30 20:26:39.718 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
+2026-04-30 20:26:39.718 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
+2026-04-30 20:26:39.718 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2596 words)
+2026-04-30 20:26:39.718 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
+2026-04-30 20:26:39.718 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
+2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
+2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:26:39.729 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=14810
+2026-04-30 20:26:39.729 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt']
+2026-04-30 20:27:04.956 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt']
+2026-04-30 20:27:04.956 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 7 chunks from excluded sources (already direct-injected)
+2026-04-30 20:27:04.956 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 25.23s (coverage=0.49, tokens=9893)
+2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 62832 chars retrieved
+2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
+2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 120460 chars
+2026-04-30 20:27:04.973 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_006)...
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 971 chars
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Outline update not needed
+2026-04-30 20:28:54.068 - backend.compiler.core.compiler_coordinator - INFO - No outline update needed
+2026-04-30 20:28:54.068 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: outline_update)
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements (focus=general)...
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 54105 chars
+2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_007)...
+2026-04-30 20:30:47.838 - backend.shared.openrouter_client - ERROR - OpenRouter unexpected error: Expecting value: line 523 column 1 (char 2871)
+2026-04-30 20:30:47.971 - backend.shared.api_client_manager - ERROR - OpenRouter error for role 'compiler_high_context': Expecting value: line 523 column 1 (char 2871), and no LM Studio fallback configured
+2026-04-30 20:30:47.971 - backend.compiler.core.compiler_coordinator - ERROR - Review context overflow: Expecting value: line 523 column 1 (char 2871)
+2026-04-30 20:30:47.986 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: review)
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements (focus=general)...
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 54105 chars
+2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_008)...
+2026-04-30 20:30:54.975 - backend.shared.openrouter_client - ERROR - OpenRouter unexpected error: Expecting value: line 13 column 1 (char 66)
+2026-04-30 20:30:55.110 - backend.shared.api_client_manager - ERROR - OpenRouter error for role 'compiler_high_context': Expecting value: line 13 column 1 (char 66), and no LM Studio fallback configured
+2026-04-30 20:30:55.110 - backend.compiler.core.compiler_coordinator - ERROR - Review context overflow: Expecting value: line 13 column 1 (char 66)
+2026-04-30 20:30:55.127 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: review)
+2026-04-30 20:30:55.127 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
+2026-04-30 20:30:55.127 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
+2026-04-30 20:30:55.127 - backend.compiler.agents.high_param_submitter - INFO - Rigor cycle: Stage 1 - theorem discovery
+2026-04-30 20:30:55.147 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=16311
+2026-04-30 20:30:55.147 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt']
+2026-04-30 20:31:20.483 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt']
+2026-04-30 20:31:20.499 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 7 chunks from excluded sources (already direct-injected)
+2026-04-30 20:31:20.499 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 25.35s (coverage=0.49, tokens=9949)
+2026-04-30 20:31:46.122 - backend.compiler.agents.high_param_submitter - INFO - Rigor cycle: Stage 2 - Lean 4 formalization (up to 5 attempts), retry_failure_id=compiler_rigor_4e20725b82af
+2026-04-30 20:31:46.139 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:47.136 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:47.136 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:49.137 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:49.142 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:49.275 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 1 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
+For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
+2026-04-30 20:31:49.275 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:50.276 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:50.276 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:52.272 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:52.272 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:52.411 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 2 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
+For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
+2026-04-30 20:31:52.411 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:53.428 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:53.429 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:55.429 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:55.430 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:55.564 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 3 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
+For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
+2026-04-30 20:31:55.564 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:56.564 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:56.564 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:58.566 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:58.566 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:58.699 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 4 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
+For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
+2026-04-30 20:31:58.699 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:31:59.679 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:31:59.679 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:32:01.684 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
+2026-04-30 20:32:01.684 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
+    "error": {
+        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
+        "type": "invalid_request_error",
+        "param": "model",
+        "code": null
+    }
+}
+2026-04-30 20:32:01.819 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 5 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
+For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
+2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop: no theorem attempted this cycle (decline)
+2026-04-30 20:32:01.819 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
+2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (decline: no more theorems or Lean failed)
+2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
+2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
+2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
+2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
+2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
+2026-04-30 20:32:01.851 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=6205, brainstorm=74310, overhead=5000, rag_budget=135431
+2026-04-30 20:32:01.851 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:32:01.851 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 20:32:01.851 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:32:27.066 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:32:27.066 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
+2026-04-30 20:32:27.066 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.22s (coverage=0.31, tokens=1739)
+2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
+2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 334181 chars
+2026-04-30 20:32:27.091 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_009)...
+2026-04-30 20:45:03.127 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 7064 chars (0 Wolfram tool call(s))
+2026-04-30 20:45:03.127 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:45:03.132 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:45:03.132 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 209b69f9-8c9c-48d1-818d-fd2fa54623e7 (section_complete=False)
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 209b69f9-8c9c-48d1-818d-fd2fa54623e7
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 6279 -> 6277 chars, new_string: 6279 -> 6277 chars)
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This completes the verified infrastructure for propositional proof systems.\n\n'
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 21235
+2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_005)...
+2026-04-30 20:45:13.994 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 20:45:13.994 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=75, new_string_len=6277
+2026-04-30 20:45:13.994 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 6277 chars (conclusion boundary preserved)
+2026-04-30 20:45:14.003 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 5, 3325 words)
+2026-04-30 20:45:14.055 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
+2026-04-30 20:45:14.055 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 85 total chunks
+2026-04-30 20:45:14.741 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
+2026-04-30 20:45:14.741 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
+2026-04-30 20:45:14.741 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
+2026-04-30 20:45:14.741 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (3325 words)
+2026-04-30 20:45:14.741 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
+2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=28005 chars
+2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 28005 chars → 28005 chars (markers preserved)
+2026-04-30 20:45:14.775 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=7922, brainstorm=74310, overhead=5000, rag_budget=133714
+2026-04-30 20:45:14.775 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:45:14.775 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 20:45:14.775 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:45:40.673 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:45:40.675 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
+2026-04-30 20:45:40.677 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.90s (coverage=0.30, tokens=1562)
+2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 12229 chars retrieved
+2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 339050 chars
+2026-04-30 20:45:40.693 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_010)...
+2026-04-30 20:55:56.846 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 7546 chars (0 Wolfram tool call(s))
+2026-04-30 20:55:56.846 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
+2026-04-30 20:55:56.861 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
+2026-04-30 20:55:56.861 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 254a7f73-ee41-4e48-a517-d664121ea839 (section_complete=False)
+2026-04-30 20:55:56.863 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 254a7f73-ee41-4e48-a517-d664121ea839
+2026-04-30 20:55:56.863 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 6564 -> 6562 chars, new_string: 6564 -> 6562 chars)
+2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
+2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The Lean theorem \\texttt{quantitative\\_lower\\_bound\\_transfer\\_under\\_simulation} (Proof~6) verifies'...
+2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 27464
+2026-04-30 20:55:56.913 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_006)...
+2026-04-30 20:56:05.370 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
+2026-04-30 20:56:05.370 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=125, new_string_len=6562
+2026-04-30 20:56:05.370 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 6562 chars (conclusion boundary preserved)
+2026-04-30 20:56:05.370 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 6, 4110 words)
+2026-04-30 20:56:05.421 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
+2026-04-30 20:56:05.432 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 107 total chunks
+2026-04-30 20:56:06.384 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
+2026-04-30 20:56:06.384 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
+2026-04-30 20:56:06.388 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
+2026-04-30 20:56:06.388 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (4110 words)
+2026-04-30 20:56:06.388 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
+2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
+2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
+2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=34569 chars
+2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 34569 chars → 34569 chars (markers preserved)
+2026-04-30 20:56:06.422 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=9712, brainstorm=74310, overhead=5000, rag_budget=131924
+2026-04-30 20:56:06.422 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
+2026-04-30 20:56:06.422 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
+2026-04-30 20:56:06.422 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:56:32.896 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
+2026-04-30 20:56:32.896 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
+2026-04-30 20:56:32.896 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 26.47s (coverage=0.31, tokens=1562)
+2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 12229 chars retrieved
+2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
+2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 345614 chars
+2026-04-30 20:56:32.925 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_011)...

From 2183450af17cb5d9bb4b13ee7d247b56c5f80aaa Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Fri, 1 May 2026 19:55:50 -0500
Subject: [PATCH 11/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 7f4b9d8..50261b8 100644
--- a/.gitignore
+++ b/.gitignore
@@ -122,4 +122,5 @@ htmlcov/
 .moto_instances/
 final_volume.txt
 RANDOM LOG.txt
+randomlog.txt
 commits_pending.txt

From bebc4978de5a983332d93ec7338ebdad55d210a9 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Fri, 1 May 2026 20:00:12 -0500
Subject: [PATCH 12/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index dd9d7de..4d2e857 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,5 @@
-# MOTO Autonomous ASI - Novel S.T.E.M. Solution Variant for ASI Automated Theory Generation
-# Autonomous Superintelligence Deep Research Harness
+# MOTO Autonomous ASI - Automated Theory Generation with Lean 4 Mathematics Verification
+# An Autonomous Prototype Superintelligence
 **Version: 1.0.7**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)

From c30193b4395a7ccd86ce8492874497530e901c35 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Fri, 1 May 2026 20:01:14 -0500
Subject: [PATCH 13/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 4d2e857..1f0e7ae 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,5 @@
-# MOTO Autonomous ASI - Automated Theory Generation with Lean 4 Mathematics Verification
-# An Autonomous Prototype Superintelligence
+# MOTO Autonomous ASI
+## An Autonomous Prototype Superintelligence - Automated Theory Generation with Lean 4 Mathematics Verification
 **Version: 1.0.7**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)

From 76be08d096a62b022867f6fef5df7e7b8d0f991e Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 17:04:55 -0500
Subject: [PATCH 14/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 .../rules/part-3-autonomous-research-mode.mdc |   7 +
 backend/api/routes/autonomous.py              |  30 +-
 .../autonomous/core/autonomous_coordinator.py | 392 +++++++-
 backend/autonomous/core/proof_novelty.py      |  30 +-
 .../core/proof_verification_stage.py          |   9 +-
 backend/autonomous/memory/paper_library.py    | 182 +++-
 backend/autonomous/memory/proof_database.py   |  13 +-
 backend/autonomous/prompts/proof_prompts.py   |  47 +-
 .../compiler/agents/high_param_submitter.py   |  16 +-
 backend/compiler/core/compiler_coordinator.py |   2 +
 backend/shared/models.py                      |   1 +
 frontend/src/App.jsx                          |  18 +
 .../src/components/PaperCritiqueModal.jsx     |  76 +-
 .../AutonomousResearchInterface.jsx           |  13 +-
 .../autonomous/AutonomousResearchSettings.jsx |  24 +-
 .../components/autonomous/BrainstormList.jsx  |  33 +-
 .../autonomous/MathematicalProofs.css         |  45 +
 .../autonomous/MathematicalProofs.jsx         |  67 +-
 .../components/autonomous/PaperLibrary.jsx    |  28 +-
 .../src/components/autonomous/ProofGraph.css  |  12 +
 .../src/components/autonomous/ProofGraph.jsx  |  11 +-
 .../components/autonomous/ProofLibrary.css    |  37 +-
 .../components/autonomous/ProofLibrary.jsx    |  36 +-
 .../autonomous/ProofNotificationStack.jsx     | 210 ++--
 .../autonomous/Stage2PaperHistory.jsx         |  29 +
 randomlog.txt                                 | 904 ------------------
 26 files changed, 1107 insertions(+), 1165 deletions(-)

diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index 571ad39..091a96e 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -163,6 +163,9 @@ When choosing between new / continue / combine:
 - **Continue Existing**: When an incomplete brainstorm has more value to explore before starting something new
 - **Combine Topics**: When multiple existing brainstorms are related and would benefit from unified exploration
 
+### Hard Code Guard: continue_existing on Completed Brainstorms
+The coordinator enforces a **hard code guard** in `_execute_topic_selection`: if the LLM selects `continue_existing` on a brainstorm whose status is `"complete"`, the action is **rejected** and the topic selection loop retries. This prevents runaway re-brainstorming on already-completed topics regardless of LLM judgment. The LLM prompt and validator prompt both instruct against this, but the code guard is the authoritative enforcement.
+
 JSON schema and examples defined in `json-prompt-design.mdc`. Fields: `action` (new_topic/continue_existing/combine_topics), `topic_id`, `topic_ids`, `topic_prompt`, `reasoning`.
 
 ---
@@ -320,6 +323,7 @@ The autonomous brainstorm aggregator inherits batch validation from Part 1 infra
    - Trigger: After each acceptance, check if count >= 30
    - Behavior: Immediately transition to paper writing, skip completion review
    - WebSocket event: `brainstorm_hard_limit_reached`
+   - **TOTAL across all rounds**: When `continue_existing` resumes an incomplete brainstorm, the 30-cap applies to the TOTAL acceptance count (prior + new). The aggregator loop tracks a `resume_acceptance_base` offset so `_acceptance_count` always reflects the true total. If a topic already has >= 30 acceptances on entry, aggregation is skipped entirely and paper writing is forced immediately.
 5. **Rejection Hard Limit**: 10 consecutive rejections (with minimum 5 acceptances) FORCE transition to paper writing
    - Purpose: Prevents infinite rejection loops when brainstorm is exhausted
    - Trigger: After rejection, check if consecutive rejections >= 10 AND acceptances >= 5
@@ -1652,6 +1656,7 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 ### Paper Compilation Failure
 - Paper compilation is retried indefinitely until success or user stops - no skipping allowed
 - A completed brainstorm ALWAYS produces a paper; the system never abandons a brainstorm without writing its paper
+- If the referenced brainstorm database was deleted, clear stale Tier 2 paper-writing state and restart the normal topic exploration → reference selection → brainstorm cycle
 - Title selection retries indefinitely with rejection feedback threaded into each attempt
 
 ---
@@ -1722,6 +1727,8 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 38. **Title exploration uses standard aggregator (cleanup disabled)** — Same parallel submitters, batch validation, queue management. Cleanup/pruning is disabled because the phase is capped at 5 candidates and the temp DB is deleted afterwards.
 39. **Final title selection sees candidate titles** — The 6th selection can choose a candidate, synthesize, or propose new. Must justify divergence from all candidates.
 40. **Proof verification is an optional post-brainstorm and post-paper checkpoint** — Gated on `lean4_enabled`; silent when disabled. Lean 4 is authoritative; SMT (when `smt_enabled`) contributes hints only. See "Proof Verification Stage" section for the full invariant list.
+41. **Hard code guard: continue_existing on completed brainstorms is REJECTED** — `_execute_topic_selection` checks `metadata.status == "complete"` and returns `None`, forcing topic re-selection. LLM prompts instruct against this but the code guard is authoritative.
+42. **30-cap is TOTAL across all brainstorm rounds for a topic** — When `continue_existing` resumes an incomplete brainstorm, the aggregator loop tracks a `resume_acceptance_base` offset. `_acceptance_count` always equals `base + fresh_aggregator_count`. If the topic already has >= 30 acceptances on entry, aggregation is skipped and paper writing is forced immediately.
 
 ---
 
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index 46fdf95..096d87d 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -2,12 +2,11 @@
 Autonomous Research API Routes - REST endpoints for autonomous research mode.
 Includes Tier 1 (Brainstorm), Tier 2 (Paper Writing), and Tier 3 (Final Answer) endpoints.
 """
-import asyncio
 import logging
 from datetime import datetime
 from pathlib import Path
 from typing import Optional, Any, Dict, List
-from fastapi import APIRouter, HTTPException, BackgroundTasks
+from fastapi import APIRouter, HTTPException
 
 from backend.shared.models import AutonomousResearchStartRequest, CritiqueRequest
 from backend.shared.path_safety import (
@@ -242,7 +241,7 @@ async def _get_combined_api_logs(limit: int = 100) -> Dict[str, Any]:
 def _get_start_conflict() -> Optional[str]:
     """Return a user-facing conflict message if another workflow is active."""
     autonomous_state = autonomous_coordinator.get_state()
-    if autonomous_state.is_running:
+    if autonomous_state.is_running or autonomous_coordinator.is_active:
         return "Autonomous research is already running"
 
     if coordinator.is_running:
@@ -607,10 +606,7 @@ async def _delete_autonomous_paper_from_scope(
 
 
 @router.post("/start")
-async def start_autonomous_research(
-    request: AutonomousResearchStartRequest,
-    background_tasks: BackgroundTasks
-):
+async def start_autonomous_research(request: AutonomousResearchStartRequest):
     """Start autonomous research mode."""
     try:
         from backend.shared.config import system_config
@@ -671,8 +667,9 @@ async def start_autonomous_research(
             tier3_enabled=request.tier3_enabled
         )
         
-        # Start in background
-        background_tasks.add_task(autonomous_coordinator.start)
+        # Start in background with a retained task handle so Stop can cancel it.
+        if not autonomous_coordinator.start_in_background():
+            raise HTTPException(status_code=400, detail="Autonomous research is already running")
         
         return {
             "success": True,
@@ -694,7 +691,7 @@ async def stop_autonomous_research():
     """Stop autonomous research mode gracefully."""
     try:
         state = autonomous_coordinator.get_state()
-        if not state.is_running:
+        if not state.is_running and not autonomous_coordinator.is_active:
             return {
                 "success": True,
                 "message": "Autonomous research was not running"
@@ -1443,6 +1440,7 @@ async def save_current_compiler_paper():
         from backend.compiler.memory.outline_memory import outline_memory as compiler_outline_memory
         from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
         from backend.autonomous.memory.research_metadata import research_metadata
+        from backend.autonomous.memory.proof_database import proof_database
         
         # Get current paper from compiler memory
         current_paper = await compiler_paper_memory.get_paper()
@@ -1463,6 +1461,18 @@ async def save_current_compiler_paper():
         brainstorm_content = ""
         if topic_id:
             brainstorm_content = await brainstorm_memory.get_database_content(topic_id)
+
+            novel_source_proofs = [
+                proof
+                for proof in await proof_database.get_all_proofs(novel_only=True)
+                if proof.source_type == "brainstorm" and proof.source_id == topic_id
+            ]
+            if novel_source_proofs:
+                current_paper = paper_library.attach_verified_proofs_to_content(
+                    current_paper,
+                    novel_source_proofs,
+                    f"source brainstorm {topic_id}",
+                )
         
         # Save paper
         metadata = await paper_library.save_paper(
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 38f51ac..6f960bf 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -96,6 +96,8 @@ def __init__(self):
         self._running = False
         self._state = AutonomousResearchState()
         self._stop_event = asyncio.Event()
+        self._main_task: Optional[asyncio.Task] = None
+        self._stop_broadcast_sent = False
         
         # Configuration (set during initialize)
         self._user_research_prompt: str = ""
@@ -150,6 +152,7 @@ def __init__(self):
         self._last_completion_review_at: int = 0  # Acceptance count at last completion review
         self._manual_paper_writing_triggered: bool = False
         self._resume_paper_phase: Optional[str] = None  # Saved phase for resume (body/conclusion/intro/abstract)
+        self._brainstorm_missing_during_paper: bool = False
         
         # Brainstorm multi-paper continuation tracking
         self._brainstorm_paper_count: int = 0  # Papers written from current brainstorm (max 3)
@@ -1019,33 +1022,52 @@ async def _check_for_incomplete_papers(self) -> None:
         
         In this case, we set up the resume state to continue writing the incomplete paper.
         """
-        incomplete_paper = await paper_library.get_most_recent_incomplete_paper()
-        
-        if incomplete_paper:
+        while True:
+            incomplete_paper = await paper_library.get_most_recent_incomplete_paper()
+            if not incomplete_paper:
+                return
+
             logger.info(f"Found incomplete paper: {incomplete_paper.paper_id} "
                        f"(title: {incomplete_paper.title}, "
                        f"from brainstorm: {incomplete_paper.source_brainstorm_ids})")
-            
+
+            topic_id = incomplete_paper.source_brainstorm_ids[0] if incomplete_paper.source_brainstorm_ids else None
+            if not topic_id:
+                await self._delete_stale_incomplete_paper(
+                    incomplete_paper.paper_id,
+                    topic_id,
+                    "missing source brainstorm id for incomplete paper resume"
+                )
+                continue
+
+            metadata = await brainstorm_memory.get_metadata(topic_id)
+            brainstorm_db_path = brainstorm_memory.get_database_path(topic_id)
+            if metadata is None or not os.path.exists(brainstorm_db_path):
+                await self._delete_stale_incomplete_paper(
+                    incomplete_paper.paper_id,
+                    topic_id,
+                    f"source brainstorm not found at {brainstorm_db_path}"
+                )
+                continue
+
             # Set up resume state for the incomplete paper
             self._current_paper_id = incomplete_paper.paper_id
             self._current_paper_title = incomplete_paper.title
-            
-            # Get source brainstorm (use first one if multiple)
-            if incomplete_paper.source_brainstorm_ids:
-                self._current_topic_id = incomplete_paper.source_brainstorm_ids[0]
-            
+            self._current_topic_id = topic_id
+
             # Restore reference papers
             self._current_reference_papers = incomplete_paper.referenced_papers or []
-            
+
             # Detect which phase the paper needs to resume from based on content
             paper_content = await self._get_paper_content_for_resume(incomplete_paper.paper_id)
             self._resume_paper_phase = self._detect_paper_phase(paper_content)
-            
+
             logger.info(f"Will resume incomplete paper {incomplete_paper.paper_id} "
                        f"from phase: {self._resume_paper_phase}")
-            
+
             # Save workflow state so the resume logic kicks in
             await self._save_workflow_state(tier="tier2_paper_writing", phase=self._resume_paper_phase)
+            return
     
     async def _get_paper_content_for_resume(self, paper_id: str) -> str:
         """Get paper content for detecting resume phase."""
@@ -1202,6 +1224,84 @@ async def _load_saved_paper_to_compiler(self, paper_id: str) -> None:
         except Exception as e:
             logger.error(f"Failed to load saved paper {paper_id} to compiler: {e}")
 
+    async def _delete_stale_incomplete_paper(
+        self,
+        paper_id: Optional[str],
+        topic_id: Optional[str],
+        reason: str
+    ) -> None:
+        """Delete an orphaned incomplete paper so it cannot be resurrected on restart."""
+        if not paper_id:
+            return
+
+        logger.warning(
+            f"Deleting stale incomplete paper {paper_id} for brainstorm {topic_id}: {reason}"
+        )
+
+        paper_metadata = await paper_library.get_metadata(paper_id)
+        if paper_metadata and paper_metadata.status == "complete":
+            logger.warning(
+                f"Skipping stale-paper deletion for {paper_id}: paper is already complete"
+            )
+            return
+
+        await paper_library.delete_paper(paper_id)
+        await research_metadata.delete_paper(paper_id)
+        if topic_id:
+            await brainstorm_memory.remove_paper_reference(topic_id, paper_id)
+
+    async def _clear_stale_paper_writing_state(
+        self,
+        topic_id: Optional[str],
+        reason: str,
+        paper_id: Optional[str] = None,
+        mark_missing: bool = True
+    ) -> None:
+        """Clear a paper-writing resume point when its source brainstorm no longer exists.
+
+        IMPORTANT: We save (not delete) the workflow state so that the session remains
+        visible to find_interrupted_session(). The session finder requires a
+        workflow_state.json with a current_tier + papers_completed_count to detect
+        the session as resumable. Deleting the file hides the session.
+        """
+        logger.warning(
+            f"Clearing stale paper-writing state for brainstorm {topic_id}: {reason}"
+        )
+        stale_paper_id = paper_id if paper_id is not None else self._current_paper_id
+        await self._delete_stale_incomplete_paper(stale_paper_id, topic_id, reason)
+        self._current_topic_id = None
+        self._current_paper_id = None
+        self._current_paper_title = None
+        self._current_reference_papers = []
+        self._resume_paper_phase = None
+        self._brainstorm_paper_count = 0
+        self._current_brainstorm_paper_ids = []
+        self._last_completed_paper_id = None
+        self._brainstorm_missing_during_paper = mark_missing
+        # Save workflow state at tier1 with no topic/paper so the session stays
+        # discoverable for resume while the stale Tier 2 pointer is gone.
+        await self._save_workflow_state(tier="tier1_aggregation")
+
+    async def _current_brainstorm_available_for_paper(self) -> bool:
+        """Return False and clear paper-writing state if the current brainstorm was deleted."""
+        if not self._current_topic_id:
+            await self._clear_stale_paper_writing_state(
+                self._current_topic_id,
+                "no current brainstorm id is set"
+            )
+            return False
+
+        metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
+        brainstorm_db_path = brainstorm_memory.get_database_path(self._current_topic_id)
+        if metadata is None or not os.path.exists(brainstorm_db_path):
+            await self._clear_stale_paper_writing_state(
+                self._current_topic_id,
+                f"brainstorm database not found at {brainstorm_db_path}"
+            )
+            return False
+
+        return True
+
     async def _preserve_failed_paper_state(self, paper_id: str, paper_title: str) -> None:
         """
         Preserve in-progress paper state after a compiler failure so retries resume.
@@ -1295,6 +1395,52 @@ async def _save_workflow_state(self, tier: str = None, phase: str = None) -> Non
         }
         await research_metadata.save_workflow_state(state)
     
+    @property
+    def is_active(self) -> bool:
+        """Return True when autonomous research is running or its task is still alive."""
+        return (
+            self._running
+            or self._state.is_running
+            or (self._main_task is not None and not self._main_task.done())
+        )
+
+    def start_in_background(self) -> bool:
+        """Launch the autonomous loop and retain a task handle for cancellation."""
+        if self._main_task and not self._main_task.done():
+            logger.warning("AutonomousCoordinator task already running")
+            return False
+
+        self._main_task = asyncio.create_task(self.start())
+        self._main_task.add_done_callback(self._on_main_task_done)
+        return True
+
+    def _on_main_task_done(self, task: asyncio.Task) -> None:
+        """Log background task failures and clear the retained task handle."""
+        try:
+            if task.cancelled():
+                logger.info("AutonomousCoordinator background task cancelled")
+            else:
+                exc = task.exception()
+                if exc:
+                    logger.error(
+                        "AutonomousCoordinator background task failed",
+                        exc_info=(type(exc), exc, exc.__traceback__)
+                    )
+        finally:
+            if self._main_task is task:
+                self._main_task = None
+
+    async def _broadcast_stopped_once(self) -> None:
+        """Notify clients once that autonomous research is stopped."""
+        if self._stop_broadcast_sent:
+            return
+
+        self._stop_broadcast_sent = True
+        stats = await research_metadata.get_stats()
+        await self._broadcast("auto_research_stopped", {
+            "final_stats": stats
+        })
+
     async def start(self) -> None:
         """Start the autonomous research loop."""
         if self._running:
@@ -1304,6 +1450,7 @@ async def start(self) -> None:
         self._running = True
         self._stop_event.clear()
         self._state.is_running = True
+        self._stop_broadcast_sent = False
         
         # Reset free model manager state for fresh start
         free_model_manager.reset()
@@ -1378,6 +1525,20 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                         resume_tier = "tier3_final_answer"
                     
                     if resume_tier == "tier2_paper_writing" and resume_topic:
+                        # If the user deleted the brainstorm while a paper was paused,
+                        # the saved paper-writing resume point is no longer valid.
+                        metadata = await brainstorm_memory.get_metadata(resume_topic)
+                        brainstorm_db_path = brainstorm_memory.get_database_path(resume_topic)
+                        if metadata is None or not os.path.exists(brainstorm_db_path):
+                            await self._clear_stale_paper_writing_state(
+                                resume_topic,
+                                "saved Tier 2 resume references a deleted brainstorm",
+                                paper_id=resume_paper,
+                                mark_missing=False
+                            )
+                            resume_state = None
+                            continue
+
                         # Resume paper writing - skip to compilation
                         # CRITICAL: Restore paper_id so compilation workflow knows to resume
                         self._current_topic_id = resume_topic
@@ -1398,6 +1559,12 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                 emit_resume_event=(_resume_paper_attempt == 1)
                             ):
                                 break
+                            if self._brainstorm_missing_during_paper:
+                                break
+
+                        if self._brainstorm_missing_during_paper:
+                            self._brainstorm_missing_during_paper = False
+                            continue
 
                         if not self._stop_event.is_set():
                             self._brainstorm_paper_count += 1
@@ -1419,9 +1586,11 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                 next_ok = False
                                 while not self._stop_event.is_set():
                                     next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
-                                    if next_ok or self._stop_event.is_set():
+                                    if next_ok or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                                         break
                                     await asyncio.sleep(5)
+                                if self._brainstorm_missing_during_paper:
+                                    break
                                 if not next_ok or self._stop_event.is_set():
                                     break
                                 self._brainstorm_paper_count += 1
@@ -1429,6 +1598,10 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                     self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                                 await self._check_paper_redundancy()
                             
+                            if self._brainstorm_missing_during_paper:
+                                self._brainstorm_missing_during_paper = False
+                                continue
+
                             self._brainstorm_paper_count = 0
                             self._current_brainstorm_paper_ids = []
                             self._last_completed_paper_id = None
@@ -1467,10 +1640,16 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             while not self._stop_event.is_set():
                                 if await self._paper_compilation_workflow():
                                     break
+                                if self._brainstorm_missing_during_paper:
+                                    break
                                 await asyncio.sleep(5)
                             
                             if self._stop_event.is_set():
                                 break
+
+                            if self._brainstorm_missing_during_paper:
+                                self._brainstorm_missing_during_paper = False
+                                continue
                             
                             self._brainstorm_paper_count += 1
                             if self._last_completed_paper_id:
@@ -1489,9 +1668,11 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                 next_ok = False
                                 while not self._stop_event.is_set():
                                     next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
-                                    if next_ok or self._stop_event.is_set():
+                                    if next_ok or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                                         break
                                     await asyncio.sleep(5)
+                                if self._brainstorm_missing_during_paper:
+                                    break
                                 if not next_ok or self._stop_event.is_set():
                                     break
                                 self._brainstorm_paper_count += 1
@@ -1499,6 +1680,10 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                     self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                                 await self._check_paper_redundancy()
                             
+                            if self._brainstorm_missing_during_paper:
+                                self._brainstorm_missing_during_paper = False
+                                continue
+
                             self._brainstorm_paper_count = 0
                             self._current_brainstorm_paper_ids = []
                             self._last_completed_paper_id = None
@@ -1512,7 +1697,8 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                         metadata = await brainstorm_memory.get_metadata(resume_topic)
                         if metadata is None:
                             logger.warning(f"Resume state references missing brainstorm {resume_topic}; clearing resume state")
-                            await research_metadata.clear_workflow_state()
+                            self._current_topic_id = None
+                            await self._save_workflow_state(tier="tier1_aggregation")
                             resume_state = None
                             continue
                         
@@ -1535,10 +1721,16 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                     await asyncio.sleep(5)
                                 if await self._paper_compilation_workflow():
                                     break
+                                if self._brainstorm_missing_during_paper:
+                                    break
 
                             if self._stop_event.is_set():
                                 break
 
+                            if self._brainstorm_missing_during_paper:
+                                self._brainstorm_missing_during_paper = False
+                                continue
+
                             self._brainstorm_paper_count += 1
                             if self._last_completed_paper_id:
                                 self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
@@ -1558,9 +1750,11 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                 next_ok = False
                                 while not self._stop_event.is_set():
                                     next_ok = await self._paper_compilation_workflow(skip_reference_selection=True)
-                                    if next_ok or self._stop_event.is_set():
+                                    if next_ok or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                                         break
                                     await asyncio.sleep(5)
+                                if self._brainstorm_missing_during_paper:
+                                    break
                                 if not next_ok or self._stop_event.is_set():
                                     break
                                 self._brainstorm_paper_count += 1
@@ -1568,6 +1762,10 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                                     self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                                 await self._check_paper_redundancy()
                             
+                            if self._brainstorm_missing_during_paper:
+                                self._brainstorm_missing_during_paper = False
+                                continue
+
                             self._brainstorm_paper_count = 0
                             self._current_brainstorm_paper_ids = []
                             self._last_completed_paper_id = None
@@ -1706,12 +1904,16 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
 
                     paper_success = await self._paper_compilation_workflow()
 
-                    if paper_success or self._stop_event.is_set():
+                    if paper_success or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                         break
 
                 if self._stop_event.is_set():
                     break
 
+                if self._brainstorm_missing_during_paper:
+                    self._brainstorm_missing_during_paper = False
+                    continue
+
                 # Only check redundancy and log completion if paper was successful
                 if paper_success:
                     self._brainstorm_paper_count += 1
@@ -1741,9 +1943,12 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             next_paper_success = await self._paper_compilation_workflow(
                                 skip_reference_selection=True
                             )
-                            if next_paper_success or self._stop_event.is_set():
+                            if next_paper_success or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                                 break
                         
+                        if self._brainstorm_missing_during_paper:
+                            break
+
                         if not next_paper_success or self._stop_event.is_set():
                             break
                         
@@ -1752,6 +1957,10 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                         await self._check_paper_redundancy()
                     
+                    if self._brainstorm_missing_during_paper:
+                        self._brainstorm_missing_during_paper = False
+                        continue
+
                     if self._brainstorm_paper_count >= 3:
                         logger.info("Brainstorm paper limit reached (3/3)")
                         await self._broadcast("brainstorm_paper_limit_reached", {
@@ -1799,11 +2008,7 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
             self._running = False
             self._state.is_running = False
             token_tracker.stop_timer()
-            
-            stats = await research_metadata.get_stats()
-            await self._broadcast("auto_research_stopped", {
-                "final_stats": stats
-            })
+            await self._broadcast_stopped_once()
             logger.info("AutonomousCoordinator stopped")
     
     async def _get_resume_point(self) -> Optional[Dict[str, Any]]:
@@ -1822,19 +2027,37 @@ async def stop(self) -> None:
         logger.info("Stopping AutonomousCoordinator...")
         self._stop_event.set()
         self._running = False
+        self._state.is_running = False
+        await self._broadcast_stopped_once()
+
+        async def _run_shutdown_step(label: str, awaitable, timeout: float = 5.0) -> bool:
+            task = asyncio.create_task(awaitable)
+            done, _ = await asyncio.wait({task}, timeout=timeout)
+            if task in done:
+                await task
+                return True
+
+            task.cancel()
+            task.add_done_callback(
+                lambda done_task: None
+                if done_task.cancelled()
+                else done_task.exception()
+            )
+            logger.warning("Timed out stopping %s; continuing shutdown", label)
+            return False
         
         # Stop any running aggregator or compiler to prevent orphan tasks
         if self._brainstorm_aggregator:
             try:
-                await self._brainstorm_aggregator.stop()
-                logger.info("Stopped brainstorm aggregator")
+                if await _run_shutdown_step("brainstorm aggregator", self._brainstorm_aggregator.stop()):
+                    logger.info("Stopped brainstorm aggregator")
             except Exception as e:
                 logger.warning(f"Error stopping aggregator: {e}")
         
         if self._paper_compiler:
             try:
-                await self._paper_compiler.stop()
-                logger.info("Stopped paper compiler")
+                if await _run_shutdown_step("paper compiler", self._paper_compiler.stop()):
+                    logger.info("Stopped paper compiler")
             except Exception as e:
                 logger.warning(f"Error stopping compiler: {e}")
         
@@ -1857,6 +2080,13 @@ async def stop(self) -> None:
             logger.info(f"Workflow state saved for resume (tier={current_tier}, topic={self._current_topic_id})")
         except Exception as e:
             logger.warning(f"Could not save workflow state on stop: {e}")
+
+        main_task = self._main_task
+        if main_task and not main_task.done() and main_task is not asyncio.current_task():
+            main_task.cancel()
+            done, _ = await asyncio.wait({main_task}, timeout=5)
+            if main_task not in done:
+                logger.warning("AutonomousCoordinator background task is still cancelling")
         
         logger.info("Autonomous research stopped - press Start to resume from last state")
     
@@ -2077,12 +2307,16 @@ async def _resume_research_loop_after_tier3(self) -> None:
 
                     paper_success = await self._paper_compilation_workflow()
 
-                    if paper_success or self._stop_event.is_set():
+                    if paper_success or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                         break
 
                 if self._stop_event.is_set():
                     break
 
+                if self._brainstorm_missing_during_paper:
+                    self._brainstorm_missing_during_paper = False
+                    continue
+
                 # Only check redundancy and log completion if paper was successful
                 if paper_success:
                     self._brainstorm_paper_count += 1
@@ -2112,9 +2346,12 @@ async def _resume_research_loop_after_tier3(self) -> None:
                             next_paper_success = await self._paper_compilation_workflow(
                                 skip_reference_selection=True
                             )
-                            if next_paper_success or self._stop_event.is_set():
+                            if next_paper_success or self._stop_event.is_set() or self._brainstorm_missing_during_paper:
                                 break
                         
+                        if self._brainstorm_missing_during_paper:
+                            break
+
                         if not next_paper_success or self._stop_event.is_set():
                             break
                         
@@ -2123,6 +2360,10 @@ async def _resume_research_loop_after_tier3(self) -> None:
                             self._current_brainstorm_paper_ids.append(self._last_completed_paper_id)
                         await self._check_paper_redundancy()
                     
+                    if self._brainstorm_missing_during_paper:
+                        self._brainstorm_missing_during_paper = False
+                        continue
+
                     if self._brainstorm_paper_count >= 3:
                         logger.info("Brainstorm paper limit reached (3/3)")
                         await self._broadcast("brainstorm_paper_limit_reached", {
@@ -2523,6 +2764,21 @@ async def _execute_topic_selection(
                     logger.error(f"Brainstorm not found: {topic_id}")
                     return None
                 
+                # HARD GUARD: Completed brainstorms cannot be re-opened.
+                # The spec says continue_existing is for INCOMPLETE brainstorms only.
+                # LLMs sometimes ignore the "complete" status in the prompt context.
+                if metadata.status == "complete":
+                    logger.warning(
+                        f"Rejected continue_existing for {topic_id}: brainstorm is already complete "
+                        f"({metadata.submission_count} submissions, papers: {metadata.papers_generated}). "
+                        f"Forcing re-selection."
+                    )
+                    await self._broadcast("topic_selection_rejected", {
+                        "reasoning": f"Cannot continue brainstorm {topic_id} — it is already marked complete. "
+                                     f"Select a new topic or continue an incomplete brainstorm."
+                    })
+                    return None
+                
                 self._current_topic_id = topic_id
                 self._acceptance_count = metadata.submission_count
                 self._consecutive_rejections = 0
@@ -2948,17 +3204,26 @@ async def paper_model_tracking_callback(model_id: str) -> None:
             last_acceptances = status.total_acceptances  # Should be 0 for new brainstorm
             last_rejections = status.total_rejections  # Track rejections for stat increments
             
+            # Base offset for continue_existing: fresh aggregator counts from 0 but topic
+            # already has prior submissions.  The 30-cap must apply to the TOTAL across
+            # all rounds, so we track the offset and add it to every aggregator reading.
+            resume_acceptance_base = 0
+            
             # CRITICAL BUG FIX: Don't reset counters if resuming from workflow state
             # Check if counters were already restored (non-zero means we're resuming)
             is_resuming = self._acceptance_count > 0 or self._rejection_count > 0
             
             if is_resuming:
-                # Resuming: Use the restored counters from workflow state, don't reset
-                logger.info(f"Resuming brainstorm with {self._acceptance_count} acceptances, "
+                # Resuming / continue_existing: The aggregator starts at 0 but the topic
+                # already has self._acceptance_count prior acceptances.  We store that as
+                # the base so every comparison uses total = base + aggregator_count.
+                resume_acceptance_base = self._acceptance_count
+                logger.info(f"Resuming brainstorm with {self._acceptance_count} prior acceptances "
+                           f"(base offset={resume_acceptance_base}), "
                            f"{self._rejection_count} rejections from workflow state")
-                # Set last_* to current values so we can track NEW acceptances/rejections from here
-                last_acceptances = self._acceptance_count
-                last_rejections = self._rejection_count
+                # Reset last_* to 0 so we track the fresh aggregator's output correctly
+                last_acceptances = 0
+                last_rejections = 0
             else:
                 # Fresh brainstorm: Initialize counters from aggregator stats (should be 0)
                 self._acceptance_count = last_acceptances
@@ -2969,6 +3234,20 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                 self._last_completion_review_at = 0  # Reset completion review checkpoint
                 logger.info(f"Starting fresh brainstorm with {last_acceptances} acceptances")
             
+            # Safety check: if topic already at or past hard cap (e.g. resume of
+            # already-complete brainstorm that slipped past the code guard), skip
+            # aggregation entirely and go straight to paper writing.
+            if self._acceptance_count >= 30:
+                logger.info(
+                    f"Topic {self._current_topic_id} already at {self._acceptance_count} "
+                    f"acceptances (>= 30 cap). Skipping aggregation, forcing paper writing."
+                )
+                await brainstorm_memory.mark_complete(self._current_topic_id)
+                await research_metadata.mark_brainstorm_complete(self._current_topic_id)
+                await self._brainstorm_aggregator.stop()
+                await self._run_brainstorm_completion_proofs()
+                return True
+            
             while self._running and not self._stop_event.is_set():
                 # Get current aggregator stats
                 status = await self._brainstorm_aggregator.get_status()
@@ -2988,7 +3267,7 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                 # Track new acceptances/rejections
                 if current_acceptances > last_acceptances:
                     new_acceptances = current_acceptances - last_acceptances
-                    self._acceptance_count = current_acceptances
+                    self._acceptance_count = resume_acceptance_base + current_acceptances
                     self._consecutive_rejections = 0
                     last_acceptances = current_acceptances
                     
@@ -3469,6 +3748,10 @@ async def _paper_compilation_workflow(
         api_client_manager.set_autonomous_phase("paper_compilation")
         
         logger.info(f"Starting paper compilation for brainstorm {self._current_topic_id}")
+
+        if not await self._current_brainstorm_available_for_paper():
+            logger.info("Paper compilation skipped because the source brainstorm is unavailable")
+            return False
         
         # Check if we're resuming an in-progress paper
         # This flag tracks whether we're resuming (for passing to _compile_paper)
@@ -3588,6 +3871,9 @@ async def _paper_compilation_workflow(
         
         if paper_content is None:
             logger.error("Paper compilation failed")
+            if self._brainstorm_missing_during_paper:
+                logger.info("Not preserving failed paper state because the source brainstorm was deleted")
+                return False
             await self._preserve_failed_paper_state(paper_id, paper_title)
             return False
 
@@ -4097,6 +4383,16 @@ async def _compile_paper(
                     logger.warning("Brainstorm database was empty after proof stripping")
             else:
                 logger.warning(f"Brainstorm database not found: {brainstorm_db_path}")
+                logger.error("Aborting paper compilation: brainstorm database is required")
+                try:
+                    await self._paper_compiler.stop()
+                except Exception as stop_exc:
+                    logger.warning(f"Failed to stop compiler after missing brainstorm abort: {stop_exc}")
+                await self._clear_stale_paper_writing_state(
+                    self._current_topic_id,
+                    f"brainstorm database not found at {brainstorm_db_path}"
+                )
+                return None
             
             # Load reference papers into compiler RAG (if any)
             if reference_paper_ids:
@@ -4313,6 +4609,32 @@ async def _handle_paper_completion(
                 final_content = final_content + "\n" + model_credits
             
             logger.info("Added author attribution and model credits to paper")
+
+        if mark_complete and self._current_topic_id:
+            try:
+                novel_source_proofs = [
+                    proof
+                    for proof in await proof_database.get_all_proofs(novel_only=True)
+                    if proof.source_type == "brainstorm"
+                    and proof.source_id == self._current_topic_id
+                ]
+                if novel_source_proofs:
+                    final_content = paper_library.attach_verified_proofs_to_content(
+                        final_content,
+                        novel_source_proofs,
+                        f"source brainstorm {self._current_topic_id}",
+                    )
+                    logger.info(
+                        "Attached %s novel source-brainstorm proof(s) to paper %s",
+                        len(novel_source_proofs),
+                        paper_id,
+                    )
+            except Exception as exc:
+                logger.warning(
+                    "Failed to attach source-brainstorm proofs to paper %s: %s",
+                    paper_id,
+                    exc,
+                )
         
         # Save paper with appropriate status
         paper_metadata = await paper_library.save_paper(
diff --git a/backend/autonomous/core/proof_novelty.py b/backend/autonomous/core/proof_novelty.py
index c4ee9e9..573d538 100644
--- a/backend/autonomous/core/proof_novelty.py
+++ b/backend/autonomous/core/proof_novelty.py
@@ -20,6 +20,11 @@
 logger = logging.getLogger(__name__)
 
 
+VALID_NOVELTY_TIERS = frozenset(
+    {"not_novel", "novel_formulation", "novel_variant", "mathematical_discovery"}
+)
+
+
 async def assess_proof_novelty(
     *,
     user_prompt: str,
@@ -31,8 +36,8 @@ async def assess_proof_novelty(
     existing_novel_proofs: str,
     task_id: str,
     role_id: str = "autonomous_proof_novelty",
-) -> Tuple[bool, str]:
-    """Classify a Lean-4-verified theorem as novel or known.
+) -> Tuple[str, str]:
+    """Classify a Lean-4-verified theorem into one of four novelty tiers.
 
     Args:
         user_prompt: Top-level research prompt for context.
@@ -49,8 +54,10 @@ async def assess_proof_novelty(
             compiler-specific role for correct logging.
 
     Returns:
-        Tuple of (is_novel, reasoning). Falls back to (False, <message>) when
-        the novelty validator returns no usable response.
+        Tuple of (novelty_tier, reasoning) where novelty_tier is one of:
+        "not_novel", "novel_formulation", "novel_variant", "mathematical_discovery".
+        Falls back to ("not_novel", <message>) when the validator returns no
+        usable response or an unrecognised tier string.
     """
     prompt = build_proof_novelty_prompt(
         user_prompt=user_prompt,
@@ -80,20 +87,27 @@ async def assess_proof_novelty(
         temperature=0.0,
     )
     if not response or not response.get("choices"):
-        return False, "Novelty validator returned no response."
+        return "not_novel", "Novelty validator returned no response."
 
     message = response["choices"][0].get("message", {})
     content = message.get("content") or message.get("reasoning") or ""
     if not content:
-        return False, "Novelty validator returned empty content."
+        return "not_novel", "Novelty validator returned empty content."
 
     try:
         data = parse_json(content)
     except Exception as exc:
         logger.warning("Novelty validator JSON parse failed: %s", exc)
-        return False, f"Novelty validator JSON parse error: {exc}"
+        return "not_novel", f"Novelty validator JSON parse error: {exc}"
 
     if isinstance(data, list):
         data = data[0] if data else {}
 
-    return bool(data.get("is_novel", False)), str(data.get("reasoning", "")).strip()
+    raw_tier = str(data.get("novelty_tier", "not_novel")).strip().lower()
+    if raw_tier not in VALID_NOVELTY_TIERS:
+        logger.warning(
+            "Novelty validator returned unrecognised tier %r; falling back to not_novel", raw_tier
+        )
+        raw_tier = "not_novel"
+
+    return raw_tier, str(data.get("reasoning", "")).strip()
diff --git a/backend/autonomous/core/proof_verification_stage.py b/backend/autonomous/core/proof_verification_stage.py
index 58251a0..9975b52 100644
--- a/backend/autonomous/core/proof_verification_stage.py
+++ b/backend/autonomous/core/proof_verification_stage.py
@@ -314,7 +314,7 @@ async def _assess_novelty(
         validator_context: int,
         validator_max_tokens: int,
         existing_novel_proofs: str,
-    ) -> tuple[bool, str]:
+    ) -> tuple[str, str]:
         from .proof_novelty import assess_proof_novelty
 
         task_id = f"proof_novelty_{self._novelty_task_sequence:03d}"
@@ -616,7 +616,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
 
                     result.verified_count += 1
                     existing_novel_proofs = novel_proofs_db.get_novel_proofs_for_injection()
-                    is_novel, novelty_reasoning = await self._assess_novelty(
+                    novelty_tier, novelty_reasoning = await self._assess_novelty(
                         user_prompt=user_prompt,
                         theorem_statement=candidate.statement,
                         lean_code=lean_code,
@@ -625,6 +625,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                         validator_max_tokens=validator_max_tokens,
                         existing_novel_proofs=existing_novel_proofs,
                     )
+                    is_novel = novelty_tier != "not_novel"
 
                     solver_hints = []
                     if self._first_attempt_used_smt_hint(attempts, candidate.smt_hint):
@@ -642,6 +643,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                         solver="Lean 4",
                         lean_code=lean_code,
                         novel=is_novel,
+                        novelty_tier=novelty_tier,
                         novelty_reasoning=novelty_reasoning,
                         verification_notes="Lean 4 accepted the submitted proof.",
                         attempt_count=len(attempts),
@@ -713,7 +715,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                         # into all prompts via inject_into_prompt().
                         if source_type == "brainstorm":
                             await brainstorm_memory.append_proofs_section(source_id, stored_record)
-                        elif ":" not in source_id:
+                        elif source_type == "paper":
                             await paper_library.append_proofs_section(source_id, stored_record)
                         await self._broadcast(
                             broadcast_fn,
@@ -723,6 +725,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                                 "proof_id": stored_record.proof_id,
                                 "theorem_statement": stored_record.theorem_statement,
                                 "solver": "Lean 4",
+                                "novelty_tier": novelty_tier,
                                 "retry_origin_source_id": candidate.origin_source_id,
                             },
                         )
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index f38ccc3..415d752 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -202,6 +202,132 @@ def _calculate_critique_average(critique: Any) -> Optional[float]:
             1
         )
 
+    @staticmethod
+    def _proof_value(proof: Any, field: str, default: Any = "") -> Any:
+        """Read a proof field from either a Pydantic record or a plain dict."""
+        if isinstance(proof, dict):
+            return proof.get(field, default)
+        return getattr(proof, field, default)
+
+    @classmethod
+    def _format_verified_proof_entry(cls, proof: Any, source_context: str = "") -> str:
+        """Format one Lean-verified proof for a paper appendix."""
+        proof_id = str(cls._proof_value(proof, "proof_id", "") or "").strip()
+        theorem_name = str(cls._proof_value(proof, "theorem_name", "") or "").strip()
+        theorem_statement = str(cls._proof_value(proof, "theorem_statement", "") or "").strip()
+        lean_code = str(cls._proof_value(proof, "lean_code", "") or "").strip()
+        source_type = str(cls._proof_value(proof, "source_type", "") or "").strip()
+        source_id = str(cls._proof_value(proof, "source_id", "") or "").strip()
+        novel = bool(cls._proof_value(proof, "novel", False))
+        novelty_tier = str(cls._proof_value(proof, "novelty_tier", "") or "").strip()
+
+        tier_labels = {
+            "mathematical_discovery": "Mathematical Discovery",
+            "novel_variant": "Novel Reformulation",
+            "novel_formulation": "Novel Formalization",
+        }
+        novelty_label = tier_labels.get(novelty_tier, "Novel" if novel else "Known")
+        context_suffix = f"; carried in from {source_context}" if source_context else ""
+        header_name = theorem_name or proof_id or "Lean 4 verified theorem"
+        source_line = f"Source: {source_type} {source_id}".strip()
+
+        lines = [
+            f"Theorem ({proof_id or 'N/A'}) [{novelty_label}] - {header_name}",
+            f"Status: verified by Lean 4{context_suffix}",
+        ]
+        if source_line != "Source:":
+            lines.append(source_line)
+        lines.extend(
+            [
+                f"Statement: {theorem_statement}",
+                "Lean 4 proof:",
+                lean_code or "[lean code unavailable]",
+                "---",
+            ]
+        )
+        return "\n".join(lines)
+
+    @classmethod
+    def attach_verified_proofs_to_content(
+        cls,
+        content: str,
+        proofs_data: Any,
+        source_context: str = "",
+    ) -> str:
+        """Attach Lean-verified proof entries to a paper's existing appendix.
+
+        Uses the compiler-managed Theorems Appendix when present. If a paper was
+        produced before those markers existed, falls back to a plain text proof
+        section at the end of the file. Existing proof IDs are not duplicated.
+        """
+        existing_content = content or ""
+        proofs = proofs_data if isinstance(proofs_data, list) else [proofs_data]
+
+        entries: List[str] = []
+        for proof in proofs:
+            proof_id = str(cls._proof_value(proof, "proof_id", "") or "").strip()
+            if proof_id and proof_id in existing_content:
+                continue
+            entries.append(cls._format_verified_proof_entry(proof, source_context))
+
+        if not entries:
+            return existing_content
+
+        new_entries = "\n\n".join(entries).strip()
+        appendix_start = "[HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]"
+        appendix_end = "[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]"
+        empty_placeholder = "[Theorems appendix - verified Lean 4 theorems not placed inline will appear here]"
+
+        start_idx = existing_content.find(appendix_start)
+        end_idx = existing_content.find(appendix_end, start_idx if start_idx >= 0 else 0)
+        if start_idx >= 0 and end_idx >= 0:
+            before = existing_content[:start_idx]
+            after = existing_content[end_idx + len(appendix_end):]
+            appendix_body = existing_content[start_idx + len(appendix_start):end_idx]
+            cleaned_body = appendix_body.replace(empty_placeholder, "").strip()
+            combined_body = (
+                f"{cleaned_body}\n\n{new_entries}".strip()
+                if cleaned_body
+                else new_entries
+            )
+            appendix_block = f"{appendix_start}\n{combined_body}\n{appendix_end}"
+            return before + appendix_block + after
+
+        fallback_header = "=== PROOFS ATTACHED TO THIS PAPER (Lean 4 Verified) ==="
+        if fallback_header in existing_content:
+            return existing_content.rstrip() + "\n\n" + new_entries + "\n"
+        return existing_content.rstrip() + "\n\n" + fallback_header + "\n\n" + new_entries + "\n"
+
+    @staticmethod
+    def strip_verified_proofs_from_content(content: str) -> str:
+        """Remove appended Lean proof sections from paper text for RAG/compiler use."""
+        if not content:
+            return ""
+
+        stripped = content
+        appendix_start = "[HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]"
+        appendix_end = "[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]"
+        empty_placeholder = "[Theorems appendix - verified Lean 4 theorems not placed inline will appear here]"
+
+        start_idx = stripped.find(appendix_start)
+        end_idx = stripped.find(appendix_end, start_idx if start_idx >= 0 else 0)
+        if start_idx >= 0 and end_idx >= 0:
+            end_idx += len(appendix_end)
+            empty_appendix = f"{appendix_start}\n{empty_placeholder}\n{appendix_end}"
+            stripped = stripped[:start_idx] + empty_appendix + stripped[end_idx:]
+
+        terminal_headers = (
+            "=== PROOFS GENERATED FROM THIS PAPER",
+            "=== PROOFS ATTACHED TO THIS PAPER",
+        )
+        header_positions = [
+            idx for header in terminal_headers if (idx := stripped.find(header)) > 0
+        ]
+        if header_positions:
+            stripped = stripped[:min(header_positions)]
+
+        return stripped.rstrip()
+
     async def _list_history_papers_from_directory(self, papers_dir: Path, session_id: str) -> List[Dict[str, Any]]:
         """List complete, non-archived papers from one legacy/session papers directory."""
         from backend.shared.critique_memory import get_latest_critique
@@ -586,10 +712,7 @@ async def get_paper_content(self, paper_id: str, *, strip_proofs: bool = False)
             async with aiofiles.open(paper_path, 'r', encoding='utf-8') as f:
                 content = await f.read()
             if strip_proofs and content:
-                marker = "=== PROOFS GENERATED FROM THIS PAPER"
-                idx = content.find(marker)
-                if idx > 0:
-                    content = content[:idx].rstrip()
+                content = self.strip_verified_proofs_from_content(content)
             return content
         except Exception as e:
             logger.error(f"Failed to read paper {paper_id}: {e}")
@@ -597,6 +720,15 @@ async def get_paper_content(self, paper_id: str, *, strip_proofs: bool = False)
 
     async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
         """Append verified proofs to the bottom of a saved paper."""
+        if ":" in paper_id:
+            session_id, scoped_paper_id = paper_id.split(":", 1)
+            papers_dir = self.get_history_papers_dir(session_id)
+            if papers_dir is None:
+                logger.error(f"History paper directory not found for proof append: {paper_id}")
+                return False
+            scoped_library = self._build_scoped_library(papers_dir)
+            return await scoped_library.append_proofs_section(scoped_paper_id, proofs_data)
+
         async with self._lock:
             paper_path = self._get_paper_path(paper_id)
             if not paper_path.exists():
@@ -604,42 +736,22 @@ async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
                 return False
 
             proofs = proofs_data if isinstance(proofs_data, list) else [proofs_data]
-            header = "=== PROOFS GENERATED FROM THIS PAPER (Lean 4 Verified) ==="
 
             try:
                 async with aiofiles.open(paper_path, "r", encoding="utf-8") as handle:
                     existing_content = await handle.read()
 
-                after_header = existing_content.split(header, 1)[1] if header in existing_content else ""
-                next_index = len(re.findall(r"(?m)^Proof \d+:", after_header)) + 1
-
-                lines: List[str] = []
-                if header not in existing_content:
-                    lines.extend(["", "", header, ""])
-                elif not existing_content.endswith("\n"):
-                    lines.append("")
-
-                for proof in proofs:
-                    theorem_statement = str(getattr(proof, "theorem_statement", "") or proof.get("theorem_statement", "")).strip()
-                    proof_id = str(getattr(proof, "proof_id", "") or proof.get("proof_id", "")).strip()
-                    novel = bool(getattr(proof, "novel", False) if hasattr(proof, "novel") else proof.get("novel", False))
-                    lean_code = str(getattr(proof, "lean_code", "") or proof.get("lean_code", "")).strip()
-                    status = "Verified (Novel)" if novel else "Verified (Known)"
-
-                    lines.extend(
-                        [
-                            f"Proof {next_index}: {theorem_statement}",
-                            f"Status: {status}",
-                            f"Proof ID: {proof_id or 'N/A'}",
-                            "Lean 4 Code:",
-                            lean_code or "[no Lean 4 code saved]",
-                            "---",
-                        ]
-                    )
-                    next_index += 1
-
-                async with aiofiles.open(paper_path, "a", encoding="utf-8") as handle:
-                    await handle.write("\n".join(lines) + "\n")
+                updated_content = self.attach_verified_proofs_to_content(
+                    existing_content,
+                    proofs,
+                    "this paper",
+                )
+                if updated_content == existing_content:
+                    logger.info("No new proof entries to append to paper %s", paper_id)
+                    return True
+
+                async with aiofiles.open(paper_path, "w", encoding="utf-8") as handle:
+                    await handle.write(updated_content)
 
                 logger.info("Appended %s proof(s) to paper %s", len(proofs), paper_id)
                 return True
diff --git a/backend/autonomous/memory/proof_database.py b/backend/autonomous/memory/proof_database.py
index 2e1e227..817a5e4 100644
--- a/backend/autonomous/memory/proof_database.py
+++ b/backend/autonomous/memory/proof_database.py
@@ -499,6 +499,7 @@ async def get_graph(self) -> Dict[str, Any]:
                 "source_title": proof.source_title,
                 "solver": proof.solver,
                 "is_novel": proof.novel,
+                "novelty_tier": proof.novelty_tier,
                 "created_at": proof.created_at.isoformat() if proof.created_at else None,
             }
             for proof in proofs
@@ -625,13 +626,20 @@ def get_novel_proofs_for_injection(self) -> str:
 
         lines = [
             "=== VERIFIED NOVEL MATHEMATICAL PROOFS (Lean 4 Verified) ===",
-            "[These proofs have been formally verified. They represent proven mathematical truths.]",
+            "[These proofs have been formally verified. They represent proven mathematical truths.",
+            "Novelty tiers: Mathematical Discovery (highest — new result), Novel Reformulation (novel reformulation of known proof), Novel Formalization (first Lean 4 formalization of known result).]",
             "",
         ]
         for index, proof in enumerate(novel_proofs, start=1):
+            tier = proof.get("novelty_tier", "")
+            tier_label = {
+                "mathematical_discovery": "Mathematical Discovery",
+                "novel_variant": "Novel Reformulation",
+                "novel_formulation": "Novel Formalization",
+            }.get(tier, "Novel")
             lines.extend(
                 [
-                    f"PROOF {index}: {proof.get('theorem_statement', '').strip()}",
+                    f"PROOF {index} [{tier_label}]: {proof.get('theorem_statement', '').strip()}",
                     f"Source: {proof.get('source_type', '')} {proof.get('source_id', '')}".strip(),
                     "Lean 4 Code:",
                     proof.get("lean_code", "").strip(),
@@ -744,6 +752,7 @@ async def _list_proofs_from_directory(
                 "source_title": proof_data.get("source_title", ""),
                 "solver": proof_data.get("solver", "Lean 4"),
                 "novel": is_novel,
+                "novelty_tier": proof_data.get("novelty_tier", "not_novel"),
                 "novelty_reasoning": proof_data.get("novelty_reasoning", ""),
                 "verification_notes": proof_data.get("verification_notes", ""),
                 "attempt_count": proof_data.get("attempt_count", 0),
diff --git a/backend/autonomous/prompts/proof_prompts.py b/backend/autonomous/prompts/proof_prompts.py
index 4726504..de9e4a7 100644
--- a/backend/autonomous/prompts/proof_prompts.py
+++ b/backend/autonomous/prompts/proof_prompts.py
@@ -522,29 +522,44 @@ def build_proof_novelty_prompt(
     lean_code: str,
     existing_novel_proofs: str,
 ) -> str:
-    """Ask the validator whether a Lean-verified theorem is novel."""
+    """Ask the validator to classify a Lean-verified theorem into one of four novelty tiers."""
     existing_proofs_block = existing_novel_proofs or "[No previously stored novel proofs.]"
     return f"""This proof has been FORMALLY VERIFIED by Lean 4. It is mathematically valid.
 
-Your ONLY task: decide whether the verified result is NOVEL in the context of this research program.
+Your ONLY task: assign a novelty tier to the verified result based on the criteria below.
 
-A proof is NOVEL if it meets ANY of these criteria:
-- It proves a result not already present in Mathlib or standard textbooks
-- It establishes a new connection, bound, or structural insight
-- It formalizes a conjecture or claim that was previously unverified
-- It is a non-trivial composition of known results yielding something new
-- It represents original work relative to the existing stored proofs below
+NOVELTY TIERS (choose exactly one):
 
-A proof is NOT novel if:
-- It is a direct restatement of a well-known Mathlib lemma or textbook theorem
-- It is a trivial identity, tautology, or definitional equality
-- It is closable by a single standard tactic (simp, omega, norm_num, decide, rfl)
-- It duplicates a result already in the stored novel proofs below
+"not_novel"
+- The result is a direct restatement of a well-known Mathlib lemma or standard textbook theorem.
+- It is a trivial identity, tautology, or definitional equality.
+- It is closable by a single standard tactic (simp, omega, norm_num, decide, rfl).
+- It duplicates a result already present in the stored proofs below.
+- Assign this tier when there is no meaningful original contribution.
+
+"novel_formulation"
+- The underlying mathematical result is historically known (it exists in textbooks or the literature).
+- However, this specific Lean 4 formalization or mechanized proof is the first of its kind for this result in the context of this research program.
+- The formalization itself required non-trivial effort, even though the mathematics is not new.
+- Assign this tier when the contribution is the act of formal verification, not a new mathematical idea.
+
+"novel_variant"
+- The proof idea is rooted in a known theorem or technique, but this proof meaningfully reformulates, restructures, or generalizes it in a non-trivial way.
+- It introduces a different proof strategy, weaker hypotheses, a stronger conclusion, or an original compositional approach that goes beyond a direct restatement.
+- The reformulation has independent mathematical interest beyond simply formalizing an existing result.
+- Assign this tier when the proof is a genuine but incremental advance on known material.
+
+"mathematical_discovery"
+- The result is a new mathematical finding: a new theorem, bound, connection, or structural insight not present in standard references or Mathlib.
+- It formalizes a previously unverified conjecture or establishes a result with independent mathematical value.
+- It constitutes a novel alternative proof of an existing result whose existence changes mathematical understanding (e.g., a constructive proof where only non-constructive proofs were known).
+- Assign this tier when the proof would be a publishable or citable contribution in its own right.
 
 Rules:
 - Do NOT re-check validity. Lean 4 already verified it.
-- When uncertain, consider the research prompt context -- a result that is textbook-standard in one field may be a novel formalization contribution in the context of this specific research program.
-- Err on the side of recognizing novelty for results that required multi-step reasoning or non-trivial formalization work.
+- Choose the single best-fitting tier. When a proof could fit multiple tiers, choose the highest applicable one.
+- Consider the research prompt context. A result textbook-standard in one field may qualify as "novel_formulation" if it is the first mechanized Lean 4 proof of that result for this research program.
+- Err toward recognizing higher tiers for results that required multi-step reasoning, non-trivial formalization work, or original proof strategy.
 
 USER RESEARCH PROMPT:
 {user_prompt}
@@ -558,5 +573,5 @@ def build_proof_novelty_prompt(
 EXISTING STORED NOVEL PROOFS:
 {existing_proofs_block}
 
-{_json_only_footer('{"is_novel": true, "reasoning": "brief explanation"}')}
+{_json_only_footer('{"novelty_tier": "mathematical_discovery", "reasoning": "brief explanation"}')}
 """
diff --git a/backend/compiler/agents/high_param_submitter.py b/backend/compiler/agents/high_param_submitter.py
index 3722798..ec03eda 100644
--- a/backend/compiler/agents/high_param_submitter.py
+++ b/backend/compiler/agents/high_param_submitter.py
@@ -85,6 +85,7 @@ def format_theorem_appendix_entry(
     lean_code: str,
     is_novel: bool,
     theorem_name: str = "",
+    novelty_tier: str = "",
     placement_outcome: str = "appendix_fallback",
 ) -> str:
     """Format a verified-theorem entry for the Theorems Appendix.
@@ -94,7 +95,12 @@ def format_theorem_appendix_entry(
     fallback). Caller selects via `placement_outcome`.
     """
     header_name = theorem_name.strip() or proof_id
-    novelty_label = "Novel" if is_novel else "Known"
+    tier_labels = {
+        "mathematical_discovery": "Mathematical Discovery",
+        "novel_variant": "Novel Reformulation",
+        "novel_formulation": "Novel Formalization",
+    }
+    novelty_label = tier_labels.get(novelty_tier, "Novel" if is_novel else "Known")
     status_suffix = {
         "appendix_fallback": "inline placement rejected; preserved here because Lean 4 verified the math",
         "inline": "also placed inline in the body",
@@ -124,6 +130,7 @@ class RigorTheoremResult:
     theorem_name: str
     lean_code: str
     is_novel: bool
+    novelty_tier: str
     novelty_reasoning: str
     attempts: List[ProofAttemptFeedback]
     source_id: str
@@ -363,6 +370,7 @@ async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
             theorem_name=theorem_name,
             lean_code=lean_code,
             is_novel=is_novel,
+            novelty_tier=novelty_tier,
             novelty_reasoning=novelty_reasoning,
             attempts=attempts,
             source_id=self._compiler_source_id(),
@@ -593,7 +601,7 @@ async def _step_assess_novelty_and_store(
         self.task_sequence += 1
 
         try:
-            is_novel, novelty_reasoning = await assess_proof_novelty(
+            novelty_tier, novelty_reasoning = await assess_proof_novelty(
                 user_prompt=self.raw_user_prompt,
                 theorem_statement=theorem_statement,
                 lean_code=lean_code,
@@ -604,9 +612,10 @@ async def _step_assess_novelty_and_store(
                 task_id=task_id,
                 role_id="compiler_rigor_novelty",
             )
+            is_novel = novelty_tier != "not_novel"
         except Exception as exc:
             logger.warning("Novelty assessment failed (%s); defaulting to non-novel", exc)
-            is_novel, novelty_reasoning = False, f"Novelty assessment error: {exc}"
+            novelty_tier, novelty_reasoning, is_novel = "not_novel", f"Novelty assessment error: {exc}", False
 
         record = ProofRecord(
             proof_id="",  # proof_database assigns proof_XXX on add_proof
@@ -620,6 +629,7 @@ async def _step_assess_novelty_and_store(
             solver="Lean 4",
             lean_code=lean_code,
             novel=is_novel,
+            novelty_tier=novelty_tier,
             novelty_reasoning=novelty_reasoning,
             verification_notes="Produced by compiler rigor loop (HighParamSubmitter).",
             attempt_count=len(attempts),
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 7225e9c..1dd5494 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -2184,6 +2184,7 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
                     lean_code=lean_result.lean_code,
                     is_novel=lean_result.is_novel,
                     theorem_name=lean_result.theorem_name,
+                    novelty_tier=lean_result.novelty_tier,
                     placement_outcome="inline",
                 )
                 try:
@@ -2260,6 +2261,7 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
             lean_code=lean_result.lean_code,
             is_novel=lean_result.is_novel,
             theorem_name=lean_result.theorem_name,
+            novelty_tier=lean_result.novelty_tier,
             placement_outcome="appendix_fallback",
         )
         appended = await paper_memory.append_to_theorems_appendix(appendix_entry)
diff --git a/backend/shared/models.py b/backend/shared/models.py
index 9401a38..2532b4e 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -574,6 +574,7 @@ class ProofRecord(BaseModel):
     solver: str = "Lean 4"
     lean_code: str
     novel: bool = False
+    novelty_tier: str = "not_novel"
     novelty_reasoning: str = ""
     verification_notes: str = ""
     attempt_count: int = 0
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index a61a21c..4368309 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -346,6 +346,7 @@ function App() {
 
   // Autonomous mode state
   const [autonomousRunning, setAutonomousRunning] = useState(false);
+  const [autonomousStopping, setAutonomousStopping] = useState(false);
   const [autonomousStatus, setAutonomousStatus] = useState(null);
   const [autonomousActivity, setAutonomousActivity] = useState([]);
   const [brainstorms, setBrainstorms] = useState([]);
@@ -1118,6 +1119,7 @@ function App() {
             theorem_statement: data.theorem_statement,
             source_type: data.source_type,
             source_id: data.source_id,
+            novelty_tier: data.novelty_tier || 'mathematical_discovery',
             timestamp: getTimestamp(data),
           }
         ];
@@ -1165,12 +1167,14 @@ function App() {
     unsubscribers.push(websocket.on('auto_research_started', () => {
       setAutonomousActivity([]);
       setAutonomousRunning(true);
+      setAutonomousStopping(false);
     }));
     
     unsubscribers.push(websocket.on('auto_research_resumed', (data) => {
       // Handle resume after crash/restart - sync running state
       console.log('Autonomous research resumed:', data);
       setAutonomousRunning(true);
+      setAutonomousStopping(false);
       if (data?.tier) {
         autonomousTierRef.current = data.tier;
       }
@@ -1188,6 +1192,8 @@ function App() {
     
     unsubscribers.push(websocket.on('auto_research_stopped', () => {
       setAutonomousRunning(false);
+      setAutonomousStopping(false);
+      setAnyWorkflowRunning(false);
       autonomousTierRef.current = null;
       setHungConnectionNotifications([]);
     }));
@@ -1726,6 +1732,7 @@ function App() {
         tier3_enabled: autonomousConfig.tier3_enabled ?? false
       });
       setAutonomousRunning(true);
+      setAutonomousStopping(false);
       setAutonomousActivity([]);
     } catch (error) {
       alert(`Failed to start autonomous research: ${error.details || error.message}`);
@@ -1733,11 +1740,21 @@ function App() {
   };
 
   const handleAutonomousStop = async () => {
+    if (autonomousStopping) {
+      return;
+    }
+
+    setAutonomousStopping(true);
     try {
       await autonomousAPI.stop();
       setAutonomousRunning(false);
+      setAnyWorkflowRunning(false);
+      const status = await autonomousAPI.getStatus();
+      setAutonomousStatus(status);
     } catch (error) {
       alert(`Failed to stop autonomous research: ${error.message}`);
+    } finally {
+      setAutonomousStopping(false);
     }
   };
 
@@ -2287,6 +2304,7 @@ function App() {
           {activeTab === 'auto-interface' && (
             <AutonomousResearchInterface
               isRunning={autonomousRunning}
+              isStopping={autonomousStopping}
               anyWorkflowRunning={anyWorkflowRunning}
               status={autonomousStatus}
               activity={autonomousActivity}
diff --git a/frontend/src/components/PaperCritiqueModal.jsx b/frontend/src/components/PaperCritiqueModal.jsx
index fed01df..a0386f7 100644
--- a/frontend/src/components/PaperCritiqueModal.jsx
+++ b/frontend/src/components/PaperCritiqueModal.jsx
@@ -56,6 +56,59 @@ function getRatingBgColor(rating) {
   return 'critique-bg--red';
 }
 
+const AUTONOMOUS_SETTINGS_STORAGE_KEY = 'autonomous_research_settings';
+const COMPILER_SETTINGS_STORAGE_KEY = 'compiler_settings';
+
+function readStoredValidatorConfig(paperType) {
+  try {
+    if (paperType === 'compiler_paper') {
+      const raw = localStorage.getItem(COMPILER_SETTINGS_STORAGE_KEY);
+      if (!raw) {
+        return null;
+      }
+
+      // compiler_settings uses camelCase keys written by CompilerSettings.jsx
+      const config = JSON.parse(raw);
+      if (!config?.validatorModel) {
+        return null;
+      }
+
+      return {
+        validator_model: config.validatorModel,
+        validator_context_window: config.validatorContextSize,
+        validator_max_tokens: config.validatorMaxOutput,
+        validator_provider: config.validatorProvider,
+        validator_openrouter_provider: config.validatorOpenrouterProvider,
+      };
+    }
+
+    // Only read the actively maintained autonomous settings key. A legacy
+    // `autonomousConfig` blob can go stale and silently override the user's
+    // current validator choice during manual critique generation.
+    const raw = localStorage.getItem(AUTONOMOUS_SETTINGS_STORAGE_KEY);
+    if (!raw) {
+      return null;
+    }
+
+    const settings = JSON.parse(raw);
+    const localConfig = settings?.localConfig;
+    if (!localConfig?.validator_model) {
+      return null;
+    }
+
+    return {
+      validator_model: localConfig.validator_model,
+      validator_context_window: localConfig.validator_context_window,
+      validator_max_tokens: localConfig.validator_max_tokens,
+      validator_provider: localConfig.validator_provider,
+      validator_openrouter_provider: localConfig.validator_openrouter_provider,
+    };
+  } catch (error) {
+    console.warn('Could not read validator config from localStorage:', error);
+    return null;
+  }
+}
+
 /**
  * Modal for displaying paper critiques from the validator model.
  * 
@@ -123,27 +176,8 @@ export default function PaperCritiqueModal({
         ? 'compiler_critique_custom_prompt'
         : 'autonomous_critique_custom_prompt';
       const customPrompt = localStorage.getItem(storageKey);
-      
-      // Get validator config from localStorage (allows critiques without starting research)
-      let validatorConfig = null;
-      try {
-        const configKey = paperType === 'compiler_paper' ? 'compiler_settings' : 'autonomousConfig';
-        const configStr = localStorage.getItem(configKey);
-        if (configStr) {
-          const config = JSON.parse(configStr);
-          // Extract validator config fields
-          validatorConfig = {
-            validator_model: config.validator_model,
-            validator_context_window: config.validator_context_window,
-            validator_max_tokens: config.validator_max_tokens,
-            validator_provider: config.validator_provider,
-            validator_openrouter_provider: config.validator_openrouter_provider,
-          };
-        }
-      } catch (e) {
-        console.warn('Could not read validator config from localStorage:', e);
-      }
-      
+
+      const validatorConfig = readStoredValidatorConfig(paperType);
       const result = await onGenerateCritique(customPrompt, validatorConfig);
       
       // Reload critiques to get the updated list
diff --git a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
index 6f52ffd..69ae366 100644
--- a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
@@ -10,6 +10,7 @@ import TextFileUploader from '../TextFileUploader';
 
 const AutonomousResearchInterface = ({
   isRunning,
+  isStopping = false,
   anyWorkflowRunning,
   status,
   activity,
@@ -417,7 +418,7 @@ const AutonomousResearchInterface = ({
       <div className="autonomous-header">
         <h2>Autonomous Research</h2>
         <div className="autonomous-controls">
-          {!isRunning ? (
+          {!isRunning && !isStopping ? (
             <button 
               className="btn-start"
               onClick={handleStart}
@@ -434,20 +435,20 @@ const AutonomousResearchInterface = ({
                 className="runtime-indicator"
                 role="status"
                 aria-live="polite"
-                title="Autonomous research is currently running"
+                title={isStopping ? "Autonomous research is stopping" : "Autonomous research is currently running"}
               >
                 <span className="runtime-indicator-dot" aria-hidden="true"></span>
-                <span className="runtime-indicator-label">Running</span>
+                <span className="runtime-indicator-label">{isStopping ? 'Stopping' : 'Running'}</span>
               </span>
-              <button className="btn-stop" onClick={onStop}>
-                Stop Research
+              <button className="btn-stop" onClick={onStop} disabled={isStopping}>
+                {isStopping ? 'Stopping...' : 'Stop Research'}
               </button>
             </>
           )}
           <button 
             className={`btn-clear ${showClearConfirm ? 'btn-confirm' : ''}`}
             onClick={handleClear}
-            disabled={isRunning || isClearing}
+            disabled={isRunning || isStopping || isClearing}
           >
             {isClearing ? 'Clearing...' : (showClearConfirm ? 'Confirm Clear' : 'Clear All')}
           </button>
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index 1dcbb38..f75c92f 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -1299,19 +1299,17 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 <OsTag />
                 <div className="flex-row-center">
                   <div className="model-item-name">Kimi K2.6</div>
-                  <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
-                  <div className="help-tooltip-anchor" style={{ zIndex: 100 }}>
-                    <button
-                      type="button"
-                      className="help-tooltip-btn"
-                      aria-label="Learn about the King of the Hill ranking"
-                      onMouseEnter={() => setShowKothTooltip(true)}
-                      onMouseLeave={() => setShowKothTooltip(false)}
-                      onFocus={() => setShowKothTooltip(true)}
-                      onBlur={() => setShowKothTooltip(false)}
-                    >
-                      ?
-                    </button>
+                  <div
+                    className="help-tooltip-anchor"
+                    style={{ zIndex: 100 }}
+                    aria-label="Learn about the King of the Hill ranking"
+                    onMouseEnter={() => setShowKothTooltip(true)}
+                    onMouseLeave={() => setShowKothTooltip(false)}
+                    onFocus={() => setShowKothTooltip(true)}
+                    onBlur={() => setShowKothTooltip(false)}
+                    tabIndex={0}
+                  >
+                    <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
                     {showKothTooltip && (
                       <div
                         className="help-tooltip-popup"
diff --git a/frontend/src/components/autonomous/BrainstormList.jsx b/frontend/src/components/autonomous/BrainstormList.jsx
index 5c10613..6633a7c 100644
--- a/frontend/src/components/autonomous/BrainstormList.jsx
+++ b/frontend/src/components/autonomous/BrainstormList.jsx
@@ -58,18 +58,37 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
 
   // Subscribe to WebSocket events for immediate updates
   useEffect(() => {
+    const refreshExpandedBrainstorm = async () => {
+      try {
+        const refreshedData = await api.getBrainstorm(expandedId);
+        setFileContent(refreshedData.content || 'No content yet...');
+      } catch (error) {
+        console.error('Failed to refresh brainstorm content:', error);
+      }
+    };
+
     const handleSubmissionAccepted = async (data) => {
       if (expandedId && data.topic_id === expandedId) {
-        try {
-          const refreshedData = await api.getBrainstorm(expandedId);
-          setFileContent(refreshedData.content || 'No content yet...');
-        } catch (error) {
-          console.error('Failed to refresh submissions:', error);
-        }
+        await refreshExpandedBrainstorm();
       }
     };
 
-    unsubscribeRef.current = websocket.on('brainstorm_submission_accepted', handleSubmissionAccepted);
+    const handleNovelProofDiscovered = async (data) => {
+      if (
+        expandedId &&
+        data.source_type === 'brainstorm' &&
+        data.source_id === expandedId
+      ) {
+        await refreshExpandedBrainstorm();
+      }
+    };
+
+    const unsubscribeSubmission = websocket.on('brainstorm_submission_accepted', handleSubmissionAccepted);
+    const unsubscribeNovelProof = websocket.on('novel_proof_discovered', handleNovelProofDiscovered);
+    unsubscribeRef.current = () => {
+      unsubscribeSubmission();
+      unsubscribeNovelProof();
+    };
     return () => {
       if (unsubscribeRef.current) {
         unsubscribeRef.current();
diff --git a/frontend/src/components/autonomous/MathematicalProofs.css b/frontend/src/components/autonomous/MathematicalProofs.css
index f6ef116..12e8e01 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.css
+++ b/frontend/src/components/autonomous/MathematicalProofs.css
@@ -173,6 +173,21 @@
   color: #86efac;
 }
 
+.math-proofs-filter--gold.active {
+  background: rgba(255, 214, 92, 0.14);
+  color: #ffd65c;
+}
+
+.math-proofs-filter--silver.active {
+  background: rgba(192, 192, 192, 0.14);
+  color: #d8d8d8;
+}
+
+.math-proofs-filter--bronze.active {
+  background: rgba(205, 127, 50, 0.14);
+  color: #e8a060;
+}
+
 .math-proofs-filter:disabled {
   cursor: not-allowed;
   opacity: 0.55;
@@ -214,6 +229,18 @@
   border-color: rgba(96, 165, 250, 0.28);
 }
 
+.math-proof-card.gold {
+  border-color: rgba(255, 214, 92, 0.45);
+}
+
+.math-proof-card.silver {
+  border-color: rgba(192, 192, 192, 0.45);
+}
+
+.math-proof-card.bronze {
+  border-color: rgba(205, 127, 50, 0.45);
+}
+
 .math-proof-card-header {
   display: flex;
   justify-content: space-between;
@@ -249,6 +276,24 @@
   border-color: rgba(96, 165, 250, 0.35);
 }
 
+.math-proof-badge.gold {
+  color: #ffd65c;
+  border-color: rgba(255, 214, 92, 0.5);
+  background: rgba(255, 214, 92, 0.08);
+}
+
+.math-proof-badge.silver {
+  color: #d8d8d8;
+  border-color: rgba(192, 192, 192, 0.45);
+  background: rgba(192, 192, 192, 0.08);
+}
+
+.math-proof-badge.bronze {
+  color: #e8a060;
+  border-color: rgba(205, 127, 50, 0.45);
+  background: rgba(205, 127, 50, 0.08);
+}
+
 .math-proof-source {
   color: var(--text-secondary, #9ca3af);
 }
diff --git a/frontend/src/components/autonomous/MathematicalProofs.jsx b/frontend/src/components/autonomous/MathematicalProofs.jsx
index 0b6fedc..cbf11ed 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.jsx
+++ b/frontend/src/components/autonomous/MathematicalProofs.jsx
@@ -47,6 +47,23 @@ function createEmptyGraphState() {
   };
 }
 
+function getTierBadge(proof) {
+  const tier = proof.novelty_tier;
+  if (tier === 'mathematical_discovery') {
+    return { cardClass: 'gold', badgeClass: 'gold', label: 'Mathematical Discovery' };
+  }
+  if (tier === 'novel_variant') {
+    return { cardClass: 'silver', badgeClass: 'silver', label: 'Novel Reformulation' };
+  }
+  if (tier === 'novel_formulation') {
+    return { cardClass: 'bronze', badgeClass: 'bronze', label: 'Novel Formalization' };
+  }
+  if (proof.novel) {
+    return { cardClass: 'gold', badgeClass: 'gold', label: 'Novel Proof' };
+  }
+  return { cardClass: 'known', badgeClass: 'known', label: 'Known Proof' };
+}
+
 function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, latestDependencyEvent = null }) {
   const [proofs, setProofs] = useState([]);
   const [proofStatus, setProofStatus] = useState(null);
@@ -297,21 +314,35 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
   }, [availableSources, manualSourceId, manualSourceType]);
 
   const counts = useMemo(() => {
-    if (proofStatus?.proof_counts) {
-      return proofStatus.proof_counts;
-    }
     const novel = proofs.filter((proof) => proof.novel).length;
+    const discovery = proofs.filter((proof) => proof.novelty_tier === 'mathematical_discovery').length;
+    const variant = proofs.filter((proof) => proof.novelty_tier === 'novel_variant').length;
+    const formulation = proofs.filter((proof) => proof.novelty_tier === 'novel_formulation').length;
+    const legacyNovel = novel - discovery - variant - formulation;
     return {
       total: proofs.length,
       novel,
       known: proofs.length - novel,
+      discovery,
+      variant,
+      formulation,
+      legacyNovel,
     };
-  }, [proofStatus, proofs]);
+  }, [proofs]);
 
   const visibleProofs = useMemo(() => {
     if (filter === 'novel') {
       return proofs.filter((proof) => proof.novel);
     }
+    if (filter === 'mathematical_discovery') {
+      return proofs.filter((proof) => proof.novelty_tier === 'mathematical_discovery');
+    }
+    if (filter === 'novel_variant') {
+      return proofs.filter((proof) => proof.novelty_tier === 'novel_variant');
+    }
+    if (filter === 'novel_formulation') {
+      return proofs.filter((proof) => proof.novelty_tier === 'novel_formulation');
+    }
     return proofs;
   }, [proofs, filter]);
   const visibleProofIds = useMemo(
@@ -385,13 +416,31 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
               className={`math-proofs-filter ${filter === 'novel' ? 'active' : ''}`}
               onClick={() => setFilter('novel')}
             >
-              Novel Proofs
+              All Novel ({counts.novel || 0})
+            </button>
+            <button
+              className={`math-proofs-filter math-proofs-filter--gold ${filter === 'mathematical_discovery' ? 'active' : ''}`}
+              onClick={() => setFilter('mathematical_discovery')}
+            >
+              Discovery ({counts.discovery || 0})
+            </button>
+            <button
+              className={`math-proofs-filter math-proofs-filter--silver ${filter === 'novel_variant' ? 'active' : ''}`}
+              onClick={() => setFilter('novel_variant')}
+            >
+              Reformulation ({counts.variant || 0})
+            </button>
+            <button
+              className={`math-proofs-filter math-proofs-filter--bronze ${filter === 'novel_formulation' ? 'active' : ''}`}
+              onClick={() => setFilter('novel_formulation')}
+            >
+              Formalization ({counts.formulation || 0})
             </button>
             <button
               className={`math-proofs-filter ${filter === 'all' ? 'active' : ''}`}
               onClick={() => setFilter('all')}
             >
-              All Verified Proofs
+              All Verified ({counts.total || 0})
             </button>
           </div>
 
@@ -535,13 +584,13 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
             return (
               <article
                 key={proof.proof_id}
-                className={`math-proof-card ${proof.novel ? 'novel' : 'known'}`}
+                className={`math-proof-card ${getTierBadge(proof).cardClass}`}
               >
                 <div className="math-proof-card-header">
                   <div>
                     <div className="math-proof-card-topline">
-                      <span className={`math-proof-badge ${proof.novel ? 'novel' : 'known'}`}>
-                        {proof.novel ? 'Novel Proof' : 'Known Proof'}
+                      <span className={`math-proof-badge ${getTierBadge(proof).badgeClass}`}>
+                        {getTierBadge(proof).label}
                       </span>
                       <span className="math-proof-source">
                         {proof.source_type} {proof.source_id}
diff --git a/frontend/src/components/autonomous/PaperLibrary.jsx b/frontend/src/components/autonomous/PaperLibrary.jsx
index c030110..5ea4a56 100644
--- a/frontend/src/components/autonomous/PaperLibrary.jsx
+++ b/frontend/src/components/autonomous/PaperLibrary.jsx
@@ -1,7 +1,7 @@
 /**
  * PaperLibrary - Displays grid of completed papers.
  */
-import React, { useState } from 'react';
+import React, { useEffect, useState } from 'react';
 import './AutonomousResearch.css';
 import LatexRenderer from '../LatexRenderer';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
@@ -9,6 +9,7 @@ import PaperCritiqueModal from '../PaperCritiqueModal';
 import { autonomousAPI } from '../../services/api';
 import { useProofCheckRuntime } from '../../hooks/useProofCheckRuntime';
 import { getRuntimeDataPath } from '../../utils/runtimeConfig';
+import { websocket } from '../../services/websocket';
 
 const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
   const [expandedId, setExpandedId] = useState(null);
@@ -30,6 +31,31 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
     queueManualProofCheck,
   } = useProofCheckRuntime();
 
+  useEffect(() => {
+    const unsubscribeNovelProof = websocket.on('novel_proof_discovered', async (data) => {
+      if (
+        !expandedId ||
+        data.source_type !== 'paper' ||
+        data.source_id !== expandedId
+      ) {
+        return;
+      }
+
+      try {
+        const refreshed = await api.getAutonomousPaper(expandedId);
+        setExpandedContent({
+          content: refreshed.content,
+          outline: refreshed.outline,
+          title: refreshed.title,
+        });
+      } catch (error) {
+        console.error('Failed to refresh paper after proof append:', error);
+      }
+    });
+
+    return () => unsubscribeNovelProof();
+  }, [expandedId, api]);
+
   const handleCardClick = async (paperId) => {
     if (expandedId === paperId) {
       setExpandedId(null);
diff --git a/frontend/src/components/autonomous/ProofGraph.css b/frontend/src/components/autonomous/ProofGraph.css
index cad3c63..f370021 100644
--- a/frontend/src/components/autonomous/ProofGraph.css
+++ b/frontend/src/components/autonomous/ProofGraph.css
@@ -119,6 +119,18 @@
   stroke: rgba(96, 165, 250, 0.32);
 }
 
+.proof-graph-node-group.gold .proof-graph-node-frame {
+  stroke: rgba(255, 214, 92, 0.55);
+}
+
+.proof-graph-node-group.silver .proof-graph-node-frame {
+  stroke: rgba(192, 192, 192, 0.5);
+}
+
+.proof-graph-node-group.bronze .proof-graph-node-frame {
+  stroke: rgba(205, 127, 50, 0.5);
+}
+
 .proof-graph-node-group.selected .proof-graph-node-frame {
   stroke: rgba(250, 204, 21, 0.9);
 }
diff --git a/frontend/src/components/autonomous/ProofGraph.jsx b/frontend/src/components/autonomous/ProofGraph.jsx
index 8406d10..bb27fa9 100644
--- a/frontend/src/components/autonomous/ProofGraph.jsx
+++ b/frontend/src/components/autonomous/ProofGraph.jsx
@@ -1,6 +1,15 @@
 import React, { useMemo, useState } from 'react';
 import './ProofGraph.css';
 
+function getGraphNodeTierClass(node) {
+  const tier = node.novelty_tier;
+  if (tier === 'mathematical_discovery') return 'gold';
+  if (tier === 'novel_variant') return 'silver';
+  if (tier === 'novel_formulation') return 'bronze';
+  if (node.is_novel) return 'novel';
+  return 'known';
+}
+
 const NODE_WIDTH = 236;
 const NODE_HEIGHT = 110;
 const X_GAP = 72;
@@ -308,7 +317,7 @@ function ProofGraph({
             return (
               <g
                 key={node.proof_id}
-                className={`proof-graph-node-group ${node.is_novel ? 'novel' : 'known'} ${isSelected ? 'selected' : ''}`}
+                className={`proof-graph-node-group ${getGraphNodeTierClass(node)} ${isSelected ? 'selected' : ''}`}
                 transform={`translate(${position.x}, ${position.y})`}
                 onClick={handleActivate}
                 onKeyDown={handleKeyDown}
diff --git a/frontend/src/components/autonomous/ProofLibrary.css b/frontend/src/components/autonomous/ProofLibrary.css
index 7c9d881..affd3d4 100644
--- a/frontend/src/components/autonomous/ProofLibrary.css
+++ b/frontend/src/components/autonomous/ProofLibrary.css
@@ -4,17 +4,32 @@
   color: #1eff1c;
 }
 
+/* Legacy fallback — keeps old records styled correctly */
 .proof-card--novel {
-  border-left: 3px solid #1eff1c;
+  border-left: 3px solid #ffd65c;
 }
 
 .proof-card--known {
   border-left: 3px solid #666;
 }
 
+/* Tier-specific card accents */
+.proof-card--gold {
+  border-left: 3px solid #ffd65c;
+}
+
+.proof-card--silver {
+  border-left: 3px solid #c0c0c0;
+}
+
+.proof-card--bronze {
+  border-left: 3px solid #cd7f32;
+}
+
+/* Legacy fallback badge */
 .proof-badge--novel {
-  background: linear-gradient(135deg, #1eff1c 0%, #7dff6f 100%);
-  color: #000;
+  background: linear-gradient(135deg, #ffd65c 0%, #ffe99a 100%);
+  color: #1a1a00;
 }
 
 .proof-badge--known {
@@ -22,6 +37,22 @@
   color: #ccc;
 }
 
+/* Tier-specific badges */
+.proof-badge--gold {
+  background: linear-gradient(135deg, #ffd65c 0%, #ffe99a 100%);
+  color: #1a1a00;
+}
+
+.proof-badge--silver {
+  background: linear-gradient(135deg, #c0c0c0 0%, #e8e8e8 100%);
+  color: #1a1a1a;
+}
+
+.proof-badge--bronze {
+  background: linear-gradient(135deg, #cd7f32 0%, #e8a060 100%);
+  color: #1a0a00;
+}
+
 .proof-title {
   font-family: 'Courier New', monospace;
   letter-spacing: 0.02em;
diff --git a/frontend/src/components/autonomous/ProofLibrary.jsx b/frontend/src/components/autonomous/ProofLibrary.jsx
index 49ca273..324e161 100644
--- a/frontend/src/components/autonomous/ProofLibrary.jsx
+++ b/frontend/src/components/autonomous/ProofLibrary.jsx
@@ -19,6 +19,32 @@ function truncate(text, maxLength = 220) {
   return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
 }
 
+function getTierBadge(proof) {
+  const tier = proof.novelty_tier;
+  if (tier === 'mathematical_discovery') {
+    return { cssClass: 'proof-badge--gold', label: 'Mathematical Discovery' };
+  }
+  if (tier === 'novel_variant') {
+    return { cssClass: 'proof-badge--silver', label: 'Novel Reformulation' };
+  }
+  if (tier === 'novel_formulation') {
+    return { cssClass: 'proof-badge--bronze', label: 'Novel Formalization' };
+  }
+  if (proof.novel) {
+    return { cssClass: 'proof-badge--gold', label: 'Novel' };
+  }
+  return { cssClass: 'proof-badge--known', label: 'Known' };
+}
+
+function getCardClass(proof) {
+  const tier = proof.novelty_tier;
+  if (tier === 'mathematical_discovery') return 'proof-card--gold';
+  if (tier === 'novel_variant') return 'proof-card--silver';
+  if (tier === 'novel_formulation') return 'proof-card--bronze';
+  if (proof.novel) return 'proof-card--novel';
+  return 'proof-card--known';
+}
+
 export default function ProofLibrary() {
   const [proofs, setProofs] = useState([]);
   const [sessionsResponse, setSessionsResponse] = useState(null);
@@ -252,9 +278,7 @@ export default function ProofLibrary() {
                       return (
                         <div
                           key={id}
-                          className={`answer-card proof-card ${isExpanded ? 'expanded' : ''} ${
-                            proof.novel ? 'proof-card--novel' : 'proof-card--known'
-                          }`}
+                          className={`answer-card proof-card ${isExpanded ? 'expanded' : ''} ${getCardClass(proof)}`}
                         >
                           <div
                             className="answer-header"
@@ -271,11 +295,9 @@ export default function ProofLibrary() {
 
                             <div className="answer-metadata">
                               <span
-                                className={`format-badge ${
-                                  proof.novel ? 'proof-badge--novel' : 'proof-badge--known'
-                                }`}
+                                className={`format-badge ${getTierBadge(proof).cssClass}`}
                               >
-                                {proof.novel ? 'Novel' : 'Known'}
+                                {getTierBadge(proof).label}
                               </span>
                               <span className="word-count">
                                 {proof.solver || 'Lean 4'}
diff --git a/frontend/src/components/autonomous/ProofNotificationStack.jsx b/frontend/src/components/autonomous/ProofNotificationStack.jsx
index 54db44c..6843f57 100644
--- a/frontend/src/components/autonomous/ProofNotificationStack.jsx
+++ b/frontend/src/components/autonomous/ProofNotificationStack.jsx
@@ -13,6 +13,40 @@ function truncate(text, maxLength = 120) {
   return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
 }
 
+const TIER_STYLES = {
+  novel_formulation: {
+    borderColor: '#cd7f32',
+    glowColor: 'rgba(205, 127, 50, 0.35)',
+    glowInset: 'rgba(180, 100, 30, 0.25)',
+    labelColor: '#e8a060',
+    label: 'Novel Formalization Discovered',
+    subLabel:
+      'Your validator has determined this is the first-of-its-kind Lean 4 formalization for this historically known proof.',
+  },
+  novel_variant: {
+    borderColor: '#c0c0c0',
+    glowColor: 'rgba(192, 192, 192, 0.35)',
+    glowInset: 'rgba(160, 160, 160, 0.25)',
+    labelColor: '#d8d8d8',
+    label: 'Novel Reformulation Discovered',
+    subLabel:
+      'Your validator has determined this proof is a novel reformulation of a historically known proof.',
+  },
+  mathematical_discovery: {
+    borderColor: '#ffd65c',
+    glowColor: 'rgba(255, 214, 92, 0.35)',
+    glowInset: 'rgba(255, 194, 57, 0.25)',
+    labelColor: '#ffd65c',
+    label: 'Congratulations!\nMathematical Discovery Found!',
+    subLabel:
+      'Your validator has determined this proof is a mathematical discovery or a novel alternative proof that changes our understanding.',
+  },
+};
+
+function getTierStyle(tier) {
+  return TIER_STYLES[tier] || TIER_STYLES.mathematical_discovery;
+}
+
 export default function ProofNotificationStack({ notifications, onDismiss, onClickNotification }) {
   if (!notifications || notifications.length === 0) {
     return null;
@@ -31,98 +65,112 @@ export default function ProofNotificationStack({ notifications, onDismiss, onCli
         pointerEvents: 'none',
       }}
     >
-      {notifications.map((notification) => (
-        <div
-          key={notification.id}
-          onClick={() => onClickNotification(notification.proof_id)}
-          onKeyDown={(event) => {
-            if (event.key === 'Enter' || event.key === ' ') {
-              event.preventDefault();
-              onClickNotification(notification.proof_id);
-            }
-          }}
-          role="button"
-          tabIndex={0}
-          style={{
-            width: scalePx(320),
-            textAlign: 'left',
-            borderRadius: scalePx(14),
-            border: '1.5px solid #ffd65c',
-            background: 'linear-gradient(135deg, rgba(8, 35, 22, 0.96), rgba(15, 23, 42, 0.96))',
-            boxShadow:
-              '0 16px 36px rgba(0, 0, 0, 0.35), 0 0 12px rgba(255, 214, 92, 0.35), inset 0 0 0 1px rgba(255, 194, 57, 0.25)',
-            padding: `${scalePx(14)} ${scalePx(14)} ${scalePx(12)} ${scalePx(14)}`,
-            color: '#f8fafc',
-            cursor: 'pointer',
-            pointerEvents: 'auto',
-          }}
-        >
+      {notifications.map((notification) => {
+        const tier = getTierStyle(notification.novelty_tier);
+        return (
           <div
+            key={notification.id}
+            onClick={() => onClickNotification(notification.proof_id)}
+            onKeyDown={(event) => {
+              if (event.key === 'Enter' || event.key === ' ') {
+                event.preventDefault();
+                onClickNotification(notification.proof_id);
+              }
+            }}
+            role="button"
+            tabIndex={0}
             style={{
-              display: 'flex',
-              justifyContent: 'space-between',
-              gap: scalePx(12),
-              alignItems: 'flex-start',
+              width: scalePx(320),
+              textAlign: 'left',
+              borderRadius: scalePx(14),
+              border: `1.5px solid ${tier.borderColor}`,
+              background: 'linear-gradient(135deg, rgba(8, 35, 22, 0.96), rgba(15, 23, 42, 0.96))',
+              boxShadow: `0 16px 36px rgba(0, 0, 0, 0.35), 0 0 12px ${tier.glowColor}, inset 0 0 0 1px ${tier.glowInset}`,
+              padding: `${scalePx(14)} ${scalePx(14)} ${scalePx(12)} ${scalePx(14)}`,
+              color: '#f8fafc',
+              cursor: 'pointer',
+              pointerEvents: 'auto',
             }}
           >
-            <div>
-              <div
-                style={{
-                  fontSize: scalePx(10),
-                  letterSpacing: '0.08em',
-                  textTransform: 'uppercase',
-                  color: '#ffd65c',
-                  marginBottom: scalePx(6),
-                  fontWeight: 700,
-                }}
-              >
-                Congratulations! Novel Proof or Novel Formulation Discovered
+            <div
+              style={{
+                display: 'flex',
+                justifyContent: 'space-between',
+                gap: scalePx(12),
+                alignItems: 'flex-start',
+              }}
+            >
+              <div>
+                <div
+                  style={{
+                    fontSize: scalePx(10),
+                    letterSpacing: '0.08em',
+                    textTransform: 'uppercase',
+                    color: tier.labelColor,
+                    marginBottom: scalePx(4),
+                    fontWeight: 700,
+                    whiteSpace: 'pre-line',
+                  }}
+                >
+                  {tier.label}
+                </div>
+                <div
+                  style={{
+                    fontSize: scalePx(10),
+                    lineHeight: 1.4,
+                    color: '#94a3b8',
+                    marginBottom: scalePx(6),
+                    fontStyle: 'italic',
+                  }}
+                >
+                  {tier.subLabel}
+                </div>
+                <div
+                  style={{
+                    fontSize: scalePx(13),
+                    lineHeight: 1.45,
+                    color: '#e2e8f0',
+                    fontWeight: 500,
+                  }}
+                  title={notification.theorem_statement}
+                >
+                  {truncate(notification.theorem_statement)}
+                </div>
+                <div
+                  style={{
+                    marginTop: scalePx(8),
+                    fontSize: scalePx(11),
+                    lineHeight: 1.4,
+                    color: '#1eff1c',
+                    fontWeight: 600,
+                  }}
+                >
+                  Verified by Lean 4. Click to open Mathematical Proofs.
+                </div>
               </div>
-              <div
-                style={{
-                  fontSize: scalePx(13),
-                  lineHeight: 1.45,
-                  color: '#e2e8f0',
-                  fontWeight: 500,
+
+              <button
+                type="button"
+                onClick={(event) => {
+                  event.stopPropagation();
+                  onDismiss(notification.id);
                 }}
-                title={notification.theorem_statement}
-              >
-                {truncate(notification.theorem_statement)}
-              </div>
-              <div
                 style={{
-                  marginTop: scalePx(8),
-                  fontSize: scalePx(11),
-                  lineHeight: 1.4,
-                  color: '#1eff1c',
-                  fontWeight: 600,
+                  border: 'none',
+                  background: 'transparent',
+                  color: '#94a3b8',
+                  cursor: 'pointer',
+                  fontSize: scalePx(16),
+                  lineHeight: 1,
+                  padding: 0,
                 }}
               >
-                Verified by Lean 4. Click to open Mathematical Proofs.
-              </div>
+                x
+              </button>
             </div>
-
-            <button
-              type="button"
-              onClick={(event) => {
-                event.stopPropagation();
-                onDismiss(notification.id);
-              }}
-              style={{
-                border: 'none',
-                background: 'transparent',
-                color: '#94a3b8',
-                cursor: 'pointer',
-                fontSize: scalePx(16),
-                lineHeight: 1,
-                padding: 0,
-              }}
-            >
-              x
-            </button>
           </div>
-        </div>
-      ))}
+        );
+      })}
     </div>
   );
 }
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.jsx b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
index ab75a71..fd415f6 100644
--- a/frontend/src/components/autonomous/Stage2PaperHistory.jsx
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
@@ -5,6 +5,7 @@ import { autonomousAPI } from '../../services/api';
 import { downloadRawText, downloadPDFViaBackend, sanitizeFilename } from '../../utils/downloadHelpers';
 import { buildResearchRunGroups } from '../../utils/researchRunHistory';
 import { useProofCheckRuntime } from '../../hooks/useProofCheckRuntime';
+import { websocket } from '../../services/websocket';
 import './FinalAnswerLibrary.css';
 import './AutonomousResearch.css';
 import './Stage2PaperHistory.css';
@@ -54,6 +55,34 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
     loadPaperHistory();
   }, []);
 
+  useEffect(() => {
+    const unsubscribeNovelProof = websocket.on('novel_proof_discovered', async (data) => {
+      if (!expandedContent || data.source_type !== 'paper') {
+        return;
+      }
+
+      const matchesExpandedPaper = (
+        data.source_id === expandedId ||
+        data.source_id === expandedContent.paper_id
+      );
+      if (!matchesExpandedPaper) {
+        return;
+      }
+
+      try {
+        const refreshed = await autonomousAPI.getHistoryPaper(
+          expandedContent.session_id,
+          expandedContent.paper_id,
+        );
+        setExpandedContent(refreshed);
+      } catch (error) {
+        console.error('Failed to refresh history paper after proof append:', error);
+      }
+    });
+
+    return () => unsubscribeNovelProof();
+  }, [expandedId, expandedContent]);
+
   const loadPaperHistory = async () => {
     try {
       setLoading(true);
diff --git a/randomlog.txt b/randomlog.txt
index 7818869..e69de29 100644
--- a/randomlog.txt
+++ b/randomlog.txt
@@ -1,904 +0,0 @@
-2026-04-30 19:29:13.331 - backend.api.middleware - INFO - Using default CORS origins: ['http://localhost:5173', 'http://127.0.0.1:5173', 'http://localhost:8000', 'http://127.0.0.1:8000']
-2026-04-30 19:29:13.331 - backend.api.middleware - INFO - Middleware configured
-INFO:     Started server process [51848]
-INFO:     Waiting for application startup.
-2026-04-30 19:29:13.347 - backend.api.main - INFO - Starting ASI Aggregator System instance 'default' (data_dir=C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data, logs_dir=C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\logs)
-2026-04-30 19:29:13.347 - backend.api.main - INFO - Secret store active: namespaced_instance=False
-2026-04-30 19:29:13.760 - backend.shared.api_client_manager - INFO - OpenRouter client initialized
-2026-04-30 19:29:13.760 - backend.api.main - INFO - Restored OpenRouter API key from secure backend storage
-2026-04-30 19:29:14.126 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha client initialized
-2026-04-30 19:29:14.126 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha singleton client initialized
-2026-04-30 19:29:14.126 - backend.api.main - INFO - Restored Wolfram Alpha API key from secure backend storage
-2026-04-30 19:29:14.142 - backend.shared.lm_studio_client - INFO - Successfully connected to LM Studio. Found 36 models.
-2026-04-30 19:29:14.159 - backend.autonomous.memory.session_manager - INFO - Found paused session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34 (last updated: 2026-04-30T17:41:52.645719)
-2026-04-30 19:29:14.159 - backend.api.main - INFO - Found resumable session on startup: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:14.159 - backend.autonomous.memory.session_manager - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:14.159 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
-2026-04-30 19:29:14.159 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
-2026-04-30 19:29:14.159 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:14.159 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
-2026-04-30 19:29:14.159 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\proofs
-2026-04-30 19:29:14.159 - backend.api.main - INFO - Session context restored - brainstorms and papers will load from session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:14.172 - backend.api.main - INFO - ASI Aggregator System ready
-2026-04-30 19:29:14.172 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\lean4_workspace
-INFO:     Application startup complete.
-INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)
-2026-04-30 19:29:26.185 - backend.autonomous.memory.research_metadata - INFO - Workflow state loaded: tier=tier2_paper_writing
-INFO:     127.0.0.1:52471 - "WebSocket /ws" [accepted]
-2026-04-30 19:29:26.465 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
-INFO:     connection open
-2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 1 (Main Submitter): model=moonshotai/kimi-k2.6, context=262000, max_tokens=40000
-2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 2 : model=openai/gpt-oss-120b, context=131072, max_tokens=25000
-2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 3 : model=deepseek/deepseek-v4-pro, context=1048576, max_tokens=65500
-2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 4 : model=inception/mercury-2, context=128000, max_tokens=25000
-2026-04-30 19:29:33.283 - backend.api.routes.autonomous - INFO - Validator: model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
-2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous coordinator initializing with 4 submitters
-2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 1 (Main Submitter): model=moonshotai/kimi-k2.6, context=262000
-2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 2 : model=openai/gpt-oss-120b, context=131072
-2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 3 : model=deepseek/deepseek-v4-pro, context=1048576
-2026-04-30 19:29:33.283 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 4 : model=inception/mercury-2, context=128000
-2026-04-30 19:29:33.301 - backend.autonomous.memory.session_manager - INFO - Found paused session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34 (last updated: 2026-04-30T17:41:52.645719)
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO - Found interrupted session: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   User prompt: Solve does P = NP or does P DNE NP, or something else. Find the solution of P and NP....
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Last updated: 2026-04-30T17:41:52.645719
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Tier: tier2_paper_writing
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Topic: topic_004
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO -   Acceptances: 20
-2026-04-30 19:29:33.301 - backend.autonomous.memory.session_manager - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:33.301 - backend.autonomous.core.autonomous_coordinator - INFO - Session resumed: solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:33.301 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
-2026-04-30 19:29:33.301 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
-2026-04-30 19:29:33.301 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34
-2026-04-30 19:29:33.301 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
-2026-04-30 19:29:33.301 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\proofs
-2026-04-30 19:29:33.301 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
-2026-04-30 19:29:33.301 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
-2026-04-30 19:29:33.316 - backend.autonomous.memory.research_metadata - INFO - Workflow state loaded: tier=tier2_paper_writing
-2026-04-30 19:29:33.317 - backend.autonomous.memory.research_metadata - INFO - Research metadata initialized
-2026-04-30 19:29:33.317 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Autonomous rejection logs initialized
-2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_coordinator - INFO - Resetting RAG state for fresh autonomous research mode...
-2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
-2026-04-30 19:29:33.317 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
-2026-04-30 19:29:33.317 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-04-30 19:29:33.373 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-04-30 19:29:33.619 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-04-30 19:29:33.635 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-04-30 19:29:33.652 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-04-30 19:29:33.652 - backend.autonomous.core.autonomous_coordinator - INFO - RAG state reset and cleared for autonomous mode
-2026-04-30 19:29:33.652 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms
-2026-04-30 19:29:33.667 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers
-2026-04-30 19:29:33.667 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager initialized
-2026-04-30 19:29:33.668 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory initialized at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\final_answer
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_selector': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_completion_reviewer': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_reference_selector': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_title_selector': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_redundancy_checker': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.668 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_framing_gate': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_novelty': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_brainstorm': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_paper': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_certainty_assessor': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_format_selector': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_volume_organizer': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Configured Tier 3 Final Answer agents with api_client_manager
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Found interrupted workflow state: tier=tier2_paper_writing
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Workflow state restored: topic=topic_004, paper=None, phase=None, acceptances=20, reference_papers=0, tier3_active=False, tier3_phase=None, tier3_format=None
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator initialized
-2026-04-30 19:29:33.669 - backend.shared.api_client_manager - INFO - Autonomous API logger callback set
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging enabled
-2026-04-30 19:29:33.669 - backend.shared.token_tracker - INFO - TokenTracker reset
-2026-04-30 19:29:33.669 - backend.shared.token_tracker - INFO - TokenTracker timer started
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator started
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Resuming from interrupted workflow: tier=tier2_paper_writing, topic=topic_004, paper=None
-2026-04-30 19:29:33.669 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper compilation for brainstorm topic_004
-2026-04-30 19:29:33.702 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Starting selection (limit=3, total_cap=3, 4 available, 0 already selected)
-2026-04-30 19:29:33.853 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector: Requesting expansion with model moonshotai/kimi-k2.6 (prompt=9729t, task_id=agg_sub1_000)
-2026-04-30 19:31:01.064 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Direct injection for 2 papers (27640 tokens <= 88800 budget)
-2026-04-30 19:31:01.066 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Making final selection with model moonshotai/kimi-k2.6 (prompt=35377t, max=3 papers, task_id=agg_sub1_001)
-2026-04-30 19:31:14.193 - backend.shared.lean4_client - WARNING - Lean 4 workspace update failed: Lean 4 process timed out after 120 seconds.
-2026-04-30 19:31:14.194 - backend.shared.lean4_client - WARNING - Lean 4 LSP warm start skipped because the workspace is not ready.
-2026-04-30 19:31:44.236 - backend.autonomous.agents.reference_selector - INFO - ReferenceSelector [additional]: Selected 2 reference papers
-2026-04-30 19:31:44.237 - backend.autonomous.core.autonomous_coordinator - INFO - Additional reference selection: 2 new + 0 existing = 2 total
-2026-04-30 19:31:44.249 - backend.aggregator.memory.shared_training - INFO - Brainstorm database file doesn't exist yet: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\title_candidates_topic_004.txt
-2026-04-30 19:31:44.249 - backend.autonomous.core.autonomous_coordinator - INFO - Starting paper title exploration phase (target: 5 candidates, resumed: 0)
-2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-04-30 19:31:44.250 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 262000, Validator: 2000000
-2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 4 submitters with models ['moonshotai/kimi-k2.6', 'openai/gpt-oss-120b', 'deepseek/deepseek-v4-pro', 'inception/mercury-2'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-04-30 19:31:44.250 - backend.aggregator.core.coordinator - INFO - Boost mode ACTIVE: Will route selected tasks to openai/gpt-5.5-pro. This does NOT affect parallel execution mode.
-2026-04-30 19:31:44.689 - backend.aggregator.core.coordinator - INFO - Currently loaded models: []
-2026-04-30 19:31:44.689 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 262000 tokens (model: moonshotai/kimi-k2.6)
-  - Submitter 2: 131072 tokens (model: openai/gpt-oss-120b)
-  - Submitter 3: 1048576 tokens (model: deepseek/deepseek-v4-pro)
-  - Submitter 4: 128000 tokens (model: inception/mercury-2)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-04-30 19:31:44.691 - backend.aggregator.memory.shared_training - INFO - Created new shared training file
-2026-04-30 19:31:44.692 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-04-30 19:31:44.797 - backend.aggregator.memory.event_log - INFO - Loaded 11401 events from event log
-2026-04-30 19:31:44.812 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 1
-2026-04-30 19:31:44.812 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model moonshotai/kimi-k2.6
-2026-04-30 19:31:44.812 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:31:44.812 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
-2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 2
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model openai/gpt-oss-120b
-2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=openai/gpt-oss-120b via Groq
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=openai/gpt-oss-120b, provider=openrouter, context=131072
-2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 3
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model deepseek/deepseek-v4-pro
-2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=deepseek/deepseek-v4-pro
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=deepseek/deepseek-v4-pro, provider=openrouter, context=1048576
-2026-04-30 19:31:44.820 - backend.aggregator.memory.local_training - INFO - Loaded 5 rejections for submitter 4
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 4 initialized with model inception/mercury-2
-2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_4': provider=openrouter, model=inception/mercury-2
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Submitter 4: model=inception/mercury-2, provider=openrouter, context=128000
-2026-04-30 19:31:44.820 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-04-30 19:31:44.820 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 4 submitters
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 4 started
-2026-04-30 19:31:44.820 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-04-30 19:31:44.820 - backend.autonomous.core.autonomous_coordinator - INFO - Title exploration aggregator started with parallel submitters
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-04-30 19:31:44.820 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-04-30 19:31:44.837 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-04-30 19:31:44.837 - backend.aggregator.agents.submitter - INFO - Submitter 4 run loop started - will run continuously until stopped
-2026-04-30 19:31:44.851 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-04-30 19:31:45.967 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 90ff3b52-2cd0-4836-b84b-c9a8b6f09923 (iteration 1)
-2026-04-30 19:31:46.533 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission a13f37f2-dba1-4954-90e3-c51ed09299df (iteration 1)
-2026-04-30 19:31:46.869 - backend.aggregator.core.coordinator - INFO - Validator iteration 3 - batch validating 2 submissions: ['90ff3b52-2cd0-4836-b84b-c9a8b6f09923', 'a13f37f2-dba1-4954-90e3-c51ed09299df']
-2026-04-30 19:31:46.869 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 2 submissions
-2026-04-30 19:31:46.869 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 2 submissions
-2026-04-30 19:31:49.165 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 108946eb-bded-4310-82e4-6ada17054636 (iteration 2)
-2026-04-30 19:31:50.267 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 142a762f-32c5-4c54-a884-34f04586e893 (iteration 2)
-2026-04-30 19:31:52.092 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 12d94cc1-78a2-44ea-b05f-1046e5f56ef7 (iteration 3)
-2026-04-30 19:31:54.326 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cee583c3-8a97-4c8c-b922-0fd8bb290de3 (iteration 3)
-2026-04-30 19:31:54.984 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 988c5fc6-6301-466d-8b78-eb991f517bf3 (iteration 4)
-2026-04-30 19:31:57.565 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 9ac811a6-d27f-4fb2-bdf3-8ce6c98ec4f4 (iteration 4)
-2026-04-30 19:31:58.096 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 3a3d3d0e-a5ae-497e-b0bc-3348c65ee135 (iteration 5)
-2026-04-30 19:32:00.958 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 6d18dff1-623f-479e-b972-e109f555d9d9 (iteration 5)
-2026-04-30 19:32:01.082 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 00db103c-1bd8-4282-973c-f77c2f9ec7dc (iteration 6)
-2026-04-30 19:32:04.022 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission c52670ac-49d7-477a-b64c-e581d1130917 (iteration 6)
-2026-04-30 19:32:14.911 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/2 accepted
-2026-04-30 19:32:14.915 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
-2026-04-30 19:32:14.915 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-04-30 19:32:14.915 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission accepted (total: 1)
-2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 4 (total: 1)
-2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-04-30 19:32:14.916 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-04-30 19:32:14.917 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 1 total chunks
-2026-04-30 19:32:14.917 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
-2026-04-30 19:32:14.917 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 1)
-2026-04-30 19:32:14.927 - backend.aggregator.core.coordinator - INFO - Queue size (10) >= threshold (10). Pausing submitters.
-2026-04-30 19:32:14.927 - backend.aggregator.core.coordinator - INFO - Validator iteration 4 - batch validating 3 submissions: ['108946eb-bded-4310-82e4-6ada17054636', '142a762f-32c5-4c54-a884-34f04586e893', '12d94cc1-78a2-44ea-b05f-1046e5f56ef7']
-2026-04-30 19:32:14.927 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:32:14.927 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:32:14.994 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 1/5 candidates accepted
-2026-04-30 19:32:16.139 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-04-30 19:32:16.139 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-04-30 19:32:40.316 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
-2026-04-30 19:32:40.318 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 1)
-2026-04-30 19:32:40.318 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 2)
-2026-04-30 19:32:40.321 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 2)
-2026-04-30 19:32:40.321 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 3)
-2026-04-30 19:32:40.324 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
-2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-04-30 19:32:40.325 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission accepted (total: 2)
-2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 4 (total: 2)
-2026-04-30 19:32:40.325 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-04-30 19:32:40.326 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-04-30 19:32:40.326 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-04-30 19:32:40.326 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 1 total chunks
-2026-04-30 19:32:40.330 - backend.aggregator.core.coordinator - INFO - Queue size (7) < threshold (10). Resuming submitters.
-2026-04-30 19:32:40.331 - backend.aggregator.core.coordinator - INFO - Validator iteration 5 - batch validating 3 submissions: ['cee583c3-8a97-4c8c-b922-0fd8bb290de3', '988c5fc6-6301-466d-8b78-eb991f517bf3', '9ac811a6-d27f-4fb2-bdf3-8ce6c98ec4f4']
-2026-04-30 19:32:40.331 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:32:40.331 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:32:40.364 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-04-30 19:32:40.364 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-04-30 19:32:40.523 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 44116b14-83a3-4e5c-9892-b768941b848c (iteration 1)
-2026-04-30 19:32:41.086 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 2/5 candidates accepted
-2026-04-30 19:32:42.437 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission acbc42c6-e70c-4e5f-a141-4f6b6165214f (iteration 7)
-2026-04-30 19:32:44.108 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cf198397-5da9-44b7-896b-40905acbd42d (iteration 7)
-2026-04-30 19:32:45.695 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission ffb22bc0-8c59-454b-bb1b-561b7ebecf3e (iteration 8)
-2026-04-30 19:32:47.524 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 2d78831a-7c3e-4354-8d3c-81758b2627d9 (iteration 8)
-2026-04-30 19:32:49.018 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 50605199-ecaa-4ab1-8829-3468e76092f1 (iteration 9)
-2026-04-30 19:32:51.107 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission cd68c0a9-f4c2-4f11-afd6-333af4025879 (iteration 9)
-2026-04-30 19:32:55.641 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
-2026-04-30 19:32:55.644 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
-2026-04-30 19:32:55.644 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-04-30 19:32:55.645 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 1)
-2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 3)
-2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-04-30 19:32:55.645 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-04-30 19:32:55.645 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 2 total chunks
-2026-04-30 19:32:55.652 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 1)
-2026-04-30 19:32:55.652 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 4)
-2026-04-30 19:32:55.656 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
-2026-04-30 19:32:55.656 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 5)
-2026-04-30 19:32:55.658 - backend.aggregator.core.coordinator - INFO - Queue size (11) >= threshold (10). Pausing submitters.
-2026-04-30 19:32:55.658 - backend.aggregator.core.coordinator - INFO - Validator iteration 6 - batch validating 3 submissions: ['3a3d3d0e-a5ae-497e-b0bc-3348c65ee135', '6d18dff1-623f-479e-b972-e109f555d9d9', '00db103c-1bd8-4282-973c-f77c2f9ec7dc']
-2026-04-30 19:32:55.659 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:32:55.659 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:32:55.704 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-04-30 19:32:55.704 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-04-30 19:32:57.100 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 3/5 candidates accepted
-2026-04-30 19:33:31.671 - backend.aggregator.agents.validator - INFO - Batch validation complete: 0/3 accepted
-2026-04-30 19:33:31.671 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 2)
-2026-04-30 19:33:31.671 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 6)
-2026-04-30 19:33:31.687 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 2)
-2026-04-30 19:33:31.687 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 7)
-2026-04-30 19:33:31.687 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 3)
-2026-04-30 19:33:31.687 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 8)
-2026-04-30 19:33:31.703 - backend.aggregator.core.coordinator - INFO - Queue size (8) < threshold (10). Resuming submitters.
-2026-04-30 19:33:31.703 - backend.aggregator.core.coordinator - INFO - Validator iteration 7 - batch validating 3 submissions: ['c52670ac-49d7-477a-b64c-e581d1130917', '44116b14-83a3-4e5c-9892-b768941b848c', 'acbc42c6-e70c-4e5f-a141-4f6b6165214f']
-2026-04-30 19:33:31.703 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:33:31.703 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:33:32.226 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f4e42d31-3e25-4cf7-8cf9-855d0fe72d09 (iteration 1)
-2026-04-30 19:33:34.146 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission d749aa5b-7242-4ed0-8f60-be13c42385b0 (iteration 10)
-2026-04-30 19:33:35.328 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 46c7a011-7b74-4d48-92ff-d990536817c5 (iteration 10)
-2026-04-30 19:33:37.594 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 338945b2-b322-4e41-9c2f-dabe2356ed7a (iteration 11)
-2026-04-30 19:33:38.927 - backend.aggregator.agents.submitter - INFO - Submitter 2 generated submission 2314ec88-7a07-4349-9567-048d64f5df76 (iteration 11)
-2026-04-30 19:33:40.486 - backend.aggregator.agents.submitter - INFO - Submitter 4 generated submission 489c5d4c-89a1-4635-a8ac-1b66bfaf4905 (iteration 12)
-2026-04-30 19:33:47.193 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
-2026-04-30 19:33:47.193 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 3)
-2026-04-30 19:33:47.193 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 9)
-2026-04-30 19:33:47.210 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-04-30 19:33:47.210 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-04-30 19:33:47.210 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 2 total chunks
-2026-04-30 19:33:47.210 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 4)
-2026-04-30 19:33:47.210 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 10)
-2026-04-30 19:33:47.221 - backend.aggregator.core.coordinator - INFO - Queue size (11) >= threshold (10). Pausing submitters.
-2026-04-30 19:33:47.223 - backend.aggregator.core.coordinator - INFO - Validator iteration 8 - batch validating 3 submissions: ['cf198397-5da9-44b7-896b-40905acbd42d', 'ffb22bc0-8c59-454b-bb1b-561b7ebecf3e', '2d78831a-7c3e-4354-8d3c-81758b2627d9']
-2026-04-30 19:33:47.223 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:33:47.223 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:33:47.266 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-04-30 19:33:47.266 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-04-30 19:33:49.233 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 4/5 candidates accepted
-2026-04-30 19:34:14.439 - backend.aggregator.agents.validator - INFO - Batch validation complete: 1/3 accepted
-2026-04-30 19:34:14.455 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission accepted (total: 2)
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 2 (total: 5)
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-04-30 19:34:14.455 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 1 total chunks
-2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 4: Submission rejected (consecutive: 5)
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 4 (total: 11)
-2026-04-30 19:34:14.455 - backend.aggregator.agents.submitter - INFO - Submitter 2: Submission rejected (consecutive: 1)
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 2 (total: 12)
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Queue size (8) < threshold (10). Resuming submitters.
-2026-04-30 19:34:14.455 - backend.aggregator.core.coordinator - INFO - Validator iteration 9 - batch validating 3 submissions: ['50605199-ecaa-4ab1-8829-3468e76092f1', 'cd68c0a9-f4c2-4f11-afd6-333af4025879', 'f4e42d31-3e25-4cf7-8cf9-855d0fe72d09']
-2026-04-30 19:34:14.455 - backend.aggregator.agents.validator - INFO - Batch validation: Processing 3 submissions
-2026-04-30 19:34:14.455 - backend.aggregator.agents.validator - INFO - Batch quality assessment: 3 submissions
-2026-04-30 19:34:14.486 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-04-30 19:34:14.486 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-04-30 19:34:14.728 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission a0422046-e395-42b4-8f4e-39333726c738 (iteration 2)
-2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: 5/5 candidates accepted
-2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: Target of 5 candidates reached
-2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-04-30 19:34:15.263 - backend.aggregator.agents.submitter - INFO - Submitter 4 stopped
-2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 9
-2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 9 iterations - is_running=False
-2026-04-30 19:34:15.263 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - Paper title exploration complete: 5 candidates accepted
-2026-04-30 19:34:15.263 - backend.autonomous.core.autonomous_coordinator - INFO - TitleExploration: Restored shared_training_memory state
-2026-04-30 19:34:15.263 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Attempt 1
-2026-04-30 19:34:15.279 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Generating title with model moonshotai/kimi-k2.6 (task_id=agg_sub1_000)
-2026-04-30 19:35:52.374 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Validating with model x-ai/grok-4.1-fast (task_id=agg_sub1_001)
-2026-04-30 19:37:06.565 - backend.autonomous.agents.paper_title_selector - INFO - PaperTitleSelector: Title accepted: 'Verified Proof Complexity in Lean 4: From Polynomial Verifiers to Exponential Lower Bounds'
-2026-04-30 19:37:06.565 - backend.autonomous.core.autonomous_coordinator - INFO - Compiling paper: Verified Proof Complexity in Lean 4: From Polynomial Verifiers to Exponential Lower Bounds
-2026-04-30 19:37:06.565 - backend.autonomous.core.autonomous_coordinator - INFO - Clearing RAG for autonomous paper compilation...
-2026-04-30 19:37:06.565 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-04-30 19:37:06.580 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-04-30 19:37:06.580 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-04-30 19:37:06.596 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-04-30 19:37:06.596 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-04-30 19:37:06.611 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-04-30 19:37:06.611 - backend.autonomous.core.autonomous_coordinator - INFO - RAG cleared successfully
-2026-04-30 19:37:06.611 - backend.compiler.core.compiler_coordinator - INFO - Initializing compiler coordinator...
-2026-04-30 19:37:06.611 - backend.compiler.memory.outline_memory - INFO - Outline memory initialized
-2026-04-30 19:37:06.627 - backend.compiler.memory.paper_memory - INFO - Paper memory initialized
-2026-04-30 19:37:06.627 - backend.compiler.memory.compiler_rejection_log - INFO - Compiler rejection/acceptance logs initialized
-2026-04-30 19:37:07.008 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha client initialized
-2026-04-30 19:37:07.015 - backend.shared.wolfram_alpha_client - INFO - Wolfram Alpha singleton client initialized
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Wolfram Alpha client initialized (available as a construction-mode tool)
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Resetting compiler RAG manager state...
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager state reset
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Initializing compiler RAG manager...
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Updating compiler context window from 131072 to 2000000
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Compiler RAG manager initialized
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Skipping Part 1 aggregator database load (autonomous mode)
-2026-04-30 19:37:07.015 - backend.compiler.agents.high_context_submitter - INFO - High-context submitter initialized with model: moonshotai/kimi-k2.6
-2026-04-30 19:37:07.015 - backend.compiler.agents.high_context_submitter - INFO - Context budget: 221500 tokens (window: 262000)
-2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_context': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-04-30 19:37:07.015 - backend.compiler.agents.high_param_submitter - INFO - High-param submitter initialized with model: openai/gpt-5.5
-2026-04-30 19:37:07.015 - backend.compiler.agents.high_param_submitter - INFO - Context budget: 921500 tokens (window: 1050000)
-2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_high_param': provider=openrouter, model=openai/gpt-5.5
-2026-04-30 19:37:07.015 - backend.compiler.validation.compiler_validator - INFO - Compiler validator initialized with model: x-ai/grok-4.1-fast
-2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Configured role 'compiler_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-04-30 19:37:07.015 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Per-paper model tracking enabled for manual compiler mode
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Compiler coordinator initialized successfully
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Autonomous mode enabled - section order: Body → Conclusion → Intro → Abstract
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Clearing paper and outline...
-2026-04-30 19:37:07.015 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 1, 0 words)
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Paper is empty, skipping re-chunking
-2026-04-30 19:37:07.015 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 1)
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_rag_manager - INFO - Outline is empty, skipping re-chunking
-2026-04-30 19:37:07.015 - backend.compiler.memory.critique_memory - ERROR - Critique memory not initialized - call initialize() first
-2026-04-30 19:37:07.015 - backend.compiler.core.compiler_coordinator - INFO - Cleared critique memory
-2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Cleared rejection/acceptance logs
-2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset per-paper model tracker
-2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset autonomous section phase to body
-2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Reset critique phase state
-2026-04-30 19:37:07.024 - backend.compiler.core.compiler_coordinator - INFO - Paper and outline cleared - system reset to fresh start
-2026-04-30 19:37:07.024 - backend.autonomous.core.autonomous_coordinator - INFO - Cleared previous paper/outline for fresh paper paper_007
-2026-04-30 19:37:07.024 - backend.autonomous.core.autonomous_coordinator - INFO - Loading brainstorm database into compiler RAG: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\brainstorm_topic_004.txt
-2026-04-30 19:37:07.040 - backend.aggregator.ingestion.pipeline - INFO - Ingested brainstorm_topic_004.txt: 556 total chunks
-2026-04-30 19:37:12.336 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\brainstorms\brainstorm_topic_004.txt
-2026-04-30 19:37:12.336 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm database loaded into compiler RAG
-2026-04-30 19:37:12.336 - backend.autonomous.core.autonomous_coordinator - INFO - Loading 2 reference papers into compiler RAG
-2026-04-30 19:37:12.336 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_006.txt: 234 total chunks
-2026-04-30 19:37:14.214 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers\paper_paper_006.txt
-2026-04-30 19:37:14.214 - backend.autonomous.core.autonomous_coordinator - INFO - Reference paper loaded: paper_006
-2026-04-30 19:37:14.216 - backend.aggregator.ingestion.pipeline - INFO - Ingested paper_paper_003.txt: 87 total chunks
-2026-04-30 19:37:14.930 - backend.aggregator.core.rag_manager - INFO - Added document: C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\auto_sessions\solve_does_p_np_or_does_p_dne_np_or_something_e_2026-04-27_15-34\papers\paper_paper_003.txt
-2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Reference paper loaded: paper_003
-2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - All reference papers loaded into compiler RAG
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Starting compiler...
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Compiler started successfully
-2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Compiler started for paper paper_007
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Compiler workflow started
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Aggregator monitoring started - will check for new acceptances every 30 seconds
-2026-04-30 19:37:14.930 - backend.autonomous.core.autonomous_coordinator - INFO - Phase updated: None → body
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - Starting fresh - no existing paper or outline found
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - PHASE 1: ITERATIVE OUTLINE CREATION
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_coordinator - INFO -
---- Outline Creation Iteration 1/15 ---
-2026-04-30 19:37:14.930 - backend.compiler.agents.high_context_submitter - INFO - Starting outline creation submission generation...
-2026-04-30 19:37:14.930 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 19:37:14.930 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_create, query_length=14810
-2026-04-30 19:37:40.825 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_create in 25.90s (coverage=0.50, tokens=10764)
-2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 68648 chars retrieved
-2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Building outline creation prompt...
-2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 102033 chars
-2026-04-30 19:37:40.825 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_000)...
-2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 3617 chars
-2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 19:40:28.113 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 19:40:28.116 - backend.compiler.agents.high_context_submitter - INFO - Outline creation submission generated: 126dcdd9-cf47-44f1-b018-a16e8155c8e8, outline_complete=True
-2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - Validating outline_create submission: 126dcdd9-cf47-44f1-b018-a16e8155c8e8
-2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=outline_create, operation=full_content
-2026-04-30 19:40:28.116 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_000)...
-2026-04-30 19:40:37.782 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 19:40:37.798 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: outline_create)
-2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ✓ Iteration 1: Outline ACCEPTED
-2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO -   Validator feedback: The submitted outline fully meets all validation criteria. It includes the optional Abstract, required Introduction ('I. Introduction'), multiple body sections (II through VIII), and Conclusion ('IX. ...
-2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - OUTLINE MARKED COMPLETE BY SUBMITTER - LOCKING
-2026-04-30 19:40:37.801 - backend.compiler.core.compiler_coordinator - INFO - ============================================================
-2026-04-30 19:40:37.803 - backend.compiler.memory.outline_memory - INFO - Outline updated (version 2)
-2026-04-30 19:40:37.814 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_outline.txt
-2026-04-30 19:40:37.814 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_outline.txt: 7 total chunks
-2026-04-30 19:40:37.935 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_outline.txt
-2026-04-30 19:40:37.937 - backend.compiler.core.compiler_rag_manager - INFO - Outline re-chunked successfully
-2026-04-30 19:40:37.937 - backend.compiler.memory.outline_memory - INFO - Outline creation feedback cleared
-2026-04-30 19:40:37.937 - backend.compiler.core.compiler_coordinator - INFO - Outline locked after 1 iterations
-2026-04-30 19:40:37.937 - backend.compiler.core.compiler_coordinator - INFO - Starting initial paper loop...
-2026-04-30 19:40:37.939 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=True, phase=body)
-2026-04-30 19:40:37.939 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 19:40:37.941 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=0 chars
-2026-04-30 19:40:37.941 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 0 chars → 0 chars (markers preserved)
-2026-04-30 19:40:37.973 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=0, brainstorm=74310, overhead=5000, rag_budget=141636
-2026-04-30 19:40:37.973 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 19:40:37.973 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=14810
-2026-04-30 19:40:37.973 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:41:11.848 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:41:11.848 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
-2026-04-30 19:41:11.848 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 33.88s (coverage=0.32, tokens=1810)
-2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 14156 chars retrieved
-2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 19:41:11.848 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 307904 chars
-2026-04-30 19:41:11.880 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_001)...
-2026-04-30 19:45:54.178 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 9286 chars (0 Wolfram tool call(s))
-2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 19:45:54.187 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: eee4f7ad-46d6-46e7-b078-34784dc32a1d (section_complete=False)
-2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: eee4f7ad-46d6-46e7-b078-34784dc32a1d
-2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=full_content
-2026-04-30 19:45:54.187 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_001)...
-2026-04-30 19:46:08.525 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 19:46:08.540 - backend.compiler.memory.paper_memory - INFO - Paper initialized with placeholders (version 2)
-2026-04-30 19:46:08.540 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-04-30 19:46:08.540 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 26 total chunks
-2026-04-30 19:46:08.794 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-04-30 19:46:08.794 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-04-30 19:46:08.794 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Initial paper portion accepted with placeholders! (1131 words)
-2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Initial paper loop complete
-2026-04-30 19:46:08.794 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-04-30 19:46:08.811 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
-2026-04-30 19:46:08.811 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
-2026-04-30 19:46:08.825 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
-2026-04-30 19:46:08.825 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 19:46:08.825 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 19:46:08.825 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:46:34.389 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:46:34.389 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
-2026-04-30 19:46:34.389 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.56s (coverage=0.30, tokens=1739)
-2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
-2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 19:46:34.389 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 316065 chars
-2026-04-30 19:46:34.420 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_002)...
-2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 14015 chars (0 Wolfram tool call(s))
-2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 19:52:38.036 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 19:52:38.052 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: f58caf39-ee36-400e-af84-0366b9400553 (section_complete=False)
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: f58caf39-ee36-400e-af84-0366b9400553
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 11972 -> 11868 chars, new_string: 11972 -> 11868 chars)
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and'...
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 7951
-2026-04-30 19:52:38.052 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_002)...
-2026-04-30 19:53:11.368 - backend.compiler.validation.compiler_validator - INFO - Validation result: reject (coherence=False, rigor=False, placement=False)
-2026-04-30 19:53:11.368 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: construction)
-2026-04-30 19:53:11.368 - backend.compiler.core.compiler_coordinator - INFO - Construction rejected
-2026-04-30 19:53:11.368 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body, retry with feedback)
-2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
-2026-04-30 19:53:11.368 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
-2026-04-30 19:53:11.398 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
-2026-04-30 19:53:11.398 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 19:53:11.398 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 19:53:11.398 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:53:37.017 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 19:53:37.019 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
-2026-04-30 19:53:37.019 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.62s (coverage=0.30, tokens=1739)
-2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
-2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 19:53:37.019 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 321059 chars
-2026-04-30 19:53:37.047 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_003)...
-2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 11972 chars (0 Wolfram tool call(s))
-2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:04:01.711 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 30d56c2e-c869-4b79-b1db-090cd0194d17 (section_complete=False)
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 30d56c2e-c869-4b79-b1db-090cd0194d17
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 10228 -> 10226 chars, new_string: 10228 -> 10226 chars)
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'...
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=570 | double_spaces=1 | first20='Since polynomial bou' | last20='orems in Section~IV.'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=8754 | double_spaces=21 | first20='[HARD CODED PLACEHOL' | last20=' BE ABOVE THIS LINE]'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle FULL:
-Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
-
-This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars repr): 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\\pi_{C}|+|\\varphi|$ (\\texttt{polynomial\\_simulation\\_transitive}, Proof~7).\n\nThis preorder str'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars repr): 'fied, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): '[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION - TO BE WRITTEN AFTER THE INTRODUCTION IS COMPLETE]\n\n[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION - TO BE WRITTEN AFTER THE CONCLUSION SECTION IS C'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'eorems not placed inline will appear here]\n[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]\n\n[HARD CODED END-OF-PAPER MARK -- ALL CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    PARTIAL_MATCH: First 50 chars of needle found at haystack pos 7756
-2026-04-30 20:04:01.711 - backend.compiler.validation.compiler_validator - WARNING -    Haystack context at partial match: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - EXACT_MATCH_FAILED - Starting diagnostics...
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    NEEDLE: length=570 | double_spaces=1 | first20='Since polynomial bou' | last20='orems in Section~IV.'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    HAYSTACK: length=2504 | double_spaces=36 | first20='Abstract\n\nI. Introdu' | last20=' BE ABOVE THIS LINE]'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - MATCH_FAILED_COMPLETELY - Deep diagnostic analysis:
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle FULL:
-Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
-
-This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle (first 200 chars repr): 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\\pi_{C}|+|\\varphi|$ (\\texttt{polynomial\\_simulation\\_transitive}, Proof~7).\n\nThis preorder str'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Needle (last 200 chars repr): 'fied, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (first 200 chars): 'Abstract\n\nI. Introduction\n   A. The Cook-Reckhow program and NP versus coNP\n   B. Verified proof complexity and the role of Lean 4\n   C. Overview of contributions\n   D. Roadmap\n\nII. Preliminaries and '
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Haystack (last 200 chars): 'pen formalization targets and future work\n\n[HARD CODED BRACKETED DESIGNATION THAT SHOWS END-OF-PAPER DESIGNATION MARK]\n[HARD CODED END-OF-OUTLINE MARK -- ALL OUTLINE CONTENT SHOULD BE ABOVE THIS LINE]'
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    NO_MATCH_FOUND: Text does not exist in document, even with whitespace/line-ending normalization
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    This suggests the model is referencing text that was never written or was from a different document version
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING -    Common causes: (1) Model hallucinated content, (2) Model referenced outline text instead of paper text, (3) Content was removed in prior edit
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - Pre-validation failed: old_string not found in document
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - WARNING - FULL old_string that failed to match:
-Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial in $|\pi_{C}|+|\varphi|$ (\texttt{polynomial\_simulation\_transitive}, Proof~7).
-
-This preorder structure underlies all later comparisons among Resolution, Cutting Planes, Frege, and Extended Frege.  In particular, once a simulation edge $S \psimulates T$ has been verified, any lower-bound result for $S$ automatically propagates to $T$, and any polynomial-boundedness result for $T$ propagates upward to $S$; we develop the associated transfer theorems in Section~IV.
-2026-04-30 20:04:01.726 - backend.compiler.validation.compiler_validator - INFO - Pre-validation rejected: old_string not found in document (pre-validation)
-2026-04-30 20:04:01.742 - backend.compiler.memory.compiler_rejection_log - INFO - Added rejection to log (mode: construction)
-2026-04-30 20:04:01.742 - backend.compiler.core.compiler_coordinator - INFO - Construction rejected
-2026-04-30 20:04:01.742 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body, retry with feedback)
-2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=8754 chars
-2026-04-30 20:04:01.742 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 8754 chars → 8754 chars (markers preserved)
-2026-04-30 20:04:01.758 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=2583, brainstorm=74310, overhead=5000, rag_budget=139053
-2026-04-30 20:04:01.758 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:04:01.758 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 20:04:01.758 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:04:27.281 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:04:27.297 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
-2026-04-30 20:04:27.297 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.54s (coverage=0.30, tokens=1739)
-2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
-2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 20:04:27.297 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 322306 chars
-2026-04-30 20:04:27.312 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_004)...
-2026-04-30 20:15:16.266 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 10878 chars (0 Wolfram tool call(s))
-2026-04-30 20:15:16.266 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:15:16.281 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:15:16.281 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 6ea8047a-c2c4-4a4f-bfa2-4162c71a2f92 (section_complete=False)
-2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 6ea8047a-c2c4-4a4f-bfa2-4162c71a2f92
-2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 8884 -> 8882 chars, new_string: 8884 -> 8882 chars)
-2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Since polynomial bounds are closed under addition and composition, the right-hand side is polynomial'...
-2026-04-30 20:15:16.281 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 7756
-2026-04-30 20:15:16.291 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_003)...
-2026-04-30 20:15:29.618 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 20:15:29.618 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=582, new_string_len=8882
-2026-04-30 20:15:29.618 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 8882 chars (conclusion boundary preserved)
-2026-04-30 20:15:29.618 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 3, 2139 words)
-2026-04-30 20:15:29.665 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-04-30 20:15:29.665 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 54 total chunks
-2026-04-30 20:15:30.103 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-04-30 20:15:30.103 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-04-30 20:15:30.108 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-04-30 20:15:30.108 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2139 words)
-2026-04-30 20:15:30.108 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=17638 chars
-2026-04-30 20:15:30.108 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 17638 chars → 17638 chars (markers preserved)
-2026-04-30 20:15:30.139 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=5123, brainstorm=74310, overhead=5000, rag_budget=136513
-2026-04-30 20:15:30.139 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:15:30.139 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 20:15:30.139 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:15:55.850 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:15:55.853 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
-2026-04-30 20:15:55.853 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.71s (coverage=0.31, tokens=1739)
-2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
-2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 20:15:55.853 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 330093 chars
-2026-04-30 20:15:55.881 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_005)...
-2026-04-30 20:21:30.392 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\Pat\Desktop\MOTO-Autonomous-ASI-development-branch\backend\data\lean4_workspace
-2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 5202 chars (0 Wolfram tool call(s))
-2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:26:31.793 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 07747a60-615b-43b7-9046-3c705a0315d2 (section_complete=False)
-2026-04-30 20:26:31.793 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 07747a60-615b-43b7-9046-3c705a0315d2
-2026-04-30 20:26:31.793 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 4088 -> 4086 chars, new_string: 4088 -> 4086 chars)
-2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'Polynomial-time checkability follows because $\\operatorname{TseitinFalse}(\\varphi)$ is computable in'...
-2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 16937
-2026-04-30 20:26:31.809 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_004)...
-2026-04-30 20:26:39.116 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 20:26:39.116 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=285, new_string_len=4086
-2026-04-30 20:26:39.116 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 4086 chars (conclusion boundary preserved)
-2026-04-30 20:26:39.116 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 4, 2596 words)
-2026-04-30 20:26:39.166 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-04-30 20:26:39.166 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 67 total chunks
-2026-04-30 20:26:39.718 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-04-30 20:26:39.718 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-04-30 20:26:39.718 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-04-30 20:26:39.718 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (2596 words)
-2026-04-30 20:26:39.718 - backend.compiler.agents.high_context_submitter - INFO - Starting outline update review...
-2026-04-30 20:26:39.718 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
-2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
-2026-04-30 20:26:39.729 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:26:39.729 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=outline_update, query_length=14810
-2026-04-30 20:26:39.729 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt']
-2026-04-30 20:27:04.956 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt']
-2026-04-30 20:27:04.956 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 7 chunks from excluded sources (already direct-injected)
-2026-04-30 20:27:04.956 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=outline_update in 25.23s (coverage=0.49, tokens=9893)
-2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 62832 chars retrieved
-2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - Building outline update prompt...
-2026-04-30 20:27:04.956 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 120460 chars
-2026-04-30 20:27:04.973 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_006)...
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 971 chars
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Outline update not needed
-2026-04-30 20:28:54.068 - backend.compiler.core.compiler_coordinator - INFO - No outline update needed
-2026-04-30 20:28:54.068 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: outline_update)
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements (focus=general)...
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 54105 chars
-2026-04-30 20:28:54.068 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_007)...
-2026-04-30 20:30:47.838 - backend.shared.openrouter_client - ERROR - OpenRouter unexpected error: Expecting value: line 523 column 1 (char 2871)
-2026-04-30 20:30:47.971 - backend.shared.api_client_manager - ERROR - OpenRouter error for role 'compiler_high_context': Expecting value: line 523 column 1 (char 2871), and no LM Studio fallback configured
-2026-04-30 20:30:47.971 - backend.compiler.core.compiler_coordinator - ERROR - Review context overflow: Expecting value: line 523 column 1 (char 2871)
-2026-04-30 20:30:47.986 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: review)
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Starting paper review for errors/improvements (focus=general)...
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Building review prompt (full outline + paper, no aggregator DB)...
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 54105 chars
-2026-04-30 20:30:47.986 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_008)...
-2026-04-30 20:30:54.975 - backend.shared.openrouter_client - ERROR - OpenRouter unexpected error: Expecting value: line 13 column 1 (char 66)
-2026-04-30 20:30:55.110 - backend.shared.api_client_manager - ERROR - OpenRouter error for role 'compiler_high_context': Expecting value: line 13 column 1 (char 66), and no LM Studio fallback configured
-2026-04-30 20:30:55.110 - backend.compiler.core.compiler_coordinator - ERROR - Review context overflow: Expecting value: line 13 column 1 (char 66)
-2026-04-30 20:30:55.127 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: review)
-2026-04-30 20:30:55.127 - backend.compiler.core.compiler_coordinator - INFO - Construction loop complete
-2026-04-30 20:30:55.127 - backend.compiler.core.compiler_coordinator - INFO - Starting rigor loop...
-2026-04-30 20:30:55.127 - backend.compiler.agents.high_param_submitter - INFO - Rigor cycle: Stage 1 - theorem discovery
-2026-04-30 20:30:55.147 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=rigor, query_length=16311
-2026-04-30 20:30:55.147 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt']
-2026-04-30 20:31:20.483 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt']
-2026-04-30 20:31:20.499 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 7 chunks from excluded sources (already direct-injected)
-2026-04-30 20:31:20.499 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=rigor in 25.35s (coverage=0.49, tokens=9949)
-2026-04-30 20:31:46.122 - backend.compiler.agents.high_param_submitter - INFO - Rigor cycle: Stage 2 - Lean 4 formalization (up to 5 attempts), retry_failure_id=compiler_rigor_4e20725b82af
-2026-04-30 20:31:46.139 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:47.136 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:47.136 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:49.137 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:49.142 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5141, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:49.275 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 1 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
-For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
-2026-04-30 20:31:49.275 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:50.276 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:50.276 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:52.272 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:52.272 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5225, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:52.411 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 2 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
-For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
-2026-04-30 20:31:52.411 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:53.428 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:53.429 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:55.429 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:55.430 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5314, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:55.564 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 3 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
-For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
-2026-04-30 20:31:55.564 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:56.564 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:56.564 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:58.566 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:58.566 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5403, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:58.699 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 4 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
-For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
-2026-04-30 20:31:58.699 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 1/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:31:59.679 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:31:59.679 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 2/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:32:01.684 - backend.shared.lm_studio_client - INFO - Retrying after 400 error...
-2026-04-30 20:32:01.684 - backend.shared.lm_studio_client - ERROR - LM Studio 400 Bad Request (attempt 3/3): model=openai/gpt-5.5, approx_tokens=5492, messages_count=1, error={
-    "error": {
-        "message": "No models loaded. Please load a model in the developer page or use the 'lms load' command.",
-        "type": "invalid_request_error",
-        "param": "model",
-        "code": null
-    }
-}
-2026-04-30 20:32:01.819 - backend.autonomous.agents.proof_formalization_agent - WARNING - ProofFormalizationAgent full-script attempt 5 failed for compiler_rigor_4e20725b82af: Client error '400 Bad Request' for url 'http://127.0.0.1:1234/v1/chat/completions'
-For more information check: https://developer.mozilla.org/en-US/docs/Web/HTTP/Status/400
-2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop: no theorem attempted this cycle (decline)
-2026-04-30 20:32:01.819 - backend.compiler.memory.compiler_rejection_log - INFO - Added decline to log (mode: rigor)
-2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor cycle ended (decline: no more theorems or Lean failed)
-2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Rigor loop complete
-2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Starting construction loop...
-2026-04-30 20:32:01.819 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=21726 chars
-2026-04-30 20:32:01.819 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 21726 chars → 21726 chars (markers preserved)
-2026-04-30 20:32:01.851 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=6205, brainstorm=74310, overhead=5000, rag_budget=135431
-2026-04-30 20:32:01.851 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:32:01.851 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 20:32:01.851 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:32:27.066 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:32:27.066 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 55 chunks from excluded sources (already direct-injected)
-2026-04-30 20:32:27.066 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.22s (coverage=0.31, tokens=1739)
-2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 13639 chars retrieved
-2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 20:32:27.066 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 334181 chars
-2026-04-30 20:32:27.091 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_009)...
-2026-04-30 20:45:03.127 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 7064 chars (0 Wolfram tool call(s))
-2026-04-30 20:45:03.127 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:45:03.132 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:45:03.132 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 209b69f9-8c9c-48d1-818d-fd2fa54623e7 (section_complete=False)
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 209b69f9-8c9c-48d1-818d-fd2fa54623e7
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 6279 -> 6277 chars, new_string: 6279 -> 6277 chars)
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'This completes the verified infrastructure for propositional proof systems.\n\n'
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 21235
-2026-04-30 20:45:03.132 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_005)...
-2026-04-30 20:45:13.994 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 20:45:13.994 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=75, new_string_len=6277
-2026-04-30 20:45:13.994 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 6277 chars (conclusion boundary preserved)
-2026-04-30 20:45:14.003 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 5, 3325 words)
-2026-04-30 20:45:14.055 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-04-30 20:45:14.055 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 85 total chunks
-2026-04-30 20:45:14.741 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-04-30 20:45:14.741 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-04-30 20:45:14.741 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-04-30 20:45:14.741 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (3325 words)
-2026-04-30 20:45:14.741 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=28005 chars
-2026-04-30 20:45:14.741 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 28005 chars → 28005 chars (markers preserved)
-2026-04-30 20:45:14.775 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=7922, brainstorm=74310, overhead=5000, rag_budget=133714
-2026-04-30 20:45:14.775 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:45:14.775 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 20:45:14.775 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:45:40.673 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:45:40.675 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
-2026-04-30 20:45:40.677 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 25.90s (coverage=0.30, tokens=1562)
-2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 12229 chars retrieved
-2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 20:45:40.677 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 339050 chars
-2026-04-30 20:45:40.693 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_010)...
-2026-04-30 20:55:56.846 - backend.compiler.agents.high_context_submitter - INFO - LLM completion received: 7546 chars (0 Wolfram tool call(s))
-2026-04-30 20:55:56.846 - backend.compiler.agents.high_context_submitter - INFO - Parsing JSON response...
-2026-04-30 20:55:56.861 - backend.compiler.agents.high_context_submitter - INFO - JSON parsed successfully
-2026-04-30 20:55:56.861 - backend.compiler.agents.high_context_submitter - INFO - Construction submission generated: 254a7f73-ee41-4e48-a517-d664121ea839 (section_complete=False)
-2026-04-30 20:55:56.863 - backend.compiler.validation.compiler_validator - INFO - Validating construction submission: 254a7f73-ee41-4e48-a517-d664121ea839
-2026-04-30 20:55:56.863 - backend.compiler.validation.compiler_validator - INFO - Stripped placeholder text from submission (content: 6564 -> 6562 chars, new_string: 6564 -> 6562 chars)
-2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_START: mode=construction, operation=insert_after
-2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO -    old_string preview: 'The Lean theorem \\texttt{quantitative\\_lower\\_bound\\_transfer\\_under\\_simulation} (Proof~6) verifies'...
-2026-04-30 20:55:56.911 - backend.compiler.validation.compiler_validator - INFO - PRE_VALIDATE_SUCCESS: old_string found uniquely at position 27464
-2026-04-30 20:55:56.913 - backend.compiler.validation.compiler_validator - INFO - Generating validation via api_client_manager (task_id=comp_val_006)...
-2026-04-30 20:56:05.370 - backend.compiler.validation.compiler_validator - INFO - Validation result: accept (coherence=True, rigor=True, placement=True)
-2026-04-30 20:56:05.370 - backend.compiler.core.compiler_coordinator - INFO - _apply_edit: operation=insert_after, old_string_len=125, new_string_len=6562
-2026-04-30 20:56:05.370 - backend.compiler.core.compiler_coordinator - INFO - Insert after: inserted 6562 chars (conclusion boundary preserved)
-2026-04-30 20:56:05.370 - backend.compiler.memory.paper_memory - INFO - Paper updated (version 6, 4110 words)
-2026-04-30 20:56:05.421 - backend.aggregator.core.rag_manager - INFO - Removed document: compiler_paper.txt
-2026-04-30 20:56:05.432 - backend.aggregator.ingestion.pipeline - INFO - Ingested compiler_paper.txt: 107 total chunks
-2026-04-30 20:56:06.384 - backend.aggregator.core.rag_manager - INFO - Added text: compiler_paper.txt
-2026-04-30 20:56:06.384 - backend.compiler.core.compiler_rag_manager - INFO - Paper re-chunked successfully
-2026-04-30 20:56:06.388 - backend.compiler.memory.compiler_rejection_log - INFO - Added acceptance to log (mode: construction)
-2026-04-30 20:56:06.388 - backend.compiler.core.compiler_coordinator - INFO - Construction accepted (4110 words)
-2026-04-30 20:56:06.388 - backend.compiler.core.compiler_coordinator - INFO - Loaded brainstorm content for retroactive corrections: 258469 chars
-2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Starting construction submission generation (first=False, phase=body)
-2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Loading outline and paper state...
-2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - State loaded: outline=2504 chars, paper=34569 chars
-2026-04-30 20:56:06.388 - backend.compiler.agents.high_context_submitter - INFO - Paper prepared for LLM: 34569 chars → 34569 chars (markers preserved)
-2026-04-30 20:56:06.422 - backend.compiler.agents.high_context_submitter - INFO - Context budget: max=221500, outline=554, paper=9712, brainstorm=74310, overhead=5000, rag_budget=131924
-2026-04-30 20:56:06.422 - backend.compiler.agents.high_context_submitter - INFO - Retrieving aggregator database evidence via RAG...
-2026-04-30 20:56:06.422 - backend.compiler.core.compiler_rag_manager - INFO - Starting RAG retrieval for mode=construction, query_length=15311
-2026-04-30 20:56:06.422 - backend.compiler.core.compiler_rag_manager - INFO - Excluding direct-injected sources: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:56:32.896 - backend.aggregator.core.rag_manager - INFO - RAG Stage 4/4: Excluding sources already direct-injected: ['compiler_outline.txt', 'compiler_paper.txt', 'brainstorm_topic_004.txt']
-2026-04-30 20:56:32.896 - backend.aggregator.core.rag_manager - INFO - RAG packing: Skipped 54 chunks from excluded sources (already direct-injected)
-2026-04-30 20:56:32.896 - backend.compiler.core.compiler_rag_manager - INFO - RAG retrieval complete for mode=construction in 26.47s (coverage=0.31, tokens=1562)
-2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - RAG retrieval complete: 12229 chars retrieved
-2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - Building construction prompt for phase: body...
-2026-04-30 20:56:32.896 - backend.compiler.agents.high_context_submitter - INFO - Prompt built: 345614 chars
-2026-04-30 20:56:32.925 - backend.compiler.agents.high_context_submitter - INFO - Generating LLM completion via api_client_manager (task_id=comp_hc_011)...

From bf002abaee85db2939da2bf4567bcf666e5eeef1 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 17:21:34 -0500
Subject: [PATCH 15/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 frontend/src/utils/autonomousProfiles.js | 64 ++++++++++++++++++++++++
 1 file changed, 64 insertions(+)

diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
index 94a0c90..057dfec 100644
--- a/frontend/src/utils/autonomousProfiles.js
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -8,9 +8,11 @@ export const RECOMMENDED_PROFILE_KEY = 'recommended_slower_affordable_higher_kno
 export const RECOMMENDED_ALTERNATE_PROFILE_KEY = 'recommended_fast_affordable_mid';
 export const RECOMMENDED_LAB_FAST_PROFILE_KEY = 'recommended_lab_fast_costly_extra_high';
 export const RECOMMENDED_LAB_MAX_PROFILE_KEY = 'recommended_lab_slow_costly_max';
+export const RECOMMENDED_ENTRY_LAB_PROFILE_KEY = 'recommended_entry_lab_fast_less_affordable';
 export const RECOMMENDED_PROFILE_KEYS = [
   RECOMMENDED_PROFILE_KEY,
   RECOMMENDED_ALTERNATE_PROFILE_KEY,
+  RECOMMENDED_ENTRY_LAB_PROFILE_KEY,
   RECOMMENDED_LAB_FAST_PROFILE_KEY,
   RECOMMENDED_LAB_MAX_PROFILE_KEY,
 ];
@@ -198,6 +200,68 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
   },
+  [RECOMMENDED_ENTRY_LAB_PROFILE_KEY]: {
+    name: 'Fast, less affordable, higher knowledge',
+    numSubmitters: 3,
+    submitters: [
+      {
+        modelId: 'x-ai/grok-4.3',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1000000,
+        maxOutputTokens: 128000,
+      },
+      {
+        modelId: 'moonshotai/kimi-k2.6',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 262000,
+        maxOutputTokens: 40000,
+      },
+      {
+        modelId: 'x-ai/grok-4.3',
+        provider: 'openrouter',
+        openrouterProvider: null,
+        lmStudioFallbackId: null,
+        contextWindow: 1000000,
+        maxOutputTokens: 128000,
+      },
+    ],
+    validator: {
+      modelId: 'x-ai/grok-4.1-fast',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 2000000,
+      maxOutputTokens: 30000,
+    },
+    highContext: {
+      modelId: 'x-ai/grok-4.3',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1000000,
+      maxOutputTokens: 128000,
+    },
+    highParam: {
+      modelId: 'x-ai/grok-4.3',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1000000,
+      maxOutputTokens: 128000,
+    },
+    critique: {
+      modelId: 'google/gemini-3.1-pro-preview',
+      provider: 'openrouter',
+      openrouterProvider: null,
+      lmStudioFallbackId: null,
+      contextWindow: 1048576,
+      maxOutputTokens: 65500,
+    },
+  },
   [RECOMMENDED_LAB_FAST_PROFILE_KEY]: {
     name: 'Lab grade, fast, costly (starts at ~$10 per hour), extra-high knowledge',
     numSubmitters: 3,

From 8710879c45d93669f4c7427a0eaf323c9adefe7c Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 18:09:20 -0500
Subject: [PATCH 16/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 ...program-directory-and-file-definitions.mdc |  4 +-
 backend/api/routes/proofs.py                  | 41 +++++++++++--------
 .../autonomous/MathematicalProofs.jsx         | 23 ++++++++---
 3 files changed, 45 insertions(+), 23 deletions(-)

diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index 13eab9e..ff05a19 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -179,7 +179,7 @@ project-root/
 │   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers + endpoint metadata, LM Studio availability, **GET /api/model-cache** for model ID caching, **POST /api/openrouter/reset-exhaustion** to reset credit exhaustion mid-session)
 │   │       ├── websocket.py             # WebSocket for real-time updates (proxy auth validation in generic mode before accept)
 │   │       ├── features.py              # GET /api/features — shared build identity plus stable capability flags (`generic_mode`, `lm_studio_enabled`, `pdf_download_available`)
-│   │       ├── proofs.py                # Proof database + Lean 4/SMT runtime + manual proof-check + certificate export + dependency graph routes (all gated on `lean4_enabled`)
+│   │       ├── proofs.py                # Proof database + Lean 4/SMT runtime + manual proof-check + certificate export + dependency graph routes; listing proofs (`GET /`, `/novel`, `/known`, `/library*`) and certificate/lean downloads (`/{id}/certificate`, `/{id}/certificate.lean`) are always available regardless of `lean4_enabled`; dependency/graph routes and `/check` are gated on `lean4_enabled`; `/status` uses short timeouts so it never blocks the UI
 │   │       └── health.py                # GET /api/health — readiness/liveness probe with instance/build metadata
 │   │
 │   ├── data/                            # Persistent data storage
@@ -393,7 +393,7 @@ project-root/
 
 - `compiler.py`: Compiler control (start/stop/status), paper/outline access, critique management
 - `autonomous.py`: Autonomous research control (start/stop/clear/status), brainstorm/paper access, Tier 3 endpoints
-- `proofs.py`: Proof database listing, `/status` runtime readiness, `POST /settings` runtime flag updates, `POST /check` manual proof check, `/{id}/certificate[.lean]` certificate export, `/{id}/dependencies` + `/graph` + `/mathlib/{lemma}/dependents` graph/lineage queries (all above gated on `lean4_enabled`); `GET /library` + `GET /library/{session_id}/{proof_id}` cross-session proof library endpoints (NOT gated — read-only file access, always available).
+- `proofs.py`: Proof database listing (`GET /`, `/novel`, `/known`) and `/status` runtime readiness — always available, never gated. `/{id}/certificate` and `/{id}/certificate.lean` — always available (data is stored on disk; Lean version info populated only when Lean is enabled). `/status` uses `asyncio.wait_for` timeouts (5s Lean, 3s Z3) so the endpoint never hangs. `POST /settings` runtime flag updates. `POST /check` manual proof check, `/{id}/dependencies`, `/graph`, `/mathlib/{lemma}/dependents` graph/lineage queries — gated on `lean4_enabled`. `GET /library` + `GET /library/{session_id}/{proof_id}` cross-session proof library endpoints — always available.
 
 ### Frontend Components
 
diff --git a/backend/api/routes/proofs.py b/backend/api/routes/proofs.py
index 5ec114a..9dff94b 100644
--- a/backend/api/routes/proofs.py
+++ b/backend/api/routes/proofs.py
@@ -3,6 +3,7 @@
 """
 from __future__ import annotations
 
+import asyncio
 import logging
 from typing import Optional, Tuple
 
@@ -301,7 +302,11 @@ async def cleanup_known_proofs_from_files():
 
 @router.get("/status")
 async def get_proofs_status():
-    """Return Lean 4 availability and proof-database status."""
+    """Return Lean 4 availability and proof-database status.
+
+    Non-blocking: Lean workspace checks use a short timeout so the
+    endpoint always returns quickly even when Lean is unavailable.
+    """
     version = ""
     workspace_ready = False
     mathlib_commit = ""
@@ -310,15 +315,18 @@ async def get_proofs_status():
     smt_available = False
     manual_check_ready, manual_check_message = await _get_manual_check_status()
     if system_config.lean4_enabled:
-        client = get_lean4_client()
-        version = await client.get_version()
-        workspace_ready = await client.ensure_workspace()
-        mathlib_commit = client.get_mathlib_commit()
-        lsp_active = client.is_server_active()
+        try:
+            client = get_lean4_client()
+            version = await asyncio.wait_for(client.get_version(), timeout=5.0)
+            workspace_ready = await asyncio.wait_for(client.ensure_workspace(), timeout=5.0)
+            mathlib_commit = client.get_mathlib_commit()
+            lsp_active = client.is_server_active()
+        except (asyncio.TimeoutError, Exception) as exc:
+            logger.warning("Lean 4 status check timed out or failed: %s", exc)
 
     if system_config.smt_enabled:
         try:
-            z3_version = await get_smt_client().get_version()
+            z3_version = await asyncio.wait_for(get_smt_client().get_version(), timeout=3.0)
             lowered_version = z3_version.lower()
             smt_available = bool(z3_version) and "not found" not in lowered_version and "no such file" not in lowered_version
         except Exception as exc:
@@ -467,16 +475,20 @@ async def get_library_proof(session_id: str, proof_id: str):
 @router.get("/{proof_id}/certificate")
 async def get_proof_certificate(proof_id: str):
     """Return a machine-readable proof certificate JSON payload."""
-    if not system_config.lean4_enabled:
-        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof certificates are unavailable while Lean 4 is disabled."})
-
     proof = await proof_database.get_proof(proof_id)
     if proof is None:
         raise HTTPException(status_code=404, detail="Proof not found")
 
-    client = get_lean4_client()
-    lean_version = await client.get_version() if system_config.lean4_enabled else ""
-    mathlib_commit = client.get_mathlib_commit()
+    lean_version = ""
+    mathlib_commit = ""
+    if system_config.lean4_enabled:
+        try:
+            client = get_lean4_client()
+            lean_version = await client.get_version()
+            mathlib_commit = client.get_mathlib_commit()
+        except Exception:
+            pass
+
     lean_code = await proof_database.get_lean_code(proof_id)
     payload = {
         "proof_id": proof.proof_id,
@@ -507,9 +519,6 @@ async def get_proof_certificate(proof_id: str):
 @router.get("/{proof_id}/certificate.lean")
 async def get_proof_certificate_lean(proof_id: str):
     """Return the raw saved Lean file for a proof."""
-    if not system_config.lean4_enabled:
-        raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Proof certificates are unavailable while Lean 4 is disabled."})
-
     proof = await proof_database.get_proof(proof_id)
     if proof is None:
         raise HTTPException(status_code=404, detail="Proof not found")
diff --git a/frontend/src/components/autonomous/MathematicalProofs.jsx b/frontend/src/components/autonomous/MathematicalProofs.jsx
index cbf11ed..829f44c 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.jsx
+++ b/frontend/src/components/autonomous/MathematicalProofs.jsx
@@ -87,17 +87,30 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
       setError(null);
       setProofGraphState(createEmptyGraphState());
 
-      const [proofsResponse, statusResponse, brainstormsResponse, papersResponse] = await Promise.all([
+      const [proofsResult, statusResult, brainstormsResult, papersResult] = await Promise.allSettled([
         api.getProofs(),
         api.getProofStatus(),
         api.getBrainstorms(),
         api.getPapers(),
       ]);
 
-      setProofs(proofsResponse.proofs || []);
-      setProofStatus(statusResponse);
-      setBrainstorms(brainstormsResponse.brainstorms || []);
-      setPapers(papersResponse.papers || []);
+      if (proofsResult.status === 'fulfilled') {
+        setProofs(proofsResult.value.proofs || []);
+      } else {
+        setError(`Failed to load proofs: ${proofsResult.reason?.message || 'Unknown error'}`);
+      }
+
+      if (statusResult.status === 'fulfilled') {
+        setProofStatus(statusResult.value);
+      }
+
+      if (brainstormsResult.status === 'fulfilled') {
+        setBrainstorms(brainstormsResult.value.brainstorms || []);
+      }
+
+      if (papersResult.status === 'fulfilled') {
+        setPapers(papersResult.value.papers || []);
+      }
     } catch (err) {
       setError(`Failed to load proofs: ${err.message}`);
     } finally {

From b6197b8671fdb6fc8168d5d6152623e4e1f56fbc Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 18:35:38 -0500
Subject: [PATCH 17/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/api/main.py                           |   2 +
 backend/api/routes/__init__.py                |   4 +-
 backend/api/routes/update.py                  |  70 +++++++
 frontend/src/App.jsx                          |  32 +---
 .../components/CritiqueNotificationStack.jsx  |   7 +-
 .../components/UpdateNotificationBanner.jsx   | 181 ++++++++++++++++++
 .../autonomous/ProofNotificationStack.jsx     |   5 +-
 frontend/src/index.css                        | 113 ++++++++++-
 frontend/src/services/api.js                  |  12 ++
 9 files changed, 391 insertions(+), 35 deletions(-)
 create mode 100644 backend/api/routes/update.py
 create mode 100644 frontend/src/components/UpdateNotificationBanner.jsx

diff --git a/backend/api/main.py b/backend/api/main.py
index 9a04f47..bc1c77b 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -22,6 +22,7 @@
     features,
     health,
     proofs,
+    update,
 )
 from backend.shared.build_info import get_build_info
 from backend.shared.lm_studio_client import lm_studio_client
@@ -291,6 +292,7 @@ async def _warm_start_lean4() -> None:
 app.include_router(proofs.router)
 app.include_router(openrouter.router)
 app.include_router(download.router)
+app.include_router(update.router)
 app.include_router(websocket.router)
 
 
diff --git a/backend/api/routes/__init__.py b/backend/api/routes/__init__.py
index c7f3682..512b263 100644
--- a/backend/api/routes/__init__.py
+++ b/backend/api/routes/__init__.py
@@ -1,4 +1,4 @@
 """API routes"""
-from . import aggregator, compiler, autonomous, websocket, boost, workflow, features, health, proofs
+from . import aggregator, compiler, autonomous, websocket, boost, workflow, features, health, proofs, update
 
-__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow', 'features', 'health', 'proofs']
+__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow', 'features', 'health', 'proofs', 'update']
diff --git a/backend/api/routes/update.py b/backend/api/routes/update.py
new file mode 100644
index 0000000..38854a4
--- /dev/null
+++ b/backend/api/routes/update.py
@@ -0,0 +1,70 @@
+"""
+Self-update routes — allows the frontend to trigger `git pull origin main`
+and poll progress in real time.
+"""
+from __future__ import annotations
+
+import asyncio
+import logging
+from pathlib import Path
+from typing import Any, Dict, List
+
+from fastapi import APIRouter
+
+router = APIRouter(tags=["update"])
+logger = logging.getLogger(__name__)
+
+_REPO_ROOT = Path(__file__).resolve().parents[3]
+
+_pull_state: Dict[str, Any] = {
+    "status": "idle",
+    "output_lines": [],
+    "returncode": None,
+}
+
+
+async def _run_pull() -> None:
+    """Execute git pull as an async subprocess, streaming output into _pull_state."""
+    global _pull_state
+    _pull_state = {"status": "running", "output_lines": [], "returncode": None}
+
+    try:
+        proc = await asyncio.create_subprocess_exec(
+            "git", "pull", "origin", "main",
+            cwd=str(_REPO_ROOT),
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.STDOUT,
+        )
+
+        assert proc.stdout is not None
+        while True:
+            line = await proc.stdout.readline()
+            if not line:
+                break
+            decoded = line.decode("utf-8", errors="replace").rstrip("\n")
+            _pull_state["output_lines"].append(decoded)
+
+        await proc.wait()
+        _pull_state["returncode"] = proc.returncode
+        _pull_state["status"] = "done" if proc.returncode == 0 else "error"
+    except Exception as exc:
+        logger.exception("git pull failed with exception")
+        _pull_state["output_lines"].append(f"Exception: {exc}")
+        _pull_state["returncode"] = -1
+        _pull_state["status"] = "error"
+
+
+@router.post("/api/update/pull")
+async def start_pull() -> Dict[str, Any]:
+    """Kick off a git pull. Returns immediately; poll /api/update/pull-status for progress."""
+    if _pull_state["status"] == "running":
+        return {"started": False, "reason": "A pull is already in progress."}
+
+    asyncio.create_task(_run_pull())
+    return {"started": True}
+
+
+@router.get("/api/update/pull-status")
+async def get_pull_status() -> Dict[str, Any]:
+    """Return current pull state including streamed output lines."""
+    return _pull_state
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 4368309..a48fbff 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -28,6 +28,7 @@ import CritiqueNotificationStack from './components/CritiqueNotificationStack';
 import ProofNotificationStack from './components/autonomous/ProofNotificationStack';
 import CreditExhaustionNotificationStack from './components/CreditExhaustionNotificationStack';
 import HungConnectionNotificationStack from './components/HungConnectionNotificationStack';
+import UpdateNotificationBanner from './components/UpdateNotificationBanner';
 import PaperCritiqueModal from './components/PaperCritiqueModal';
 import { websocket } from './services/websocket';
 import { api, autonomousAPI, openRouterAPI } from './services/api';
@@ -2083,31 +2084,10 @@ function App() {
 
       {/* Update Notice Banner — dismissible per session, reappears on restart */}
       {updateNotice && !updateNoticeDismissed && (
-        <div className="update-notice-banner">
-          <div className="update-notice-content">
-            <span className="update-notice-icon">&#9432;</span>
-            <span className="update-notice-text">
-              <strong>Update available:</strong>{' '}
-              {updateNotice.installed_version} ({updateNotice.installed_commit})
-              {' '}&rarr;{' '}
-              {updateNotice.available_version} ({updateNotice.available_commit})
-              {' '}&mdash;{' '}
-              <span className="update-notice-detail">
-                {updateNotice.can_auto_apply
-                  ? 'Restart the launcher to apply this update.'
-                  : `Install layout: ${updateNotice.install_layout}. Pull the latest from GitHub main to update.`}
-              </span>
-            </span>
-          </div>
-          <button
-            className="update-notice-dismiss"
-            onClick={() => setUpdateNoticeDismissed(true)}
-            aria-label="Dismiss update notice"
-            title="Dismiss"
-          >
-            &#10005;
-          </button>
-        </div>
+        <UpdateNotificationBanner
+          notice={updateNotice}
+          onDismiss={() => setUpdateNoticeDismissed(true)}
+        />
       )}
       
       {/* CRITICAL: Boost buttons are ETERNAL - they NEVER disappear */}
@@ -2552,6 +2532,7 @@ function App() {
         notifications={proofNotifications}
         onDismiss={handleDismissProofNotification}
         onClickNotification={handleClickProofNotification}
+        panelCollapsed={workflowPanelCollapsed}
       />
       
       {/* Critique Notification Stack - Persists across all screens */}
@@ -2559,6 +2540,7 @@ function App() {
         notifications={critiqueNotifications}
         onDismiss={handleDismissNotification}
         onClickNotification={handleClickNotification}
+        panelCollapsed={workflowPanelCollapsed}
       />
       
       {/* Credit Exhaustion Notification Stack - Persists until user dismisses */}
diff --git a/frontend/src/components/CritiqueNotificationStack.jsx b/frontend/src/components/CritiqueNotificationStack.jsx
index 4b9d74f..b37a9fc 100644
--- a/frontend/src/components/CritiqueNotificationStack.jsx
+++ b/frontend/src/components/CritiqueNotificationStack.jsx
@@ -48,7 +48,7 @@ function getRatingColor(rating) {
  * - onDismiss: (id) => void - callback when notification is dismissed
  * - onClickNotification: (paper_id, paper_title) => void - callback when notification is clicked
  */
-export default function CritiqueNotificationStack({ notifications, onDismiss, onClickNotification }) {
+export default function CritiqueNotificationStack({ notifications, onDismiss, onClickNotification, panelCollapsed }) {
   if (!notifications || notifications.length === 0) {
     return null;
   }
@@ -58,12 +58,13 @@ export default function CritiqueNotificationStack({ notifications, onDismiss, on
       style={{
         position: 'fixed',
         bottom: '20px',
-        right: '20px',
+        right: panelCollapsed ? '20px' : '340px',
         zIndex: 999999,
         display: 'flex',
         flexDirection: 'column',
         gap: scalePx(8),
-        pointerEvents: 'none', // Allow clicks through container
+        pointerEvents: 'none',
+        transition: 'right 0.15s ease',
       }}
     >
       {notifications.map((notification, index) => (
diff --git a/frontend/src/components/UpdateNotificationBanner.jsx b/frontend/src/components/UpdateNotificationBanner.jsx
new file mode 100644
index 0000000..9104cff
--- /dev/null
+++ b/frontend/src/components/UpdateNotificationBanner.jsx
@@ -0,0 +1,181 @@
+import React, { useState, useEffect, useRef } from 'react';
+import { api } from '../services/api';
+
+const POLL_INTERVAL_MS = 1000;
+
+export default function UpdateNotificationBanner({ notice, onDismiss }) {
+  const [phase, setPhase] = useState('idle');
+  const [outputLines, setOutputLines] = useState([]);
+  const [errorMessage, setErrorMessage] = useState('');
+  const logRef = useRef(null);
+  const pollRef = useRef(null);
+
+  useEffect(() => {
+    return () => {
+      if (pollRef.current) clearInterval(pollRef.current);
+    };
+  }, []);
+
+  useEffect(() => {
+    if (logRef.current) {
+      logRef.current.scrollTop = logRef.current.scrollHeight;
+    }
+  }, [outputLines]);
+
+  const startPolling = () => {
+    pollRef.current = setInterval(async () => {
+      try {
+        const status = await api.getPullStatus();
+        setOutputLines(status.output_lines || []);
+        if (status.status === 'done') {
+          clearInterval(pollRef.current);
+          pollRef.current = null;
+          setPhase('success');
+        } else if (status.status === 'error') {
+          clearInterval(pollRef.current);
+          pollRef.current = null;
+          setErrorMessage(
+            (status.output_lines || []).slice(-5).join('\n') || 'Unknown error'
+          );
+          setPhase('error');
+        }
+      } catch {
+        clearInterval(pollRef.current);
+        pollRef.current = null;
+        setErrorMessage('Lost connection to backend while pulling.');
+        setPhase('error');
+      }
+    }, POLL_INTERVAL_MS);
+  };
+
+  const handlePull = async () => {
+    setPhase('pulling');
+    setOutputLines([]);
+    setErrorMessage('');
+    try {
+      const resp = await api.startPull();
+      if (!resp.started) {
+        setErrorMessage(resp.reason || 'Pull rejected by server.');
+        setPhase('error');
+        return;
+      }
+      startPolling();
+    } catch (err) {
+      setErrorMessage(err.message || 'Failed to start pull.');
+      setPhase('error');
+    }
+  };
+
+  const handleRetry = () => {
+    handlePull();
+  };
+
+  if (phase === 'idle') {
+    return (
+      <div className="update-notice-banner">
+        <div className="update-notice-content">
+          <span className="update-notice-icon">&#9432;</span>
+          <span className="update-notice-text">
+            <strong>Update available:</strong>{' '}
+            {notice.installed_version} ({notice.installed_commit})
+            {' '}&rarr;{' '}
+            {notice.available_version} ({notice.available_commit})
+          </span>
+          <div className="update-notice-actions">
+            <button
+              className="update-notice-pull-btn"
+              onClick={handlePull}
+            >
+              Update
+            </button>
+            <button
+              className="update-notice-dismiss"
+              onClick={onDismiss}
+              aria-label="Dismiss update notice"
+              title="Dismiss"
+            >
+              Dismiss
+            </button>
+          </div>
+        </div>
+      </div>
+    );
+  }
+
+  if (phase === 'pulling') {
+    return (
+      <div className="update-notice-banner update-notice-pulling">
+        <div className="update-notice-content">
+          <span className="update-notice-spinner" />
+          <span className="update-notice-text">
+            <strong>Pulling update...</strong>
+          </span>
+        </div>
+        <pre className="update-notice-log" ref={logRef}>
+          {outputLines.length > 0
+            ? outputLines.join('\n')
+            : 'Waiting for output...'}
+        </pre>
+      </div>
+    );
+  }
+
+  if (phase === 'success') {
+    return (
+      <div className="update-notice-banner update-notice-success">
+        <div className="update-notice-content">
+          <span className="update-notice-icon update-notice-icon-success">&#10003;</span>
+          <span className="update-notice-text">
+            <strong>Update applied!</strong>{' '}
+            Restart the backend server to take effect.
+          </span>
+          <button
+            className="update-notice-dismiss"
+            onClick={onDismiss}
+            aria-label="Dismiss update notice"
+            title="Dismiss"
+          >
+            Dismiss
+          </button>
+        </div>
+        <pre className="update-notice-log" ref={logRef}>
+          {outputLines.join('\n')}
+        </pre>
+      </div>
+    );
+  }
+
+  // phase === 'error'
+  return (
+    <div className="update-notice-banner update-notice-error">
+      <div className="update-notice-content">
+        <span className="update-notice-icon update-notice-icon-error">&#10007;</span>
+        <span className="update-notice-text">
+          <strong>Update failed.</strong>{' '}
+          {errorMessage}
+        </span>
+        <div className="update-notice-actions">
+          <button
+            className="update-notice-pull-btn"
+            onClick={handleRetry}
+          >
+            Retry
+          </button>
+          <button
+            className="update-notice-dismiss"
+            onClick={onDismiss}
+            aria-label="Dismiss update notice"
+            title="Dismiss"
+          >
+            Dismiss
+          </button>
+        </div>
+      </div>
+      {outputLines.length > 0 && (
+        <pre className="update-notice-log" ref={logRef}>
+          {outputLines.join('\n')}
+        </pre>
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/components/autonomous/ProofNotificationStack.jsx b/frontend/src/components/autonomous/ProofNotificationStack.jsx
index 6843f57..b4cda04 100644
--- a/frontend/src/components/autonomous/ProofNotificationStack.jsx
+++ b/frontend/src/components/autonomous/ProofNotificationStack.jsx
@@ -47,7 +47,7 @@ function getTierStyle(tier) {
   return TIER_STYLES[tier] || TIER_STYLES.mathematical_discovery;
 }
 
-export default function ProofNotificationStack({ notifications, onDismiss, onClickNotification }) {
+export default function ProofNotificationStack({ notifications, onDismiss, onClickNotification, panelCollapsed }) {
   if (!notifications || notifications.length === 0) {
     return null;
   }
@@ -57,12 +57,13 @@ export default function ProofNotificationStack({ notifications, onDismiss, onCli
       style={{
         position: 'fixed',
         bottom: scalePx(116),
-        right: '20px',
+        right: panelCollapsed ? '20px' : '340px',
         zIndex: 999998,
         display: 'flex',
         flexDirection: 'column',
         gap: scalePx(8),
         pointerEvents: 'none',
+        transition: 'right 0.15s ease',
       }}
     >
       {notifications.map((notification) => {
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 0b0d539..9054c22 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -2235,7 +2235,6 @@ button.danger:hover {
 .update-notice-banner {
   display: flex;
   align-items: center;
-  justify-content: space-between;
   gap: 1rem;
   padding: 0.6rem 1.2rem;
   background: linear-gradient(135deg, rgba(30, 255, 28, 0.12) 0%, rgba(30, 200, 28, 0.08) 100%);
@@ -2244,6 +2243,25 @@ button.danger:hover {
   font-size: 0.88rem;
   line-height: 1.45;
   z-index: 50;
+  flex-wrap: wrap;
+}
+
+.update-notice-banner.update-notice-pulling {
+  background: linear-gradient(135deg, rgba(59, 130, 246, 0.12) 0%, rgba(59, 130, 246, 0.06) 100%);
+  border-bottom-color: rgba(59, 130, 246, 0.4);
+  color: #bfdbfe;
+}
+
+.update-notice-banner.update-notice-success {
+  background: linear-gradient(135deg, rgba(34, 197, 94, 0.14) 0%, rgba(34, 197, 94, 0.07) 100%);
+  border-bottom-color: rgba(34, 197, 94, 0.5);
+  color: #bbf7d0;
+}
+
+.update-notice-banner.update-notice-error {
+  background: linear-gradient(135deg, rgba(239, 68, 68, 0.12) 0%, rgba(239, 68, 68, 0.06) 100%);
+  border-bottom-color: rgba(239, 68, 68, 0.4);
+  color: #fecaca;
 }
 
 .update-notice-content {
@@ -2260,23 +2278,80 @@ button.danger:hover {
   flex-shrink: 0;
 }
 
+.update-notice-icon-success {
+  color: #22c55e;
+}
+
+.update-notice-icon-error {
+  color: #ef4444;
+}
+
 .update-notice-text strong {
   color: #1eff1c;
 }
 
+.update-notice-pulling .update-notice-text strong {
+  color: #93c5fd;
+}
+
+.update-notice-success .update-notice-text strong {
+  color: #4ade80;
+}
+
+.update-notice-error .update-notice-text strong {
+  color: #f87171;
+}
+
 .update-notice-detail {
   color: #a0d89e;
 }
 
+.update-notice-actions {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  flex-shrink: 0;
+}
+
+.update-notice-pull-btn {
+  background: rgba(30, 255, 28, 0.2);
+  border: 1px solid rgba(30, 255, 28, 0.5);
+  border-radius: 4px;
+  color: #1eff1c;
+  font-size: 0.82rem;
+  font-weight: 600;
+  cursor: pointer;
+  padding: 0.3rem 0.75rem;
+  line-height: 1;
+  transition: background 0.15s, border-color 0.15s;
+}
+
+.update-notice-pull-btn:hover {
+  background: rgba(30, 255, 28, 0.35);
+  border-color: rgba(30, 255, 28, 0.8);
+}
+
+.update-notice-error .update-notice-pull-btn {
+  background: rgba(239, 68, 68, 0.2);
+  border-color: rgba(239, 68, 68, 0.5);
+  color: #f87171;
+}
+
+.update-notice-error .update-notice-pull-btn:hover {
+  background: rgba(239, 68, 68, 0.35);
+  border-color: rgba(239, 68, 68, 0.8);
+}
+
 .update-notice-dismiss {
   flex-shrink: 0;
+  margin-left: 20px;
   background: none;
   border: 1px solid rgba(30, 255, 28, 0.3);
   border-radius: 4px;
   color: #1eff1c;
-  font-size: 0.95rem;
+  font-size: 0.82rem;
   cursor: pointer;
-  padding: 0.2rem 0.55rem;
+  padding: 0.25rem 0.6rem;
   line-height: 1;
   transition: background 0.15s, border-color 0.15s;
 }
@@ -2286,6 +2361,38 @@ button.danger:hover {
   border-color: rgba(30, 255, 28, 0.6);
 }
 
+.update-notice-log {
+  width: 100%;
+  max-height: 120px;
+  overflow-y: auto;
+  background: rgba(0, 0, 0, 0.4);
+  border: 1px solid rgba(255, 255, 255, 0.1);
+  border-radius: 4px;
+  padding: 0.5rem 0.7rem;
+  margin-top: 0.4rem;
+  font-family: 'Courier New', Courier, monospace;
+  font-size: 0.75rem;
+  line-height: 1.5;
+  color: #d1d5db;
+  white-space: pre-wrap;
+  word-break: break-all;
+}
+
+.update-notice-spinner {
+  display: inline-block;
+  width: 14px;
+  height: 14px;
+  border: 2px solid rgba(147, 197, 253, 0.3);
+  border-top-color: #93c5fd;
+  border-radius: 50%;
+  animation: update-spin 0.7s linear infinite;
+  flex-shrink: 0;
+}
+
+@keyframes update-spin {
+  to { transform: rotate(360deg); }
+}
+
 .disclaimer-modal {
   position: fixed;
   top: 50%;
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index 8fc17d5..f0a3223 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -94,6 +94,18 @@ export const api = {
     return response.json();
   },
 
+  async startPull() {
+    const response = await fetch(`${API_BASE}/update/pull`, { method: 'POST' });
+    if (!response.ok) throw new Error('Failed to start pull');
+    return response.json();
+  },
+
+  async getPullStatus() {
+    const response = await fetch(`${API_BASE}/update/pull-status`);
+    if (!response.ok) throw new Error('Failed to get pull status');
+    return response.json();
+  },
+
   // Start aggregator
   async startAggregator(config) {
     const response = await fetch(`${API_BASE}/aggregator/start`, {

From 02b77beec0213f8c9a88862abc421865da090f83 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 18:49:34 -0500
Subject: [PATCH 18/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 frontend/package-lock.json |  6 ++--
 moto_launcher.py           | 58 ++++++++++++++++++++++++++++++++++----
 2 files changed, 56 insertions(+), 8 deletions(-)

diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index 4efcf03..389caa3 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1176,9 +1176,9 @@
       }
     },
     "node_modules/postcss": {
-      "version": "8.5.6",
-      "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.5.6.tgz",
-      "integrity": "sha512-3Ybi1tAuwAP9s0r1UQ2J4n5Y0G05bJkpUIO0/bI9MhwmD70S5aTWbXGBwxHrelT+XM1k6dM0pk+SwNkpTRN7Pg==",
+      "version": "8.5.14",
+      "resolved": "https://registry.npmjs.org/postcss/-/postcss-8.5.14.tgz",
+      "integrity": "sha512-SoSL4+OSEtR99LHFZQiJLkT59C5B1amGO1NzTwj7TT1qCUgUO6hxOvzkOYxD+vMrXBM3XJIKzokoERdqQq/Zmg==",
       "dev": true,
       "funding": [
         {
diff --git a/moto_launcher.py b/moto_launcher.py
index b823681..d47a94a 100644
--- a/moto_launcher.py
+++ b/moto_launcher.py
@@ -30,6 +30,7 @@
     build_update_prompt,
     build_warning_message,
     check_for_updates,
+    classify_install_state,
     cleanup_launcher_state,
     cleanup_path,
     consume_internal_launcher_args,
@@ -1374,12 +1375,59 @@ def install_frontend_dependencies() -> tuple[str, bool]:
         cprint("- package.json exists in frontend directory", YELLOW)
         exit_with_pause(1)
 
-    vulnerability_warning = "vulnerabilities found" in npm_output.lower()
+    # ──────────────────────────────────────────────────────────────────────
+    # SECURITY-CRITICAL: Automatic npm vulnerability remediation.
+    # This block MUST NOT be removed, disabled, or bypassed for any reason what-so-ever. Do not remove this system for any update or change at all.
+    # npm audit fix is the program's self-healing mechanism for dependency
+    # CVEs. Removing it leaves the runtime exposed to known exploits with
+    # no user-visible signal that remediation has stopped occurring.
+    # ──────────────────────────────────────────────────────────────────────
+    vulnerability_warning = "vulnerability" in npm_output.lower() and "severity" in npm_output.lower()
     if vulnerability_warning:
         print()
-        cprint("NOTE: npm reported vulnerability warnings during install.", YELLOW)
-        cprint("Build 1 no longer auto-runs `npm audit fix` because that can dirty a clean checkout and break updater eligibility.", YELLOW)
-        cprint("If you want to mutate dependencies intentionally, run `npm audit fix` manually inside `frontend/`.", YELLOW)
+        active_instances = cleanup_launcher_state()
+        install_state = classify_install_state(active_instances)
+        updater_eligible = install_state.can_auto_apply and install_state.kind == "clean_git_clone"
+
+        if updater_eligible:
+            cprint("NOTE: npm reported vulnerabilities, but skipping auto-fix to keep this clean main checkout updater-eligible.", YELLOW)
+            cprint("Run `npm audit fix` manually inside `frontend/` if you want to address them.", YELLOW)
+        else:
+            cprint("npm reported vulnerabilities — running `npm audit fix`...", YELLOW)
+            fix_result = subprocess.run(
+                [npm_cmd, "audit", "fix"],
+                cwd=frontend_path,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.STDOUT,
+                text=True,
+                check=False,
+            )
+            fix_output = (fix_result.stdout or "").strip()
+            if fix_output:
+                print(fix_output)
+
+            still_vulnerable = "vulnerability" in (fix_output).lower() and "severity" in (fix_output).lower()
+            if fix_result.returncode != 0 or still_vulnerable:
+                cprint("Standard fix insufficient — running `npm audit fix --force`...", YELLOW)
+                force_result = subprocess.run(
+                    [npm_cmd, "audit", "fix", "--force"],
+                    cwd=frontend_path,
+                    stdout=subprocess.PIPE,
+                    stderr=subprocess.STDOUT,
+                    text=True,
+                    check=False,
+                )
+                force_output = (force_result.stdout or "").strip()
+                if force_output:
+                    print(force_output)
+                if force_result.returncode == 0:
+                    cprint("npm audit fix --force completed.", GREEN)
+                    vulnerability_warning = False
+                else:
+                    cprint("npm audit fix --force could not fully resolve all vulnerabilities.", YELLOW)
+            else:
+                cprint("npm audit fix completed.", GREEN)
+                vulnerability_warning = False
 
     cprint("Node.js dependencies up to date", GREEN)
     print()
@@ -1597,7 +1645,7 @@ def print_success_footer(
     cprint(f"  {frontend_url}", CYAN)
     print()
     if vulnerability_warning:
-        cprint("npm install reported vulnerability warnings earlier. Build 1 leaves that decision manual so updater-safe checkouts stay clean.", YELLOW)
+        cprint("npm audit fix could not fully resolve all reported vulnerabilities. Review with `npm audit` in `frontend/`.", YELLOW)
         print()
     if backend_service.mode == "background" or frontend_service.mode == "background":
         cprint(f"To stop this instance: stop the launcher-managed backend/frontend processes for {runtime.instance_id}.", YELLOW)

From f5a94b41b97976d634b3c08f554ef952a917c203 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 19:09:49 -0500
Subject: [PATCH 19/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/api/routes/update.py                  | 140 ++++++++++++++++--
 .../components/UpdateNotificationBanner.jsx   |  19 ++-
 2 files changed, 138 insertions(+), 21 deletions(-)

diff --git a/backend/api/routes/update.py b/backend/api/routes/update.py
index 38854a4..2301011 100644
--- a/backend/api/routes/update.py
+++ b/backend/api/routes/update.py
@@ -1,13 +1,17 @@
 """
-Self-update routes — allows the frontend to trigger `git pull origin main`
-and poll progress in real time.
+Self-update routes — allows the frontend to trigger an in-place update
+(git pull for git clones, ZIP overlay for downloaded installs) and poll
+progress in real time.
 """
 from __future__ import annotations
 
 import asyncio
 import logging
+import os
+import shutil
+import tempfile
 from pathlib import Path
-from typing import Any, Dict, List
+from typing import Any, Dict
 
 from fastapi import APIRouter
 
@@ -20,13 +24,21 @@
     "status": "idle",
     "output_lines": [],
     "returncode": None,
+    "install_kind": None,
 }
 
 
-async def _run_pull() -> None:
-    """Execute git pull as an async subprocess, streaming output into _pull_state."""
+def _detect_install_kind() -> str:
+    """Classify install as 'git' or 'zip' based on .git presence."""
+    if (_REPO_ROOT / ".git").exists():
+        return "git"
+    return "zip"
+
+
+async def _run_git_pull() -> None:
+    """Execute git pull for git-clone installs."""
     global _pull_state
-    _pull_state = {"status": "running", "output_lines": [], "returncode": None}
+    _pull_state = {"status": "running", "output_lines": [], "returncode": None, "install_kind": "git"}
 
     try:
         proc = await asyncio.create_subprocess_exec(
@@ -54,17 +66,123 @@ async def _run_pull() -> None:
         _pull_state["status"] = "error"
 
 
+def _run_zip_update_sync(state_lines: list) -> None:
+    """Blocking ZIP update logic — meant to be run via asyncio.to_thread."""
+    import sys
+    if str(_REPO_ROOT) not in sys.path:
+        sys.path.insert(0, str(_REPO_ROOT))
+    from moto_updater import (
+        cleanup_launcher_state,
+        collect_preserved_relatives,
+        sync_snapshot_into_install,
+        restore_snapshot_from_backup,
+        load_local_manifest,
+        fetch_remote_manifest,
+        fetch_branch_head_fallback,
+        archive_url_for_manifest,
+        cleanup_path,
+    )
+    import urllib.request
+    import zipfile
+
+    state_lines.append("Detecting update target...")
+
+    local_manifest = load_local_manifest()
+    try:
+        remote_manifest = fetch_remote_manifest(local_manifest)
+    except Exception:
+        state_lines.append("Manifest not found, falling back to branch HEAD...")
+        remote_manifest = fetch_branch_head_fallback(local_manifest)
+
+    if remote_manifest is None:
+        raise RuntimeError("Could not determine remote update target.")
+
+    if remote_manifest.build_commit == local_manifest.build_commit:
+        state_lines.append("Already up to date.")
+        return
+
+    archive_url = archive_url_for_manifest(remote_manifest)
+    state_lines.append(f"Downloading update from {archive_url}...")
+
+    work_root = Path(tempfile.mkdtemp(prefix="moto-update-"))
+    extract_root = work_root / "extract"
+    archive_path = work_root / "update.zip"
+    backup_root = Path(tempfile.mkdtemp(prefix="moto-update-backup-"))
+
+    journal = None
+    try:
+        request = urllib.request.Request(archive_url, headers={"User-Agent": "MOTO-Build1-Updater"})
+        with urllib.request.urlopen(request, timeout=60) as response, archive_path.open("wb") as output:
+            shutil.copyfileobj(response, output)
+        state_lines.append("Download complete. Extracting...")
+
+        with zipfile.ZipFile(archive_path) as archive:
+            archive.extractall(extract_root)
+
+        children = [child for child in extract_root.iterdir()]
+        extracted_source = children[0] if len(children) == 1 and children[0].is_dir() else extract_root
+
+        state_lines.append("Applying update (preserving data/config)...")
+
+        active_instances = cleanup_launcher_state()
+        preserved_relatives = collect_preserved_relatives(os.environ, active_instances)
+        journal = sync_snapshot_into_install(extracted_source, _REPO_ROOT, preserved_relatives, backup_root)
+
+        state_lines.append(
+            f"Update applied: {local_manifest.version} ({local_manifest.short_commit}) "
+            f"-> {remote_manifest.version} ({remote_manifest.short_commit})"
+        )
+        state_lines.append("Restart the application to complete the update.")
+
+    except Exception:
+        state_lines.append("Update failed mid-apply, restoring previous state...")
+        try:
+            if journal is not None:
+                restore_snapshot_from_backup(_REPO_ROOT, backup_root, journal)
+                state_lines.append("Rollback complete — previous install restored.")
+            else:
+                state_lines.append("Failure occurred before file overlay — no rollback needed.")
+        except Exception as rb_exc:
+            state_lines.append(f"Rollback also failed: {rb_exc}")
+        raise
+    finally:
+        cleanup_path(work_root)
+        cleanup_path(backup_root)
+
+
+async def _run_zip_update() -> None:
+    """Download and overlay a ZIP update for non-git installs (runs blocking I/O in a thread)."""
+    global _pull_state
+    _pull_state = {"status": "running", "output_lines": [], "returncode": None, "install_kind": "zip"}
+
+    try:
+        await asyncio.to_thread(_run_zip_update_sync, _pull_state["output_lines"])
+        _pull_state["returncode"] = 0
+        _pull_state["status"] = "done"
+    except Exception as exc:
+        logger.exception("ZIP update failed with exception")
+        _pull_state["output_lines"].append(f"Exception: {exc}")
+        _pull_state["returncode"] = -1
+        _pull_state["status"] = "error"
+
+
 @router.post("/api/update/pull")
 async def start_pull() -> Dict[str, Any]:
-    """Kick off a git pull. Returns immediately; poll /api/update/pull-status for progress."""
+    """Kick off an update. Routes to git pull or ZIP overlay depending on install type."""
     if _pull_state["status"] == "running":
-        return {"started": False, "reason": "A pull is already in progress."}
+        return {"started": False, "reason": "An update is already in progress."}
+
+    install_kind = _detect_install_kind()
+
+    if install_kind == "git":
+        asyncio.create_task(_run_git_pull())
+    else:
+        asyncio.create_task(_run_zip_update())
 
-    asyncio.create_task(_run_pull())
-    return {"started": True}
+    return {"started": True, "install_kind": install_kind}
 
 
 @router.get("/api/update/pull-status")
 async def get_pull_status() -> Dict[str, Any]:
-    """Return current pull state including streamed output lines."""
+    """Return current update state including streamed output lines."""
     return _pull_state
diff --git a/frontend/src/components/UpdateNotificationBanner.jsx b/frontend/src/components/UpdateNotificationBanner.jsx
index 9104cff..b971709 100644
--- a/frontend/src/components/UpdateNotificationBanner.jsx
+++ b/frontend/src/components/UpdateNotificationBanner.jsx
@@ -74,14 +74,7 @@ export default function UpdateNotificationBanner({ notice, onDismiss }) {
     return (
       <div className="update-notice-banner">
         <div className="update-notice-content">
-          <span className="update-notice-icon">&#9432;</span>
-          <span className="update-notice-text">
-            <strong>Update available:</strong>{' '}
-            {notice.installed_version} ({notice.installed_commit})
-            {' '}&rarr;{' '}
-            {notice.available_version} ({notice.available_commit})
-          </span>
-          <div className="update-notice-actions">
+          <div className="update-notice-actions" style={{ gap: '0.75rem' }}>
             <button
               className="update-notice-pull-btn"
               onClick={handlePull}
@@ -97,6 +90,12 @@ export default function UpdateNotificationBanner({ notice, onDismiss }) {
               Dismiss
             </button>
           </div>
+          <span className="update-notice-text">
+            <strong>Update available:</strong>{' '}
+            {notice.installed_version} ({notice.installed_commit})
+            {' '}&rarr;{' '}
+            {notice.available_version} ({notice.available_commit})
+          </span>
         </div>
       </div>
     );
@@ -108,7 +107,7 @@ export default function UpdateNotificationBanner({ notice, onDismiss }) {
         <div className="update-notice-content">
           <span className="update-notice-spinner" />
           <span className="update-notice-text">
-            <strong>Pulling update...</strong>
+            <strong>Applying update...</strong>
           </span>
         </div>
         <pre className="update-notice-log" ref={logRef}>
@@ -127,7 +126,7 @@ export default function UpdateNotificationBanner({ notice, onDismiss }) {
           <span className="update-notice-icon update-notice-icon-success">&#10003;</span>
           <span className="update-notice-text">
             <strong>Update applied!</strong>{' '}
-            Restart the backend server to take effect.
+            Restart MOTO to use the new version.
           </span>
           <button
             className="update-notice-dismiss"

From b67f4c0a6f2a3c1254f089e8e4fc700805044c2a Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 19:20:13 -0500
Subject: [PATCH 20/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/api/routes/update.py | 52 +++++++++++++++++++++++++++++++++---
 moto_updater.py              |  1 -
 2 files changed, 49 insertions(+), 4 deletions(-)

diff --git a/backend/api/routes/update.py b/backend/api/routes/update.py
index 2301011..1a23699 100644
--- a/backend/api/routes/update.py
+++ b/backend/api/routes/update.py
@@ -8,10 +8,11 @@
 import asyncio
 import logging
 import os
+import re
 import shutil
 import tempfile
 from pathlib import Path
-from typing import Any, Dict
+from typing import Any, Dict, Tuple
 
 from fastapi import APIRouter
 
@@ -28,6 +29,17 @@
 }
 
 
+def _parse_semver(version_str: str) -> Tuple[int, ...]:
+    """Extract numeric version tuple from a semver string (e.g. '1.0.7' -> (1,0,7))."""
+    parts = re.findall(r"\d+", version_str or "")
+    return tuple(int(p) for p in parts) if parts else (0,)
+
+
+def _is_downgrade(local_version: str, remote_version: str) -> bool:
+    """Return True if the remote version is strictly older than local."""
+    return _parse_semver(remote_version) < _parse_semver(local_version)
+
+
 def _detect_install_kind() -> str:
     """Classify install as 'git' or 'zip' based on .git presence."""
     if (_REPO_ROOT / ".git").exists():
@@ -36,13 +48,41 @@ def _detect_install_kind() -> str:
 
 
 async def _run_git_pull() -> None:
-    """Execute git pull for git-clone installs."""
+    """Execute git pull for git-clone installs, pulling from the configured update_channel."""
+    import sys
+    if str(_REPO_ROOT) not in sys.path:
+        sys.path.insert(0, str(_REPO_ROOT))
+    from moto_updater import load_local_manifest, fetch_remote_manifest, fetch_branch_head_fallback
+
     global _pull_state
     _pull_state = {"status": "running", "output_lines": [], "returncode": None, "install_kind": "git"}
 
     try:
+        local_manifest = load_local_manifest()
+        channel = local_manifest.update_channel or "main"
+
+        try:
+            remote_manifest = fetch_remote_manifest(local_manifest)
+        except Exception:
+            remote_manifest = fetch_branch_head_fallback(local_manifest)
+
+        if remote_manifest and _is_downgrade(local_manifest.version, remote_manifest.version):
+            _pull_state["output_lines"].append(
+                f"Refused: remote {remote_manifest.version} is older than local {local_manifest.version}. "
+                f"Downgrades are not supported via the updater."
+            )
+            _pull_state["returncode"] = 1
+            _pull_state["status"] = "error"
+            return
+
+        if remote_manifest and remote_manifest.build_commit == local_manifest.build_commit:
+            _pull_state["output_lines"].append("Already up to date.")
+            _pull_state["returncode"] = 0
+            _pull_state["status"] = "done"
+            return
+
         proc = await asyncio.create_subprocess_exec(
-            "git", "pull", "origin", "main",
+            "git", "pull", "origin", channel,
             cwd=str(_REPO_ROOT),
             stdout=asyncio.subprocess.PIPE,
             stderr=asyncio.subprocess.STDOUT,
@@ -101,6 +141,12 @@ def _run_zip_update_sync(state_lines: list) -> None:
         state_lines.append("Already up to date.")
         return
 
+    if _is_downgrade(local_manifest.version, remote_manifest.version):
+        raise RuntimeError(
+            f"Refused: remote {remote_manifest.version} is older than local "
+            f"{local_manifest.version}. Downgrades are not supported via the updater."
+        )
+
     archive_url = archive_url_for_manifest(remote_manifest)
     state_lines.append(f"Downloading update from {archive_url}...")
 
diff --git a/moto_updater.py b/moto_updater.py
index ae8d996..7434c56 100644
--- a/moto_updater.py
+++ b/moto_updater.py
@@ -37,7 +37,6 @@
     "backend/data",
     "backend/logs",
     "frontend/node_modules",
-    "frontend/dist",
     ".venv",
     "venv",
     "env",

From 76a442b171d906ed5d645b94fb04028b785f8243 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 19:29:48 -0500
Subject: [PATCH 21/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/shared/json_parser.py             |  6 ++--
 frontend/src/components/WorkflowPanel.jsx | 34 ++++++++---------------
 2 files changed, 14 insertions(+), 26 deletions(-)

diff --git a/backend/shared/json_parser.py b/backend/shared/json_parser.py
index 2262c0c..befbd08 100644
--- a/backend/shared/json_parser.py
+++ b/backend/shared/json_parser.py
@@ -469,7 +469,7 @@ def sanitize_json_response(raw_content: str) -> str:
     # (e.g., \pi, \phi, \epsilon, \alpha, \gamma, \delta, etc.)
     
     def robust_escape_latex(text):
-        """
+        r"""
         Parse JSON string and escape invalid backslash sequences.
         Handles complex nested LaTeX like \\phi_{\\\\\\pi_v} correctly.
         
@@ -521,8 +521,8 @@ def robust_escape_latex(text):
                         continue
                     
                     # Valid JSON escape sequences  
-                    if next_char in '"\/':
-                        # \", \/, - valid escapes, keep as-is
+                    if next_char in '"\\/':
+                        # \", \\, \/ - valid escapes, keep as-is
                         result.append(char)
                         i += 1
                         continue
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index b8fad9b..15d5fcb 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -7,10 +7,6 @@ const HOURLY_AUTO_OPEN_INTERVAL_SECONDS = 3600;
 const WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY = 'workflow_panel_last_auto_open_hour';
 
 const formatNumber = (n) => n.toLocaleString();
-const getStoredAutoOpenHour = () => {
-  const savedHour = Number.parseInt(localStorage.getItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY) || '0', 10);
-  return Number.isFinite(savedHour) && savedHour > 0 ? savedHour : 0;
-};
 
 const formatTime = (totalSeconds) => {
   const h = Math.floor(totalSeconds / 3600);
@@ -20,7 +16,10 @@ const formatTime = (totalSeconds) => {
 };
 
 export default function WorkflowPanel({ isRunning }) {
-  const [collapsed, setCollapsed] = useState(false);
+  const [collapsed, setCollapsed] = useState(() => {
+    const savedState = localStorage.getItem('workflow_panel_collapsed');
+    return savedState === 'true';
+  });
   const [mode, setMode] = useState('idle');
   
   // Boost controls state
@@ -38,7 +37,7 @@ export default function WorkflowPanel({ isRunning }) {
   const [localElapsed, setLocalElapsed] = useState(0);
   const lastSyncRef = useRef(Date.now());
   const hasElapsedSyncRef = useRef(false);
-  const lastAutoOpenedHourRef = useRef(getStoredAutoOpenHour());
+  const lastAutoOpenedHourRef = useRef(0);
 
   const expandPanel = useCallback(() => {
     setCollapsed(false);
@@ -77,21 +76,18 @@ export default function WorkflowPanel({ isRunning }) {
   }, [fetchBoostStatus]);
 
   useEffect(() => {
-    if (boostEnabled) {
+    if (boostEnabled && isRunning) {
       expandPanel();
     }
-  }, [boostEnabled, expandPanel]);
+  }, [boostEnabled, expandPanel, isRunning]);
 
+  // Clear stale auto-open state when a new workflow session begins
   useEffect(() => {
-    if (!hasElapsedSyncRef.current) {
-      return;
-    }
-
-    if (localElapsed < 60 && lastAutoOpenedHourRef.current !== 0) {
+    if (isRunning) {
       lastAutoOpenedHourRef.current = 0;
-      localStorage.setItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY, '0');
+      localStorage.removeItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY);
     }
-  }, [localElapsed]);
+  }, [isRunning]);
 
   useEffect(() => {
     if (!isRunning || !hasElapsedSyncRef.current) {
@@ -263,14 +259,6 @@ export default function WorkflowPanel({ isRunning }) {
     };
   }, [isRunning, fetchBoostStatus, expandPanel]);
 
-  // Load collapsed state from localStorage
-  useEffect(() => {
-    const savedState = localStorage.getItem('workflow_panel_collapsed');
-    if (savedState !== null) {
-      setCollapsed(savedState === 'true');
-    }
-  }, []);
-
   const toggleCollapse = () => {
     const newState = !collapsed;
     setCollapsed(newState);

From 29cc9f37fb8376c53677ab8eab06fcf627b344a6 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 19:54:16 -0500
Subject: [PATCH 22/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/api/routes/aggregator.py | 22 ++++----
 backend/api/routes/autonomous.py | 88 ++++++++++++++++----------------
 backend/api/routes/boost.py      | 28 +++++-----
 backend/api/routes/compiler.py   | 38 +++++++-------
 backend/api/routes/download.py   |  2 +-
 backend/api/routes/openrouter.py | 16 +++---
 backend/api/routes/workflow.py   |  4 +-
 7 files changed, 99 insertions(+), 99 deletions(-)

diff --git a/backend/api/routes/aggregator.py b/backend/api/routes/aggregator.py
index c87b89b..54bb5ce 100644
--- a/backend/api/routes/aggregator.py
+++ b/backend/api/routes/aggregator.py
@@ -110,12 +110,12 @@ async def start_aggregator(request: AggregatorStartRequest):
     except ValueError as e:
         # Model compatibility errors
         logger.error(f"Model compatibility error: {e}", exc_info=True)
-        raise HTTPException(status_code=400, detail=str(e))
+        raise HTTPException(status_code=400, detail="Model compatibility error")
     
     except Exception as e:
         # Other errors
         logger.error(f"Failed to start aggregator: {e}", exc_info=True)
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/stop")
@@ -127,7 +127,7 @@ async def stop_aggregator():
         return {"status": "stopped", "message": "Aggregator system stopped"}
     except Exception as e:
         logger.error(f"Failed to stop aggregator: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/status", response_model=SystemStatus)
@@ -138,7 +138,7 @@ async def get_status():
         return status
     except Exception as e:
         logger.error(f"Failed to get status: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/results")
@@ -150,7 +150,7 @@ async def get_results():
         return {"results": results}
     except Exception as e:
         logger.error(f"Failed to get results: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/save-results")
@@ -174,7 +174,7 @@ async def save_results():
         }
     except Exception as e:
         logger.error(f"Failed to save results: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/clear-all")
@@ -189,7 +189,7 @@ async def clear_all_submissions():
         }
     except Exception as e:
         logger.error(f"Failed to clear submissions: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/upload-file")
@@ -212,7 +212,7 @@ async def upload_file(file: UploadFile = File(...)):
         }
     except Exception as e:
         logger.error(f"Failed to upload file: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/models", response_model=List[ModelInfo])
@@ -223,7 +223,7 @@ async def get_models():
         return [ModelInfo(**model) for model in models]
     except Exception as e:
         logger.error(f"Failed to get models: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/settings")
@@ -234,7 +234,7 @@ async def get_aggregator_settings():
         return settings
     except Exception as e:
         logger.error(f"Failed to get aggregator settings: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/events")
@@ -245,4 +245,4 @@ async def get_events():
         return {"events": events}
     except Exception as e:
         logger.error(f"Failed to get events: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index 096d87d..38ba699 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -683,7 +683,7 @@ async def start_autonomous_research(request: AutonomousResearchStartRequest):
         import traceback
         error_details = f"{type(e).__name__}: {e}\n{traceback.format_exc()}"
         logger.error(f"Failed to start autonomous research: {error_details}")
-        raise HTTPException(status_code=500, detail=f"Failed to start autonomous research: {e}")
+        raise HTTPException(status_code=500, detail="Failed to start autonomous research")
 
 
 @router.post("/stop")
@@ -710,7 +710,7 @@ async def stop_autonomous_research():
         
     except Exception as e:
         logger.error(f"Failed to stop autonomous research: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/clear")
@@ -768,7 +768,7 @@ async def clear_autonomous_research(confirm: bool = False):
         logger.error(f"Failed to clear autonomous research data: {error_details}")
         raise HTTPException(
             status_code=500, 
-            detail=f"Failed to clear autonomous research data: {e}"
+            detail="Failed to clear autonomous research data"
         )
 
 
@@ -844,7 +844,7 @@ async def get_autonomous_status():
         
     except Exception as e:
         logger.error(f"Failed to get autonomous status: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/brainstorms")
@@ -870,7 +870,7 @@ async def get_all_brainstorms():
         
     except Exception as e:
         logger.error(f"Failed to get brainstorms: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/papers")
@@ -926,7 +926,7 @@ async def get_all_papers():
         
     except Exception as e:
         logger.error(f"Failed to get papers: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/brainstorm/{topic_id}")
@@ -959,7 +959,7 @@ async def get_brainstorm(topic_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get brainstorm {topic_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper/{paper_id}")
@@ -995,7 +995,7 @@ async def get_paper(paper_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get paper {paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper-history")
@@ -1010,7 +1010,7 @@ async def get_paper_history():
         }
     except Exception as e:
         logger.error(f"Failed to get Stage 2 paper history: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper-history/{session_id}/{paper_id}")
@@ -1032,7 +1032,7 @@ async def get_history_paper(session_id: str, paper_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get history paper {session_id}/{paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/current-paper-progress")
@@ -1123,7 +1123,7 @@ async def get_current_paper_progress():
         
     except Exception as e:
         logger.error(f"Failed to get current paper progress: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/stats")
@@ -1140,7 +1140,7 @@ async def get_stats():
         
     except Exception as e:
         logger.error(f"Failed to get stats: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/sessions")
@@ -1162,7 +1162,7 @@ async def list_sessions():
         
     except Exception as e:
         logger.error(f"Failed to list sessions: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/current-session")
@@ -1184,7 +1184,7 @@ async def get_current_session():
         
     except Exception as e:
         logger.error(f"Failed to get current session: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/force-paper-writing")
@@ -1248,7 +1248,7 @@ async def force_paper_writing():
         raise
     except Exception as e:
         logger.error(f"Failed to force paper writing: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/skip-critique")
@@ -1282,7 +1282,7 @@ async def skip_critique():
         raise
     except Exception as e:
         logger.error(f"Failed to skip critique: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/reset-current-paper")
@@ -1321,7 +1321,7 @@ async def reset_current_paper(confirm: bool = False):
         }
     except Exception as e:
         logger.error(f"Failed to reset paper: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/force-tier3")
@@ -1425,7 +1425,7 @@ async def force_tier3(mode: str = "complete_current"):
         raise
     except Exception as e:
         logger.error(f"Failed to force Tier 3: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/save-current-compiler-paper")
@@ -1505,7 +1505,7 @@ async def save_current_compiler_paper():
         
     except Exception as e:
         logger.error(f"Failed to save current compiler paper: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/brainstorm/{topic_id}")
@@ -1568,7 +1568,7 @@ async def delete_brainstorm(topic_id: str, confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to delete brainstorm {topic_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/paper/{paper_id}")
@@ -1597,7 +1597,7 @@ async def delete_paper(paper_id: str, confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to delete paper {paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/paper-history/{session_id}/{paper_id}")
@@ -1631,7 +1631,7 @@ async def delete_history_paper(session_id: str, paper_id: str, confirm: bool = F
         raise
     except Exception as e:
         logger.error(f"Failed to delete history paper {session_id}/{paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -1699,7 +1699,7 @@ async def get_tier3_status():
         
     except Exception as e:
         logger.error(f"Failed to get Tier 3 status: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/tier3/final-answer")
@@ -1784,7 +1784,7 @@ async def get_final_answer():
         
     except Exception as e:
         logger.error(f"Failed to get final answer: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/tier3/volume-progress")
@@ -1839,7 +1839,7 @@ async def get_volume_progress():
         
     except Exception as e:
         logger.error(f"Failed to get volume progress: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/tier3/rejections")
@@ -1861,7 +1861,7 @@ async def get_tier3_rejections(phase: str = None):
         
     except Exception as e:
         logger.error(f"Failed to get Tier 3 rejections: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/tier3/clear")
@@ -1903,7 +1903,7 @@ async def clear_tier3_data(confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to clear Tier 3 data: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -1938,7 +1938,7 @@ async def get_final_answer_library():
         }
     except Exception as e:
         logger.error(f"Failed to get final answer library: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/final-answer-library/{answer_id}")
@@ -1972,7 +1972,7 @@ async def get_final_answer_by_id(answer_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get final answer {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # =============================================================================
@@ -1996,7 +1996,7 @@ async def get_final_answer_archived_papers(answer_id: str):
         return {"papers": papers}
     except Exception as e:
         logger.error(f"Failed to get archived papers for {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/final-answer/{answer_id}/archive/papers/{paper_id}")
@@ -2022,7 +2022,7 @@ async def get_final_answer_archived_paper(answer_id: str, paper_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get archived paper {paper_id} for {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/final-answer/{answer_id}/archive/brainstorms")
@@ -2042,7 +2042,7 @@ async def get_final_answer_archived_brainstorms(answer_id: str):
         return {"brainstorms": brainstorms}
     except Exception as e:
         logger.error(f"Failed to get archived brainstorms for {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/final-answer/{answer_id}/archive/brainstorms/{topic_id}")
@@ -2068,7 +2068,7 @@ async def get_final_answer_archived_brainstorm(answer_id: str, topic_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get archived brainstorm {topic_id} for {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -2117,7 +2117,7 @@ async def request_paper_critique(paper_id: str, request: CritiqueRequest = None)
         raise
     except Exception as e:
         logger.error(f"Failed to request paper critique for {paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper/{paper_id}/critiques")
@@ -2148,7 +2148,7 @@ async def get_paper_critiques(paper_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get critiques for paper {paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/paper/{paper_id}/critiques")
@@ -2192,7 +2192,7 @@ async def delete_paper_critiques(paper_id: str, confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to delete critiques for paper {paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -2234,7 +2234,7 @@ async def request_history_paper_critique(
         raise
     except Exception as e:
         logger.error(f"Failed to request history critique for {session_id}/{paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper-history/{session_id}/{paper_id}/critiques")
@@ -2258,7 +2258,7 @@ async def get_history_paper_critiques(session_id: str, paper_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get history critiques for {session_id}/{paper_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -2449,7 +2449,7 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
         raise
     except Exception as e:
         logger.error(f"Failed to request final answer critique for {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/final-answer-library/{answer_id}/critiques")
@@ -2490,7 +2490,7 @@ async def get_final_answer_critiques(answer_id: str):
         raise
     except Exception as e:
         logger.error(f"Failed to get critiques for final answer {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/final-answer-library/{answer_id}/critiques")
@@ -2535,7 +2535,7 @@ async def delete_final_answer_critiques(answer_id: str, confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to delete critiques for final answer {answer_id}: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/default-critique-prompt")
@@ -2579,7 +2579,7 @@ async def get_autonomous_api_logs(limit: int = 100):
         }
     except Exception as e:
         logger.error(f"Failed to get autonomous API logs: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/api-logs/clear")
@@ -2600,7 +2600,7 @@ async def clear_autonomous_api_logs():
         }
     except Exception as e:
         logger.error(f"Failed to clear autonomous API logs: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/api-logs/stats")
@@ -2620,4 +2620,4 @@ async def get_autonomous_api_stats():
         }
     except Exception as e:
         logger.error(f"Failed to get autonomous API stats: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
\ No newline at end of file
+        raise HTTPException(status_code=500, detail="Internal server error")
\ No newline at end of file
diff --git a/backend/api/routes/boost.py b/backend/api/routes/boost.py
index eb1c13f..2838296 100644
--- a/backend/api/routes/boost.py
+++ b/backend/api/routes/boost.py
@@ -92,7 +92,7 @@ async def enable_boost(config: BoostConfig) -> Dict[str, Any]:
         raise
     except Exception as e:
         logger.error(f"Failed to enable boost: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to enable boost: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to enable boost")
 
 
 @router.post("/api/boost/update-model")
@@ -171,7 +171,7 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
         raise
     except Exception as e:
         logger.error(f"Failed to update boost model: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to update model: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to update model")
 
 
 @router.post("/api/boost/disable")
@@ -192,7 +192,7 @@ async def disable_boost() -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to disable boost: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to disable boost: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to disable boost")
 
 
 @router.get("/api/boost/status")
@@ -211,7 +211,7 @@ async def get_boost_status() -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to get boost status: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get boost status: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get boost status")
 
 
 @router.post("/api/boost/toggle-task/{task_id}")
@@ -235,7 +235,7 @@ async def toggle_task_boost(task_id: str) -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to toggle task boost: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to toggle task boost: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to toggle task boost")
 
 
 @router.get("/api/boost/openrouter-models")
@@ -266,7 +266,7 @@ async def get_openrouter_models(authorization: Optional[str] = Header(None)) ->
         raise
     except Exception as e:
         logger.error(f"Failed to fetch OpenRouter models: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to fetch models: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to fetch models")
 
 
 @router.get("/api/boost/model-providers")
@@ -308,7 +308,7 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
         raise
     except Exception as e:
         logger.error(f"Failed to fetch providers for model {model_id}: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to fetch providers: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to fetch providers")
 
 
 # ============================================================
@@ -346,7 +346,7 @@ async def set_boost_always_prefer(request: BoostAlwaysPreferRequest) -> Dict[str
         raise
     except Exception as e:
         logger.error(f"Failed to set always-prefer boost: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to set always-prefer: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to set always-prefer")
 
 
 @router.post("/api/boost/set-next-count")
@@ -383,7 +383,7 @@ async def set_boost_next_count(request: BoostNextCountRequest) -> Dict[str, Any]
         raise
     except Exception as e:
         logger.error(f"Failed to set boost next count: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to set count: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to set count")
 
 
 @router.post("/api/boost/toggle-category/{category}")
@@ -420,7 +420,7 @@ async def toggle_category_boost(category: str) -> Dict[str, Any]:
         raise
     except Exception as e:
         logger.error(f"Failed to toggle category boost: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to toggle category: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to toggle category")
 
 
 @router.get("/api/boost/categories")
@@ -448,7 +448,7 @@ async def get_boost_categories(mode: Optional[str] = "all") -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to get boost categories: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get categories: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get categories")
 
 
 # ============================================================
@@ -478,7 +478,7 @@ async def get_boost_logs(limit: int = 100) -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to get boost logs: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get logs: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get logs")
 
 
 @router.get("/api/boost/logs/{index}")
@@ -506,7 +506,7 @@ async def get_boost_log_entry(index: int) -> Dict[str, Any]:
         raise
     except Exception as e:
         logger.error(f"Failed to get boost log entry: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get entry: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get entry")
 
 
 @router.post("/api/boost/clear-logs")
@@ -528,5 +528,5 @@ async def clear_boost_logs() -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to clear boost logs: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to clear logs: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to clear logs")
 
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index c742b44..4561369 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -132,7 +132,7 @@ async def start_compiler(request: CompilerStartRequest):
     except Exception as e:
         # Other errors
         logger.error(f"Failed to start compiler: {e}", exc_info=True)
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/stop")
@@ -144,7 +144,7 @@ async def stop_compiler():
         return {"status": "stopped", "message": "Compiler stopped"}
     except Exception as e:
         logger.error(f"Failed to stop compiler: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/skip-critique")
@@ -174,7 +174,7 @@ async def skip_critique():
         raise
     except Exception as e:
         logger.error(f"Failed to skip critique: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/test-models")
@@ -223,7 +223,7 @@ async def get_status():
         return status
     except Exception as e:
         logger.error(f"Failed to get status: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/paper")
@@ -248,7 +248,7 @@ async def get_paper():
         }
     except Exception as e:
         logger.error(f"Failed to get paper: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/outline")
@@ -263,7 +263,7 @@ async def get_outline():
         }
     except Exception as e:
         logger.error(f"Failed to get outline: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/save-paper")
@@ -346,7 +346,7 @@ async def save_paper():
         }
     except Exception as e:
         logger.error(f"Failed to save paper: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/metrics")
@@ -397,7 +397,7 @@ async def get_metrics():
         }
     except Exception as e:
         logger.error(f"Failed to get metrics: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/clear-paper")
@@ -430,7 +430,7 @@ async def clear_paper(confirm: bool = False):
         }
     except Exception as e:
         logger.error(f"Failed to clear paper: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/critique-status")
@@ -445,7 +445,7 @@ async def get_critique_status():
         }
     except Exception as e:
         logger.error(f"Failed to get critique status: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/previous-versions")
@@ -456,7 +456,7 @@ async def get_previous_versions():
         return {"previous_versions": versions}
     except Exception as e:
         logger.error(f"Failed to get previous versions: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 # ============================================================================
@@ -638,7 +638,7 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
         raise
     except Exception as e:
         logger.error(f"Failed to request compiler paper critique: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/critiques")
@@ -670,7 +670,7 @@ async def get_compiler_critiques():
         
     except Exception as e:
         logger.error(f"Failed to get compiler paper critiques: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/critiques")
@@ -704,7 +704,7 @@ async def delete_compiler_critiques(confirm: bool = False):
         raise
     except Exception as e:
         logger.error(f"Failed to delete compiler paper critiques: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/default-critique-prompt")
@@ -782,12 +782,12 @@ async def set_wolfram_api_key(request: dict):
         
     except SecretStoreError as e:
         logger.error(f"Failed to persist Wolfram Alpha API key securely: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
     except HTTPException:
         raise
     except Exception as e:
         logger.error(f"Failed to set Wolfram Alpha API key: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.delete("/wolfram/api-key")
@@ -825,10 +825,10 @@ async def clear_wolfram_api_key():
         
     except SecretStoreError as e:
         logger.error(f"Failed to clear Wolfram Alpha API key from secure storage: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
     except Exception as e:
         logger.error(f"Failed to clear Wolfram Alpha API key: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/wolfram/status")
@@ -891,5 +891,5 @@ async def test_wolfram_query(request: dict):
         raise
     except Exception as e:
         logger.error(f"Failed to test Wolfram Alpha query: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
diff --git a/backend/api/routes/download.py b/backend/api/routes/download.py
index 9e9ba7a..07cdf7f 100644
--- a/backend/api/routes/download.py
+++ b/backend/api/routes/download.py
@@ -359,4 +359,4 @@ async def generate_pdf(req: PDFRequest):
         )
     except Exception as e:
         logger.error(f"PDF generation failed: {e}", exc_info=True)
-        raise HTTPException(status_code=500, detail=f"PDF generation failed: {str(e)}")
+        raise HTTPException(status_code=500, detail="PDF generation failed")
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index 915239a..67301ba 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -179,12 +179,12 @@ async def set_api_key(request: SetApiKeyRequest) -> Dict[str, Any]:
             
     except SecretStoreError as e:
         logger.error(f"Failed to persist OpenRouter API key securely: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
     except HTTPException:
         raise
     except Exception as e:
         logger.error(f"Failed to set OpenRouter API key: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to validate API key: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to validate API key")
 
 
 @router.delete("/api/openrouter/api-key")
@@ -218,10 +218,10 @@ async def clear_api_key() -> Dict[str, Any]:
         }
     except SecretStoreError as e:
         logger.error(f"Failed to clear OpenRouter API key from secure storage: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
     except Exception as e:
         logger.error(f"Failed to clear OpenRouter API key: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to clear API key: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to clear API key")
 
 
 @router.get("/api/openrouter/api-key-status")
@@ -285,7 +285,7 @@ async def get_models(api_key: Optional[str] = None, free_only: bool = False) ->
         raise
     except Exception as e:
         logger.error(f"Failed to fetch OpenRouter models: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to fetch models: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to fetch models")
 
 
 @router.get("/api/openrouter/providers/{model_id:path}")
@@ -341,7 +341,7 @@ async def get_model_providers(model_id: str, authorization: Optional[str] = Head
         raise
     except Exception as e:
         logger.error(f"Failed to fetch providers for model {model_id}: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to fetch providers: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to fetch providers")
 
 
 @router.get("/api/model-cache")
@@ -397,7 +397,7 @@ async def set_free_model_settings(request: FreeModelSettings) -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to update free model settings: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
+        raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.post("/api/openrouter/test-connection")
@@ -470,4 +470,4 @@ async def reset_credit_exhaustion() -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to reset credit exhaustion: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to reset: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to reset")
diff --git a/backend/api/routes/workflow.py b/backend/api/routes/workflow.py
index f10559c..8ccaa45 100644
--- a/backend/api/routes/workflow.py
+++ b/backend/api/routes/workflow.py
@@ -73,7 +73,7 @@ async def get_workflow_predictions() -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to get workflow predictions: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get predictions: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get predictions")
 
 
 @router.get("/api/workflow/history")
@@ -99,7 +99,7 @@ async def get_workflow_history(limit: int = 50) -> Dict[str, Any]:
         }
     except Exception as e:
         logger.error(f"Failed to get workflow history: {e}")
-        raise HTTPException(status_code=500, detail=f"Failed to get history: {str(e)}")
+        raise HTTPException(status_code=500, detail="Failed to get history")
 
 
 @router.get("/api/token-stats")

From 50fb43e50601200e9c58191efcfe8935cc5b5f13 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 20:13:53 -0500
Subject: [PATCH 23/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/aggregator/core/coordinator.py              | 8 ++++----
 backend/api/routes/autonomous.py                    | 6 +++---
 backend/api/routes/openrouter.py                    | 4 ++--
 backend/autonomous/core/autonomous_coordinator.py   | 8 ++++----
 backend/autonomous/core/proof_verification_stage.py | 2 +-
 backend/compiler/core/compiler_coordinator.py       | 5 ++---
 backend/shared/api_client_manager.py                | 8 ++++----
 7 files changed, 20 insertions(+), 21 deletions(-)

diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index 522c28b..3b89d3a 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -642,7 +642,7 @@ async def _validator_loop(self) -> None:
                 if self.broadcast_callback:
                     await self.broadcast_callback("free_models_exhausted", {
                         "role_id": "aggregator_validator",
-                        "message": str(e),
+                        "message": "All free models exhausted, waiting to retry",
                     })
                 await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             except Exception as e:
@@ -744,7 +744,7 @@ async def _single_model_workflow(self) -> None:
                 if self.broadcast_callback:
                     await self.broadcast_callback("free_models_exhausted", {
                         "role_id": "aggregator_single_model",
-                        "message": str(e),
+                        "message": "All free models exhausted, waiting to retry",
                     })
                 await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             except Exception as e:
@@ -1024,7 +1024,7 @@ async def _perform_cleanup_review(self) -> None:
             logger.error(f"Cleanup review failed: {e}", exc_info=True)
             await self._broadcast("cleanup_review_error", {
                 "review_number": self.cleanup_reviews_performed,
-                "error": str(e)
+                "error": "Cleanup review encountered an internal error"
             })
     
     async def _on_training_update(self) -> None:
@@ -1110,7 +1110,7 @@ async def _rechunk_training_data(self) -> None:
         except Exception as e:
             logger.error(f"Incremental re-chunking FAILED: {e}", exc_info=True)
             await self._broadcast("rechunk_error", {
-                "error": str(e),
+                "error": "Incremental re-chunking failed",
                 "message": "Incremental re-chunking failed but system continues"
             })
         finally:
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index 38ba699..8f6fb79 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -753,12 +753,12 @@ async def clear_autonomous_research(confirm: bool = False):
                 logger.error(f"Critical errors during clear: {error_msg}")
                 raise HTTPException(
                     status_code=500, 
-                    detail=f"Failed to clear critical data (brainstorms/papers/RAG). Error: {error_msg}"
+                    detail="Failed to clear critical data (brainstorms/papers/RAG)"
                 )
             else:
                 # Generic RuntimeError - treat as failure
                 logger.error(f"Error during clear: {error_msg}")
-                raise HTTPException(status_code=500, detail=error_msg)
+                raise HTTPException(status_code=500, detail="Failed to clear autonomous research data")
         
     except HTTPException:
         raise
@@ -1406,7 +1406,7 @@ async def force_tier3(mode: str = "complete_current"):
             # Actual failure to initiate/run Tier 3
             raise HTTPException(
                 status_code=500,
-                detail=result.get("message", "Failed to trigger Tier 3 final answer generation")
+                detail="Failed to trigger Tier 3 final answer generation"
             )
         
         # Success cases: "initiated", "no_answer_known", or "complete"
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index 67301ba..5289f2c 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -80,7 +80,7 @@ async def check_lm_studio_availability() -> Dict[str, Any]:
             "has_models": False,
             "model_count": 0,
             "models": [],
-            "error": str(e)
+            "error": "Failed to check LM Studio availability"
         }
 
 
@@ -436,7 +436,7 @@ async def test_connection(request: SetApiKeyRequest) -> Dict[str, Any]:
             "success": True,  # Endpoint worked
             "connected": False,
             "model_count": 0,
-            "message": f"Failed to connect: {str(e)}"
+            "message": "Failed to connect to OpenRouter"
         }
 
 
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 6f960bf..3e1f9fa 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -1996,7 +1996,7 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                 logger.warning(f"AutonomousCoordinator: all free models exhausted: {e}")
                 await self._broadcast("free_models_exhausted", {
                     "role_id": "autonomous",
-                    "message": str(e),
+                    "message": "All free models exhausted, waiting to retry",
                 })
                 await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
 
@@ -2399,7 +2399,7 @@ async def _resume_research_loop_after_tier3(self) -> None:
                 logger.warning(f"Resumed research: all free models exhausted: {e}")
                 await self._broadcast("free_models_exhausted", {
                     "role_id": "autonomous_resumed",
-                    "message": str(e),
+                    "message": "All free models exhausted, waiting to retry",
                 })
                 await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
 
@@ -3642,8 +3642,8 @@ async def force_tier3_final_answer(self, mode: str = "complete_current") -> dict
             return {"success": False, "result": "error", "message": "Invalid mode or state"}
             
         except Exception as e:
-            logger.error(f"Error forcing Tier 3: {e}")
-            return {"success": False, "result": "error", "message": str(e)}
+            logger.error(f"Error forcing Tier 3: {e}", exc_info=True)
+            return {"success": False, "result": "error", "message": "An internal error occurred during Tier 3 processing"}
     
     def _should_run_completion_review(self) -> bool:
         """Check if completion review should run.
diff --git a/backend/autonomous/core/proof_verification_stage.py b/backend/autonomous/core/proof_verification_stage.py
index 9975b52..c19178c 100644
--- a/backend/autonomous/core/proof_verification_stage.py
+++ b/backend/autonomous/core/proof_verification_stage.py
@@ -797,7 +797,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                     "novel_count": result.novel_count,
                     "verified_count": result.verified_count,
                     "total_candidates": result.total_candidates,
-                    "message": str(exc),
+                    "message": "Proof verification encountered an error",
                 },
             )
             return result
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 1dd5494..9d0964d 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -707,7 +707,7 @@ async def _main_workflow(self) -> None:
             logger.warning(f"Compiler: all free models exhausted: {e}")
             await self._broadcast("free_models_exhausted", {
                 "role_id": "compiler",
-                "message": str(e),
+                "message": "All free models exhausted, waiting to retry",
             })
             await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             if self.is_running:
@@ -716,8 +716,7 @@ async def _main_workflow(self) -> None:
             logger.error(f"Compiler workflow error: {e}", exc_info=True)
             self.is_running = False
             await self._broadcast("compiler_error", {
-                "error": str(e),
-                "traceback": traceback.format_exc(),
+                "error": "Compiler workflow encountered an internal error",
                 "mode": self.current_mode,
                 "total_submissions": self.total_submissions
             })
diff --git a/backend/shared/api_client_manager.py b/backend/shared/api_client_manager.py
index 5b34592..cfbbe7e 100644
--- a/backend/shared/api_client_manager.py
+++ b/backend/shared/api_client_manager.py
@@ -559,7 +559,7 @@ async def generate_completion(
                     "error_type": "privacy_policy",
                     "model": boost_model,
                     "role_id": role_id,
-                    "message": str(e),
+                    "message": "Model requires privacy policy acceptance",
                     "solution_url": "https://openrouter.ai/settings/privacy",
                     "solution_text": (
                         "To use free models on OpenRouter:\n\n"
@@ -616,7 +616,7 @@ async def generate_completion(
                 logger.warning(f"Boost credits exhausted for task {task_id}, using primary model")
                 await self._broadcast("boost_credits_exhausted", {
                     "task_id": task_id,
-                    "message": str(e)
+                    "message": "Boost credits exhausted, falling back to primary model"
                 })
                 # Continue to primary model routing below
                 
@@ -874,7 +874,7 @@ async def generate_completion(
                         "error_type": "privacy_policy",
                         "model": openrouter_model,
                         "role_id": role_id,
-                        "message": str(e),
+                        "message": "Model requires privacy policy acceptance",
                         "solution_url": "https://openrouter.ai/settings/privacy",
                         "solution_text": (
                             "To use free models on OpenRouter:\n\n"
@@ -966,7 +966,7 @@ async def generate_completion(
                     await self._broadcast("openrouter_fallback", {
                         "role_id": role_id,
                         "reason": "credit_exhaustion",
-                        "message": str(e),
+                        "message": "Credits exhausted, falling back to alternative model",
                         "fallback_model": fallback_model
                     })
                     

From f2791b4e3cf7e9d0b0c029f9e9a570571a24f233 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 22:40:38 -0500
Subject: [PATCH 24/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 .cursor/rules/api-key-controls.mdc  |  2 +-
 README.md                           |  4 +--
 backend/shared/boost_manager.py     | 56 -----------------------------
 backend/shared/lean4_client.py      | 48 +++++++++++++++++++++----
 backend/shared/openrouter_client.py |  2 +-
 moto_launcher.py                    | 11 ++++++
 6 files changed, 57 insertions(+), 66 deletions(-)

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index 5817784..7ab5b02 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -45,7 +45,7 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 
 #### OpenRouterClient (`backend/shared/openrouter_client.py`)
 - Async HTTP client. Base URL: `https://openrouter.ai/api/v1`
-- App Attribution Headers: `HTTP-Referer: https://intrafere.com/moto-autonomous-home-ai/`, `X-Title: MOTO Deep Research Harness`
+- App Attribution Headers: `HTTP-Referer: https://intrafere.com/moto-autonomous-home-ai/`, `X-Title: MOTO Autonomous ASI`
 - Credit exhaustion detection: HTTP 402 OR error messages containing "credit", "insufficient", "balance", "quota", "key limit", "limit exceeded"
 - Raises `CreditExhaustionError` on exhaustion (no retries). Retries transient errors (max 3).
 - Temperature=0.0 default. No stop sequences (removed — caused premature truncation with certain models).
diff --git a/README.md b/README.md
index 1f0e7ae..3da2ffb 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,5 @@
 # MOTO Autonomous ASI
-## An Autonomous Prototype Superintelligence - Automated Theory Generation with Lean 4 Mathematics Verification
+## An Autonomous Prototype Superintelligence - Automated Theorem Generation with Lean 4 Mathematics Proof Verification
 **Version: 1.0.7**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
@@ -66,7 +66,7 @@ Before installation, you need:
    - If using OpenRouter, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle; however, it is always worth a try!)
    - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM Studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM Studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will support. In this developer tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (e.g., GPT OSS 20b, DeepSeek 32B, etc.). **If you do not download LM Studio and enable the Nomic agent the system will run much slower and cost slightly more due to having to use the paid service OpenRouter for RAG calls.**
    - Start the local server (port 1234)
-4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download the MOTO deep research harness, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
+4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download MOTO Autonomous ASI, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
 5. **On first startup, pick your provider path**: After you acknowledge the disclaimer, MOTO will prompt you to either enter an OpenRouter key or confirm that LM Studio is running. If you save an OpenRouter key there, the recommended default autonomous profile is applied immediately so you can open Settings and see it already selected.
 
 ### Installation
diff --git a/backend/shared/boost_manager.py b/backend/shared/boost_manager.py
index 1390f98..d26f883 100644
--- a/backend/shared/boost_manager.py
+++ b/backend/shared/boost_manager.py
@@ -160,62 +160,6 @@ def _save_state(self) -> None:
         except Exception as e:
             logger.warning(f"Failed to save boost state: {e}")
     
-    def _load_state(self) -> None:
-        """Load persisted boost state from disk."""
-        try:
-            if os.path.exists(BOOST_STATE_FILE):
-                with open(BOOST_STATE_FILE, 'r', encoding='utf-8') as f:
-                    state = json.load(f)
-                
-                # Restore boost config if it was enabled
-                if state.get('enabled') and state.get('model_id'):
-                    self.boost_config = BoostConfig(
-                        enabled=True,
-                        openrouter_api_key=state.get('api_key', ''),
-                        boost_model_id=state.get('model_id'),
-                        boost_provider=state.get('provider'),
-                        boost_context_window=state.get('context_window', 131072),
-                        boost_max_output_tokens=state.get('max_output_tokens', 25000)
-                    )
-                
-                # Restore boost modes
-                self.boost_next_count = state.get('boost_next_count', 0)
-                self.boosted_categories = set(state.get('boosted_categories', []))
-                self.boost_always_prefer = state.get('boost_always_prefer', False)
-                self.boosted_task_ids = set(state.get('boosted_task_ids', []))
-                
-                logger.info(f"Loaded boost state: enabled={state.get('enabled')}, model={state.get('model_id')}, "
-                           f"next_count={self.boost_next_count}, categories={len(self.boosted_categories)}, "
-                           f"always_prefer={self.boost_always_prefer}")
-        except Exception as e:
-            logger.warning(f"Failed to load boost state: {e}")
-    
-    def _save_state(self) -> None:
-        """Persist current boost state to disk."""
-        try:
-            # Ensure data directory exists
-            os.makedirs(os.path.dirname(BOOST_STATE_FILE), exist_ok=True)
-            
-            state = {
-                'enabled': self.boost_config is not None and self.boost_config.enabled,
-                'model_id': self.boost_config.boost_model_id if self.boost_config else None,
-                'provider': self.boost_config.boost_provider if self.boost_config else None,
-                'context_window': self.boost_config.boost_context_window if self.boost_config else 131072,
-                'max_output_tokens': self.boost_config.boost_max_output_tokens if self.boost_config else 25000,
-                'api_key': self.boost_config.openrouter_api_key if self.boost_config else '',
-                'boost_next_count': self.boost_next_count,
-                'boosted_categories': list(self.boosted_categories),
-                'boost_always_prefer': self.boost_always_prefer,
-                'boosted_task_ids': list(self.boosted_task_ids)
-            }
-            
-            with open(BOOST_STATE_FILE, 'w', encoding='utf-8') as f:
-                json.dump(state, f, indent=2)
-            
-            logger.debug("Boost state saved to disk")
-        except Exception as e:
-            logger.warning(f"Failed to save boost state: {e}")
-    
     def set_broadcast_callback(self, callback: Callable) -> None:
         """Set callback for broadcasting WebSocket events."""
         self._broadcast_callback = callback
diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index 2c6a2e0..4e5c8c2 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -395,6 +395,26 @@ def _workspace_unavailable_result(self, *, tactic_script: bool = False) -> Lean4
             )
         return Lean4Result(success=False, error_output=error_output)
 
+    @staticmethod
+    def _is_stale_lake_state(output: str) -> bool:
+        """Detect Lake errors caused by a stale .lake directory from a prior failed clone."""
+        text = (output or "").lower()
+        return (
+            "url has changed" in text
+            or "exited with code 128" in text
+            or ("delete" in text and "packages" in text and "manually" in text)
+        )
+
+    def _wipe_lake_directory(self) -> None:
+        """Remove the .lake directory to give lake update a clean slate."""
+        lake_dir = self.workspace_dir / ".lake"
+        if lake_dir.exists():
+            try:
+                shutil.rmtree(lake_dir)
+                logger.info("Removed stale .lake directory at %s", lake_dir)
+            except OSError as exc:
+                logger.warning("Failed to remove .lake directory at %s: %s", lake_dir, exc)
+
     async def _repair_workspace_after_infrastructure_error(self, output: str) -> bool:
         logger.warning(
             "Lean 4 workspace infrastructure error detected; invalidating workspace cache and refetching Mathlib artifacts. Diagnostic: %s",
@@ -403,6 +423,7 @@ async def _repair_workspace_after_infrastructure_error(self, output: str) -> boo
         async with self._workspace_lock:
             self._workspace_unhealthy_error = ""
             self._workspace_ready = False
+            self._wipe_lake_directory()
             repaired = await self._ensure_workspace_locked()
             if not repaired:
                 self._mark_workspace_unhealthy(output)
@@ -473,12 +494,27 @@ async def _ensure_workspace_locked(self) -> bool:
                 timeout=max(system_config.lean4_proof_timeout, 120),
             )
             if update_rc != 0:
-                self._mark_workspace_unhealthy(update_stderr or update_stdout)
-                logger.warning(
-                    "Lean 4 workspace update failed: %s",
-                    (update_stderr or update_stdout).strip(),
-                )
-                return False
+                combined_update_output = "\n".join(
+                    part for part in (update_stdout, update_stderr) if part
+                ).strip()
+                lake_dir = self.workspace_dir / ".lake"
+                if lake_dir.exists() and self._is_stale_lake_state(combined_update_output):
+                    logger.warning(
+                        "lake update failed due to stale .lake state; wiping .lake directory and retrying."
+                    )
+                    self._wipe_lake_directory()
+                    update_rc, update_stdout, update_stderr = await self._run_process(
+                        [lake_cmd, "update"],
+                        cwd=self.workspace_dir,
+                        timeout=max(system_config.lean4_proof_timeout, 120),
+                    )
+                if update_rc != 0:
+                    self._mark_workspace_unhealthy(update_stderr or update_stdout)
+                    logger.warning(
+                        "Lean 4 workspace update failed: %s",
+                        (update_stderr or update_stdout).strip(),
+                    )
+                    return False
 
             # The project's lean-toolchain MUST match Mathlib's pinned toolchain,
             # otherwise `lake exe cache get` refuses to download the prebuilt
diff --git a/backend/shared/openrouter_client.py b/backend/shared/openrouter_client.py
index 6533957..60c4bdf 100644
--- a/backend/shared/openrouter_client.py
+++ b/backend/shared/openrouter_client.py
@@ -34,7 +34,7 @@ class OpenRouterClient:
     # App attribution for OpenRouter leaderboards
     # See: https://openrouter.ai/docs/app-attribution
     APP_URL = "https://intrafere.com/moto-autonomous-home-ai/"
-    APP_TITLE = "MOTO Deep Research Harness"
+    APP_TITLE = "MOTO Autonomous ASI"
     
     def __init__(self, api_key: str):
         self.api_key = api_key
diff --git a/moto_launcher.py b/moto_launcher.py
index d47a94a..ce24dc9 100644
--- a/moto_launcher.py
+++ b/moto_launcher.py
@@ -1228,6 +1228,17 @@ def install_lean4(
         print()
         return
 
+    if sys.platform == "win32":
+        try:
+            subprocess.run(
+                ["git", "config", "--global", "core.longpaths", "true"],
+                check=False,
+                stdout=subprocess.DEVNULL,
+                stderr=subprocess.DEVNULL,
+            )
+        except Exception:
+            pass
+
     workspace_dir = Path(runtime.data_root) / "lean4_workspace"
     try:
         _write_lean_workspace_files(workspace_dir)

From 85907a50828a918ffcdf58f49927aa47f92a09b6 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 22:48:45 -0500
Subject: [PATCH 25/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 backend/autonomous/memory/proof_database.py | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/backend/autonomous/memory/proof_database.py b/backend/autonomous/memory/proof_database.py
index 817a5e4..b2bff96 100644
--- a/backend/autonomous/memory/proof_database.py
+++ b/backend/autonomous/memory/proof_database.py
@@ -16,7 +16,7 @@
 
 from backend.shared.config import system_config
 from backend.shared.models import FailedProofCandidate, ProofCandidate, ProofRecord
-from backend.shared.path_safety import validate_single_path_component
+from backend.shared.path_safety import resolve_path_within_root, validate_single_path_component
 from backend.autonomous.prompts.proof_prompts import format_failure_hints_for_injection
 
 logger = logging.getLogger(__name__)
@@ -768,20 +768,23 @@ async def get_library_proof(self, session_id: str, proof_id: str) -> Optional[Di
         if session_id == "legacy":
             proofs_dir = Path(system_config.data_dir) / "proofs"
         else:
-            proofs_dir = Path(system_config.auto_sessions_base_dir) / validate_single_path_component(session_id, "session ID") / "proofs"
+            safe_session = validate_single_path_component(session_id, "session ID")
+            proofs_dir = resolve_path_within_root(
+                Path(system_config.auto_sessions_base_dir), safe_session, "proofs"
+            )
 
         if not proofs_dir.exists():
             return None
 
         safe_id = validate_single_path_component(proof_id, "proof ID")
-        record_path = proofs_dir / f"proof_{safe_id}.json"
-        lean_path = proofs_dir / f"proof_{safe_id}_lean.lean"
+        record_path = resolve_path_within_root(proofs_dir, f"proof_{safe_id}.json")
+        lean_path = resolve_path_within_root(proofs_dir, f"proof_{safe_id}_lean.lean")
 
         if not record_path.exists():
             return None
 
         try:
-            async with aiofiles.open(record_path, "r", encoding="utf-8") as handle:
+            async with aiofiles.open(str(record_path), "r", encoding="utf-8") as handle:
                 proof_data = json.loads(await handle.read())
         except Exception as exc:
             logger.error("Failed to read proof %s from session %s: %s", proof_id, session_id, exc)
@@ -790,7 +793,7 @@ async def get_library_proof(self, session_id: str, proof_id: str) -> Optional[Di
         lean_code = ""
         if lean_path.exists():
             try:
-                async with aiofiles.open(lean_path, "r", encoding="utf-8") as handle:
+                async with aiofiles.open(str(lean_path), "r", encoding="utf-8") as handle:
                     lean_code = await handle.read()
             except Exception:
                 lean_code = str(proof_data.get("lean_code", "") or "")

From be951f4bb72d55f55c1daf4d880377eb20747a54 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Mon, 4 May 2026 23:04:17 -0500
Subject: [PATCH 26/32] # Version 1.0.7

## Features
- Lean 4 Integrated: Automated theorem generation pipeline completed with Lean 4 proof verification as the final validation step, this new mechanic includes the MOTO ASI's primary Top-P exploration mechanic for feedback/retry and deeper exploration on proof retry attempts.
- New autonomous proof pipeline modules: proof identification, lemma search, proof formalization, dependency extraction, novelty checking, proof database, and a dedicated proof verification stage.
- New proof surfaces in the GUI: Mathematical Proofs panel, Proof Graph visualization, and a Proof notification stack.
- New backend routes: `/api/health`, `/api/features`, `/api/update-notice`, and a full proofs API (proof database, Lean 4 status, manual proof checks, certificate export).
- Docker support: first-class `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh` for hosted/generic-mode deployments.
- Ubuntu 24.04 launcher: new `Launch MOTO.sh` bootstrapper that provisions a repo-local `.venv` and runs the shared Python launcher.
- Launcher and updater infrastructure rewritten in Python (`moto_launcher.py`, `moto_updater.py`) with a new `moto-update-manifest.json` describing version, build commit, and API contract version for update comparison.
- Generic/hosted mode added, with `requirements-generic.txt`, hosted-proxy authentication helpers (`backend/api/proxy_auth.py`), a Lean-free / Z3-free hosted contract, and a dedicated `fastembed` embedding provider for hosted environments.
- Auto-fill OpenRouter context window from model context length.
- Auto-cap OpenRouter max output to the lower of 20% model context or the smallest available host output cap.
- The program now supports parallel program runtimes.
- New automated test suite under `tests/` covering the Lean 4 client, launcher/updater, rigor Lean placement validator, compiler marker visibility, Wolfram tool loop, paper memory appendix, and more.

## Changes
- Kimi K2.6 replaced Kimi K2.5 in any respective default profiles.
- DeepSeek V4 Pro replaced DeepSeek V3.2 in the respective default profiles using DeepSeek.
- Inception 2 Mercury added as a supplementary 4th parallel brainstorm submitter in the fast affordable profile.
- Applied the new OpenRouter auto-fill and host-cap logic across Aggregator, Compiler, Autonomous Research, and Boost settings.
- Added concise rule coverage for proof verification checkpoints, manual proof checks, proof APIs/events, session-aware proof storage, and proof graph/dependency surfaces.
- Documented Lean 4 / SMT runtime gating, Lean-authoritative verification, and the hosted Lean-free/Z3-free contract.
- Updated `.gitignore` with `backend/data/proofs/` (keep-pattern), `backend/data/lean4_workspace/` (blanket), and `backend/data/elan/` (blanket) to keep the Lean toolchain installer and workspace out of the repo, plus a new `backend/data/proofs/.gitkeep`.
- Balanced fast submitters with slow submitters; any individual submitter role that has more than 4 submissions in the queue pauses while the others continue.
- Added 2 "lab grade" tier default profiles featuring SOTA models such as Opus 4.7, GPT 5-5 Pro, and Grok 4.20 Multi-Agent. Runtime cost estimates range from $20 per hour to $60 per hour or greater for each respective profile.
- Replaced the legacy `_moto_internal_launcher.ps1` bootstrap with the cross-platform `moto_launcher.py` entrypoint.
- Trimmed the MIT LICENSE appendix (the non-legal AI-generated-content advisory block that followed the `---` divider); the MIT license text itself is unchanged.

## Bug Fixes
- OpenRouter provider lookups now return endpoint metadata instead of only host names.
- Fixed LM Studio "offline" status bug in GUI which showed LM Studio offline when it was not.
- Silenced the ECONNREFUSED noise during startup while preserving real errors.
- Fixed disclaimer GUI resolution bug discovered by @asimog.
- Added GUI UIX optimizations proposed by @asimog.
- Fixed tab switching screen orientation bug.
---
 frontend/src/App.jsx                      |  4 +-
 frontend/src/components/WorkflowPanel.jsx | 89 +++++++----------------
 2 files changed, 29 insertions(+), 64 deletions(-)

diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index a48fbff..56a16aa 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -231,7 +231,7 @@ function App() {
   // Track WorkflowPanel collapse state for sliding boost buttons
   const [workflowPanelCollapsed, setWorkflowPanelCollapsed] = useState(() => {
     const savedState = localStorage.getItem('workflow_panel_collapsed');
-    return savedState === 'true';
+    return savedState !== 'false';
   });
 
   // Update notice banner state (dismissible per session, re-appears on restart)
@@ -2039,7 +2039,7 @@ function App() {
   useEffect(() => {
     const handleStorageChange = () => {
       const savedState = localStorage.getItem('workflow_panel_collapsed');
-      setWorkflowPanelCollapsed(savedState === 'true');
+      setWorkflowPanelCollapsed(savedState !== 'false');
     };
     
     const interval = setInterval(handleStorageChange, 500);
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index fdfa1a6..4b45212 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -3,8 +3,7 @@ import { websocket } from '../services/websocket';
 import { boostAPI, workflowAPI } from '../services/api';
 import './WorkflowPanel.css';
 
-const HOURLY_AUTO_OPEN_INTERVAL_SECONDS = 3600;
-const WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY = 'workflow_panel_last_auto_open_hour';
+const AUTO_OPEN_DELAY_SECONDS = 600;
 
 const formatNumber = (n) => n.toLocaleString();
 
@@ -16,10 +15,7 @@ const formatTime = (totalSeconds) => {
 };
 
 export default function WorkflowPanel({ isRunning }) {
-  const [collapsed, setCollapsed] = useState(() => {
-    const savedState = localStorage.getItem('workflow_panel_collapsed');
-    return savedState === 'true';
-  });
+  const [collapsed, setCollapsed] = useState(true);
   const [mode, setMode] = useState('idle');
   
   // Boost controls state
@@ -36,15 +32,31 @@ export default function WorkflowPanel({ isRunning }) {
   const [showPerModel, setShowPerModel] = useState(false);
   const [localElapsed, setLocalElapsed] = useState(0);
   const lastSyncRef = useRef(Date.now());
-  const hasElapsedSyncRef = useRef(false);
-  const lastAutoOpenedHourRef = useRef(0);
+
+  // Auto-open: pop open exactly once, 10 minutes after user presses Start.
+  // No persistence. Resets every time isRunning goes true.
+  const hasPoppedThisSession = useRef(false);
 
   const expandPanel = useCallback(() => {
     setCollapsed(false);
     localStorage.setItem('workflow_panel_collapsed', 'false');
   }, []);
 
-  // Fetch boost status and categories when running
+  useEffect(() => {
+    if (isRunning) {
+      hasPoppedThisSession.current = false;
+    }
+  }, [isRunning]);
+
+  useEffect(() => {
+    if (!isRunning || hasPoppedThisSession.current) return;
+    if (localElapsed >= AUTO_OPEN_DELAY_SECONDS) {
+      expandPanel();
+      hasPoppedThisSession.current = true;
+    }
+  }, [isRunning, localElapsed, expandPanel]);
+
+  // Fetch boost status and categories
   const fetchBoostStatus = useCallback(async () => {
     try {
       const statusResponse = await boostAPI.getStatus();
@@ -54,8 +66,6 @@ export default function WorkflowPanel({ isRunning }) {
         setBoostedCategories(statusResponse.status.boosted_categories || []);
         setBoostAlwaysPrefer(statusResponse.status.boost_always_prefer || false);
       }
-      
-      // Always fetch all categories (no mode filter)
       const categoriesResponse = await boostAPI.getCategories('all');
       if (categoriesResponse.success) {
         setAvailableCategories(categoriesResponse.categories || []);
@@ -65,54 +75,12 @@ export default function WorkflowPanel({ isRunning }) {
     }
   }, []);
 
-  // Fetch boost status on mount and when running state changes
-  // ETERNAL: Always fetch boost status, even when not running
   useEffect(() => {
     fetchBoostStatus();
-    
-    // Poll boost status periodically (every 5 seconds)
     const interval = setInterval(fetchBoostStatus, 5000);
     return () => clearInterval(interval);
   }, [fetchBoostStatus]);
 
-  useEffect(() => {
-    if (boostEnabled && isRunning) {
-      expandPanel();
-    }
-  }, [boostEnabled, expandPanel, isRunning]);
-
-  // Clear stale auto-open state when a new workflow session begins
-  useEffect(() => {
-    if (isRunning) {
-      lastAutoOpenedHourRef.current = 0;
-      localStorage.removeItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY);
-    }
-  }, [isRunning]);
-
-  useEffect(() => {
-    if (!isRunning || !hasElapsedSyncRef.current) {
-      return;
-    }
-
-    const elapsedHours = Math.floor(localElapsed / HOURLY_AUTO_OPEN_INTERVAL_SECONDS);
-    if (elapsedHours < 1 || elapsedHours <= lastAutoOpenedHourRef.current) {
-      return;
-    }
-
-    if (collapsed) {
-      expandPanel();
-    }
-
-    lastAutoOpenedHourRef.current = elapsedHours;
-    localStorage.setItem(WORKFLOW_PANEL_AUTO_OPEN_HOUR_KEY, elapsedHours.toString());
-  }, [collapsed, expandPanel, isRunning, localElapsed]);
-
-  useEffect(() => {
-    if (!isEditingBoostNext) {
-      setBoostNextInput(boostNextCount > 0 ? boostNextCount.toString() : '');
-    }
-  }, [boostNextCount, isEditingBoostNext]);
-
   useEffect(() => {
     if (!isEditingBoostNext) {
       setBoostNextInput(boostNextCount > 0 ? boostNextCount.toString() : '');
@@ -160,13 +128,10 @@ export default function WorkflowPanel({ isRunning }) {
 
   // Token stats: initial fetch on mount and when isRunning changes
   useEffect(() => {
-    hasElapsedSyncRef.current = false;
-
     const fetchTokenStats = async () => {
       try {
         const resp = await workflowAPI.getTokenStats();
         if (resp.success) {
-          hasElapsedSyncRef.current = true;
           setTokenStats(resp);
           setLocalElapsed(resp.elapsed_seconds || 0);
           lastSyncRef.current = Date.now();
@@ -179,7 +144,6 @@ export default function WorkflowPanel({ isRunning }) {
   // Token stats: listen for real-time WebSocket updates
   useEffect(() => {
     const handleTokenUpdate = (data) => {
-      hasElapsedSyncRef.current = true;
       setTokenStats(data);
       setLocalElapsed(data.elapsed_seconds || 0);
       lastSyncRef.current = Date.now();
@@ -235,7 +199,6 @@ export default function WorkflowPanel({ isRunning }) {
 
     const handleBoostEnabled = () => {
       setBoostEnabled(true);
-      expandPanel();
       fetchBoostStatus();
     };
 
@@ -263,12 +226,14 @@ export default function WorkflowPanel({ isRunning }) {
       websocket.off('boost_disabled', handleBoostDisabled);
       websocket.off('boost_always_prefer_updated', handleAlwaysPreferUpdated);
     };
-  }, [isRunning, fetchBoostStatus, expandPanel]);
+  }, [isRunning, fetchBoostStatus]);
 
   const toggleCollapse = () => {
-    const newState = !collapsed;
-    setCollapsed(newState);
-    localStorage.setItem('workflow_panel_collapsed', newState.toString());
+    setCollapsed(prev => {
+      const next = !prev;
+      localStorage.setItem('workflow_panel_collapsed', next.toString());
+      return next;
+    });
   };
 
   // REMOVED: Conditional rendering that hid panel when no workflow running

From dec7b7d832b1b5094f09ea83a9bc19bf6608e844 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Tue, 5 May 2026 08:01:20 -0500
Subject: [PATCH 27/32] # Version 1.0.7 Bug Fix

## Bug Fixes
Fixed Matlab /git bug caused by excessive timeout.
---
 backend/shared/lean4_client.py | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index 4e5c8c2..79ab9c0 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -304,7 +304,7 @@ async def _run_process(
         args: list[str],
         *,
         cwd: Path,
-        timeout: int,
+        timeout: Optional[int] = None,
     ) -> tuple[int, str, str]:
         process = await asyncio.create_subprocess_exec(
             *args,
@@ -313,7 +313,10 @@ async def _run_process(
             stderr=asyncio.subprocess.PIPE,
         )
         try:
-            stdout_bytes, stderr_bytes = await asyncio.wait_for(process.communicate(), timeout=timeout)
+            if timeout is not None:
+                stdout_bytes, stderr_bytes = await asyncio.wait_for(process.communicate(), timeout=timeout)
+            else:
+                stdout_bytes, stderr_bytes = await process.communicate()
         except asyncio.CancelledError:
             process.kill()
             await process.communicate()
@@ -488,10 +491,10 @@ async def _ensure_workspace_locked(self) -> bool:
         if needs_bootstrap or not self._workspace_ready:
             logger.info("Bootstrapping Lean 4 workspace at %s", self.workspace_dir)
 
+            # NO TIMEOUT: lake update clones the multi-GB Mathlib repo. Do NOT add a timeout here.
             update_rc, update_stdout, update_stderr = await self._run_process(
                 [lake_cmd, "update"],
                 cwd=self.workspace_dir,
-                timeout=max(system_config.lean4_proof_timeout, 120),
             )
             if update_rc != 0:
                 combined_update_output = "\n".join(
@@ -503,10 +506,10 @@ async def _ensure_workspace_locked(self) -> bool:
                         "lake update failed due to stale .lake state; wiping .lake directory and retrying."
                     )
                     self._wipe_lake_directory()
+                    # NO TIMEOUT: lake update clones the multi-GB Mathlib repo. Do NOT add a timeout here.
                     update_rc, update_stdout, update_stderr = await self._run_process(
                         [lake_cmd, "update"],
                         cwd=self.workspace_dir,
-                        timeout=max(system_config.lean4_proof_timeout, 120),
                     )
                 if update_rc != 0:
                     self._mark_workspace_unhealthy(update_stderr or update_stdout)
@@ -528,10 +531,10 @@ async def _ensure_workspace_locked(self) -> bool:
                 logger.info(
                     "Aligned workspace lean-toolchain with Mathlib; re-running lake update."
                 )
+                # NO TIMEOUT: lake update clones the multi-GB Mathlib repo. Do NOT add a timeout here.
                 update_rc, update_stdout, update_stderr = await self._run_process(
                     [lake_cmd, "update"],
                     cwd=self.workspace_dir,
-                    timeout=max(system_config.lean4_proof_timeout, 120),
                 )
                 if update_rc != 0:
                     self._mark_workspace_unhealthy(update_stderr or update_stdout)
@@ -564,13 +567,14 @@ async def _fetch_mathlib_cache(
         lake_cmd: str,
         cwd: Path,
     ) -> tuple[int, str, str]:
-        """Fetch Mathlib's cache, retrying once after pruning corrupt downloads."""
-        timeout = max(system_config.lean4_proof_timeout, 600)
+        """Fetch Mathlib's cache, retrying once after pruning corrupt downloads.
+
+        NO TIMEOUT: This downloads ~6 GB of prebuilt olean files. Do NOT add a timeout.
+        """
         cache_args = [lake_cmd, "exe", "cache", "get"]
         cache_rc, cache_stdout, cache_stderr = await self._run_process(
             cache_args,
             cwd=cwd,
-            timeout=timeout,
         )
         if cache_rc == 0:
             return cache_rc, cache_stdout, cache_stderr
@@ -593,7 +597,6 @@ async def _fetch_mathlib_cache(
         return await self._run_process(
             cache_args,
             cwd=cwd,
-            timeout=timeout,
         )
 
     @staticmethod

From 377c127b818dce2bc1d20b409926a46a0e032f7b Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Tue, 5 May 2026 08:46:36 -0500
Subject: [PATCH 28/32] # Version 1.0.7 Bug Fix

## Bug Fixes
Fixed Matlab /git bug caused by excessive timeout.
---
 backend/shared/lean4_client.py | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index 79ab9c0..0d1ffd1 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -103,6 +103,11 @@ def _output_contains_sorry_warning(output: str) -> bool:
     "imports are out of date",
     "invalid or corrupt .olean",
     "invalid or corrupt olean",
+    "setup-file",
+)
+
+_LEAN_WORKSPACE_COMBINED_MARKERS: tuple[tuple[str, ...], ...] = (
+    ("no such file or directory", ".lake"),
 )
 
 # Markdown fence markers the LLM occasionally emits inside the `lean_code`
@@ -364,9 +369,13 @@ def _combined_process_output(stdout: str, stderr: str) -> str:
     def _is_workspace_infrastructure_error(output: str) -> bool:
         text = output or ""
         lowered = text.lower()
-        return bool(_OLEAN_OBJECT_FILE_MISSING_RE.search(text)) or any(
-            marker in lowered for marker in _LEAN_WORKSPACE_ERROR_MARKERS
-        )
+        if bool(_OLEAN_OBJECT_FILE_MISSING_RE.search(text)):
+            return True
+        if any(marker in lowered for marker in _LEAN_WORKSPACE_ERROR_MARKERS):
+            return True
+        if any(all(part in lowered for part in combo) for combo in _LEAN_WORKSPACE_COMBINED_MARKERS):
+            return True
+        return False
 
     @staticmethod
     def _format_workspace_infrastructure_error(output: str) -> str:

From 501e8cb7aeb54aa48b4b8309fb3e218a41fa214b Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Tue, 5 May 2026 09:33:47 -0500
Subject: [PATCH 29/32] # Version 1.0.7 Bug Fix

## Bug Fixes
Fixed Matlab and Lean 4 co-dependence bug that was disrupting some users proof generation.
---
 backend/shared/lean4_client.py | 47 +++++++++++++++++++++++++++++++---
 1 file changed, 44 insertions(+), 3 deletions(-)

diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index 0d1ffd1..b90cb02 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -6,8 +6,11 @@
 import asyncio
 import json
 import logging
+import os
 import re
 import shutil
+import stat
+import time
 import uuid
 from contextlib import suppress
 from dataclasses import dataclass
@@ -420,12 +423,27 @@ def _is_stale_lake_state(output: str) -> bool:
     def _wipe_lake_directory(self) -> None:
         """Remove the .lake directory to give lake update a clean slate."""
         lake_dir = self.workspace_dir / ".lake"
-        if lake_dir.exists():
+        if not lake_dir.exists():
+            return
+        for attempt in range(3):
             try:
-                shutil.rmtree(lake_dir)
+                shutil.rmtree(lake_dir, onerror=self._rmtree_onerror)
                 logger.info("Removed stale .lake directory at %s", lake_dir)
+                return
             except OSError as exc:
-                logger.warning("Failed to remove .lake directory at %s: %s", lake_dir, exc)
+                if attempt < 2:
+                    time.sleep(1)
+                else:
+                    logger.warning("Failed to remove .lake directory at %s after 3 attempts: %s", lake_dir, exc)
+
+    @staticmethod
+    def _rmtree_onerror(func: Any, path: str, exc_info: Any) -> None:
+        """Handle permission errors during rmtree by clearing read-only and retrying."""
+        try:
+            os.chmod(path, stat.S_IWRITE)
+            func(path)
+        except Exception:
+            pass
 
     async def _repair_workspace_after_infrastructure_error(self, output: str) -> bool:
         logger.warning(
@@ -566,6 +584,29 @@ async def _ensure_workspace_locked(self) -> bool:
                 )
                 return False
 
+            # Sanity check: verify the cache is actually usable before marking ready.
+            # lake exe cache get can report success while files are missing on disk.
+            # NO TIMEOUT: First-time elaboration of `import Mathlib` against a fresh
+            # olean cache can take too long on a cold machine even when all
+            # files are present. A timeout here would false-report failure, wipe a
+            # valid .lake directory, and loop forever. Do NOT add a timeout.
+            sanity_rc, sanity_stdout, sanity_stderr = await self._run_process(
+                [lake_cmd, "env", self.lean_path or self._resolve_executable("lean"),
+                 root_file_path.name],
+                cwd=self.workspace_dir,
+            )
+            if sanity_rc != 0:
+                sanity_output = self._combined_process_output(sanity_stdout, sanity_stderr)
+                if self._is_workspace_infrastructure_error(sanity_output):
+                    logger.warning(
+                        "Lean 4 workspace sanity check failed — Mathlib cache is incomplete. "
+                        "Wiping .lake and marking unhealthy. Details: %s",
+                        sanity_output[:500],
+                    )
+                    self._wipe_lake_directory()
+                self._mark_workspace_unhealthy(sanity_output)
+                return False
+
         self._workspace_ready = True
         self._workspace_unhealthy_error = ""
         return True

From cb8eca8338e0ac9adeece7b2d9639f6ea42e1d7c Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Tue, 5 May 2026 12:36:13 -0500
Subject: [PATCH 30/32] # Version 1.0.7 Bug Fix

## Bug Fixes
Fixed Matlib and Lean 4 co-dependence bug that was disrupting some users proof generation.
---
 backend/shared/lean4_client.py |  60 ++++-
 randomlog.txt                  | 467 +++++++++++++++++++++++++++++++++
 2 files changed, 522 insertions(+), 5 deletions(-)

diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index b90cb02..310d4b3 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -113,6 +113,25 @@ def _output_contains_sorry_warning(output: str) -> bool:
     ("no such file or directory", ".lake"),
 )
 
+# Lean emits "bad import" when an `import` statement references a module whose
+# .lean source doesn't exist. This is NOT an infrastructure error — it means the
+# proof code has a wrong/stale module path (e.g. Mathlib reorganised its tree).
+# We must NOT let this trigger the expensive workspace-repair loop.
+_BAD_IMPORT_RE = re.compile(
+    r"(?:bad import|unknown module|could not find module)[^\n]*",
+    re.IGNORECASE,
+)
+_BAD_IMPORT_HINT = (
+    "HINT: One or more `import` statements reference Mathlib modules that do not "
+    "exist in the current Mathlib version. Mathlib4 frequently reorganises its "
+    "module tree. Common renames include:\n"
+    "  • Mathlib.Analysis.NormedSpace.Banach → Mathlib.Analysis.Normed.Operator.Banach\n"
+    "  • Mathlib.Analysis.NormedSpace.OperatorNorm → Mathlib.Analysis.Normed.Operator.NormedSpace\n"
+    "  • Mathlib.Topology.MetricSpace.BanachFixedPoint → Mathlib.Topology.MetricSpace.Contracting\n"
+    "Use `import Mathlib` (imports everything) or check the current Mathlib4 source tree "
+    "for the correct module path."
+)
+
 # Markdown fence markers the LLM occasionally emits inside the `lean_code`
 # JSON field even when instructed to return raw code. Strip them defensively so
 # Lean 4 does not fail to parse the generated file on a stray ```lean line.
@@ -372,6 +391,12 @@ def _combined_process_output(stdout: str, stderr: str) -> str:
     def _is_workspace_infrastructure_error(output: str) -> bool:
         text = output or ""
         lowered = text.lower()
+
+        # A "bad import" is a proof-level error (stale/renamed Mathlib module),
+        # not infrastructure failure. Short-circuit to avoid the repair loop.
+        if _BAD_IMPORT_RE.search(text):
+            return False
+
         if bool(_OLEAN_OBJECT_FILE_MISSING_RE.search(text)):
             return True
         if any(marker in lowered for marker in _LEAN_WORKSPACE_ERROR_MARKERS):
@@ -812,6 +837,21 @@ def _annotate_no_goals_hint(error_output: str) -> str:
             return error_output
         return f"{_NO_GOALS_HINT}\n\n{error_output}"
 
+    @staticmethod
+    def _annotate_bad_import_hint(error_output: str) -> str:
+        """Prepend a hint when Lean reports a bad/unknown import.
+
+        This tells the LLM that module paths have been renamed and suggests
+        alternatives, preventing it from assuming the workspace is broken.
+        """
+        if not error_output:
+            return error_output
+        if not _BAD_IMPORT_RE.search(error_output):
+            return error_output
+        if _BAD_IMPORT_HINT in error_output:
+            return error_output
+        return f"{_BAD_IMPORT_HINT}\n\n{error_output}"
+
     @staticmethod
     def _format_tactic_lines(tactic_list: list[str]) -> list[str]:
         lines: list[str] = []
@@ -989,7 +1029,9 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
         error_output = combined_output or "Lean 4 rejected the proof without additional diagnostics."
         return Lean4Result(
             success=False,
-            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            error_output=self._annotate_bad_import_hint(
+                self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output))
+            ),
             goal_states=goal_states,
             raw_stderr=stderr.strip(),
         )
@@ -1152,10 +1194,14 @@ async def _run_tactic_script_once(
         error_output = tactic_error_slice or combined_output or "Lean 4 rejected the tactic script without additional diagnostics."
         return Lean4Result(
             success=False,
-            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            error_output=self._annotate_bad_import_hint(
+                self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output))
+            ),
             goal_states=goal_states,
             raw_stderr=stderr.strip(),
-            tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+            tactic_error_slice=self._annotate_bad_import_hint(
+                self._annotate_no_goals_hint(tactic_error_slice)
+            ),
             failing_tactic_index=failing_tactic_index,
         )
 
@@ -1573,10 +1619,14 @@ def _result_from_diagnostics(
 
         return Lean4Result(
             success=False,
-            error_output=self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output)),
+            error_output=self._annotate_bad_import_hint(
+                self._annotate_no_goals_hint(self._prioritize_errors_in_output(error_output))
+            ),
             goal_states=goal_states,
             raw_stderr=raw_stderr,
-            tactic_error_slice=self._annotate_no_goals_hint(tactic_error_slice),
+            tactic_error_slice=self._annotate_bad_import_hint(
+                self._annotate_no_goals_hint(tactic_error_slice)
+            ),
             failing_tactic_index=failing_tactic_index,
         )
 
diff --git a/randomlog.txt b/randomlog.txt
index e69de29..d5c1c74 100644
--- a/randomlog.txt
+++ b/randomlog.txt
@@ -0,0 +1,467 @@
+2026-05-05 09:37:18.716 - backend.api.middleware - INFO - Using default CORS origins: ['http://localhost:5173', 'http://127.0.0.1:5173', 'http://localhost:8000', 'http://127.0.0.1:8000']
+2026-05-05 09:37:18.716 - backend.api.middleware - INFO - Middleware configured
+INFO:     Started server process [15848]
+INFO:     Waiting for application startup.
+2026-05-05 09:37:18.777 - backend.api.main - INFO - Starting ASI Aggregator System instance 'default' (data_dir=C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data, logs_dir=C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\logs)
+2026-05-05 09:37:18.783 - backend.api.main - INFO - Secret store active: namespaced_instance=False
+2026-05-05 09:37:20.433 - backend.shared.api_client_manager - INFO - OpenRouter client initialized
+2026-05-05 09:37:20.433 - backend.api.main - INFO - Restored OpenRouter API key from secure backend storage
+2026-05-05 09:37:20.446 - backend.api.main - INFO - No Wolfram Alpha API key found in secure backend storage for this namespace
+2026-05-05 09:37:20.465 - backend.shared.lm_studio_client - INFO - Successfully connected to LM Studio. Found 4 models.
+2026-05-05 09:37:20.465 - backend.api.main - INFO - No resumable session found - using legacy paths
+2026-05-05 09:37:20.465 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\proofs
+2026-05-05 09:37:20.465 - backend.api.main - INFO - ASI Aggregator System ready
+2026-05-05 09:37:20.497 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
+INFO:     Application startup complete.
+INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)
+INFO:     127.0.0.1:62649 - "WebSocket /ws" [accepted]
+2026-05-05 09:37:28.127 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
+INFO:     connection open
+2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 1 (Main Submitter): model=x-ai/grok-4.3, context=1000000, max_tokens=128000
+2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 2 : model=moonshotai/kimi-k2.6, context=262000, max_tokens=40000
+2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 3 : model=x-ai/grok-4.3, context=1000000, max_tokens=128000
+2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Validator: model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
+2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous coordinator initializing with 3 submitters
+2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 1 (Main Submitter): model=x-ai/grok-4.3, context=1000000
+2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 2 : model=moonshotai/kimi-k2.6, context=262000
+2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 3 : model=x-ai/grok-4.3, context=1000000
+2026-05-05 09:37:33.493 - backend.autonomous.memory.session_manager - INFO - Session initialized: explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
+2026-05-05 09:37:33.493 - backend.autonomous.memory.session_manager - INFO - Session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
+2026-05-05 09:37:33.493 - backend.autonomous.core.autonomous_coordinator - INFO - New session initialized: explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
+2026-05-05 09:37:33.493 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
+2026-05-05 09:37:33.493 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
+2026-05-05 09:37:33.493 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
+2026-05-05 09:37:33.493 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\final_answer
+2026-05-05 09:37:33.493 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\proofs
+2026-05-05 09:37:33.493 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
+2026-05-05 09:37:33.509 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'user_research_prompt' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'base_user_research_prompt' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_active' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_context' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_reasoning' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_runtime_config' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'brainstorms' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'papers' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_topic_id' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_paper_id' to research metadata
+2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - User research prompt updated
+2026-05-05 09:37:33.527 - backend.autonomous.memory.research_metadata - INFO - Research metadata initialized
+2026-05-05 09:37:33.543 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Autonomous rejection logs initialized
+2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_coordinator - INFO - Resetting RAG state for fresh autonomous research mode...
+2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
+2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
+2026-05-05 09:37:33.543 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
+2026-05-05 09:37:33.560 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
+2026-05-05 09:37:33.576 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
+2026-05-05 09:37:33.577 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
+2026-05-05 09:37:33.593 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
+2026-05-05 09:37:33.610 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
+2026-05-05 09:37:33.610 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
+2026-05-05 09:37:33.626 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
+2026-05-05 09:37:33.677 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
+2026-05-05 09:37:33.677 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
+2026-05-05 09:37:33.677 - backend.autonomous.core.autonomous_coordinator - INFO - RAG state reset and cleared for autonomous mode
+2026-05-05 09:37:33.677 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
+2026-05-05 09:37:33.677 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
+2026-05-05 09:37:33.677 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager initialized
+2026-05-05 09:37:33.677 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\final_answer
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_selector': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_completion_reviewer': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_reference_selector': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_title_selector': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_redundancy_checker': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_framing_gate': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_novelty': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.692 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.692 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_paper': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_certainty_assessor': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_format_selector': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_volume_organizer': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - Configured Tier 3 Final Answer agents with api_client_manager
+2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - No interrupted workflow found - checking for incomplete papers
+2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator initialized
+2026-05-05 09:37:33.710 - backend.shared.api_client_manager - INFO - Autonomous API logger callback set
+2026-05-05 09:37:33.710 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging enabled
+2026-05-05 09:37:33.710 - backend.shared.token_tracker - INFO - TokenTracker reset
+2026-05-05 09:37:33.710 - backend.shared.token_tracker - INFO - TokenTracker timer started
+2026-05-05 09:37:33.710 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator started
+2026-05-05 09:37:42.744 - backend.autonomous.core.autonomous_coordinator - INFO - Starting topic exploration phase (target: 5 candidates)
+2026-05-05 09:37:42.744 - backend.aggregator.memory.shared_training - INFO - Brainstorm database file doesn't exist yet: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms\exploration_candidates.txt
+2026-05-05 09:37:42.744 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
+2026-05-05 09:37:42.759 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 1000000, Validator: 2000000
+2026-05-05 09:37:42.759 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['x-ai/grok-4.3', 'moonshotai/kimi-k2.6', 'x-ai/grok-4.3'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
+2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
+2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Context window configuration:
+  - Submitter 1: 1000000 tokens (model: x-ai/grok-4.3)
+  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.6)
+  - Submitter 3: 1000000 tokens (model: x-ai/grok-4.3)
+  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
+2026-05-05 09:37:43.544 - backend.aggregator.memory.shared_training - INFO - Created new shared training file
+2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
+2026-05-05 09:37:43.561 - backend.aggregator.memory.event_log - INFO - Created new event log file
+2026-05-05 09:37:43.561 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 1
+2026-05-05 09:37:43.561 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model x-ai/grok-4.3
+2026-05-05 09:37:43.561 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:43.561 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=x-ai/grok-4.3, provider=openrouter, context=1000000
+2026-05-05 09:37:43.561 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 2
+2026-05-05 09:37:43.570 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.6
+2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
+2026-05-05 09:37:43.570 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 3
+2026-05-05 09:37:43.570 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.3
+2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.3, provider=openrouter, context=1000000
+2026-05-05 09:37:43.570 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
+2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
+2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
+2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
+2026-05-05 09:37:43.576 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
+2026-05-05 09:37:43.576 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
+2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
+2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
+2026-05-05 09:37:43.577 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
+2026-05-05 09:37:43.577 - backend.autonomous.core.autonomous_coordinator - INFO - Exploration aggregator started with parallel submitters
+2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
+2026-05-05 09:37:43.876 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
+2026-05-05 09:37:43.877 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
+2026-05-05 09:37:43.877 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
+2026-05-05 09:38:04.127 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 8ad7c7a9-5bac-4d75-b43b-d97e86b604bf (iteration 1)
+2026-05-05 09:38:04.976 - backend.aggregator.core.coordinator - INFO - Validator iteration 22 - batch validating 1 submissions: ['8ad7c7a9-5bac-4d75-b43b-d97e86b604bf']
+2026-05-05 09:38:13.593 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
+2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:38:13.593 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
+2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 1)
+2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-05-05 09:38:13.600 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 4 total chunks
+2026-05-05 09:38:13.611 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 1/5 candidates accepted
+2026-05-05 09:38:13.760 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-05-05 09:38:13.760 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-05-05 09:38:23.076 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission c4e0cff3-864a-4369-b923-c566bf2591af (iteration 1)
+2026-05-05 09:38:23.625 - backend.aggregator.core.coordinator - INFO - Validator iteration 33 - batch validating 1 submissions: ['c4e0cff3-864a-4369-b923-c566bf2591af']
+2026-05-05 09:38:35.643 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
+2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:38:35.643 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
+2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 2)
+2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
+2026-05-05 09:38:35.643 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 2 total chunks
+2026-05-05 09:38:35.768 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
+2026-05-05 09:38:35.768 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
+2026-05-05 09:38:37.629 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 2/5 candidates accepted
+2026-05-05 09:38:47.097 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission fd6f9a4b-8e0a-45cb-b816-0ac7a0b2b575 (iteration 2)
+2026-05-05 09:38:47.707 - backend.aggregator.core.coordinator - INFO - Validator iteration 46 - batch validating 1 submissions: ['fd6f9a4b-8e0a-45cb-b816-0ac7a0b2b575']
+2026-05-05 09:38:55.508 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
+2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:38:55.508 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
+2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 3)
+2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
+2026-05-05 09:38:55.508 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 2 total chunks
+2026-05-05 09:38:55.625 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
+2026-05-05 09:38:55.625 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
+2026-05-05 09:38:55.625 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 3/5 candidates accepted
+2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - JSON TRUNCATION DETECTED: Model hit max_tokens during generation. Response has 1 unclosed braces, in_string=True. Response length: 743 chars. Last completed property at char 525: ...'obabilistic certificates for admissible lossiness?",\n  "reasoning": "This candidate is substantively'...
+2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - JSON TRUNCATION DETECTED: Incomplete JSON structure. open_braces=1, open_brackets=0, in_string=True. Response length: 743 chars. Model hit max_tokens during generation.
+2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - parse_json: JSON response truncated at max_tokens: incomplete structure with 1 unclosed braces, 0 unclosed brackets, in_string=True. Response length: 743 chars. Model needs to generate more concise output that fits within token limits.
+2026-05-05 09:39:05.825 - backend.aggregator.agents.submitter - INFO - Submitter 3: Initial JSON parse failed, attempting conversational retry
+2026-05-05 09:39:32.192 - backend.shared.lean4_client - INFO - Updated workspace lean-toolchain: 'leanprover/lean4:stable' -> 'leanprover/lean4:v4.30.0-rc2'
+2026-05-05 09:39:32.192 - backend.shared.lean4_client - INFO - Aligned workspace lean-toolchain with Mathlib; re-running lake update.
+2026-05-05 09:39:49.573 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 9c50c080-d45f-4b57-bbd5-759ca83d9313 (iteration 3)
+2026-05-05 09:39:49.622 - backend.aggregator.core.coordinator - INFO - Validator iteration 101 - batch validating 1 submissions: ['9c50c080-d45f-4b57-bbd5-759ca83d9313']
+2026-05-05 09:39:59.057 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
+2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:39:59.057 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 3)
+2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
+2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
+2026-05-05 09:39:59.057 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 1 total chunks
+2026-05-05 09:39:59.140 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
+2026-05-05 09:39:59.140 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
+2026-05-05 09:39:59.657 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 4/5 candidates accepted
+2026-05-05 09:40:15.356 - backend.aggregator.agents.submitter - INFO - Submitter 3: First retry succeeded!
+2026-05-05 09:40:15.356 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 918a44e9-acb1-4680-9c48-01dbe53780d1 (iteration 2)
+2026-05-05 09:40:16.123 - backend.aggregator.core.coordinator - INFO - Validator iteration 119 - batch validating 1 submissions: ['918a44e9-acb1-4680-9c48-01dbe53780d1']
+2026-05-05 09:40:26.339 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
+2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:40:26.354 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
+2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 5)
+2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-05-05 09:40:26.355 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 3 total chunks
+2026-05-05 09:40:26.439 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-05-05 09:40:26.439 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-05-05 09:40:27.678 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 5/5 candidates accepted
+2026-05-05 09:40:27.679 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: Target of 5 candidates reached
+2026-05-05 09:40:27.679 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
+2026-05-05 09:40:27.679 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
+2026-05-05 09:40:27.691 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
+2026-05-05 09:40:27.694 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
+2026-05-05 09:40:27.694 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 121
+2026-05-05 09:40:27.694 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 121 iterations - is_running=False
+2026-05-05 09:40:27.695 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
+2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Topic exploration complete: 5 candidates accepted
+2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Exploration: Restored shared_training_memory state
+2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Topic selection attempt 1
+2026-05-05 09:40:27.696 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generating topic selection with model x-ai/grok-4.3 (prompt=2689t, task_id=agg_sub1_000)
+2026-05-05 09:40:56.939 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generated submission - action=new_topic
+2026-05-05 09:40:56.939 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Validating topic selection with model x-ai/grok-4.1-fast (prompt=1406t, task_id=agg_val_000)
+2026-05-05 09:41:04.810 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Decision=accept
+2026-05-05 09:41:04.828 - backend.autonomous.memory.brainstorm_memory - INFO - Created new brainstorm: topic_001
+2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Created new brainstorm: topic_001
+2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - No papers available for pre-brainstorm reference selection
+2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Selected 0 reference papers for brainstorm
+2026-05-05 09:41:04.845 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
+2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Per-paper model tracking enabled for brainstorm topic_001
+2026-05-05 09:41:04.845 - backend.aggregator.memory.shared_training - INFO - Reloaded 0 insights from C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms\brainstorm_topic_001.txt (submission count: 0)
+2026-05-05 09:41:04.855 - backend.autonomous.core.autonomous_coordinator - INFO - Reloaded 0 existing submissions from brainstorm database
+2026-05-05 09:41:04.855 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
+2026-05-05 09:41:04.855 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 1000000, Validator: 2000000
+2026-05-05 09:41:04.856 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['x-ai/grok-4.3', 'moonshotai/kimi-k2.6', 'x-ai/grok-4.3'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
+2026-05-05 09:41:05.527 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
+2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Context window configuration:
+  - Submitter 1: 1000000 tokens (model: x-ai/grok-4.3)
+  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.6)
+  - Submitter 3: 1000000 tokens (model: x-ai/grok-4.3)
+  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
+2026-05-05 09:41:05.528 - backend.aggregator.memory.shared_training - INFO - Loaded 0 existing insights from shared training (submission count: 0)
+2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
+2026-05-05 09:41:05.528 - backend.aggregator.memory.event_log - INFO - Loaded 5 events from event log
+2026-05-05 09:41:05.528 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 1
+2026-05-05 09:41:05.528 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model x-ai/grok-4.3
+2026-05-05 09:41:05.528 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=x-ai/grok-4.3, provider=openrouter, context=1000000
+2026-05-05 09:41:05.528 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 2
+2026-05-05 09:41:05.528 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.6
+2026-05-05 09:41:05.528 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.6
+2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
+2026-05-05 09:41:05.538 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 3
+2026-05-05 09:41:05.539 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.3
+2026-05-05 09:41:05.539 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.3
+2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.3, provider=openrouter, context=1000000
+2026-05-05 09:41:05.539 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
+2026-05-05 09:41:05.539 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
+2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
+2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
+2026-05-05 09:41:05.540 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
+2026-05-05 09:41:05.540 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
+2026-05-05 09:41:05.540 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
+2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
+2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
+2026-05-05 09:41:05.541 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
+2026-05-05 09:41:05.541 - backend.autonomous.core.autonomous_coordinator - INFO - Aggregator started for brainstorm topic_001
+2026-05-05 09:41:05.541 - backend.autonomous.core.autonomous_coordinator - INFO - Starting fresh brainstorm with 0 acceptances
+2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
+2026-05-05 09:41:05.545 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
+2026-05-05 09:41:05.545 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
+2026-05-05 09:41:05.555 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
+2026-05-05 09:41:33.088 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission cfd4829a-3a5f-4ea2-8dfb-7dfcc0c5d377 (iteration 1)
+2026-05-05 09:41:33.570 - backend.aggregator.core.coordinator - INFO - Validator iteration 29 - batch validating 1 submissions: ['cfd4829a-3a5f-4ea2-8dfb-7dfcc0c5d377']
+2026-05-05 09:41:41.931 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
+2026-05-05 09:41:41.936 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:41:41.936 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
+2026-05-05 09:41:41.937 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 1)
+2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-05-05 09:41:41.938 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 13 total chunks
+2026-05-05 09:41:42.205 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-05-05 09:41:42.205 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-05-05 09:42:00.104 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission eb653b63-2e14-42df-87c8-971f683d4b54 (iteration 1)
+2026-05-05 09:42:00.952 - backend.aggregator.core.coordinator - INFO - Validator iteration 49 - batch validating 1 submissions: ['eb653b63-2e14-42df-87c8-971f683d4b54']
+2026-05-05 09:42:25.104 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
+2026-05-05 09:42:25.104 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:42:25.120 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
+2026-05-05 09:42:25.121 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 2)
+2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
+2026-05-05 09:42:25.124 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 6 total chunks
+2026-05-05 09:42:25.304 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
+2026-05-05 09:42:25.304 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
+2026-05-05 09:42:46.150 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 1752a022-ebc0-44e7-854c-77c34bcc134f (iteration 2)
+2026-05-05 09:42:46.161 - backend.aggregator.core.coordinator - INFO - Validator iteration 71 - batch validating 1 submissions: ['1752a022-ebc0-44e7-854c-77c34bcc134f']
+2026-05-05 09:43:15.187 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission rejected (consecutive: 1)
+2026-05-05 09:43:15.187 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 1 (total: 1)
+2026-05-05 09:43:41.573 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 4ce1ad0e-18a7-4855-a408-ad71e44a2bad (iteration 2)
+2026-05-05 09:43:42.251 - backend.aggregator.core.coordinator - INFO - Validator iteration 99 - batch validating 1 submissions: ['4ce1ad0e-18a7-4855-a408-ad71e44a2bad']
+2026-05-05 09:43:59.534 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
+2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:43:59.534 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
+2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 3)
+2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
+2026-05-05 09:43:59.550 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 5 total chunks
+2026-05-05 09:43:59.699 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
+2026-05-05 09:43:59.699 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
+2026-05-05 09:44:28.808 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 15b0c73a-a6c3-40b4-9ea5-dfa7b351ba61 (iteration 3)
+2026-05-05 09:44:29.665 - backend.aggregator.core.coordinator - INFO - Validator iteration 130 - batch validating 1 submissions: ['15b0c73a-a6c3-40b4-9ea5-dfa7b351ba61']
+2026-05-05 09:44:48.360 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f5754b90-663f-4778-a822-927137536d11 (iteration 3)
+2026-05-05 09:44:57.829 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
+2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:44:57.829 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
+2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
+2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
+2026-05-05 09:44:57.829 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 3 total chunks
+2026-05-05 09:44:57.845 - backend.aggregator.core.coordinator - INFO - Validator iteration 131 - batch validating 1 submissions: ['f5754b90-663f-4778-a822-927137536d11']
+2026-05-05 09:44:57.948 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
+2026-05-05 09:44:57.948 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
+2026-05-05 09:45:26.368 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
+2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:45:26.368 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 3)
+2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 5)
+2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
+2026-05-05 09:45:26.368 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 8 total chunks
+2026-05-05 09:45:26.512 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
+2026-05-05 09:45:26.512 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
+2026-05-05 09:45:57.396 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 9863bbde-134c-4777-b6d7-4fdc20b73076 (iteration 4)
+2026-05-05 09:45:57.554 - backend.aggregator.core.coordinator - INFO - Validator iteration 163 - batch validating 1 submissions: ['9863bbde-134c-4777-b6d7-4fdc20b73076']
+2026-05-05 09:46:17.543 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #6
+2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
+2026-05-05 09:46:17.543 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 3)
+2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 6)
+2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
+2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
+2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
+2026-05-05 09:46:17.543 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 8 total chunks
+2026-05-05 09:46:17.694 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
+2026-05-05 09:46:17.694 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
+2026-05-05 09:46:33.252 - backend.api.routes.autonomous - INFO - Manual override: Forcing paper writing for brainstorm topic_001
+2026-05-05 09:46:33.252 - backend.autonomous.core.autonomous_coordinator - INFO - MANUAL OVERRIDE: Forcing paper writing for brainstorm topic_001
+2026-05-05 09:46:33.252 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
+2026-05-05 09:46:33.252 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
+2026-05-05 09:46:33.252 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
+2026-05-05 09:46:33.264 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
+2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 179
+2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 179 iterations - is_running=False
+2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
+2026-05-05 09:46:33.264 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm aggregator stopped by manual override
+2026-05-05 09:46:34.169 - backend.autonomous.core.autonomous_coordinator - INFO - Manual override detected - transitioning to paper writing
+2026-05-05 09:47:50.131 - backend.autonomous.agents.lemma_search_agent - INFO - Built Mathlib declaration index with 169436 entries
+2026-05-05 09:47:53.453 - backend.shared.lean4_client - WARNING - Lean 4 LSP unhealthy; falling back to subprocess mode: startup failed:
+2026-05-05 09:47:53.469 - backend.shared.lean4_client - INFO - Lean 4 LSP reader exited after idle shutdown
+2026-05-05 09:50:57.464 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
+2026-05-05 09:55:59.235 - backend.shared.lean4_client - WARNING - Lean 4 workspace infrastructure error detected; invalidating workspace cache and refetching Mathlib artifacts. Diagnostic: LEAN 4 WORKSPACE ERROR: Mathlib cache/workspace repair failed. This is an infrastructure problem, not a proof error. Lean reported missing or invalid compiled Mathlib artifacts. Original diagnostic: MOTOProofCheck_170b6342efa846cf8f8beb216ddbccca.lean:1:0: error: object file 'C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace\.lake\packages\mathlib\.lake\build\lib\lean\Mathlib\Analysis\SpecialFunctions\Integrals.olean' of module Mathlib.Analysis.SpecialFunctions.Integrals does not exist
+2026-05-05 09:57:32.423 - backend.shared.lean4_client - INFO - Removed stale .lake directory at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace\.lake
+2026-05-05 09:57:32.439 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
+2026-05-05 09:57:32.870 - backend.shared.lm_studio_client - WARNING - 'lms ps' timed out after 10s
+2026-05-05 09:57:32.906 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
+2026-05-05 09:57:36.296 - backend.shared.lean4_client - WARNING - Lean 4 workspace update failed: error: compiled configuration is invalid; run with '-R' to reconfigure
+
+
+P
+9:37:42 AM
+Proof framing enabled for this research run
+◉
+9:37:42 AM
+Topic exploration started (target: 5 candidates)
+✓
+9:38:13 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 1)
+◈
+9:38:13 AM
+Exploration candidate 1/5 accepted:
+✓
+9:38:35 AM
+Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 2)
+◈
+9:38:37 AM
+Exploration candidate 2/5 accepted:
+✓
+9:38:55 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 3)
+◈
+9:38:55 AM
+Exploration candidate 3/5 accepted:
+✓
+9:39:59 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 4)
+◈
+9:39:59 AM
+Exploration candidate 4/5 accepted:
+✓
+9:40:26 AM
+Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 5)
+◈
+9:40:27 AM
+Exploration candidate 5/5 accepted:
+✓
+9:40:27 AM
+Topic exploration complete: 5 candidates collected from 5 attempts
+»
+9:41:04 AM
+Topic selected: How can the resolvent kernel and successive approximation theory for Volterra integral equations of the second kind be generalized to families of operators with time- or state-dependent coupling parameters, yielding explicit a-priori bounds on the deviation between solutions of the fully coupled system and those of its partly or fully decoupled truncations, thereby furnishing rigorous guarantees for controlled lossiness in variably-coupled computational models?
+✓
+9:41:41 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 1)
+✓
+9:42:25 AM
+Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 2)
+✗
+9:43:15 AM
+Submitter 1 [grok-4.3]: ✗ REJECTED (total: 1)
+✓
+9:43:59 AM
+Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 3)
+✓
+9:44:57 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 4)
+✓
+9:45:26 AM
+Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 5)
+✓
+9:46:17 AM
+Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 6)
+▶
+9:46:33 AM
+Manual override: Forcing paper writing for topic_001 (6 submissions)
+◌
+9:46:34 AM
+Proof check started for brainstorm topic_001
+#
+9:47:18 AM
+Proof check found 4 theorem candidate(s)
+>
+9:48:19 AM
+Proof attempt 1 started: Let V(ε) be the one-parameter family of Volterra operators (V(ε)x)(t) := ∫_0^t K(t,s; ε λ(t,s)) x(s) ds for ε ∈ [0,1]. Let x(ε) solve x = f + V(ε)x in C([0,T];X). Then the deviation δ = x(1) − x(0) admits the representation δ(t) = ∫_0^1 R_ε (∂V/∂ε(ε) x(ε))(t) dε, and under the uniform bound ||K|| ≤ M and Lipschitz constant L of K w.r.t. its coupling argument, ||δ(t)|| ≤ L ||λ||_∞ ||f|| (t exp(M t) − (exp(M t)−1)/M).
+>
+9:49:01 AM
+Proof attempt 1 started: Equip C([0,T];X) with the weighted norm |||x|||_\alpha := sup_t ||x(t)|| e^{-\alpha t}. Under linear growth and Lipschitz conditions on the kernel with constants M and L, the nonlinear Volterra map x ↦ f + V(x) is a contraction of ratio L/\alpha whenever \alpha > L. Consequently there exists a unique global solution satisfying ||x(t)|| ≤ C_\alpha exp(\alpha t). For a decoupled truncation V_0 the deviation δ satisfies the explicit weighted-norm bound |||δ|||_\alpha ≤ (ε_∞ / ((1 − L/\alpha) \alpha)) |||x_0|||_\alpha, which optimizes the exponential growth rate over admissible \alpha.
+>
+9:49:26 AM
+Proof attempt 1 started: Let x and x_0 be the solutions corresponding to coupling functions λ and λ_0 ≡ 0 on selected blocks. Using the Neumann series expansions x = ∑ V_λ^n f and x_0 = ∑ V_0^n f, the deviation admits the telescoping representation δ = ∑_{n=1}^∞ (V_λ^n − V_0^n) f. Under the Lipschitz assumption on K, ||V_λ^n − V_0^n|| ≤ n M^{n−1} ε with ε ≤ L T ||λ||_∞, yielding the explicit bound ||δ(t)|| ≤ (ε t / (1 − M t)^2) exp(M t) ||f||_∞ for t < 1/M. The same telescoping argument produces a strictly sharper estimate than the crude resolvent bound whenever the support of λ − λ_0 has small measure.
+>
+9:49:41 AM
+Proof attempt 1 started: For the block-structured Volterra operator T_λ = T_d + ΔT with measurable coupling λ : [0,T]×[0,T] → [0,1], the deviation δ = x − x_0 between the fully coupled and decoupled solutions satisfies the inhomogeneous Volterra equation δ = T_λ δ + ΔT x_0. The resolvent representation then gives the explicit integral bound ||δ(t)|| ≤ C ∫_0^t ε(s) exp(M t) ds, where ε(s) = sup_{u≤s} |λ(s,u)| · M_c(s) measures the effective coupling strength and C depends only on M and ||f||. The same bound continues locally for state-dependent λ(t,s,x(s)) as long as the solution remains inside a ball where the local Lipschitz constant is controlled.
+⚠
+9:55:51 AM
+Proof attempt 1 failed: MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:11:8: error: No goals to be solved MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:17:10: error(lean.unknownIdentifier): Unknown identifier `deriv_sub` MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:27:25: error(lean.invalidField): Invalid field `monotoneOn_of_deriv_nonneg`: The environment does not contain `Function.monotoneOn_of_deriv_nonneg`, so it is not possible to project the field `monotoneOn_of_deriv_nonneg` from an expressi...
+>
+9:55:51 AM
+Proof attempt 2 started: Let V(ε) be the one-parameter family of Volterra operators (V(ε)x)(t) := ∫_0^t K(t,s; ε λ(t,s)) x(s) ds for ε ∈ [0,1]. Let x(ε) solve x = f + V(ε)x in C([0,T];X). Then the deviation δ = x(1) − x(0) admits the representation δ(t) = ∫_0^1 R_ε (∂V/∂ε(ε) x(ε))(t) dε, and under the uniform bound ||K|| ≤ M and Lipschitz constant L of K w.r.t. its coupling argument, ||δ(t)|| ≤ L ||λ||_∞ ||f|| (t exp(M t) − (exp(M t)−1)/M).
+⚠
+9:57:36 AM
+Proof attempt 2 failed: LEAN 4 WORKSPACE ERROR: Mathlib cache/workspace repair failed. This is an infrastructure problem, not a proof error. Lean reported missing or invalid compiled Mathlib artifacts. Original diagnostic: error: compiled configuration is invalid; run with '-R' to reconfigure
\ No newline at end of file

From 06298fc647e267117e7468bb019a4563275dde69 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Sun, 17 May 2026 18:49:21 -0500
Subject: [PATCH 31/32] # MOTO v1.0.8

## Features
  - Added LeanOJ Proof Solver as a third standalone mode with dedicated model profiles, cumulative brainstorming, proof storming, skip-brainstorm control, and Lean 4-verified final template solving.
  - Added hosted/generic-mode runtime support with an API-only sandbox contract, FastEmbed embeddings, OpenRouter-only inference, and capability flags for the hosted web wrapper.
  - Added pruned-paper preservation and history downloads so context-excluded Stage 2 papers remain reviewable by users.
  - Added "supercharge" mode that incorporates a mini-version of Top-P exploration at the individual model level. Increasing a model's intelligence before its final constituent answer within the harness itself. This has the largest impact on LM studio and budget model users that are running smaller models.
  - The brainstorm mechanic for all modes can now produce Lean 4 proofs in the brainstorm stage if relevant to the users prompt.

## Changes
  - Optimized proof-solving prompt flow to work directly toward the user prompt/template instead of only building exploratory context.
  - Added statement-alignment validation so Lean-accepted proof code must correspond to the intended theorem candidate before storage or placement.
  - Added shared proof registration and integrity gates across autonomous proof verification, compiler rigor mode, and LeanOJ.
  - Updated project rules to document hosted runtime behavior, LeanOJ, and shared proof-integrity architecture.
  - Added shared post-Lean proof integrity checks for autonomous paper proofs, compiler rigor mode, and LeanOJ.
  - Compatible models screen is now on all settings.
  - Added "Major mathematical discovery" validator ranking category for proofs and relabeled the gold category to "Minor Mathematical Discovery". Users are now able to tell which discoveries are major vs minor as per their validator model's direction injection review.
  - Optimized and audited .cursor rules folder to assist with vibe coders and forks.
  - Parallel ran harness roles now utilize a temperature ladder such as 0, .2, .4, and .8 for concurrent LM studio API calls on models loaded with multiple slots.
  - Expanded OpenRouter model/provider settings, raw settings tooling, and automated context settings to avoid provider outliers that disrupted automatic context sizing.
  - Improved API logging, boost routing visibility, and live activity UI for long-running workflow state.
  - Improved autonomous proof verification and paper context handling during brainstorm-to-paper and resume flows.
  - Improved compiler rigor, critique, and Wolfram tool flows.
  - Updated launchers, updater metadata, and Linux hosted entrypoint behavior.
  - Refreshed documentation, rules, ignore files, and test coverage.

## Bug Fixes
  - Hardened desktop API access with loopback defaults, token-authenticated HTTP routes, one-time WebSocket tickets, and CSRF-style origin checks.
  - Hardened hosted proxy auth with signed body-hash headers so unauthenticated request bodies are not buffered before rejection.
  - Hardened workflow startup, provider error handling, and log redaction paths for safer default and hosted operation.
  - Fixed Boost secret persistence so OpenRouter keys are no longer written to boost state and restored Boost reports when a key is needed.
  - Locked Z3 executable configuration to trusted startup settings and rejected runtime `z3_path` proof-settings input.
  - Hardened final-answer archive access against nested paper/brainstorm path traversal.
  - Hardened PDF export by sanitizing server-side HTML, enforcing size caps, disabling JavaScript, and blocking external Chromium requests.
  - Redacted API/Boost logs by default so full prompts, responses, Wolfram tool results, and legacy full payloads are not exposed through log routes.
  - Sanitized OpenRouter/provider error bodies before logging or surfacing them to avoid leaking echoed prompts or keys.
  - Removed OpenRouter API keys from model-list query strings and require headers or stored runtime keys instead.
  - Disabled hosted self-update mutation and made workflow start checks atomic across top-level modes.
  - Reduced proof-status path disclosure by returning safe Lean/Z3 path labels instead of absolute local paths.
  - Fixed retry transcript hygiene so private model thought/channel tokens cannot poison retries, memory, or RAG context.
  - Fixed Mathlib and Lean 4 co-dependence bug that disrupted some users' proof generation.
  - Rejected fake proof devices (`axiom`, `constant`, `opaque`) introduced by generated Lean code unless already present in the source/template context.
  - Fixed LeanOJ skip-brainstorm handling so the skip request is not consumed before the brainstorm phase.
  - Fixed generic API helper path handling so configured API bases are respected.
  - Fixed API call logs so standard model calls are recorded alongside boosted calls.
  - Fixed OS hover pop-up layering showing behind neighboring boxes.
  - Fixed OpenRouter credit exhaustion causing proofs to be skipped if the user ran out during the proof creation step.
  - Fixed RAG lock release on cancelled embedding/indexing tasks so resumed research cannot stall.
  - Fixed autonomous paper writer resume so completed brainstorms restart at the proof/paper handoff instead of zero.
  - Fixed manual Lean 4 proof checks so they use the currently selected role models instead of stale brainstorm or paper generation models.
  - Fixed Lean 4 proof completion UI so finished proof passes show accurate live activity counts.

  Authored by Patrick White, Patrick@Intrafere.com
---
 .cursor/rules/api-key-controls.mdc            |   62 +-
 .cursor/rules/hosted-web-contract.mdc         |  193 +
 .cursor/rules/json-prompt-design.mdc          |  331 +-
 ...interaction-and-rule-interaction-rules.mdc |   20 +-
 ...-aggregator-tool-design-specifications.mdc |   11 +-
 ...-and-part-2-cointeraction-architecture.mdc |   23 +-
 ...t-2-compiler-tool-design-specification.mdc |   41 +-
 .../rules/part-3-autonomous-research-mode.mdc |  152 +-
 ...program-directory-and-file-definitions.mdc |  107 +-
 .../rules/rag-design-for-overall-program.mdc  |   52 +-
 .dockerignore                                 |    2 +-
 .gitattributes                                |   16 +
 .gitignore                                    |    4 +
 HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md        |  400 ++
 LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md       |   25 +
 LEANOJ_PROBLEM_11_PROMPT.md                   |   34 +
 README.md                                     |   39 +-
 backend/aggregator/agents/submitter.py        |  112 +-
 backend/aggregator/agents/validator.py        |   24 +-
 backend/aggregator/core/coordinator.py        |  267 +-
 backend/aggregator/core/queue_manager.py      |   43 +-
 backend/aggregator/core/rag_manager.py        |  134 +-
 backend/aggregator/memory/local_training.py   |   16 +-
 .../aggregator/prompts/submitter_prompts.py   |   64 +-
 .../aggregator/prompts/validator_prompts.py   |   99 +-
 backend/api/main.py                           |   30 +
 backend/api/middleware.py                     |  122 +-
 backend/api/proxy_auth.py                     |   77 +-
 backend/api/routes/__init__.py                |    4 +-
 backend/api/routes/aggregator.py              |  159 +-
 backend/api/routes/autonomous.py              |  529 +-
 backend/api/routes/boost.py                   |   37 +-
 backend/api/routes/compiler.py                |  268 +-
 backend/api/routes/download.py                |  162 +-
 backend/api/routes/leanoj.py                  |  392 ++
 backend/api/routes/openrouter.py              |   16 +-
 backend/api/routes/proofs.py                  |   83 +-
 backend/api/routes/update.py                  |   12 +-
 backend/api/routes/websocket.py               |   46 +-
 backend/api/routes/workflow.py                |    7 +-
 .../agents/final_answer/certainty_assessor.py |    3 +-
 .../autonomous/agents/lemma_search_agent.py   |    3 +
 .../autonomous/agents/paper_title_selector.py |    8 +-
 .../agents/proof_formalization_agent.py       |    5 +
 .../agents/proof_identification_agent.py      |    5 +
 .../autonomous/core/autonomous_coordinator.py |  929 ++-
 .../autonomous/core/autonomous_rag_manager.py |   18 +
 backend/autonomous/core/proof_novelty.py      |   13 +-
 backend/autonomous/core/proof_registration.py |  216 +
 .../core/proof_verification_stage.py          |  375 +-
 .../memory/autonomous_api_logger.py           |  160 +-
 .../autonomous/memory/final_answer_memory.py  |   64 +-
 backend/autonomous/memory/paper_library.py    |  506 +-
 backend/autonomous/memory/proof_database.py   |   56 +-
 .../autonomous/memory/research_metadata.py    |   45 +-
 backend/autonomous/memory/session_manager.py  |  217 +-
 .../autonomous/prompts/completion_prompts.py  |   24 +-
 .../prompts/final_answer_prompts.py           |   20 +
 .../prompts/paper_continuation_prompts.py     |   13 +-
 .../prompts/paper_redundancy_prompts.py       |   15 +-
 .../prompts/paper_reference_prompts.py        |   38 +-
 .../paper_title_exploration_prompts.py        |    5 +
 .../autonomous/prompts/paper_title_prompts.py |    7 +
 backend/autonomous/prompts/proof_prompts.py   |  123 +-
 .../prompts/topic_exploration_prompts.py      |   14 +-
 backend/autonomous/prompts/topic_prompts.py   |   19 +-
 .../validation/paper_redundancy_checker.py    |   22 +-
 backend/compiler/agents/critique_submitter.py |  294 +-
 .../compiler/agents/high_context_submitter.py |   71 +-
 .../compiler/agents/high_param_submitter.py   |  231 +-
 backend/compiler/core/compiler_coordinator.py |  967 +---
 backend/compiler/memory/paper_memory.py       |  130 +-
 .../compiler/prompts/construction_prompts.py  |   77 +-
 backend/compiler/prompts/critique_prompts.py  | 1032 +---
 backend/compiler/prompts/outline_prompts.py   |   13 +
 backend/compiler/prompts/review_prompts.py    |    2 +
 backend/compiler/prompts/rigor_prompts.py     |   63 +-
 .../compiler/validation/compiler_validator.py |  256 +-
 backend/leanoj/__init__.py                    |    1 +
 backend/leanoj/core/__init__.py               |    1 +
 backend/leanoj/core/leanoj_context.py         |  829 +++
 backend/leanoj/core/leanoj_coordinator.py     | 5084 +++++++++++++++++
 backend/leanoj/prompts.py                     | 1009 ++++
 backend/shared/api_client_manager.py          |  440 +-
 backend/shared/boost_logger.py                |  144 +-
 backend/shared/boost_manager.py               |   95 +-
 backend/shared/brainstorm_proof_gate.py       |  341 ++
 backend/shared/build_info.py                  |    2 +-
 backend/shared/config.py                      |   40 +-
 backend/shared/json_parser.py                 |  302 +-
 backend/shared/lean4_client.py                |   35 +-
 backend/shared/lean_proof_integrity.py        |  233 +
 backend/shared/lm_studio_client.py            |  285 +-
 backend/shared/log_redaction.py               |   29 +
 backend/shared/model_error_utils.py           |   39 +
 backend/shared/models.py                      |  225 +-
 backend/shared/openrouter_client.py           |  103 +-
 backend/shared/smt_client.py                  |    7 +-
 backend/shared/wolfram_alpha_client.py        |    8 +-
 backend/shared/workflow_start_guard.py        |   23 +
 frontend/index.html                           |    2 +-
 frontend/package-lock.json                    |    4 +-
 frontend/package.json                         |    2 +-
 frontend/src/App.jsx                          | 1003 +++-
 frontend/src/components/ApiCallLogs.jsx       |  412 ++
 frontend/src/components/BoostControlModal.jsx |   52 +-
 .../components/CritiqueNotificationStack.jsx  |    8 +-
 frontend/src/components/HelpTooltip.jsx       |   18 +-
 .../components/HighlightedModelsSidebar.jsx   |  200 +
 frontend/src/components/LiveActivityFeed.jsx  |   69 +
 .../src/components/PaperCritiqueModal.jsx     |    9 +-
 .../src/components/ProofStrengthBadge.jsx     |   18 +
 frontend/src/components/RawSettingsEditor.jsx |   39 +
 frontend/src/components/WorkflowPanel.css     |    9 +
 frontend/src/components/WorkflowPanel.jsx     |   16 +-
 .../aggregator/AggregatorInterface.jsx        |   18 +-
 .../aggregator/AggregatorSettings.jsx         |  633 +-
 .../autonomous/AutonomousResearch.css         |  245 +-
 .../AutonomousResearchInterface.jsx           |   29 +-
 .../autonomous/AutonomousResearchLogs.jsx     |  407 +-
 .../autonomous/AutonomousResearchSettings.jsx |  540 +-
 .../components/autonomous/BrainstormList.jsx  |    7 +-
 .../autonomous/FinalAnswerLibrary.css         |   77 +
 .../autonomous/FinalAnswerLibrary.jsx         |  141 +-
 .../autonomous/MathematicalProofs.css         |  108 +-
 .../autonomous/MathematicalProofs.jsx         |   69 +-
 .../components/autonomous/PaperLibrary.jsx    |   77 +-
 .../src/components/autonomous/ProofGraph.css  |    5 +
 .../src/components/autonomous/ProofGraph.jsx  |    1 +
 .../components/autonomous/ProofLibrary.css    |   84 +
 .../components/autonomous/ProofLibrary.jsx    |   54 +-
 .../autonomous/ProofNotificationStack.jsx     |   14 +-
 .../autonomous/Stage2PaperHistory.css         |   43 +
 .../autonomous/Stage2PaperHistory.jsx         |  144 +-
 .../components/compiler/CompilerInterface.jsx |  154 +-
 .../src/components/compiler/CompilerLogs.jsx  |   82 +-
 .../components/compiler/CompilerSettings.jsx  |  659 ++-
 .../src/components/compiler/LivePaper.jsx     |   79 +-
 .../components/leanoj/LeanOJBrainstorms.jsx   |  265 +
 .../src/components/leanoj/LeanOJInterface.jsx |  170 +
 frontend/src/components/leanoj/LeanOJLogs.jsx |   20 +
 .../components/leanoj/LeanOJMasterProof.css   |  167 +
 .../components/leanoj/LeanOJMasterProof.jsx   |  207 +
 .../leanoj/LeanOJMathematicalProofs.jsx       |  312 +
 .../components/leanoj/LeanOJProofLibrary.jsx  |  352 ++
 .../src/components/leanoj/LeanOJSettings.jsx  |  840 +++
 frontend/src/components/leanoj/index.js       |    7 +
 frontend/src/components/settings-common.css   |  114 +
 frontend/src/hooks/useProofCheckRuntime.js    |   91 +-
 frontend/src/index.css                        |   70 +
 frontend/src/index.jsx                        |    3 +-
 frontend/src/services/api.js                  |  202 +-
 frontend/src/services/websocket.js            |   32 +-
 frontend/src/utils/activityStyles.js          |  320 ++
 frontend/src/utils/autonomousProfiles.js      |  163 +-
 frontend/src/utils/downloadHelpers.js         |    8 +-
 frontend/src/utils/leanojProfiles.js          |  278 +
 frontend/src/utils/openRouterSelection.js     |  347 +-
 frontend/src/utils/runtimeConfig.js           |   74 +
 frontend/vite.config.js                       |    2 +-
 Launch MOTO.sh => linux-ubuntu-launcher.sh    |    2 +-
 moto-update-manifest.json                     |    4 +-
 moto_launcher.py                              |   14 +-
 moto_updater.py                               |    2 +-
 package.json                                  |    2 +-
 randomlog.txt                                 |  467 --
 tests/test_lean4_client.py                    |    6 +-
 tests/test_leanoj_coordinator.py              | 2255 ++++++++
 tests/test_wolfram_tool_loop.py               |    2 +-
 169 files changed, 25987 insertions(+), 5891 deletions(-)
 create mode 100644 .cursor/rules/hosted-web-contract.mdc
 create mode 100644 .gitattributes
 create mode 100644 HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
 create mode 100644 LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
 create mode 100644 LEANOJ_PROBLEM_11_PROMPT.md
 create mode 100644 backend/api/routes/leanoj.py
 create mode 100644 backend/autonomous/core/proof_registration.py
 create mode 100644 backend/leanoj/__init__.py
 create mode 100644 backend/leanoj/core/__init__.py
 create mode 100644 backend/leanoj/core/leanoj_context.py
 create mode 100644 backend/leanoj/core/leanoj_coordinator.py
 create mode 100644 backend/leanoj/prompts.py
 create mode 100644 backend/shared/brainstorm_proof_gate.py
 create mode 100644 backend/shared/lean_proof_integrity.py
 create mode 100644 backend/shared/log_redaction.py
 create mode 100644 backend/shared/model_error_utils.py
 create mode 100644 backend/shared/workflow_start_guard.py
 create mode 100644 frontend/src/components/ApiCallLogs.jsx
 create mode 100644 frontend/src/components/HighlightedModelsSidebar.jsx
 create mode 100644 frontend/src/components/LiveActivityFeed.jsx
 create mode 100644 frontend/src/components/ProofStrengthBadge.jsx
 create mode 100644 frontend/src/components/RawSettingsEditor.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJBrainstorms.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJInterface.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJLogs.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJMasterProof.css
 create mode 100644 frontend/src/components/leanoj/LeanOJMasterProof.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJMathematicalProofs.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJProofLibrary.jsx
 create mode 100644 frontend/src/components/leanoj/LeanOJSettings.jsx
 create mode 100644 frontend/src/components/leanoj/index.js
 create mode 100644 frontend/src/utils/activityStyles.js
 create mode 100644 frontend/src/utils/leanojProfiles.js
 rename Launch MOTO.sh => linux-ubuntu-launcher.sh (94%)
 delete mode 100644 randomlog.txt
 create mode 100644 tests/test_leanoj_coordinator.py

diff --git a/.cursor/rules/api-key-controls.mdc b/.cursor/rules/api-key-controls.mdc
index 7ab5b02..dd3d8ec 100644
--- a/.cursor/rules/api-key-controls.mdc
+++ b/.cursor/rules/api-key-controls.mdc
@@ -1,5 +1,5 @@
 ---
-alwaysApply: false
+alwaysApply: true
 ---
 
 # API Key Controls & Workflow Management System
@@ -11,12 +11,16 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 **Key Features:**
 - **Per-Role OpenRouter Selection**: Each role independently uses LM Studio or OpenRouter (default mode); all roles use OpenRouter in generic mode
 - **Global OpenRouter API Key**: Single key for all per-role OpenRouter selections within one running backend instance. Boost can reuse it when no explicit boost-only override key is provided.
-- **OpenRouter Auto-Fill**: OpenRouter selectors auto-fill context window from model `context_length` and auto-fill max output tokens as `min(20% of model context_length, smallest available host max_completion_tokens)`
+- **OpenRouter Auto-Fill**: OpenRouter selectors fetch provider endpoint metadata and compute host-aware context/output settings from a capable endpoint set. Auto mode must ignore known weak hosts (currently Venice) and low/missing-cap outliers before computing context/max-output; manual host selection uses that exact host.
+- **OpenRouter Reasoning Effort**: Every OpenRouter role exposes a visible reasoning-effort selector. Default `auto` sends maximum OpenRouter reasoning effort (`xhigh`) through the normalized `reasoning.effort` request object; users may lower it or set `none`.
 - **LM Studio Fallback** (default mode only): Optional fallback per role on credit exhaustion
 - **Free Model Cooldown Handling**: SERIAL BOTTLENECK pause, free model looping, and auto-selector backup (see below)
-- **Boost Mode**: Selective task acceleration via two modes, using either an explicit boost override key or the active global OpenRouter key:
+- **Boost Mode**: Selective task acceleration via next-count, category, always-prefer, and per-task routing controls, using either an explicit boost override key or the active global OpenRouter key:
   - **Boost Next X Calls**: Counter-based, next X API calls regardless of task ID
-  - **Category Boost**: Role-based, boosts all calls for specific role categories (Aggregator and Compiler only; Autonomous agents inherit from their parent roles automatically)
+  - **Category Boost**: Role-based, boosts all calls for specific role categories across Aggregator, Compiler, Autonomous/proof, and LeanOJ roles
+  - **Always Prefer Boost**: Attempts boost for every API call, falling back to the primary route on boost failure
+  - **Per-Task Toggle**: Legacy task-ID boost controls for individual workflow tasks
+- **Supercharge**: Per-role setting that wraps one role answer as 4 parallel diversified full answer attempts plus a 5th same-model deterministic synthesis answer. If Boost applies, all 5 calls use the Boost route/model/provider/settings.
 - **System works without LM Studio**: Defaults to OpenRouter when LM Studio unavailable; generic mode never attempts LM Studio
 
 ## Mode-Specific Behavior
@@ -39,7 +43,20 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 **Boost is a ROUTING decision, NOT a CONCURRENCY decision.**
 - Boost affects which API endpoint is used, NOT whether submitters run in parallel or serial
 - Aggregation submitters ALWAYS run in parallel regardless of boost status (unless single-model mode)
-- Single-model mode: triggered when all submitters AND validator use the SAME configured model ID. Boost routing does NOT trigger single-model mode.
+- LeanOJ topic and brainstorm submitters ALWAYS run in parallel regardless of boost/provider routing; validation batches up to 3 topics/submissions.
+- Single-model mode: triggered when all submitters AND validator use the SAME configured model ID, except when LM Studio has multiple loaded same-base numeric `:#` instances (for example `model:1`, `model:2`) for that model; in that case submitters may run in parallel and the LM Studio client routes independent calls to idle sibling instances. Boost routing does NOT trigger single-model mode.
+
+### Supercharge
+
+**Supercharge is a per-role answer-quality wrapper, NOT a routing mode.**
+- `ModelConfig.supercharge_enabled` and related request fields control it per role.
+- Frontend Supercharge controls are developer-mode-only; start/generate request payloads must force Supercharge off unless developer mode is active.
+- `api_client_manager.generate_completion()` is the only implementation choke point: checked roles run 4 parallel full answer attempts, then a 5th synthesis call that receives the original messages plus the prior 4 outputs and returns the single role answer.
+- Calls 1-4 must be full answer attempts in the original role format/schema, not short notes.
+- Calls 1-4 intentionally violate the default deterministic temperature rule with the fixed ladder `[0.0, 0.2, 0.4, 0.8]` so concurrent candidates diversify; the synthesis call stays `temperature=0.0`.
+- The synthesis call must produce the final answer in the exact original required format/schema and must not mention Supercharge or candidate attempts.
+- Tool-call requests (`tools` or `tool_choice`) bypass Supercharge because assistant/tool turn pairing must remain exact.
+- If Boost applies to the original task, all 5 Supercharge calls force the same Boost mode and Boost config first; Boost failures are strict for Supercharge and must not silently mix in the primary route. `boost_next_count` is consumed once for the successful boosted overall Supercharge answer, not once per internal attempt.
 
 ### Backend Core
 
@@ -48,11 +65,19 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 - App Attribution Headers: `HTTP-Referer: https://intrafere.com/moto-autonomous-home-ai/`, `X-Title: MOTO Autonomous ASI`
 - Credit exhaustion detection: HTTP 402 OR error messages containing "credit", "insufficient", "balance", "quota", "key limit", "limit exceeded"
 - Raises `CreditExhaustionError` on exhaustion (no retries). Retries transient errors (max 3).
-- Temperature=0.0 default. No stop sequences (removed — caused premature truncation with certain models).
+- Temperature=0.0 default except Supercharge candidate attempts and parallel brainstorm submitter lanes. No stop sequences (removed — caused premature truncation with certain models).
 - Exposes both model-level metadata (`/models`) and provider endpoint metadata (`/models/{author}/{slug}/endpoints`) so the UI can compute safe host-aware OpenRouter auto-fill values.
+- Auto-routed calls include a provider `ignore` list for known weak hosts so OpenRouter can still fall back across capable providers. Explicit user-selected providers use `provider.order=[provider]` with `allow_fallbacks=false` so requests cannot silently fall back to a host whose limits were not used for settings.
 
 #### APIClientManager (`backend/shared/api_client_manager.py`)
-- Central router for all API calls: boost check → role's OpenRouter (with resettable fallback) → LM Studio (default mode) or OpenRouter-only (generic mode)
+- Central router for all API calls: optional Supercharge wrapper → boost check → role's OpenRouter (with resettable fallback) → LM Studio (default mode) or OpenRouter-only (generic mode)
+- Temperature policy exceptions live here: Supercharge attempts use `[0.0, 0.2, 0.4, 0.8]`; parallel brainstorm submitter lanes use `[0.0, 0.1, ..., 0.9]`. Validators, compiler roles, proof/final roles, JSON retries, and single-model sequential submitters stay `0.0`.
+- LM Studio instance sharing lives below this router in `lm_studio_client.generate_completion()`: only default-mode LM Studio calls can share same-base loaded numeric `:#` siblings, response metadata must preserve both the configured model and effective instance, and state-sensitive workflow ordering must not change.
+- Raw provider/model transport output must never be replayed into MOTO retry prompts, feedback memory, accepted memory, RAG, or durable context. Conversational retries are required, but failed-output context must first pass `sanitize_model_output_for_retry_context()` so only reusable visible answer text remains. The sanitizer strips known private thought/channel/control tokens only as transport scaffolding outside visible JSON/string content, not ordinary visible Lean/math/operator syntax such as `<|` or literal visible marker text such as `<|channel>final` / `<channel|>` inside content.
+- Parser exception strings that are inserted into retry prompts must not contain raw response excerpts; raw excerpts are allowed only in logs/observability surfaces that are never reused as model context.
+- Observability surfaces must default to metadata/previews with secret redaction. Provider keys, URL query keys, Wolfram query/result text, and full prompt/response bodies must not be persisted or broadcast unless an explicit trusted debug path opts in. Legacy full-payload log fields are scrubbed from persisted API logs on logger startup.
+- Tool-call assistant/tool protocol turns are the only exception where exact assistant content/structure may need preservation; ordinary JSON retry assistant turns are not tool protocol turns and must use sanitized retry context.
+- Generic mode must normalize or reject LM Studio role configs and must never fall through to `lm_studio_client.generate_completion()`, even if a direct API caller submits legacy `provider="lm_studio"` or an LM fallback value.
 - Generic mode: `get_embeddings()` early-returns to `FastEmbedProvider` before the LM Studio → OpenRouter fallback chain
 - Tracks fallback state per role: `_role_fallback_state: Dict[str, str]`
 - `reset_openrouter_fallbacks()`: Resets all roles originally configured for OpenRouter back from LM Studio fallback. Called automatically on API key set, or manually via reset endpoint.
@@ -60,12 +85,15 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 
 **CRITICAL REQUIREMENT - Role Configuration:**
 - **EVERY role calling `api_client_manager.generate_completion()` MUST be configured via `api_client_manager.configure_role()`**
-- This includes: aggregator submitters/validator, compiler submitters/validator/critique, autonomous agents, Tier 3 final answer agents
+- This includes: aggregator submitters/validator, compiler submitters/validator/critique, autonomous agents, Tier 3 final answer agents, and LeanOJ roles/topic/brainstorm submitters
+- Role configs must preserve `supercharge_enabled` when copied into proof snapshots, manual proof helpers, child Aggregator/Compiler coordinators, and LeanOJ grouped roles.
 - **Proof agents (Part 3, optional)** do NOT have standalone role configs. `ProofVerificationStage` reuses the stored `ProofRuntimeConfigSnapshot` (brainstorm submitter, high-context submitter, validator) captured by `autonomous_coordinator._build_proof_runtime_config_snapshot()` and persisted via `research_metadata.set_proof_runtime_config()`. Manual `POST /api/proofs/check` requires `lean4_enabled=True` AND a seeded snapshot — start autonomous research once to seed it.
 
 **Boost Mode Priority** (`should_use_boost(task_id)`):
 1. Boost Next X: `boost_next_count > 0` → True
-2. Category Boost: `_extract_role_prefix(task_id) in boosted_categories` → True
+2. Always Prefer Boost: `always_prefer_boost=True` → True
+3. Category Boost: `_extract_role_prefix(task_id) in boosted_categories` → True
+4. Per-task toggle: exact task ID is enabled → True
 
 **Counter Decrement:** `boost_next_count` decrements ONLY on successful boost API calls. Failed/exhausted calls do NOT decrement.
 
@@ -78,16 +106,18 @@ Enables OpenRouter integration with automatic LM Studio fallback (default mode)
 - `compiler_high_param` → "Compiler High-Param"
 - `compiler_validator` → "Compiler Validator"
 - `autonomous_*` → "Autonomous"
+- `proof_*` / `autonomous_proof_*` → proof-specific categories
+- `leanoj_*` → LeanOJ topic, brainstorm, subproof, final-solver, and validator categories; LeanOJ path-decision tasks are absorbed into Final Solver boost routing
 
 #### BoostManager (`backend/shared/boost_manager.py`)
-- Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call)
-- Boost can use an **explicit override** OpenRouter API key, or it falls back to the active global OpenRouter key. A temporary `OpenRouterClient` is created per boosted task and closed immediately after.
+- Singleton. Key methods: `set_boost_config`, `clear_boost`, `set_boost_next_count`, `toggle_category_boost`, `set_always_prefer`, `toggle_task_boost`, `should_use_boost` (main check for coordinators), `consume_boost_count` (only after successful boost call)
+- Boost can use an **explicit override** OpenRouter API key in process memory only, or it falls back to the active global OpenRouter key. Boost state persistence must never write provider key material; legacy persisted boost keys are scrubbed on load. A temporary `OpenRouterClient` is created per boosted task and closed immediately after.
 - **Autonomous agent task ID inheritance**: All autonomous orchestration agents use parent role task ID prefixes — Topic Selector/Completion Reviewer/Reference Selector/Paper Title Selector/Tier 3 agents use `agg_sub1_*`; Topic Validator/Redundancy Checker use `agg_val_*`. Boosting a parent role automatically covers all autonomous agents that run on that model. **Proof agents are the exception**: they use their own prefixes (`proof_id_*`, `proof_lemma_*`, `proof_form_*`, `proof_novelty_*`, `proof_framing_gate_*`) because they run under the `autonomous_proof_*` role IDs with distinct runtime-snapshot configs; Aggregator/Validator category boosts do NOT cover proof agents.
 
 #### BoostLogger (`backend/shared/boost_logger.py`)
 - Singleton. Log file resolves under the active instance data root (default desktop path: `backend/data/boost_api_log.txt`)
 - Methods: `log_api_call`, `get_logs(limit)`, `clear_logs`, `get_stats`
-- Boost logs are merged into the main API call log view; boost endpoints remain available for boost-only debugging.
+- Boost logs are merged into the main API call log view; persisted/default route output must avoid provider keys and raw full prompt/response bodies.
 
 #### Workflow Task Generation (Internal Backend Tracking)
 Coordinators track task IDs internally for boost routing. The frontend does NOT display predicted task lists.
@@ -144,7 +174,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `POST /api/openrouter/reset-exhaustion` — Reset all credit exhaustion flags + role fallback states mid-session
 - `DELETE /api/openrouter/api-key` — Clear key
 - `GET /api/openrouter/api-key-status` — `{ has_key, enabled }`
-- `GET /api/openrouter/models` — Available models (also caches free models for rotation)
+- `GET /api/openrouter/models` — Available models (also caches free models for rotation); temporary keys must use `Authorization: Bearer`, never URL query parameters
 - `GET /api/openrouter/providers/{model_id}` — Providers + endpoint metadata for model
 - `GET /api/openrouter/free-model-settings` — `{ looping_enabled, auto_selector_enabled, ... }`
 - `POST /api/openrouter/free-model-settings` — Update free model settings (body: `FreeModelSettings`)
@@ -176,7 +206,7 @@ Predictions refresh: after initialization, each task completion, mode switches,
 - `looping_enabled` — rotate to next available free model on rate limit (highest context first)
 - `auto_selector_enabled` — fall back to `openrouter/free` (131072 context) when all free models exhausted
 
-**Rotation chain** (in `api_client_manager._try_free_model_rotation()` called from RateLimitError handler):
+**Rotation chain** (in `api_client_manager._try_free_model_rotation()` called from RateLimitError handler; keep optional `tools` / `tool_choice` passed through when that helper is used):
 1. If `looping_enabled`: **iterate through ALL** non-rate-limited free models (highest context first) using `tried_models` set to avoid re-trying. On each `RateLimitError`, refresh rate-limited dict and continue to next model. On `CreditExhaustionError`, stop looping.
 2. If all looping candidates exhausted and `auto_selector_enabled`: try `openrouter/free`
 3. If still failed: check LM Studio fallback (default mode only; generic mode skips this)
@@ -214,6 +244,6 @@ Predictions refresh: after initialization, each task completion, mode switches,
 
 **Hosted generic mode (no keyring):** Provider keys are env-injected at sandbox launch and/or set via proxied MOTO API routes. `secret_store` persistence is bypassed; keys live in sandbox memory only. Re-injection required after sandbox recreation. `OPENROUTER_API_KEY` env var auto-loaded during lifespan if present.
 
-**localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`). When `MOTO_FRONTEND_STORAGE_PREFIX` / `VITE_MOTO_STORAGE_PREFIX` is active, these keys are automatically namespaced per instance.
+**localStorage:** `workflow_panel_collapsed`, `aggregatorConfig`, `compiler_settings`, `autonomousConfig` (includes `freeModelLooping`, `freeModelAutoSelector`, per-role Supercharge settings). When `MOTO_FRONTEND_STORAGE_PREFIX` / `VITE_MOTO_STORAGE_PREFIX` is active, these keys are automatically namespaced per instance.
 
-**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state. Boost logs and boost state persist under the active instance data root (`boost_api_log.txt`, `boost_state.json`) and are merged into the main API call log view.
+**Session (in-memory):** fallback state per role, boosted task IDs, boost next count, boosted categories, completed task IDs, free model manager state, and any explicit Boost override key. Boost override keys must never be persisted to `boost_state.json`; legacy plaintext keys are ignored/scrubbed on load. Boost logs and non-secret boost routing state persist under the active instance data root (`boost_api_log.txt`, `boost_state.json`) and are merged into the main API call log view. API call logs store previews/metadata by default; full prompt/response payload persistence is debug opt-in only, and provider/model error logs must report shape/status metadata instead of raw response bodies.
diff --git a/.cursor/rules/hosted-web-contract.mdc b/.cursor/rules/hosted-web-contract.mdc
new file mode 100644
index 0000000..6715d90
--- /dev/null
+++ b/.cursor/rules/hosted-web-contract.mdc
@@ -0,0 +1,193 @@
+---
+description: Hybrid deployment contract — generic_mode, hosted sandbox, proxy auth, web-team boundary, updater policy
+alwaysApply: true
+---
+
+# Hybrid Deployment Contract (intrafere.ai / Hosted Web Product)
+
+MOTO is ONE codebase serving TWO deployment targets. A single `generic_mode` boolean switches between them. All features, fixes, and improvements ship to both targets simultaneously.
+
+## Two Deployment Targets
+
+- **Default mode (`generic_mode=False`)**: GitHub open-source release. Desktop app with `.bat`/`.ps1` launcher. LM Studio + OpenRouter. User runs locally.
+- **Generic mode (`generic_mode=True`)**: Hosted web backend. API-only sandbox on Blaxel, fronted by the Intrafere website/control plane on AWS. FastEmbed embeddings, OpenRouter-only LLM inference, no LM Studio dependency.
+
+## Two-Team Boundary (Strict)
+
+| Team | Repo | Owns |
+|------|------|------|
+| **Upgrade Team** | MOTO repo | `generic_mode` conditional branches, FastEmbed provider, hosted runtime contract, proxy auth plumbing, `/api/features`, `/api/health`, build metadata, desktop launchers + updater contract |
+| **Web Team** | Separate repo | Website frontend, Clerk auth, Stripe billing, AWS control plane, Blaxel sandbox lifecycle, same-domain proxy, dashboard update UX, CI/CD image pipeline |
+
+The Web Team consumes MOTO as a pre-built image. They never commit into the MOTO repo. Their website wraps private MOTO sandboxes — handles auth, billing, proxying, and instance lifecycle while MOTO handles all research orchestration.
+
+## Hosted Container Artifacts
+
+- The MOTO repo provides the canonical hosted container files: `Dockerfile`, `.dockerignore`, and `docker/entrypoint.sh`.
+- Those files define the API-only `python:3.12-slim` generic-mode runtime contract. Image publish, rollout, and redeploy automation still belong to the separate Web Team repo.
+
+## The `generic_mode` Flag
+
+`SystemConfig` field in `backend/shared/config.py`:
+```python
+generic_mode: bool = False
+```
+
+Toggled via `MOTO_GENERIC_MODE=true` env var (read explicitly in `main.py` lifespan, not via Pydantic auto-mapping, to avoid adding an env_prefix to SystemConfig).
+
+When `False`: program behaves as the existing open-source desktop release. When `True`: activates conditional code paths. No existing default-mode behavior is modified.
+
+## Decision Points
+
+1. **`api_client_manager.get_embeddings()`** — generic mode early-returns to in-process `FastEmbedProvider` before the LM Studio → OpenRouter fallback chain
+2. **`rag_manager.py`** — generic mode skips global RAG lock for embedding calls (FastEmbed is in-process/thread-safe); ChromaDB write locking remains in both modes; synchronous ChromaDB calls and CPU-heavy RAG scoring must run off the FastAPI event loop
+3. **`main.py` lifespan** — generic mode skips LM Studio connection test; auto-loads `OPENROUTER_API_KEY` from env if present
+4. **`openrouter.py` LM Studio availability** — generic mode returns `{available: false, generic_mode: true}` without pinging LM Studio
+5. **`download.py` PDF** — generic mode returns `501` (Playwright/Chromium not installed in hosted image)
+6. **Frontend** — calls `GET /api/features` on mount; when `generic_mode=True`, hides all LM Studio UI, defaults everything to OpenRouter
+7. **`middleware.py` + `websocket.py`** — generic mode validates internal proxy auth (`X-Moto-*` signed headers) on all non-allowlisted routes
+8. **Long-running workflow isolation** — research/proof/RAG/Lean jobs may run in background tasks, but must not block the FastAPI event loop that serves GUI/status/health/API-key routes
+
+## Instance-Scoped Runtime Contract (Both Modes)
+
+One process pair = one MOTO instance (local or sandbox). Env inputs:
+- `MOTO_INSTANCE_ID`, `MOTO_BACKEND_HOST`/`HOST`, `MOTO_BACKEND_PORT`/`PORT`
+- `MOTO_DATA_ROOT`, optional `MOTO_LOG_ROOT`, optional `MOTO_SECRET_NAMESPACE`
+- optional `MOTO_FRONTEND_STORAGE_PREFIX`, optional `MOTO_CORS_ORIGINS`, optional `MOTO_LM_STUDIO_BASE_URL`
+- Default desktop launches bind backend and bundled Vite frontend to loopback and require `MOTO_DESKTOP_API_TOKEN` / `VITE_MOTO_DESKTOP_API_TOKEN` on protected HTTP routes. Desktop WebSockets use one-time tickets minted by authenticated `POST /api/ws-ticket`; hosted generic mode continues to use proxy HMAC auth instead.
+
+Hosted sandboxes reuse this exact contract (`MOTO_DATA_ROOT=/app/backend/data`). No separate hosted-only env model.
+
+## Proxy Auth Contract (Generic Mode Only)
+
+Browser reaches sandboxes only through the authenticated control-plane proxy, never via direct sandbox URLs.
+
+- **Proxy path**: `https://app.intrafere.com/instances/{instance_id}/moto/api/...` and `wss://.../moto/ws`
+- Proxy strips `/instances/{instance_id}/moto` prefix before forwarding
+- Control plane injects signed headers: `X-Moto-Instance-Id`, `X-Moto-Proxy-Timestamp`, `X-Moto-Proxy-Signature`, and `X-Moto-Body-SHA256` for body-capable protected requests
+- Signature payload binds `{instance_id}`, `{timestamp}`, uppercase method, stripped path, raw query string, and the `X-Moto-Body-SHA256` value (empty hash for WebSockets/bodyless requests)
+- Sandbox validates instance ID match, timestamp skew ≤60s, HMAC digest, query string, that the signed body hash matches the actual received request body, and rejects replayed signatures inside the accepted skew window
+- Protected hosted HTTP requests with `Content-Length` above `MOTO_GENERIC_MAX_REQUEST_BYTES` / `GENERIC_MAX_REQUEST_BYTES` (default 16 MiB) are rejected before route handling; the control-plane proxy should enforce the same or stricter body-size cap before forwarding
+- If `generic_mode=True` and `MOTO_INSTANCE_ID` or `MOTO_INTERNAL_PROXY_SECRET` is missing: fail closed at startup
+- Allowlisted without proxy auth: `GET /health`, `GET /api/health`, `GET /api/features`, `OPTIONS` preflight
+- `Authorization` header is NOT reused for sandbox auth (existing MOTO routes use it for OpenRouter key passthrough)
+
+Implementation: centralized in `middleware.py` (HTTP) and `websocket.py` (before `accept()`). No per-route auth changes.
+
+## `/api/features` Endpoint (Both Modes)
+
+Build 0 lands the public identity subset first. Returns:
+```python
+{
+    "version": str,
+    "build_commit": str,  # authoritative update key
+    "update_channel": "main",
+ "api_contract_version": "build5-v12",
+    "generic_mode": bool,
+    "lm_studio_enabled": bool,
+    "pdf_download_available": bool,
+}
+```
+
+The current Build 5 runtime preserves the four identity fields while exposing the stable capability flags above. Build 5 v12 replaces compiler critique rewrite WebSocket events with `self_review_appended` and changes post-body critique output to a validated appended self-review section. Later hosted work may extend `/api/features` with additional capability flags such as `max_submitters` and `tier3_available`, but the existing fields above remain stable and `api_contract_version` must bump when that happens.
+
+Must remain capability-only. Must NOT expose per-user or per-instance state (e.g. whether an OpenRouter key is set).
+
+## `/api/health` Endpoint
+
+Richer readiness alias of `/health`. Available in both modes. Hosted sandboxes use it for liveness/readiness probes.
+
+## FastAPI Responsiveness Contract
+
+GUI loads, hosted control-plane probes, and desktop status polling share the same FastAPI app as long-running MOTO workflows. Any code reachable from background research/proof tasks must preserve event-loop responsiveness:
+
+- Do not run synchronous ChromaDB operations, large in-memory RAG scoring, Lean temp-file writes/deletes, workspace repair deletes, subprocess waits, or `time.sleep()` on the event loop.
+- Use async subprocess APIs for external tools and `asyncio.to_thread()` for unavoidable synchronous filesystem, ChromaDB, or CPU-heavy scoring work.
+- Status/health/capability/key-status endpoints must be fast-lane routes: return cached/in-memory state only and must not trigger Lean, ChromaDB scans, OpenRouter model-list fetches, or large session-directory walks.
+- Do not paper over event-loop starvation with multiple Uvicorn workers unless coordinator state, WebSockets, and runtime memory have first been externalized; current singleton coordinators assume one backend process per instance.
+
+## Embedding Strategy (Generic Mode)
+
+FastEmbed by Qdrant — in-process ONNX Runtime, `nomic-embed-text-v1.5` INT8, ~200 MB RAM, no PyTorch.
+
+- Dependency in `requirements-generic.txt` (additive, not in main `requirements.txt`)
+- `fastembed_provider.py` (~30 lines) wraps the library; lazy-imported so default installs are unaffected
+- If `generic_mode=True` and `fastembed` is missing: fail fast with clear error
+- Batch query variant optimization: `_vector_search()` batches all query embeddings into one `get_embeddings()` call (benefits both modes)
+
+## Dependency Handling
+
+`requirements-generic.txt`:
+```
+-r requirements.txt
+fastembed>=0.3.6
+onnxruntime>=1.18.0,<2.0
+```
+Hosted image installs both files but does NOT run `playwright install chromium`.
+
+## Frontend Serving (Generic Mode)
+
+Sandbox is API-only. The MOTO React frontend is NOT served from the hosted sandbox. The Web Team builds their own frontend (website + dashboard + embedded MOTO UI). In default mode, the bundled frontend is served by Vite / static build as today.
+
+## PDF Download
+
+- Default mode: `POST /api/download/pdf` works via Playwright, but submitted HTML is untrusted; server-side rendering must sanitize/allowlist content, enforce PDF-specific size caps, disable JavaScript, keep Chromium sandboxing enabled, and block external browser network requests
+- Generic mode: returns `501` ("PDF generation unavailable in web mode. Use raw text download.")
+- Web Team may implement client-side PDF in their frontend independently
+
+## Secret Handling (Generic Mode)
+
+- Desktop default: `secret_store.py` uses OS keyring, restored on startup
+- Hosted generic mode: provider keys are env-injected at sandbox launch and/or set via proxied MOTO API routes. `secret_store` persistence is bypassed; keys live in sandbox memory only. Re-injection required after sandbox recreation.
+- Generic-mode OpenRouter and Wolfram routes update runtime memory only; they do not write to or clear the desktop keyring.
+- Control plane NEVER stores, logs, or persists user provider keys in its own database
+
+## Data Persistence
+
+- `backend/data/` is the default desktop working set
+- Hosted: `MOTO_DATA_ROOT=/app/backend/data` so Blaxel storage mounts to one unambiguous path
+- ChromaDB SQLite files stay on Blaxel sandbox storage (local file semantics required)
+- Sandbox recall/resume returns the same filesystem state; redeploy/recreate advances to the newest image
+- Uploads: server-side enforcement of `.txt` only, 5 MB max, filename sanitization, path traversal rejection
+
+## Updater Policy
+
+- **Authoritative update source**: GitHub `main` branch (not GitHub Releases)
+- **Desktop**: launcher compares local build metadata against GitHub `main`. Auto-apply is only for clean `origin/main` git checkouts or ZIP/extracted installs with no launcher-managed instances still running. ZIP updates preserve active data/log roots, instance storage, launcher state, env files, and keyring-related namespaces.
+- **Hosted**: sandboxes do NOT self-mutate. Redeploy/recreate uses the latest approved `main`-derived image. Recall/resume keeps the existing image. Hosted `POST /api/update/pull` must return unavailable instead of attempting in-place update.
+- **Build metadata**: `version`, `build_commit`, `update_channel`, and `api_contract_version` exposed via `/api/features`; the committed `main`-branch manifest lives at `moto-update-manifest.json`
+
+## Canonical Runtime Baselines
+
+- **Desktop release**: Windows (release-blocking); Ubuntu 24.04 LTS (validation target, separate launcher effort)
+- **Hosted sandbox**: Debian/glibc via `python:3.12-slim`
+- **Unsupported**: Alpine/musl (Python + ONNX + Chroma stack needs glibc)
+
+## What Stays the Same (Both Modes)
+
+All RAG pipeline logic, coordinator logic, prompt engineering, WebSocket routing, paper/brainstorm/outline memory management, ChromaDB usage, and REST route surface remain shared. Generic mode adds proxy auth and hides LM Studio options; proof execution routes may exist but must report disabled/unavailable capability unless the required runtime flags and toolchains are present.
+
+## Integration Contract Rule
+
+Any REST shape, auth contract, or WebSocket event change that affects the website must update **code, this rule, the live `/openapi.json` schema, and `api_contract_version` in `/api/features`** in the same approved `main` merge. The live backend's `GET /openapi.json` is the machine-readable REST schema contract.
+
+## Proof Integration Contract (Builds 1-5, optional, gated off by default)
+
+All Lean 4 and SMT behavior is gated on three runtime flags (`lean4_enabled`, `lean4_lsp_enabled`, `smt_enabled`). All three default false and stay silent when disabled. Hosted sandboxes ship with them disabled.
+
+- **Hosted image stays Lean-free and Z3-free.** No Lean toolchain, no `z3` binary, and no Python wheel for either is permitted in `Dockerfile`, `docker/entrypoint.sh`, or `requirements-generic.txt`. Proof features are desktop-opt-in only for the current contract.
+- **Lean 4 remains authoritative** for every stored proof. The `Lean4Result` contract is unchanged by SMT; SMT (when enabled) produces tactic hints consumed by the formalization agent, never a standalone proof artifact.
+- **Subprocess fallback must keep working** when `lean4_lsp_enabled=False`. LSP is a latency optimization, not a replacement.
+- **Proof routes under `/api/proofs/*`** are additive to the hosted REST contract: `GET /api/proofs` (list), `GET /api/proofs/novel`, `GET /api/proofs/status`, `POST /api/proofs/settings`, `POST /api/proofs/check` (manual check), `GET /api/proofs/{id}`, `GET /api/proofs/{id}/certificate[.lean]`, `GET /api/proofs/{id}/dependencies`, `GET /api/proofs/graph`, `GET /api/proofs/mathlib/{lemma_name}/dependents` (Build 5).
+- **LeanOJ routes** are additive to the hosted REST contract in `build5-v6`: start/resume, stop, status, clear, skip-brainstorm, force-brainstorm, master-proof draft/edit summaries, current-run proofs, and cross-session proof library endpoints live under `/api/leanoj/*`.
+- **Pruned Stage 2 paper routes** are additive in `build5-v6`: pruned papers are removed from model context/RAG but remain downloadable under `/api/auto-research/paper-history/pruned*`; hard deletion is limited to explicit delete-all-pruned endpoints.
+- **LeanOJ live-activity WebSocket events** include model-call failure/retry progress, initial topic generation/validation, recursive brainstorm progress, brainstorm submitter/queue/batch-validation events, sufficiency/phase-limit events, master-proof edit validation/applied/rejected events, final semantic-review rejection, and final-attempt-cycle exhaustion.
+- **Compiler critique WebSocket events** include validated critique progress and `self_review_appended`; partial/total rewrite events are no longer emitted by the active critique flow.
+- **Proof WebSocket events** are part of the web-surface contract: `proof_framing_decided`, `proof_check_started`, `proof_check_complete`, `proof_check_no_candidates`, `proof_check_candidates_found`, `mathlib_lemmas_suggested`, `proof_attempt_started`, `proof_verified`, `proof_attempt_failed`, `proof_attempts_exhausted`, `proof_retry_started`, `proof_retry_scheduled`, `novel_proof_discovered`, `known_proof_verified`, `proof_dependency_added`, `smt_check_started`, `smt_check_complete`. `proof_verified` is emitted only after proof registration/reuse and includes `proof_id`.
+- **Proof certificate exports stay text-based** (`.lean` source + JSON metadata). No binary-only proof artifacts.
+- **Proof runtime config snapshot** (`ProofRuntimeConfigSnapshot`) is persisted via `research_metadata` so manual `POST /api/proofs/check` can run without an active autonomous session; required state is `lean4_enabled=True` AND a seeded snapshot.
+- **`api_contract_version` bumps** apply the same way to proof additions as to the base contract: any new proof route or event added after Build 5 must bump the contract version in the same merge.
+
+## Hosting Ownership
+
+Intrafere operates the service providing back-end with Blaxel.
diff --git a/.cursor/rules/json-prompt-design.mdc b/.cursor/rules/json-prompt-design.mdc
index 5715730..3748820 100644
--- a/.cursor/rules/json-prompt-design.mdc
+++ b/.cursor/rules/json-prompt-design.mdc
@@ -164,16 +164,30 @@ CORRECT RESPONSE:
 - Improve validator rigor (currently lacks evaluation depth)
 - Maintain existing prompt assembly order: System → JSON Schema → User Prompt → Context → RAG → Final Instruction
 - **MATH VARIANT**: Citation requirements REMOVED. Focus on mathematical rigor, logical correctness, and established mathematical principles. Models with web search capabilities are encouraged to use them for verification. Validation is purely AI-driven.
+- **Proof Prompt Relevance Boundary**: Every automated proof JSON prompt must treat the USER RESEARCH PROMPT as the primary filter. Candidate identification returns every prompt-relevant, non-trivial theorem worth attempting, ordered by usefulness to the user prompt first and novelty/formalization value second. Never impose an artificial theorem-count cap unless explicitly requested.
 - **Compiler Outline Injection**: The compiler outline is always fully injected (never truncated, never RAGed) for all modes because it provides the structural framework for document construction and validation.
-- **TEMPERATURE POLICY**: All prompts use temperature=0.0 (deterministic generation). The system's evolving context provides sufficient diversity. This applies to ALL agents.
+- **TEMPERATURE POLICY**: Default all prompts to `temperature=0.0`. Only two exceptions are allowed: Supercharge candidate attempts and parallel brainstorm submitter lanes. Validators, compiler roles, proof/final roles, and JSON retries must stay deterministic.
+- **Supercharge Schema Preservation**: Per-role Supercharge calls generate 4 full answer attempts plus a 5th synthesis answer. Candidate attempts must be sanitized to reusable visible answer text before the 5th call; private thought/channel/control transcript text must never be fed into synthesis, retries, feedback memory, accepted memory, or RAG. The synthesis prompt must place the final instruction after the candidate block, treat candidates as optional working material, and preserve the original task's exact output contract; if the original role expects JSON, the 5th answer must output only valid JSON in that same schema and must not mention Supercharge or candidate attempts.
 - **NATURAL COMPLETION POLICY**: Models stop naturally when JSON response is complete. No stop sequences enforced. `sanitize_json_response()` handles trailing whitespace. **CRITICAL**: Truncated JSON (unclosed braces/brackets) raises ValueError - no repair attempted.
 - **JSON Response Preprocessing**: All LLM responses preprocessed by `sanitize_json_response()` in `backend/shared/json_parser.py`. See implementation for complete sanitization pipeline: strips reasoning tokens/markdown/control tokens, handles LaTeX escapes (pre-escapes dangerous commands), escapes control chars in strings, rejects truncated JSON, detects pure reasoning text. Enhanced error logging with diagnostics. Array responses auto-extract `data[0]`.
+- **Retry Transcript Hygiene**: Raw provider/model transport output must never enter retry prompts, feedback memory, accepted memory, RAG, synthesis prompts, or durable context. Keep conversational retries, but replay only `sanitize_model_output_for_retry_context()` output, which strips known leading private thought/channel/control transcript scaffolding while preserving useful visible malformed JSON/output excerpts and literal tags/operators inside visible content. Channel/control markers must be treated as transport scaffolding only when detected outside visible JSON/string content; sanitization must not treat ordinary Lean/math/operator text such as `<|`, or literal visible text such as `<think>`, `<thought>`, `<|channel>final`, or `<channel|>`, as a control token when it appears inside visible content. Exact assistant/tool protocol turns are the only exception.
 - **No Startup Compatibility Testing**: Models trusted to work. JSON sanitizer handles all quirks automatically. Model configs cached on first success.
 - **Reasoning Field Extraction**: Agent code checks BOTH `content` and `reasoning` fields for model compatibility.
 - **Centralized JSON Parsing**: All agents use `parse_json()` from `backend/shared/json_parser.py`. Exceptions: memory modules loading system-written files use direct `json.loads()`.
+- **LeanOJ JSON Retry**: LeanOJ proof-solver roles also use centralized `parse_json()` and must retry malformed/non-object JSON before treating a role call as failed. During each configured final-attempt cycle, malformed model output is recorded as failed proof feedback and the loop continues until Lean verifies, the cycle is exhausted, or the operator stops; provider credit exhaustion/no-fallback configuration errors are non-retryable resumable pauses, not proof feedback.
+- **LeanOJ Batch Validation JSON**: LeanOJ brainstorm validation may receive 2-3 submissions and must return `{"decisions": [...]}` with one ordered binary accept/reject decision per submission. Accepted brainstorm decisions should classify `context_role` as `active_plan`, `verified_hint`, `refuted_construction`, or `scratch`; topic validation may receive 2-3 topics and must return ordered `{"decisions": [...]}` entries keyed by `topic_number`. Initial topic validation accepts only broad locked foundation questions that cover `answer n`, lower construction, upper proof, exact LeanOJ semantics, and Lean formalization; reject narrow lemma/tactic/bound/repair topics.
+- **LeanOJ Brainstorm Prune JSON**: LeanOJ prune-review prompts must ask whether any accepted brainstorm memory should be removed or updated because it is `outdated`, `redundant`, wrong, harmful, or superseded. Do not pressure the reviewer to remove content: keep the conservative `"none"` default, allow at most one operation, and preserve any idea with unique proof-solving value. Prune validation should accept deletes/edits only when the operation clearly improves the proof-solving database under those criteria.
+- **LeanOJ Final Context Routing**: Final-solver direct proof context is limited to verified standalone subproofs plus accepted notes explicitly classified as `active_plan`. Ordinary accepted brainstorm notes default to `scratch`, and accepted idea artifact records must persist `context_role` metadata across resume/reload. Lean-accepted partial scaffolds with `sorry`/`admit` and failed final attempts cannot seed `master_proof.lean` unless explicitly marked high-value/master-seed eligible. The final solver may receive the most recent 5 final attempts only as compact execution feedback to avoid repeating failed edits; this feedback is not proof evidence. Failed/refuted constructions are not proof evidence: pass them only through the compact `refuted_construction_warnings` / “DO NOT USE” channel.
+- **LeanOJ Master-Proof Editing JSON**: The final solver edits durable `master_proof.lean` with `{"action":"edit_proof","needs_more_time":true|false,"operation":"full_content|replace|insert_after|delete","old_string":"exact unique proof text","new_string":"Lean code","reasoning":"..."}`. `master_proof.lean` must contain the current chosen proof route only, not accumulated competing/refuted constructions. Final solver prompts must not expose path-transition choices, raw `need_more_brainstorming`, final-cycle failed-attempt counts, or any `stuck_needs_brainstorm` action. They may expose compact recent execution feedback such as Lean errors, stale `old_string` rejections, JSON truncation, and watchdog/no-progress notices. Required corrections from recent feedback must take priority over unrelated new additions, fresh routes, or speculative helpers; new additions are allowed only when they directly implement the required correction or helper code needed for that correction. Phase transitions are selected only by the discrete path-decision mode. Legacy `{"lean_code":...}` is compatibility only.
+- **LeanOJ Master-Proof Lean Gate**: A master proof edit must never be persisted merely because the string edit applies. After structural edit application and any required shortening validation, the updated proof is checked in memory first. `needs_more_time=true` edits run Lean with placeholders allowed but still must parse/typecheck, preserve the original template/declarations, and pass forbidden-device integrity checks. `needs_more_time=false` edits run Lean with no placeholders, then final template integrity, answer adequacy, semantic review, and registration. Lean/template failure rejects the edit, preserves the prior master proof and shortening-backup metadata, and feeds the Lean diagnostics (`error_output`, diagnostic output, goal states, raw stderr when present) back to the final solver.
+- **LeanOJ Master-Proof Shortening Validation JSON**: Material-shortening edits to `master_proof.lean` must be reviewed before the Lean gate by `leanoj_master_proof_edit_validator` using `{"decision":"accept","reasoning":"...","feedback_to_submitter":""}` or `{"decision":"reject","reasoning":"...","feedback_to_submitter":"precise correction"}`. Rejection preserves the prior proof and becomes direct final-solver feedback. Validator acceptance is not proof acceptance: shortening backup/redo state and `master_proof.lean` persistence happen only after the accepted edit also passes the Lean/template gate. The edit validator must reject changes that ignore required corrections in favor of unrelated new additions, and rejection feedback must instruct the submitter to fix the required corrections before new addition attempts.
+- **LeanOJ Final Semantic Review JSON**: After Lean accepts final code and deterministic integrity checks pass, the Final Proof Solver must review the Lean-accepted code against the full LeanOJ problem prompt/template using `{"solved":true,"reasoning":"..."}` or `{"solved":false,"continuation_feedback":"...","reasoning":"..."}`. Rejection is continuation feedback, not verified success.
+- **LeanOJ Formalization Semantics Guardrail**: LeanOJ planning, proof-editing, validation, and final-review prompts must state that the Lean template is the formal source of truth, template operations must not be silently reinterpreted to match informal olympiad intuition (e.g. `Nat` subtraction truncates), proposed formulas/constructions should be sanity-checked against the exact Lean predicate on small cases when feasible, and Lean acceptance alone must not be claimed as solving the informal problem unless the formal/informal correspondence is justified.
+- **Shared Post-Lean Proof Integrity Gate**: Lean 4 is authoritative for proof checking, but proof outputs still pass `backend/shared/lean_proof_integrity.py` before storage/placement. This shared gate rejects newly introduced `axiom`/`constant`/`opaque` proof devices and uses statement-alignment validation so a Lean-accepted proof cannot be stored for an unrelated or user-prompt-irrelevant `ProofCandidate.statement`.
+- **LeanOJ Proof Validation Boundary**: Lean 4 is authoritative formal checking for LeanOJ success, but LLM validators still gate planning decisions, Lean-accepted subproof relevance, and final semantic review. A compiled subproof must not be stored as verified run context unless it matches the requested subproof/role; a compiled final solution must not stop the run unless it preserves the template and the Final Proof Solver confirms it solves the actual prompt rather than a formal loophole.
 - **Specialized Retry for Pure Reasoning Text**: When "No JSON found" error, aggregator submitter uses specialized retry: (1) Don't think step-by-step, (2) Start with `{` immediately, (3) Raw JSON only. See `backend/aggregator/agents/submitter.py`.
 - **Standard LaTeX-Focused Retry**: Retry prompts explain HOW to escape LaTeX properly. **LaTeX IS allowed** - just escape backslashes once (`\mathbb` → `\\mathbb`). DO NOT double-escape. For `old_string`: copy EXACTLY from document, just escape backslashes.
-- **Retry Context Overflow Prevention (CRITICAL)**: Truncate failed output to ~2000 chars before retry. Calculate if retry fits context window. Fall back to simple re-prompt if too large. Set `max_tokens` explicitly (never `None`). NEVER auto-increase beyond user limits. Applies to: `submitter.py`, `validator.py`, `high_param_submitter.py`, `compiler_validator.py`.
+- **Retry Context Overflow Prevention (CRITICAL)**: Sanitize failed output, then truncate to ~2000 chars before retry. Parser exception messages that are inserted into retry prompts must report failure type/structure only and must not include raw output excerpts. Calculate if retry fits context window. Fall back to simple re-prompt if too large. Set `max_tokens` explicitly (never `None`). NEVER auto-increase beyond user limits. Applies to: `submitter.py`, `validator.py`, `high_context_submitter.py`, `high_param_submitter.py`, `compiler_validator.py`.
 
 ## Internal Content Warning (Required in All Prompts)
 
@@ -227,6 +241,7 @@ WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified inte
 - `backend/autonomous/prompts/paper_redundancy_prompts.py`
 - `backend/autonomous/prompts/paper_continuation_prompts.py`
 - `backend/autonomous/prompts/final_answer_prompts.py`
+- `backend/autonomous/prompts/proof_prompts.py`
 
 **Note:** The prompt structure examples in the sections below show the core task-specific content. The INTERNAL CONTENT WARNING block is ALWAYS inserted between the role description and the "YOUR TASK:" section in the actual code.
 
@@ -245,13 +260,20 @@ def get_validator_system_prompt() -> str:
     return """You are a validation agent in an AI cluster. Your role is to evaluate mathematical submissions and decide whether they should be added to the shared knowledge base.
 
 YOUR TASK:
-Tell me if the addition of the new submission increases potential solution availability in a significant way and/or provides a valuable solution space-constraint that narrows where we need to search in a significant way.
+Decide whether the submission provides the strongest rigorous progress currently justified toward solving the user's problem, with highest priority given to direct solutions, direct partial solutions, impossibility results, exact reductions, or sharp constraints.
+
+Essentially, you are evaluating whether the training database becomes more useful toward directly answering the user's mathematical prompt with this submission added than it was without it.
 
-Essentially, you are evaluating whether the training database becomes more useful toward finding mathematical solutions with this submission added than it was without it.
+Note: You are not generating solutions yourself. You are judging whether this submission directly solves, partially solves, refutes, or materially enables the user's problem better than the current knowledge base does.
 
-Note: You are not generating solutions yourself - you are assessing if there are new solutions potentially available if we add this submission to the training database, or if the solution space becomes stronger in any way.
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate the submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA - Consider:
+- Does the submission directly answer, partially answer, refute, or sharply constrain the user's problem or a necessary subproblem?
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
 - Does the submission connect existing mathematical concepts in novel ways?
 - Does the submission provide concrete methods, theorems, proofs, or mathematical techniques?
@@ -263,9 +285,9 @@ EVALUATION CRITERIA - Consider:
 
 VALIDATION DECISION RULES:
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -451,9 +473,15 @@ YOUR TASK:
 Evaluate EACH submission INDEPENDENTLY to determine if it would make a valuable cumulative addition to the shared knowledge base.
 
 Independent Assessment:
-For each submission, ask: "Does this submission increase potential solution availability or provide valuable constraints, considering only the existing database (not the other submission in this batch)?"
+For each submission, ask: "Does this submission provide the strongest rigorous direct progress currently justified toward the user's problem, considering only the existing database (not the other submission in this batch)?"
 
-Essentially, you are evaluating whether the training database becomes more useful toward finding mathematical solutions with each submission added than it was without it.
+Essentially, you are evaluating whether the training database becomes more useful toward directly answering the user's mathematical prompt with each submission added than it was without it.
+
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate each submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA (Apply to EACH submission independently):
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
@@ -466,9 +494,9 @@ EVALUATION CRITERIA (Apply to EACH submission independently):
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -599,9 +627,15 @@ YOUR TASK:
 Evaluate EACH submission INDEPENDENTLY to determine if it would make a valuable cumulative addition to the shared knowledge base.
 
 Independent Assessment:
-For each of the three submissions, ask: "Does this submission increase potential solution availability or provide valuable constraints, considering only the existing database (not the other submissions in this batch)?"
+For each of the three submissions, ask: "Does this submission provide the strongest rigorous direct progress currently justified toward the user's problem, considering only the existing database (not the other submissions in this batch)?"
+
+Essentially, you are evaluating whether the training database becomes more useful toward directly answering the user's mathematical prompt with each submission added than it was without it.
 
-Essentially, you are evaluating whether the training database becomes more useful toward finding mathematical solutions with each submission added than it was without it.
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate each submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA (Apply to EACH submission independently):
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
@@ -614,9 +648,9 @@ EVALUATION CRITERIA (Apply to EACH submission independently):
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -1652,79 +1686,37 @@ Output your response ONLY as JSON in this exact format:
 
 ---
 
-## 8. CRITIQUE & REWRITE PHASE (POST-BODY CONSTRUCTION)
+## 8. CRITIQUE & SELF-REVIEW PHASE (POST-BODY CONSTRUCTION)
 
 **File:** `backend/compiler/prompts/critique_prompts.py`
 
 ### Overview
 
-After the body section is complete (before conclusion), the system enters a **Critique Phase** that reuses the aggregator infrastructure to collect peer review feedback. This phase ensures the body section is mathematically sound and properly aligned before proceeding.
+After the body section is complete (before conclusion), the system enters a **Critique Phase** that collects validator-approved self-review notes. Accepted critiques are appended to the paper transparently instead of rewriting paper content.
 
 ### Workflow
 
-1. **Critique Aggregation** (5 total attempts required):
+1. **Critique Aggregation** (3 total attempts required):
    - Single critique submitter generates peer review feedback on body section
-   - **Decline Mechanism**: Submitter can assess "no critique needed" when body is academically acceptable (counts toward 5 total attempts)
+   - **Decline Mechanism**: Submitter can assess "no critique needed" when body is academically acceptable (counts toward 3 total attempts)
    - Validator validates critiques/declines (accept/reject with feedback loop)
    - Pruning occurs every 7 acceptances (same as aggregator cleanup review)
-   - Target: 5 total attempts (accepted + rejected + declined attempts)
+   - Target: 3 total attempts (accepted + rejected + declined attempts)
    - Uses aggregator workflow with critique-specific prompts
 
-2. **Rewrite Decision**:
-   - If at least 1 critique accepted: Critique submitter reviews all accepted critiques + accumulated history from previous failed versions
-   - If 0 critiques accepted: Skip rewrite, move to next section
-   - Decides: "rewrite" (major issues found) or "continue" (minor/incorrect critiques)
-   - Validator validates the decision (accept/reject with retry loop)
-   - Decision includes optional new title and new outline
-
-3. **Rewrite Execution** (if approved):
-   - Mark rewrite as pending (counter increments only after first successful acceptance)
-   - Three execution paths based on decision:
-     - **CONTINUE**: Proceed to conclusion (critiques minor/incorrect)
-     - **PARTIAL_REVISION**: **ITERATIVE** edits - proposes ONE edit at a time, validates, applies, then proposes next edit
-     - **TOTAL_REWRITE**: Clear body section completely and rebuild from scratch
-   - Update title if changed (increment version number)
-   - Update outline if changed
-   - **CONTEXT FOR BOTH PARTIAL_REVISION AND TOTAL_REWRITE**:
-     - Pre-critique paper (paper snapshot from START of critique phase - shows what failed)
-     - Current accepted critique feedback (ONLY accepted, not rejected critiques)
-     - ALL critiques from ALL previous failed versions (accumulated feedback history)
-     - Original aggregator database
-     - Reference papers (if applicable)
-
-4. **Version Loop**:
-   - If rewrite_count >= 1 (completed rewrites): Skip critique phase entirely, proceed to conclusion
-   - Rewrite counts as "completed" only after first successful body acceptance
-   - Single completed rewrite cycle is sufficient for convergence
+2. **Self-Review Append**:
+   - If at least 1 critique is accepted: append accepted critiques as `AI Self-Review and Limitations`
+   - If 0 critiques are accepted: move to conclusion without adding the section
+   - The section is placed after compiler/appended proof material when present, otherwise after conclusion
+   - Critiques never trigger partial rewrites, total rewrites, body clearing, title changes, or outline updates
 
 ### Rationale
 
-**Why partial revision is ITERATIVE (one edit at a time):**
-- Allows the model to see the result of each edit before proposing the next
-- Each edit is validated individually for correctness
-- Prevents cascading failures from a batch of edits
-- Model can see pre-critique paper AND current paper to understand what started vs where we are
-- More precise control over the revision process
-
-**Why partial revision is preferred:**
-- Most critiques identify specific, localized issues that can be fixed with targeted edits
-- Preserves coherence in sections that are already correct
-- Faster than full body rewrite
-- Reduces risk of introducing new errors in previously sound sections
-- More efficient use of model context and computation
-
-**Why total rewrite is last resort:**
-- Total rewrites are difficult and can introduce errors in areas that were previously correct
-- Even with feedback, rewriting from scratch can lose coherence
-- Should only be used when issues are too pervasive for targeted edits
-- Catastrophic flaws (fundamental math errors throughout, complete misalignment) justify total rewrite
-- Now receives full context: pre-critique paper + accepted critiques, so rewrite is informed
-
-**Why maximum 1 rewrite:**
-- Prevents infinite rewrite loops on difficult topics
-- Forces convergence to best-effort result after single revision attempt
-- Accumulated feedback ensures the revision benefits from all critique history
-- Single rewrite cycle is sufficient with partial revision option available
+**Why append rather than rewrite:**
+- Preserves the validated paper content and proof placement.
+- Keeps model-discovered limitations visible to readers.
+- Avoids rewrite loops and accidental loss of correct content.
+- Makes the AI self-review honest provenance rather than hidden revision pressure.
 
 ### Decline Mechanism (Academically Acceptable Body)
 
@@ -1740,9 +1732,9 @@ After the body section is complete (before conclusion), the system enters a **Cr
 - Mathematical rigor meets academic standards
 
 **Behavior When Target Met**:
-- If NO accepted critiques: Skip rewrite, transition directly to conclusion
-- If accepted critiques exist: Run rewrite decision
-- Rationale: With only 5 attempts, no early termination mechanism is needed
+- If NO accepted critiques: transition directly to conclusion
+- If accepted critiques exist: append `AI Self-Review and Limitations`, then transition to conclusion
+- Rationale: With only 3 attempts, no early termination mechanism is needed
 
 ### Complete Prompt Structure - Critique Generation
 
@@ -1819,84 +1811,6 @@ Output as JSON:
 """
 ```
 
-### Complete Prompt Structure - Rewrite Decision
-
-**Function:** `get_rewrite_decision_system_prompt()`
-
-```python
-def get_rewrite_decision_system_prompt() -> str:
-    return """You are reviewing aggregated peer review critiques to decide if body needs revision.
-
-[... INTERNAL CONTENT WARNING ...]
-
-YOUR TASK:
-The peer review phase collected critiques through multiple attempts. ALL accepted critiques from the CURRENT version are provided below (typically 1-3 accepted out of 5 total attempts).
-
-**ACCUMULATED CRITIQUE HISTORY**: If this is not the first critique phase (rewrite_count > 0), you will also see critiques from ALL previous failed versions, labeled as "FAILED - REWRITTEN". Use this accumulated feedback to understand what went wrong in past attempts and avoid repeating mistakes.
-
-Review all critiques and decide:
-
-DECISION OPTIONS:
-1. CONTINUE - Minor/incorrect critiques
-2. PARTIAL_REVISION - Fixable issues, you will propose edits ONE AT A TIME in iterative loop
-3. TOTAL_REWRITE - Catastrophic flaws, rebuild from scratch (last resort)
-
-CONTINUE if:
-- Minor issues
-- Incorrect critiques
-- Small gaps addressable in review
-
-PARTIAL_REVISION if:
-- Specific sections have fixable errors
-- Missing content can be inserted at specific locations
-- Most of body is sound, only targeted fixes needed
-- NOTE: You will then propose edits ONE AT A TIME (not all at once)
-
-TOTAL_REWRITE if (ONLY AS LAST RESORT):
-- Fundamental mathematical errors pervasive throughout
-- Body fundamentally misaligned with paper title
-- Structural problems require complete reorganization
-- Issues too widespread for targeted edits
-- NOTE: Rewrite will have full context (pre-critique paper + accepted critiques)
-
-FOR ANY REVISION:
-- Can change title (if scope drift)
-- Can update outline (if structure needs changes)
-- For PARTIAL_REVISION: Edit operations are proposed iteratively (not in this decision)
-
-Output as JSON:
-{
-  "decision": "continue | partial_revision | total_rewrite",
-  "new_title": "New title or null",
-  "new_outline": "Updated outline or null",
-  "reasoning": "Detailed explanation"
-}
-"""
-```
-
-### Iterative Edit Prompt Structure (for PARTIAL_REVISION)
-
-**Function:** `get_iterative_edit_system_prompt()`
-
-When PARTIAL_REVISION is chosen, the system enters an iterative edit loop. Each iteration:
-1. Shows pre-critique paper (original state before this revision cycle)
-2. Shows current paper (after any edits applied so far)
-3. Shows accepted critique feedback
-4. Shows edits already applied
-5. Requests ONE edit proposal
-
-```json
-{
-  "operation": "replace | insert_after | delete",
-  "old_string": "Exact text to find in CURRENT paper",
-  "new_string": "Replacement text",
-  "reasoning": "Which critique issue this addresses",
-  "more_edits_needed": true | false
-}
-```
-
-The loop continues until `more_edits_needed=false` or max iterations (20) reached.
-
 ### Assembly in `build_critique_prompt()`
 
 ```python
@@ -1938,35 +1852,6 @@ The loop continues until `more_edits_needed=false` or max iterations (20) reache
 }
 ```
 
-**Rewrite Decision:**
-```json
-{
-  "decision": "continue | partial_revision | total_rewrite",
-  "new_title": "New title or null",
-  "new_outline": "Updated outline or null",
-  "reasoning": "Detailed explanation"
-}
-```
-
-**Iterative Edit (for partial_revision loop):**
-```json
-{
-  "operation": "replace | insert_after | delete",
-  "old_string": "Exact text to find",
-  "new_string": "Replacement text",
-  "reasoning": "Which critique this addresses",
-  "more_edits_needed": true | false
-}
-```
-
-**Rewrite Decision Validation:**
-```json
-{
-  "decision": "accept or reject",
-  "reasoning": "Why decision is or isn't justified"
-}
-```
-
 ---
 
 ## 9. COMPILER RIGOR PROMPTS (LEAN 4 THEOREM FLOW)
@@ -1979,30 +1864,35 @@ The loop continues until `more_edits_needed=false` or max iterations (20) reache
 
 ### Four-Stage Architecture
 
-The rigor loop no longer edits paper text. Each rigor cycle runs four stages, with the coordinator owning the validator loop and the appendix fallback:
+The rigor loop no longer edits paper text directly during discovery/formalization. Each rigor cycle runs four stages, with the coordinator owning inline validator attempts and appendix routing:
 
 **Stage 1: Theorem discovery (unvalidated)** — `build_rigor_theorem_discovery_prompt`
 - High-param submitter reads the full writing context (outline direct-injected, paper direct-injected when it fits, RAG for the rest per the offload priority excluding `compiler_outline.txt` + `compiler_paper.txt`).
 - Sees `EXISTING VERIFIED PROOFS` block (from `proof_database.get_all_proofs()`) so it does not re-propose already-verified theorems.
 - Sees `OPEN LEMMA TARGETS` block (from `proof_database.get_recent_failure_hints()`) as optional retry candidates.
-- Decides whether a theorem is worth attempting. Decline ends the rigor cycle.
+- Decides whether a user-prompt-relevant theorem is worth attempting. Decline ends the rigor cycle.
+- Discovery is explicitly allowed to construct extension theorems from partial paper work, the current outline, supporting context, or the user prompt when helpful to paper construction and/or the user's goal. It is not limited to exact claims already present in the current paper.
+- Discovery must classify `theorem_origin` as `existing_paper_claim`, `extension_from_partial_work`, or `extension_from_user_prompt`, and must set `placement_preference` to `inline` or `appendix_only`. Extension-derived theorems must use `appendix_only`.
 
 **Stage 2: Lean 4 formalization** — reuses `ProofFormalizationAgent.prove_candidate(max_attempts=5)` from autonomous mode
 - Up to 5 Lean 4 attempts with error-feedback chaining (failing tactic + goal states + raw Lean diagnostics fed back into each retry).
 - Broadcasts `proof_attempt_started` / `proof_verified` / `proof_attempt_failed` / `proof_check_complete` events with `source_type="compiler_rigor"` so the existing autonomous-mode proof UI lights up for free.
 - All-5-fail: candidate is recorded via `proof_database.record_failed_candidate` (becomes a future open lemma target) and the cycle ends as a decline.
 
-**Stage 3: Novelty classification + persistence** — shared `assess_proof_novelty` helper from `backend/autonomous/core/proof_novelty.py`
+**Stage 3: Post-Lean integrity + novelty classification + persistence** — shared `validate_full_lean_proof_integrity` helper from `backend/shared/lean_proof_integrity.py`, then shared `assess_proof_novelty` helper from `backend/autonomous/core/proof_novelty.py`
+- Rejects Lean-accepted proofs that introduce new fake proof devices (`axiom`, `constant`, `opaque`) not present in the source context.
+- Rejects Lean-accepted proofs that do not align with the intended theorem statement.
 - Classifies the verified proof as novel or known.
 - `proof_database.add_proof(record)` stores it with `source_type="paper"`, `source_id=f"compiler_rigor:{session}"`.
 - Novel proofs automatically enter the highest-priority direct-injection block on the next submitter instantiation (via `proof_database.inject_into_prompt`).
 - Non-novel proofs stay in the database, visible through `/api/proofs/*` for future reference-selection UI flows.
 
-**Stage 4: Placement (2 attempts + appendix fallback)** — `build_rigor_placement_prompt`
-- Submitter proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4, see Appendix A, <proof_id>" marker.
+- **Stage 4: Placement routing (inline attempts OR appendix-only)** — `build_rigor_placement_prompt`
+- If `placement_preference="appendix_only"`, inline placement is skipped and the verified theorem is appended directly to the Theorems Appendix with `placement_outcome="appendix_requested"`.
+- If `placement_preference="inline"`, submitter proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4, see Appendix A, <proof_id>" marker.
 - Validator uses the new `rigor_lean_placement` mode: judges placement and narrative only; `rigor_check` is **forced to True** regardless of LLM output (Lean 4 is the source of mathematical truth).
 - Up to 2 placement attempts; attempt 2 receives the validator's rejection feedback via `validator_rejection_feedback` field.
-- On double rejection (or when attempt 1 is not produced), the theorem is appended to the **Theorems Appendix** via `paper_memory.append_to_theorems_appendix(...)`. Counts as a `rigor_acceptance` because the math is preserved.
+- On double rejection (or when attempt 1 is not produced), the theorem is appended to the **Theorems Appendix** via `paper_memory.append_to_theorems_appendix(...)` with `placement_outcome="appendix_fallback"`. Counts as a `rigor_acceptance` because the math is preserved.
 
 ### Stage 1 JSON Schema (discovery)
 
@@ -2011,7 +1901,9 @@ The rigor loop no longer edits paper text. Each rigor cycle runs four stages, wi
   "needs_theorem_work": true,
   "theorem_statement": "precise statement with explicit hypotheses",
   "formal_sketch": "concrete Mathlib tactics / lemmas that look promising",
-  "source_excerpt": "2-6 sentences from the paper that motivate this theorem",
+  "source_excerpt": "2-6 sentences of motivating paper/outline/context/user-prompt basis",
+  "theorem_origin": "existing_paper_claim | extension_from_partial_work | extension_from_user_prompt",
+  "placement_preference": "inline | appendix_only",
   "retry_existing_failure_id": "theorem_id from OPEN LEMMA TARGETS if retrying, empty otherwise",
   "reasoning": "why this theorem is the best target right now OR why no theorem"
 }
@@ -2024,11 +1916,15 @@ Decline form:
   "theorem_statement": "",
   "formal_sketch": "",
   "source_excerpt": "",
+  "theorem_origin": "",
+  "placement_preference": "",
   "retry_existing_failure_id": "",
   "reasoning": "why declining"
 }
 ```
 
+Placement preference rule: `extension_from_partial_work` and `extension_from_user_prompt` MUST resolve to `appendix_only` even if the model emits `inline`. Existing paper claims may use `inline` when the theorem strengthens local prose, or `appendix_only` when it is useful but would distract from the body.
+
 ### Stage 4 JSON Schema (placement)
 
 ```json
@@ -2060,7 +1956,7 @@ Each entry written by `format_theorem_appendix_entry(...)` (helper in `backend/c
 
 ```
 Theorem (proof_XXX) [Novel | Known] - <theorem_name or proof_id>
-Status: verified by Lean 4 (<inline | appendix_fallback>)
+Status: verified by Lean 4 (<inline | appendix_requested | appendix_fallback>)
 Statement: <natural-language theorem statement>
 Lean 4 proof:
 <full Lean 4 source>
@@ -2306,7 +2202,7 @@ Part 3 introduces autonomous topic selection, brainstorm-to-paper workflows, and
 
 **File:** `backend/autonomous/prompts/topic_exploration_prompts.py`
 
-**Purpose:** Before topic selection, collect 5 validated candidate brainstorm questions using the full Part 1 aggregator infrastructure (parallel submitters, batch validation up to 3). Uses `build_exploration_user_prompt()` to frame the standard aggregator as a candidate question generator.
+**Purpose:** Before topic selection, collect 5 validated candidate brainstorm questions using the full Part 1 aggregator infrastructure (parallel submitters, batch validation up to 3). Uses `build_exploration_user_prompt()` to frame the standard aggregator as a candidate question generator, with a preference for candidate questions that maximize the chance of a rigorous direct answer rather than merely broad exploration.
 
 **Architecture:** Reuses `AggregatorCoordinator` — no custom JSON schemas. Standard aggregator submitter/validator prompts handle generation and validation. The exploration user prompt provides the framing context (research goal, existing brainstorms/papers, diversity requirement).
 
@@ -2757,7 +2653,7 @@ All proof prompts pass `temperature=0.0`.
 
 **Function:** `build_proof_framing_gate_prompt(user_prompt)`
 
-**Purpose:** One-shot decision at autonomous start — decides whether the research program should activate the full proof pipeline. Errs on the side of `true` whenever there is meaningful mathematical substance.
+**Purpose:** One-shot decision at autonomous start — decides whether the research program should activate the full proof pipeline. Errs on the side of `true` whenever formal proof can materially help the user's prompt.
 
 ```json
 {
@@ -2776,7 +2672,7 @@ All proof prompts pass `temperature=0.0`.
 
 **Function:** `build_proof_identification_prompt(user_prompt, source_type, source_id, source_content)`
 
-**Purpose:** Novelty-seeking gate that extracts the most promising non-trivial theorem candidates from a brainstorm or paper. Rejects trivial identities and textbook restatements. Returns at most 5 candidates ranked by novelty potential.
+**Purpose:** User-prompt relevance gate that extracts every prompt-relevant, non-trivial theorem candidate from a brainstorm or paper. Rejects off-prompt curiosities, trivial identities, and textbook restatements. Orders candidates by direct usefulness to the user prompt first, then novelty/formalization value. No artificial theorem-count cap.
 
 ```json
 {
@@ -2786,23 +2682,23 @@ All proof prompts pass `temperature=0.0`.
       "theorem_id": "thm_1",
       "statement": "natural-language theorem statement",
       "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy",
-      "novelty_rationale": "why this theorem is non-trivial and worth formalizing"
+      "novelty_rationale": "why this theorem helps the user prompt and is worth formalizing"
     }
   ]
 }
 ```
 
 **Field requirements:**
-- `has_provable_theorems`: Boolean. `true` when at least one non-trivial novel-potential theorem is present.
-- `theorems`: Array of candidates, ranked by novelty potential. **Maximum 5 entries.** Empty array when `has_provable_theorems` is `false`.
+- `has_provable_theorems`: Boolean. `true` when at least one prompt-relevant, non-trivial theorem is present.
+- `theorems`: Array of every prompt-relevant candidate, ordered by direct usefulness to the user prompt first and novelty/formalization value second. Empty array when `has_provable_theorems` is `false`.
 - `theorem_id`: Stable string identifier such as `"thm_1"`, `"thm_2"`, etc.
 - `statement`: Natural-language theorem statement. Required.
 - `formal_sketch`: Optional Lean formalization hints, assumptions, or notation notes.
-- `novelty_rationale`: Brief explanation of why this theorem is non-trivial and worth the cost of Lean verification. Required for each candidate.
+- `novelty_rationale`: Brief explanation of why this theorem helps the USER RESEARCH PROMPT and is worth the cost of Lean verification. Required for each candidate.
 
-**What to extract:** Novel theorems, bold conjectures that can be sharpened, non-obvious connections/bounds/structural results, ambitious claims (the formalization agent narrows if needed).
+**What to extract:** Theorems, supporting lemmas, sharpened conjectures, non-obvious bounds, and structural results that materially help answer, support, or advance the USER RESEARCH PROMPT.
 
-**What to reject:** Trivial identities (e.g. `n + 0 = n`), standard Mathlib restatements, results closable by a single tactic (`simp`, `omega`, `norm_num`, `decide`, `rfl`), tautologies, definitional equalities.
+**What to reject:** Off-prompt mathematical curiosities, trivial identities (e.g. `n + 0 = n`), standard Mathlib restatements, results closable by a single tactic (`simp`, `omega`, `norm_num`, `decide`, `rfl`), tautologies, definitional equalities.
 
 ---
 
@@ -2910,20 +2806,24 @@ All proof prompts pass `temperature=0.0`.
 
 **Function:** `build_proof_novelty_prompt(user_prompt, theorem_statement, lean_code, existing_novel_proofs)`
 
-**Purpose:** Post-verification novelty gate — classifies a Lean-4-verified theorem as novel or known. Does NOT re-check validity. Errs on the side of recognizing novelty for results that required multi-step reasoning or non-trivial formalization work.
+**Purpose:** Post-verification novelty gate — classifies a Lean-4-verified theorem into a novelty tier. Does NOT re-check validity. Errs on the side of recognizing novelty for results that required multi-step reasoning, non-trivial formalization work, or original proof strategy.
 
 ```json
 {
-  "is_novel": true,
+  "novelty_tier": "mathematical_discovery",
   "reasoning": "brief explanation"
 }
 ```
 
 **Field requirements:**
-- `is_novel`: Boolean. `true` → proof enters the highest-priority direct-injection block for all subsequent brainstorm/paper submitters via `proof_database.get_novel_proofs_for_injection()`. `false` → stored in the database but not injected.
+- `novelty_tier`: One of `not_novel`, `novel_formulation`, `novel_variant`, `mathematical_discovery`, or `major_mathematical_discovery`. Any tier except `not_novel` enters the highest-priority direct-injection block for all subsequent brainstorm/paper submitters via `proof_database.get_novel_proofs_for_injection()`. `not_novel` proofs are stored in the database but not injected.
 - `reasoning`: Always required.
 
-**Novel criteria (any one sufficient):** Result not in Mathlib or standard textbooks; new connection/bound/structural insight; formalizes a previously unverified conjecture; non-trivial composition of known results yielding something new; original relative to the existing stored proofs.
+**Novelty tiers:**
+- `novel_formulation`: The mathematical result is historically known, but this Lean 4 formalization or mechanized proof is novel for the research program.
+- `novel_variant`: A non-trivial reformulation, restructuring, generalization, different proof strategy, weaker hypotheses, stronger conclusion, or original composition based on known material.
+- `mathematical_discovery`: A new theorem, bound, connection, structural insight, formally verified conjecture, or independently publishable/citable mathematical contribution.
+- `major_mathematical_discovery`: A possible field-level breakthrough that may be competitive for a major prize or medal in a related field if confirmed and accepted by domain experts. This sits above ordinary `mathematical_discovery`.
 
 **Not novel:** Direct Mathlib restatement; trivial identity or tautology; closable by a single standard tactic (`simp`, `omega`, `norm_num`, `decide`, `rfl`); duplicates an already-stored novel proof.
 
@@ -2936,16 +2836,17 @@ These core requirements apply across all prompt types:
 1. **Internal Content Warning**: All system prompts include the standardized skepticism warning block
 2. **Concrete Format Examples**: Every prompt includes correct/wrong format examples with visual indicators
 3. **Structured Rejection Feedback**: Validators use the standardized rejection format (Reason/Issue/What I Saw/Expected/Fix)
-4. **Compiler Outline Injection**: The compiler outline is always fully injected (never RAGed) for structural framework
-5. **Temperature Policy**: All prompts use temperature=0.0 where API calls allow (deterministic generation) - the context in the program from feedback, etc provide enough variance to avoid looping.
-6. **JSON Preprocessing**: All LLM responses preprocessed by `sanitize_json_response()`
-7. **Exact String Matching**: Document edits use exact verbatim matches with conservative consecutive fuzzy matching fallback for model escaping quirks (85% consecutive + tail anchor + uniqueness required)
-8. **Phase-Based Construction**: Papers written in order: Body → Conclusion → Introduction → Abstract
-9. **Required Sections**: 
+4. **Direct-Solution Preference**: Prompts should prefer the strongest rigorous direct progress toward the user's goal (direct solutions, direct partial solutions, impossibility results, exact reductions, or sharp constraints) and use indirect support only when no stronger direct step is currently justified. Meta-phases such as topic exploration and paper title exploration still output candidates, but those candidates are judged by direct-answer potential instead of being rejected for not being solutions themselves.
+5. **Compiler Outline Injection**: The compiler outline is always fully injected (never RAGed) for structural framework
+6. **Temperature Policy**: Default `temperature=0.0`; only Supercharge candidates and parallel brainstorm submitter lanes may use explicit diversity temperatures. Validators, compiler roles, proof/final roles, and JSON retries stay `0.0`.
+7. **JSON Preprocessing**: All LLM responses preprocessed by `sanitize_json_response()`
+8. **Exact String Matching**: Document edits use exact verbatim matches with conservative consecutive fuzzy matching fallback for model escaping quirks (85% consecutive + tail anchor + uniqueness required)
+9. **Phase-Based Construction**: Papers written in order: Body → Conclusion → Introduction → Abstract
+10. **Required Sections**:
    - **OUTLINE**: Must include Introduction, Body, Conclusion (Abstract is optional - can be "Abstract", "I. Abstract", or "0. Abstract")
    - **PAPER CONSTRUCTION**: Always writes Abstract → Introduction → Body → Conclusion (Abstract is always written during construction phase regardless of outline)
-10. **No Placeholder Output**: Submissions must never contain placeholder markers
-11. **Placeholder Resume Repair**: When resuming from existing paper, missing placeholders are automatically added via `paper_memory.ensure_placeholders_exist()` to prevent "old_string not found" failures
-12. **Fake Placeholder Detection**: System distinguishes real section content from model-inserted fake placeholder text (FULL content >300 chars = real; <300 chars with keywords = fake) to prevent confusion during marker repair
+11. **No Placeholder Output**: Submissions must never contain placeholder markers
+12. **Placeholder Resume Repair**: When resuming from existing paper, missing placeholders are automatically added via `paper_memory.ensure_placeholders_exist()` to prevent "old_string not found" failures
+13. **Fake Placeholder Detection**: System distinguishes real section content from model-inserted fake placeholder text (FULL content >300 chars = real; <300 chars with keywords = fake) to prevent confusion during marker repair
 
 ---
diff --git a/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc b/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
index 312e9ca..242f663 100644
--- a/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
+++ b/.cursor/rules/main-rule-3-code-interaction-and-rule-interaction-rules.mdc
@@ -4,7 +4,7 @@ alwaysApply: true
 
 # Code and Rule Interaction Rules
 
-1.) Never introduce a new wait to hault the program unless specifically directed by the user. The program is designed to run until its goal completion or the operator presses stop. Infinite loops are probabalistically avoided due to the feedback mechanics.
+1.) Never introduce a new hidden wait/halt, automatic stop, or loop-disabling cap unless specifically directed by the user or already defined by these rules as an explicit safety valve/user-configurable checkpoint. RALPH/MOTO is designed to run until goal completion or until the operator presses stop; infinite loops are intentional and are probabilistically steered by feedback mechanics, not disabled by agent edits.
 
 2.) Always remove and cleanup old code, do not comment out code or leave broken/unused code in this program unless specifically directed by the user.
 
@@ -18,6 +18,20 @@ alwaysApply: true
 
 7.) Any REST shape, auth contract, WebSocket event, or `/api/features` capability change that affects the web wrapper must update **code, the relevant rule(s), and `api_contract_version` in `/api/features`** in the same approved merge. The live backend's `GET /openapi.json` is the machine-readable REST schema contract.
 
-8.) Only ONE workflow mode may be active at a time (Aggregator, Compiler, or Autonomous Research). This constraint applies identically in both default mode and generic mode.
+8.) Only ONE workflow mode may be active at a time (Aggregator, Compiler, Autonomous Research, or LeanOJ Proof Solver). This constraint applies identically in both default mode and generic mode. Start conflict checks must be serialized and include pending/background-task activity flags such as `autonomous_coordinator.is_active`, not only persisted `state.is_running` fields.
 
-9.) Lean 4 and SMT features are always gated on `lean4_enabled`, `lean4_lsp_enabled`, and `smt_enabled` runtime flags. All three default false, must stay silent and side-effect-free when disabled, and must never ship Lean or Z3 toolchains or Python wheels into `requirements-generic.txt`, `Dockerfile`, or `docker/entrypoint.sh` (hosted image stays Lean-free and Z3-free). Lean 4 is authoritative for every stored proof; SMT contributes hints only.
+9.) Lean 4 and SMT features are always gated on `lean4_enabled`, `lean4_lsp_enabled`, and `smt_enabled` runtime flags. All three default false, must stay silent and side-effect-free when disabled, and must never ship Lean or Z3 toolchains or Python wheels into `requirements-generic.txt`, `Dockerfile`, or `docker/entrypoint.sh` (hosted image stays Lean-free and Z3-free). Lean 4 is authoritative formal checking for every stored proof and is necessary for LeanOJ final solutions; SMT contributes hints only. Z3 executable paths are trusted startup/operator configuration only, must be rejected as runtime API input, and must resolve to a `z3`/`z3.exe` executable. Automated proof candidates must directly serve the user prompt, not merely be non-trivial or novel.
+
+10.) LeanOJ initial topic generation and brainstorm submitters always run in parallel and feed one validator that batch-validates up to 3 topics/submissions. Initial topic candidates/selection must be broad locked foundation questions covering the whole LeanOJ solution route, not narrow sublemma/tactic/local-repair topics. Recursive brainstorming has no separate recursive-topic prepass and must not re-inject the initial selected topic as active steering context; it uses the shared accepted proof-memory database plus the current proof/failure context. Accepted brainstorm memory must preserve occurrence-specific chronological metadata even for duplicate idea text. Never implement active LeanOJ topic or brainstorm phases as round-robin/serial submitter calls; one hung submitter must not halt the phase.
+
+11.) LeanOJ stop/crash/restart is resumable by default. `Clear Progress` / `/api/leanoj/clear?confirm=true` is the only intentional reset path. Start/restart should choose the best matching/resumable persisted session by proof context, not blindly create a new session or pick the latest file.
+
+12.) LeanOJ OpenRouter credit exhaustion or no-fallback provider configuration errors are non-retryable pauses, not proof-attempt failures. Do not let API credit/config failures inflate final proof attempt loops.
+
+13.) LeanOJ/RALPH final-proof loop checkpoints may only be user-configurable feedback checkpoints, not hidden loop shutdowns. The durable `master_proof.lean` is the authoritative working draft, and every accepted master-proof edit must pass an in-memory Lean gate before persistence: `needs_more_time=true` runs Lean with `sorry`/`admit` placeholders allowed but still requires parse/typecheck, template preservation, and no fake proof devices; `needs_more_time=false` runs Lean placeholder-free and then final semantic review against the user prompt/template before the run stops as verified. Final-proof mode is edit-only: it must not be offered, shown, or taught `stuck_needs_brainstorm`, raw `need_more_brainstorming`, failed-attempt counts, or any path transition. It may see the most recent 5 final attempts as compact execution feedback (Lean errors, stale edit rejections, JSON truncation, watchdog/no-progress notices) so it can avoid repeating failed edits. Lean/template rejection, semantic-review rejection, conservative no-progress/stale-edit watchdog feedback, and validator rejection of non-progressive shortening edits must preserve the master proof and persist structured continuation feedback; non-user-forced no-progress handoffs should gather recursive brainstorm context before re-entering final mode.
+
+14.) LeanOJ/RALPH final verification must remain placeholder-free, but Lean-accepted scaffolds containing `sorry`/`admit` should be saved as partial proofs for future context. Partial proofs are citeable incomplete references only; never count them as verified solutions and never accept fake `axiom`/`constant`/`opaque` proof devices.
+
+15.) Parent/user-selected phases have hierarchy precedence over child branches. When a parent phase starts (LeanOJ forced final loop, autonomous paper writing, Tier 3 final answer/final selection), lower-tier brainstorm/topic/path child tasks must stop or be ignored. LeanOJ `Skip Brainstorm` locks the run into the final loop until the configured final-attempt cycle is exhausted; model/path requests for more brainstorming cannot override that user action early. `Force Brainstorm` is a separate explicit user override that returns to recursive brainstorming while preserving proof progress.
+
+16.) LeanOJ prompt flows must guard formal/informal mismatches: treat the Lean template as the formal source of truth, do not silently reinterpret operations such as `Nat` subtraction, sanity-check exact-template formulas on small cases when feasible, and never claim Lean acceptance alone proves the informal problem unless that correspondence is justified.
diff --git a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
index f0b5171..702551f 100644
--- a/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
+++ b/.cursor/rules/part-1-aggregator-tool-design-specifications.mdc
@@ -46,7 +46,7 @@ Validator processes 1, 2, or 3 submissions simultaneously using batch-specific p
 
 **Submission context injection**: Direct inject if fits. If too large: RAG the submission as file, keep user prompt direct. If user prompt + RAG'd submission still too large: RAG all user-prompt files. If user prompt itself too large after all RAG: halt with error + diagnostic.
 
-**Hosted upload enforcement (generic mode)**: Server-side validation of `.txt` only, 5 MB max, filename sanitization, path traversal rejection. Applied in both modes but critical for hosted sandboxes where the control plane proxies uploads.
+**Upload/path enforcement**: Server-side validation of `.txt` only, 5 MB max, filename sanitization, path traversal rejection. Upload responses return logical filenames, not absolute host paths. Public Aggregator starts resolve `uploaded_files` only under `user_uploads`; internal autonomous reference-paper context may opt into trusted data-root file references via an explicit coordinator flag.
 
 ## Context Allocation
 
@@ -66,16 +66,21 @@ No context carryover between prompts (only system-intended DB/submission transfe
 
 User selects model per role. Multiple roles can share a model. Models load with user-set context sizes.
 
+Per-role Supercharge is optional. When enabled for a submitter or validator, `api_client_manager.generate_completion()` runs 4 parallel full answer attempts for that role call, then a 5th same-model synthesis call and returns only the synthesis result. Supercharge candidate attempts intentionally use temperatures `[0.0, 0.2, 0.4, 0.8]` to diversify parallel outputs; synthesis remains `0.0`. Candidate attempts are sanitized to reusable visible answer text before synthesis; private thought/channel/control transcript text must never be fed back as feedback, brainstorm memory, or synthesis context. The synthesis prompt frames candidates as optional working material: the model may use one, combine several, ignore all, or write a stronger new answer, while preserving the original role output contract. If Boost applies to that role/task, all internal Supercharge calls use the Boost config first. Tool-call requests bypass Supercharge.
+
+Parallel brainstorm submitter lanes intentionally use temperatures `[0.0, 0.1, ..., 0.9]` by submitter index so every parallel set includes a deterministic lane and increasing exploration lanes. This applies only to parallel submitter generation. Validators, compiler roles, JSON retries, and single-model sequential submitters remain `0.0`.
+
 ## Single-Model Mode
 When ALL submitters AND validator use the same model → single-model mode:
 - Submitters run SEQUENTIALLY (S1 → S2 → ... → Sn)
 - Validator processes all queued submissions after each full submitter round
 - Prevents queue overflow from parallel tasks flooding when LLM completes
+- Exception: if LM Studio reports multiple loaded same-base numeric `:#` instances for that model, submitters may still run in parallel while the LM Studio client routes independent calls to idle sibling instances.
 - Boost does NOT affect single-model detection (routing only, not model config)
 
 ## Multi-Submitter Configuration
 
-Per-submitter: provider (LM Studio / OpenRouter in default mode; OpenRouter only in generic mode), model, OpenRouter host provider, LM Studio fallback (default mode only), context window, max output tokens. UI: "Number of Submitters" selector (1-10), "Copy Main to All" button.
+Per-submitter: provider (LM Studio / OpenRouter in default mode; OpenRouter only in generic mode), model, OpenRouter host provider, LM Studio fallback (default mode only), context window, max output tokens, and Supercharge checkbox. UI: "Number of Submitters" selector (1-10), "Copy Main to All" button.
 
 OpenRouter auto-fill rule: selecting an OpenRouter model auto-fills from endpoint metadata only. Context window uses the smallest relevant host `context_length`; max output tokens use `min(20% of that host context, smallest relevant host max_completion_tokens)`. If `max_prompt_tokens` is available, shrink usable context to respect it. If endpoint caps are incomplete, preserve current values (no guessing).
 
@@ -89,7 +94,7 @@ Accepted submissions database: never truncated. Live preview shows exact non-tru
 
 Every 7th acceptance (`total_acceptances % 7 == 0`, minimum 7 before first review):
 
-**Phase 1**: Validator reviews ALL accepted submissions, identifies AT MOST ONE for removal (redundant, contradicted, superseded, or provides no unique value).
+**Phase 1**: Validator reviews the accepted-submissions database and identifies AT MOST ONE for removal (redundant, contradicted, superseded, or provides no unique value). If the complete database fits, it is direct-injected in full. If it does not fit, cleanup must use the normal direct-first/RAG fallback path instead of skipping or truncating; the review is then evidence-bounded by retrieved context.
 
 **Phase 2** (only if removal proposed): Validator self-validates its removal proposal. Conservative default: if uncertain, reject removal. If validated: execute removal + full RAG rebuild (all shared-training sources are dropped and re-indexed from the post-removal file so deleted content is no longer retrievable).
 
diff --git a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
index b50a2d5..35a3455 100644
--- a/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
+++ b/.cursor/rules/part-1-and-part-2-cointeraction-architecture.mdc
@@ -6,12 +6,12 @@ alwaysApply: true
 
  This describes additional architecture for the synergy between the part 1 database aggregator tool and part 2 aggregator-compiler tool. Both modes operate identically in default and generic deployment — the only difference is provider availability (see `hosted-web-contract.mdc` for details on generic mode).
 
- NOTE: This is a continuously-running program that does not stop itself, the user selects the aggregator to start, then starts the compiler when they desire, and then the user choses when to turn off each selective mode by turning the off switch. There is no "solution stop token" as in normal AI solution generation.
+ NOTE: This is a continuously-running program that does not stop itself; the user selects one top-level workflow mode to run and turns it off when desired. There is no "solution stop token" as in normal AI solution generation.
  
  
  ## Aggregator start-up workflow
 1.) The aggregator runs initially with no compiler running.
-2.) The compiler does not begin running until the user starts it manually. Aggregator can run on its own for a head-start for as long as the operator would like. If the operator desires the aggregator can also run by itself without any compilation.
+2.) The compiler does not begin running until the user starts it manually, and current code enforces that Aggregator, Compiler, Autonomous Research, and LeanOJ Proof Solver are mutually exclusive top-level modes. Aggregator can run on its own without any compilation.
 
 ## GUI Design
 
@@ -40,22 +40,34 @@ The live-constructing compiler-written paper should be viewable in one tab and a
 
 **Use Case**: User may have domain knowledge that the brainstorm has explored sufficient territory before the automatic 10-acceptance interval, saving time and allowing manual control over the autonomous workflow.
 
-## Multi-Submitter Architecture (Aggregator Only)
+## Hierarchy / Parent Action Precedence
 
-**Distinction**: Multiple submitters are only available for the Aggregator (Part 1 and Part 3 brainstorm aggregation). The Compiler (Part 2) uses a fixed single-submitter sequential Markov chain workflow.
+Parent workflow actions override child agents immediately. Manual paper writing, forced Tier 3, LeanOJ forced final solving, and final selection phases must stop or fence off any lower-tier brainstorm/topic/path workers before continuing. Never allow stale child outputs to change phase after a parent action has taken ownership.
+
+## Multi-Submitter Architecture (Aggregator and LeanOJ)
+
+**Distinction**: Multiple submitters are available for the Aggregator (Part 1 and Part 3 brainstorm aggregation) and LeanOJ topic/brainstorm phases. The Compiler (Part 2) uses a fixed single-submitter sequential Markov chain workflow.
 
 ### Aggregator Multi-Submitter (Part 1 & Part 3)
 - Configurable 1-10 parallel submitters (default: 3)
 - Each submitter can have its own model, context window, and max output tokens
 - Enables multi-model exploration of different solution basins simultaneously
+- Parallel submitter generation uses the shared temperature ladder `[0.0, 0.1, ..., 0.9]` by submitter index; single-model sequential submitters and validators stay `0.0`.
+- If all submitters and the validator are configured with the same LM Studio model ID, the Aggregator normally uses single-model sequential mode. Exception: when LM Studio reports multiple loaded same-base numeric `:#` instances for that model, submitters may run in parallel and `lm_studio_client` routes independent calls to idle sibling instances while the validator remains ordered.
 - Single validator maintains coherent Markov chain evolution for database alignment
 - UI labels: "Submitter 1 (Main Submitter)", "Submitter 2", "Submitter 3", etc.
 - "Copy Main to All" button for quick configuration
 
+### LeanOJ Topic/Brainstorm Multi-Submitter
+- Configurable 1-10 parallel submitters generate initial topics and brainstorm ideas
+- One validator batch-validates up to 3 completed topics or submissions at a time; initial topics must be broad locked foundation questions for the whole LeanOJ solution route, not narrow lemma/tactic/repair targets
+- Parallel topic/brainstorm submitters use the shared temperature ladder `[0.0, 0.1, ..., 0.9]` by submitter index; LeanOJ validators, final solver, semantic review, and retry/repair calls stay `0.0`.
+- No round-robin/serial submitter awaiting; a hung submitter must not block other submitters or validation
+
 ### Compiler Single-Submitter (Part 2)
 - Fixed 2-submitter architecture (NOT configurable):
   - **High-Context Submitter**: Handles outline_create, outline_update, construction, review modes. During construction, may invoke the Wolfram Alpha tool up to 20 times per submission when `system_config.wolfram_alpha_enabled=true`.
-  - **High-Parameter Submitter**: Handles rigor mode. Rigor is the **Lean-4-verified-theorem flow**: discovery → up to 5 Lean 4 formalization attempts (with error feedback) → novelty classification → placement (2 attempts, validator uses `rigor_lean_placement` mode forcing `rigor_check=True`) → Theorems Appendix fallback. The compiler writes verified proofs directly into the shared `proof_database` (same database used by autonomous mode); novel proofs automatically enter the highest-priority direct-injection block on the next submitter instantiation.
+  - **High-Parameter Submitter**: Handles rigor mode. Rigor is the **Lean-4-verified-theorem flow**: user-prompt-relevant discovery (including explicit extension theorems from partial paper work / outline / supporting context / user prompt when helpful) → up to 5 Lean 4 formalization attempts (with error feedback) → novelty classification → placement routing. Existing-paper-claim theorems may go through inline placement (2 attempts, validator uses `rigor_lean_placement` mode forcing `rigor_check=True`); extension-derived theorems are forced to `placement_preference="appendix_only"` and appended directly to the Theorems Appendix (`placement_outcome="appendix_requested"`). Inline failures still use Theorems Appendix fallback. The compiler writes verified proofs directly into the shared `proof_database` (same database used by autonomous mode); novel proofs automatically enter the highest-priority direct-injection block on the next submitter instantiation.
 - Sequential Markov chain workflow (only one submission at a time)
 - Each compiler submitter has its own model, context, and max token settings (separate from aggregator)
 - UI shows these as separate "High-Context Submitter" and "High-Parameter Submitter" sections
@@ -65,6 +77,7 @@ The live-constructing compiler-written paper should be viewable in one tab and a
 ## Additional Traits Shared Between Aggregator-Submitters and Compiler-Submitters
 
 - The JSON of aggregator-subbmiters and compiler-submitters should include a "reasoning:" request below its "submission:" line. (This forces the submitter to explain the thoughts behind there reasoning and can also reveal deception for additional context for the validator.)
+- MOTO conversational retries must preserve useful failed-output context, but never raw provider/model transcript text. Any assistant replay or reusable feedback/memory excerpt must be sanitized to remove known private thought/channel/control transport scaffolding first while preserving visible mathematical/Lean syntax such as `<|` and literal marker text inside JSON/string content. Parser error strings sent back to models must not include raw output excerpts. Exact tool-call assistant/tool protocol turns are the only exception.
 
 ## API Call Output Notes (User-Configurable)
 - **All `max_tokens` limits are user-configurable via GUI settings** (like context window sizes). Users can adjust these per model role based on their specific models' capabilities.
diff --git a/.cursor/rules/part-2-compiler-tool-design-specification.mdc b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
index b397819..9406396 100644
--- a/.cursor/rules/part-2-compiler-tool-design-specification.mdc
+++ b/.cursor/rules/part-2-compiler-tool-design-specification.mdc
@@ -31,9 +31,11 @@ Before every `_pre_validate_exact_string_match()`, system calls `paper_memory.en
 
 **Provider Selection**: Each compiler role (validator, high-context, high-param, critique submitter) can independently use LM Studio or OpenRouter with optional host provider and LM Studio fallback (default mode). In generic mode, all roles use OpenRouter only; LM Studio options are hidden in the frontend.
 
-**Export Behavior**: Raw text export available in both modes. PDF export (`POST /api/download/pdf`) is desktop-only — generic mode returns `501` (Playwright/Chromium not installed in hosted image).
+**Supercharge**: Each compiler role has an optional Supercharge checkbox. Checked roles run 4 full answer attempts plus a 5th same-model synthesis answer through `api_client_manager.generate_completion()`. If Boost applies, every internal Supercharge call uses the Boost route/model/provider settings first. Tool-call requests bypass Supercharge; this is especially important for the Wolfram-enabled construction loop.
 
-**Aggregator RAG refresh**: Every 10 accepted aggregator submissions (not immediate like aggregator).
+**Export Behavior**: Raw text export available in both modes. PDF export (`POST /api/download/pdf`) is desktop-only — generic mode returns `501` (Playwright/Chromium not installed in hosted image). Server-side PDF rendering must treat submitted HTML as untrusted: sanitize/allowlist content and block external network requests from Playwright.
+
+**Aggregator RAG refresh**: Manual Part 2 refreshes every 10 accepted aggregator submissions (not immediate like aggregator). Autonomous/Tier 3 compiler runs do not start the manual aggregator monitor because the parent autonomous tier owns the active brainstorm/reference context.
 
 **Enhanced Rejection Feedback Format** (`compiler_rejection_log.py`):
 - Header: "🚫 REJECTED BECAUSE: [Failure Reason]"
@@ -97,20 +99,19 @@ Body content is ALWAYS inserted BEFORE CONCLUSION_PLACEHOLDER. `_apply_edit()` a
 - 4× HC construction → validator
 - 1× HC outline update → validator *(skipped if body complete)*
 - 2× HC review → validator
-- 1× HP rigor → validator *(skipped if body complete)*
+- Then, if body is still active, run the HP Lean-4 theorem-search rigor loop until the first decline. Each successful rigor cycle lands one verified theorem inline or in the Theorems Appendix, then the rigor loop may continue; this is no longer exactly one HP pass.
 
 **Rigor Mode (Lean 4 verified theorems, 4-stage)**:
 The rigor loop no longer rewrites prose. Each rigor cycle:
-- Stage 1 (HP, unvalidated): theorem discovery - using the full writing context, decide if a theorem worth formalizing exists that is not already verified; return `needs_theorem_work=false` to decline and end the rigor loop.
+- Stage 1 (HP, unvalidated): theorem discovery - using the full writing context, decide if a user-prompt-relevant theorem worth formalizing exists that is not already verified; return `needs_theorem_work=false` to decline and end the rigor loop. Discovery is explicitly allowed to construct extension theorems from partial paper work, the outline, supporting context, or the user prompt when helpful to paper construction and/or the user's goal, not only exact claims already written in the current paper.
+- Stage 1 output includes `theorem_origin` (`existing_paper_claim`, `extension_from_partial_work`, `extension_from_user_prompt`) and `placement_preference` (`inline`, `appendix_only`). Extension-derived theorems MUST be forced to `appendix_only`; existing-paper-claim theorems may be inline or appendix-only.
 - Stage 2: `ProofFormalizationAgent.prove_candidate(max_attempts=5)` - up to 5 Lean 4 attempts with error-feedback chaining. On 5 failures: record the candidate via `proof_database.record_failed_candidate` so future cycles see it as an open lemma target; end the rigor cycle as a decline.
 - Stage 3: novelty classification via the shared `assess_proof_novelty` helper; `proof_database.add_proof` persists the verified proof. Novel proofs automatically enter the highest-priority direct-injection block (`proof_database.inject_into_prompt`) on the next submitter instantiation. Non-novel proofs remain available through `/api/proofs` for future user-driven reference selection.
-- Stage 4: placement - HP model proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4" marker and an appendix cross-reference. Validator uses the new `rigor_lean_placement` mode which forces `rigor_check=True` (Lean 4 is the source of mathematical truth) and judges placement/narrative only. Up to 2 placement attempts (attempt 2 gets validator rejection feedback).
-- Appendix fallback: if both placement attempts fail, the verified theorem is appended to the **Theorems Appendix** block (`THEOREMS_APPENDIX_START` / `THEOREMS_APPENDIX_END` bracket markers in `paper_memory.py`). Still counts as a `rigor_acceptance` because the math is preserved.
+- Stage 4: placement - if `placement_preference="inline"`, HP model proposes an inline edit that introduces the theorem with an explicit "verified in Lean 4" marker and an appendix cross-reference. Validator uses `rigor_lean_placement` mode which forces `rigor_check=True` (Lean 4 is the source of mathematical truth) and judges placement/narrative only. Up to 2 placement attempts (attempt 2 gets validator rejection feedback).
+- Appendix routing: if `placement_preference="appendix_only"`, skip inline placement and append directly to the **Theorems Appendix** with `placement_outcome="appendix_requested"`. If inline placement is attempted but both placement attempts fail, append with `placement_outcome="appendix_fallback"`. Both outcomes count as `rigor_acceptance` because the math is preserved.
 - Loop 2 ends on first **decline** (no theorem found OR 5 Lean attempts failed OR Lean 4 disabled). Every verified theorem lands somewhere so there is no "rejection" outcome at the loop level.
 - Config gate: `system_config.lean4_enabled=false` → every rigor cycle declines immediately.
 
-**Decline Mechanisms:**
-- `outline_update`: `needs_update: boolean`
 **Decline Mechanisms:**
 - `outline_update`: `needs_update: boolean`
 - `construction`: `needs_construction: boolean`
@@ -133,24 +134,22 @@ Detection via `_is_body_complete()` in `compiler_coordinator.py`.
 
 ## Critique Phase (Post-Body, Pre-Conclusion)
 
-**"5 total attempts"** = accepted + rejected + declined (not just accepted).
-
-**Max 1 completed rewrite**. Rewrite "completed" only after first successful body acceptance post-rewrite. After 1 completed rewrite, critique phase is skipped entirely.
+**"3 total attempts"** = accepted + rejected + declined (not just accepted).
 
 **Workflow:**
-1. If `rewrite_count >= 1` completed rewrites → skip critique, proceed to conclusion
-2. Critique aggregation: target 5 total attempts
-3. Pre-critique snapshot of paper body
-4. If 5 attempts with ≥1 accepted → rewrite decision; if 0 accepted → skip rewrite
-5. Decisions: **CONTINUE** (minor/incorrect critiques) | **PARTIAL_REVISION** (iterative one-edit-at-a-time loop until `more_edits_needed=false`) | **TOTAL_REWRITE** (catastrophic flaws only)
+1. Critique aggregation: target 3 total attempts
+2. Submitter may critique or decline; validator still validates every critique/decline
+3. If accepted critiques exist, append them to the paper as `AI Self-Review and Limitations`
+4. If 0 critiques are accepted, proceed without adding the section
+5. Transition to conclusion; critique never rewrites paper content
 
-Context for rewrites: pre-critique paper + accepted critiques only (rejected excluded) + accumulated history from prior failed versions.
+The self-review section is inserted after the compiler Theorems Appendix when present, otherwise after the paper conclusion and before the paper anchor. Later autonomous proof appends must stay before this self-review section.
 
-**Decline**: Submitter can assess "no critique needed" if body is academically acceptable (no errors, complete, meets rigor). If 0 accepted critiques at end of 5 attempts → skip rewrite.
+**Decline**: Submitter can assess "no critique needed" if body is academically acceptable (no errors, complete, meets rigor). If no critiques are accepted after 3 attempts, no self-review section is appended.
 
 **Skip Critique (User Override)**: `POST /api/compiler/skip-critique` — available only during active critique phase (`in_critique_phase=True`). Immediately ends critique, transitions to conclusion, broadcasts `critique_phase_skipped` with `reason: "user_override"`. Irreversible.
 
-**WebSocket Events:** `critique_phase_started`, `critique_progress`, `critique_accepted`, `critique_rejected`, `critique_decline_accepted`, `critique_decline_rejected`, `critique_removed`, `critique_phase_ended`, `critique_phase_skipped`, `rewrite_decision_rejected`, `body_rewrite_started`, `phase_transition`, `phase_completion_signal`
+**WebSocket Events:** `critique_phase_started`, `critique_progress`, `critique_accepted`, `critique_rejected`, `critique_decline_accepted`, `critique_decline_rejected`, `critique_removed`, `self_review_appended`, `critique_phase_ended`, `critique_phase_skipped`, `phase_transition`, `phase_completion_signal`
 
 ---
 
@@ -207,11 +206,11 @@ Prevents models' fake placeholder text (e.g., "XI. Conclusion\n*placeholder*") f
 
 Per-role context windows (all user-configurable, default 131072):
 - Validator, High-Context Submitter, High-Parameter Submitter: 131072 tokens each
-- **Settings flow**: All compiler modules read from `system_config.compiler_*` at runtime. The caller that creates `CompilerCoordinator` MUST write settings to `system_config` before init (manual mode: `/api/compiler/start`; autonomous mode: `autonomous_coordinator.py` before `CompilerCoordinator()` creation).
+- **Settings flow**: All compiler modules read from `system_config.compiler_*` at runtime. The caller that creates `CompilerCoordinator` MUST write settings to `system_config` before init (manual mode: `/api/compiler/start`; autonomous mode: `autonomous_coordinator.py` before `CompilerCoordinator()` creation). Per-role Supercharge flags must be passed through `ModelConfig`, not `system_config`.
 - **OpenRouter auto-fill**: Selecting an OpenRouter model auto-fills from endpoint metadata only. Context window uses the smallest relevant host `context_length`; max output tokens use `min(20% of that host context, smallest relevant host max_completion_tokens)`. If `max_prompt_tokens` is available, shrink usable context to respect it. If endpoint caps are incomplete, preserve current values (no guessing).
 - Rigor mode dynamically adjusts RAG budget if outline + system prompts exceed available context
 - Construction mode dynamically adjusts RAG budget when brainstorm content is present: `rag_budget = max(5000, max_allowed - outline_tokens - paper_tokens - brainstorm_tokens - 5000_overhead)`. Brainstorm always direct-injected at full fidelity; RAG evidence scales to fit remaining budget.
-- **Wolfram Alpha as a construction tool**: During `HighContextSubmitter.submit_construction` (body / conclusion / introduction / abstract), when `system_config.wolfram_alpha_enabled=true`, the writer may invoke the `wolfram_alpha_query` OpenAI-compatible tool up to **20 times per submission** to verify factual / computational claims before writing them. On budget exhaustion, the loop forces finalization with tools disabled. Tool audit trail lives in `CompilerSubmission.metadata["wolfram_calls"]`. The validator is not re-invoking Wolfram; it just sees the audit trail. Wolfram tool is NOT available in `outline_create`, `outline_update`, `review`, or the rigor loop.
+- **Wolfram Alpha as a construction tool**: During `HighContextSubmitter.submit_construction` (body / conclusion / introduction / abstract), when `system_config.wolfram_alpha_enabled=true`, the writer may invoke the `wolfram_alpha_query` OpenAI-compatible tool up to **20 times per submission** to verify factual / computational claims before writing them. On budget exhaustion, the loop forces finalization with tools disabled. Tool replies remain model-visible, but logs/WebSocket events expose only redacted metadata and lengths; paper credits store counts only. Wolfram tool is NOT available in `outline_create`, `outline_update`, `review`, or the rigor loop.
 
 **Context rules:** User prompt ALWAYS direct injected. Direct injection first; RAG only when doesn't fit. ~85% RAG retrieval, ~15% direct injections. Halt with error if user prompt exceeds context_window - minimum_RAG_allocation.
 
diff --git a/.cursor/rules/part-3-autonomous-research-mode.mdc b/.cursor/rules/part-3-autonomous-research-mode.mdc
index 091a96e..0b4599b 100644
--- a/.cursor/rules/part-3-autonomous-research-mode.mdc
+++ b/.cursor/rules/part-3-autonomous-research-mode.mdc
@@ -42,6 +42,8 @@ The autonomous coordinator USES actual Part 1 aggregator infrastructure for brai
 - Configures with topic-specific database path (`auto_brainstorms/brainstorm_{topic_id}.txt` under the active instance data root; default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}.txt`)
 - Runs configurable 1-10 submitters + 1 validator workflow (default 3 submitters)
 - Each submitter can have its own model, context window, and max output tokens for multi-model exploration
+- Each role can independently enable Supercharge; child Aggregator coordinators must preserve `supercharge_enabled` from the autonomous role configs.
+- Parallel brainstorm/topic/title exploration submitters inherit the Part 1 temperature ladder; autonomous validators and compiler/final-answer roles stay `0.0`.
 - SINGLE validator maintains coherent Markov chain evolution (same constraint as Part 1)
 - Monitors acceptance count for completion triggers (every 10 acceptances)
 - Handles pruning (every 7 acceptances) automatically via aggregator
@@ -55,6 +57,7 @@ The autonomous coordinator USES actual Part 1 aggregator infrastructure for brai
 - Stops aggregator when completion review decides to write paper
 - **Phase enforcement**: Construction submitter must check current phase before declaring completion
 - **Premature decline rejection**: Coordinator rejects declines if required sections are missing based on current phase
+- **Parent precedence**: Forced paper writing and forced Tier 3 must stop active child aggregators before the parent tier continues; local exploration/title aggregators must be tracked so they can be stopped.
 
 ### Part 2 Compiler Integration (Tier 2)
 The autonomous coordinator USES actual Part 2 compiler infrastructure for paper compilation:
@@ -68,11 +71,13 @@ Compiler submitters may selectively use, synthesize beyond, or depart from brain
 
 **Critical Implementation Details**:
 - **system_config propagation (REQUIRED)**: Before creating `CompilerCoordinator`, autonomous mode MUST write all compiler context/token settings to `system_config` (e.g., `system_config.compiler_high_context_context_window = self._high_context_context`). Compiler modules read from `system_config` at init — the manual `/api/compiler/start` route does this, but autonomous mode bypasses that route and must do it explicitly. Applies to both `_compile_paper_from_brainstorm()` and `_compile_tier3_paper()`.
+- **Supercharge propagation (REQUIRED)**: Autonomous mode must preserve per-role `supercharge_enabled` for brainstorm submitters, validator, high-context, high-param, critique submitter, proof runtime snapshots, and child Compiler/Aggregator coordinators. This setting lives in role configs / `ModelConfig`, not `system_config`.
 - Constrains section order: Body → Conclusion → Introduction → Abstract
-- Paper is considered complete when abstract is detected in paper content
-- Uses regex patterns to detect and extract abstract section
+- Paper is considered complete when the abstract phase receives explicit `section_complete: true`
+- Regex patterns may still extract abstract text for metadata, but do not drive phase completion
 - Reference papers are RAG'ed with brainstorm having higher direct injection priority
 - Outline is ALWAYS fully injected (never RAGed) for structural framework integrity
+- Autonomous/Tier 3 compiler runs must not start the manual Part 1 aggregator monitor; the parent tier owns all brainstorm/reference context.
 
 ---
 
@@ -282,12 +287,6 @@ JSON schemas defined in `json-prompt-design.mdc`. Two-step: submitter requests p
 - System intelligently handles large papers via RAG when needed
 - Maximum 3 papers enforced across the topic-cycle selection modes
 
-### Context for Pre-Brainstorm Reference Selection
-- User's high-level research prompt (direct injection)
-- Current brainstorm topic prompt (direct injection)
-- ALL Tier 2 paper titles + abstracts (direct injection if fits, RAG if too large)
-- Instruction: "Select papers that would help inform and enhance exploration of this brainstorm topic"
-
 ### Key Design Points
 - **Same references persist**: References selected here are used for BOTH brainstorming AND paper writing
 - **Additional selection later**: AI can select MORE references (up to 3 total) before paper writing
@@ -318,13 +317,14 @@ The autonomous brainstorm aggregator inherits batch validation from Part 1 infra
 1. **Topic-Specific Database**: Writes to `auto_brainstorms/brainstorm_{topic_id}.txt` under the active instance data root (default desktop path: `backend/data/auto_brainstorms/brainstorm_{topic_id}.txt`) instead of `rag_shared_training.txt`
 2. **No User-Provided Topic Prompt**: Uses the AI-generated brainstorm topic prompt
 3. **Completion Tracking**: Tracks acceptance count (including removals) for completion review trigger
-4. **Hard Limit**: 30 accepted submissions (FORCE transition to paper writing, no completion review)
+4. **Deletion Safety**: An active/current brainstorm must not be deleted while autonomous research or its aggregator is running; if its metadata or database disappears, aggregation must stop and clear stale coordinator pointers rather than recreate an invisible DB.
+5. **Hard Limit**: 30 accepted submissions (FORCE transition to paper writing, no completion review)
    - Purpose: Prevents runaway brainstorms from accumulating indefinitely
    - Trigger: After each acceptance, check if count >= 30
    - Behavior: Immediately transition to paper writing, skip completion review
    - WebSocket event: `brainstorm_hard_limit_reached`
    - **TOTAL across all rounds**: When `continue_existing` resumes an incomplete brainstorm, the 30-cap applies to the TOTAL acceptance count (prior + new). The aggregator loop tracks a `resume_acceptance_base` offset so `_acceptance_count` always reflects the true total. If a topic already has >= 30 acceptances on entry, aggregation is skipped entirely and paper writing is forced immediately.
-5. **Rejection Hard Limit**: 10 consecutive rejections (with minimum 5 acceptances) FORCE transition to paper writing
+6. **Rejection Hard Limit**: 10 consecutive rejections (with minimum 5 acceptances) FORCE transition to paper writing
    - Purpose: Prevents infinite rejection loops when brainstorm is exhausted
    - Trigger: After rejection, check if consecutive rejections >= 10 AND acceptances >= 5
    - Behavior: Immediately transition to paper writing, skip completion review
@@ -500,30 +500,6 @@ Same two-step browsing workflow as pre-brainstorm selection (expand request →
 
 **Prompts**: `paper_title_exploration_prompts.py` — `build_title_exploration_user_prompt()` frames the aggregation task for candidate title generation with context: user prompt, topic, brainstorm summary, existing papers, reference papers.
 
-### Paper Title Exploration (Pre-Title Candidate Brainstorm)
-
-**Purpose**: Before committing to a paper title, the system collects 5 validated candidate titles using the Part 1 aggregator infrastructure. The final title selection then chooses from candidates, synthesizes them, or proposes a new title with justification.
-
-**Architecture**: Uses `AggregatorCoordinator` from Part 1 — same parallel submitters + batch validator, but with **cleanup/pruning disabled** (`enable_cleanup_review=False`) since target is only 5 candidates.
-
-**Applies to EVERY paper creation**: Tier 2 papers (1/2/3 from brainstorm), Tier 3 short-form, Tier 3 gap/intro/conclusion chapters.
-
-**Workflow**:
-1. Aggregator starts with all configured submitters running in parallel
-2. Submitters generate candidate paper titles as standard submissions
-3. Validator checks quality, relevance, and DIVERSITY (rejects near-duplicates)
-4. Accepted candidates accumulate in temp title DB
-5. Coordinator stops at 5 acceptances (or 15 consecutive rejections safety valve)
-6. Reads title DB, formats as candidate list for final title selection
-
-**Temp DB**: `title_candidates_{topic_id}.txt` in brainstorms dir (cleaned up after phase)
-
-**WebSocket Events**: `paper_title_exploration_started`, `paper_title_exploration_progress`, `paper_title_exploration_complete`
-
-**Crash Recovery**: On resume, exploration restarts fresh (short phase, no state to preserve).
-
-**Prompts**: `paper_title_exploration_prompts.py` — `build_title_exploration_user_prompt()` frames the aggregation task for candidate title generation with context: user prompt, topic, brainstorm summary, existing papers, reference papers.
-
 ### Paper Title Selection
 
 **Context**:
@@ -618,24 +594,17 @@ The validator will REJECT any outline missing these required sections or with in
 - Cannot skip to conclusion/introduction/abstract
 
 **Critique Phase (Post-Body, Pre-Conclusion)**:
-- **Maximum Rewrites**: 1 completed rewrite allowed. Rewrite counts as "completed" only after first successful body acceptance. After 1 completed rewrite, critique phase is skipped.
-- **Pre-Critique Snapshot**: Paper body snapshotted at critique phase start (for rewrite context)
-- **Triggered**: Automatically when body construction completes (unless rewrite_count >= 1 completed rewrites)
+- **Triggered**: Automatically when body construction completes
 - **Purpose**: Peer review body section before proceeding to conclusion
-- **Target**: 5 total attempts (accepted + rejected + declined)
+- **Target**: 3 total attempts (accepted + rejected + declined)
 - **Decline Mechanism**: Submitter can assess "no critique needed" if body is academically acceptable (no mathematical errors, all outline requirements met, proper rigor)
-- **Skip Rewrite**: If 5 total attempts complete with 0 accepted critiques, skip rewrite phase and continue to conclusion
-- **Rewrite Decision**: If 5 total attempts reached with ≥1 acceptance, submitter decides: continue / partial_revision / total_rewrite
-- **Decision Options**:
-  - **CONTINUE**: Critiques minor/incorrect, proceed to conclusion
-  - **PARTIAL_REVISION**: **ITERATIVE** edits - proposes ONE edit at a time, validates, applies, sees result, then proposes next. Context includes pre-critique paper + current paper + accepted critiques.
-  - **TOTAL_REWRITE**: Clear entire body and rebuild from scratch (catastrophic flaws only). Receives pre-critique paper + accepted critiques for context.
-- **Accumulated History**: All critiques from all previous failed versions are provided to rewrite decision
-- **Context for Rewrites**: Pre-critique paper (shows what failed) + accepted critiques ONLY (rejected critiques NOT included)
-- **JSON Schema**: `{"critique_needed": true/false, "submission": "...", "reasoning": "..."}` for critiques; `{"decision": "continue|partial_revision|total_rewrite", "new_title": null, "new_outline": null, "reasoning": "..."}` for rewrite decision (note: edit_operations removed, now iterative)
+- **Self-Review Append**: If accepted critiques exist after 3 attempts, append them as `AI Self-Review and Limitations`; if 0 critiques are accepted, continue without the section
+- **No Rewrites**: Critiques never trigger partial revision, total rewrite, body clearing, title changes, or outline updates
+- **Placement**: Self-review is final reader-facing content after the compiler Theorems Appendix/proof section when present, otherwise after the conclusion; later proof appends must stay before self-review
+- **JSON Schema**: `{"critique_needed": true/false, "submission": "...", "reasoning": "..."}` for critiques only
 
 **Skip Critique Phase (User Override)**:
-- **Purpose**: Allow users to manually skip the critique/rewrite phase and proceed directly to conclusion
+- **Purpose**: Allow users to manually skip the critique/self-review phase and proceed directly to conclusion
 - **API Endpoint**: `POST /api/auto-research/skip-critique`
 - **Availability**: Any time during Tier 2 paper writing
 - **Behavior**:
@@ -765,8 +734,8 @@ When abstract is written and validated, the paper is considered COMPLETE. Additi
    - Uses validator model from current session configuration
    - Calculates average rating: `(novelty + correctness + impact) / 3`
    - Saves critique to paper's critique storage
-   - If average rating ≥ 7.0, emits `high_score_critique` WebSocket event
-   - Frontend displays popup notification (max 3, FIFO queue)
+   - If average rating ≥ 6.25, emits `high_score_critique` WebSocket event
+   - Frontend displays popup notification (max 3, FIFO queue) and recovers missed high-score popups from saved paper critique badges on reload/poll
    - Non-blocking: errors logged but don't affect paper completion
    - See "Auto-Critique Popup Notifications" section below for details
 
@@ -798,9 +767,9 @@ JSON schema defined in `json-prompt-design.mdc`. Fields: `should_remove` (bool),
    - Maximum 1 removal per review cycle
 
 5. **Execution**:
-   - If removal validated: Move paper to `auto_papers/archive/` under the active instance data root (default desktop path: `backend/data/auto_papers/archive/`)
-   - Update metadata to mark as "archived"
-   - Update statistics
+   - If removal validated: prune the paper into `auto_papers/pruned/` (or the session `papers/pruned/` directory) with `pruned_paper_{paper_id}*` filenames and a top-of-file `PRUNED PAPER - REMOVED FROM MODEL CONTEXT` banner
+   - Update metadata to mark `status="pruned"`, store prune reason/actor/time, and remove active RAG sources for that paper
+   - Pruned papers are excluded from all future model context/reference selection, but remain visible and downloadable for the user until they explicitly delete all pruned papers
 
 ### Return to Topic Selection / Brainstorm Multi-Paper Continuation
 
@@ -1031,10 +1000,10 @@ Wolfram Alpha Verifications: 3 queries
 
 **Wolfram Alpha Verification Tracking**:
 - Wolfram Alpha API calls are tracked separately from LLM API calls
-- Only ACCEPTED Wolfram verifications are counted (where result was added to paper via validated rigor submission)
+- Only Wolfram calls attached to accepted construction submissions are counted in paper credits
 - Displayed in MODEL CREDITS section below LLM model list
 - Format: "Wolfram Alpha Verifications: N queries"
-- Tracking happens in `compiler_coordinator._submit_and_validate_rigor()` after validator acceptance
+- Tracking happens in `compiler_coordinator._track_submission_wolfram_calls()` after validator acceptance
 - If no Wolfram calls made, this line is omitted from credits
 - **Graceful edge case handling**: Credits show even if only Wolfram calls exist (no model tracking data), or if only model calls exist (no Wolfram calls)
 
@@ -1049,7 +1018,7 @@ class PaperMetadata(BaseModel):
 
 **PaperModelTracker Class** (`backend/autonomous/memory/paper_model_tracker.py`):
 - `track_call(model_id)`: Record an API call for a model
-- `track_wolfram_call(query)`: Record a Wolfram Alpha verification
+- `track_wolfram_call(query)`: Increment the Wolfram verification count; query text is not persisted for credits
 - `get_wolfram_call_count()`: Get total Wolfram queries
 - `has_tracking_data()`: Returns True if any model calls OR Wolfram calls exist (handles edge cases gracefully)
 - `get_models_dict()`: Get Dict[str, int] for metadata storage
@@ -1220,10 +1189,12 @@ Main component for displaying Tier 3 status and content:
   - Back button to return to list
 
 **API Endpoints**:
-- `GET /auto-research/final-answer/{answer_id}/archive/papers` - List archived papers
-- `GET /auto-research/final-answer/{answer_id}/archive/papers/{paper_id}` - Get paper details
-- `GET /auto-research/final-answer/{answer_id}/archive/brainstorms` - List archived brainstorms
-- `GET /auto-research/final-answer/{answer_id}/archive/brainstorms/{topic_id}` - Get brainstorm details
+- `GET /api/auto-research/final-answer/{answer_id}/archive/papers` - List archived papers
+- `GET /api/auto-research/final-answer/{answer_id}/archive/papers/{paper_id}` - Get paper details
+- `GET /api/auto-research/final-answer/{answer_id}/archive/brainstorms` - List archived brainstorms
+- `GET /api/auto-research/final-answer/{answer_id}/archive/brainstorms/{topic_id}` - Get brainstorm details
+
+Archive IDs are untrusted path components. Resolve `answer_id`, `paper_id`, and `topic_id` with `validate_single_path_component()` / `resolve_path_within_root()` before reading archived files.
 
 **Design Principles**:
 - Non-intrusive: Button is discrete, not prominently displayed
@@ -1249,17 +1220,17 @@ Main component for displaying Tier 3 status and content:
 
 Runs automatically after every completed brainstorm (Tier 1) and every completed paper (Tier 2 / Tier 3 chapter), gated on `system_config.lean4_enabled`. Silent no-op when disabled.
 
-**Proof Framing Gate (one-shot, at autonomous start)**: When `lean4_enabled`, the coordinator runs `_run_proof_framing_gate()` before research begins. A single LLM call on the user prompt decides `is_proof_amenable` (`build_proof_framing_gate_prompt` → `autonomous_proof_framing_gate` role). The gate errs on the side of `true` — it returns `false` only when the prompt is purely empirical, engineering-focused, or has no meaningful mathematical content. If `true`, `PROOF_FRAMING_CONTEXT` (which directs submissions to pursue **novel, non-trivial** theorems and explicitly discourages standard identities and Mathlib restatements) is appended to every subsequent submitter prompt via `_append_proof_framing()` and persisted to workflow state for crash recovery. Decision is broadcast via `proof_framing_decided`. Silent no-op when disabled or when the prompt is not proof-amenable.
+**Proof Framing Gate (one-shot, at autonomous start)**: When `lean4_enabled`, the coordinator runs `_run_proof_framing_gate()` before research begins. A single LLM call on the user prompt decides `is_proof_amenable` (`build_proof_framing_gate_prompt` → `autonomous_proof_framing_gate` role). The gate errs on the side of `true` when formal proof can help the user's prompt — it returns `false` when the prompt is purely empirical, engineering-focused, or has no meaningful prompt-relevant mathematical content. If `true`, `PROOF_FRAMING_CONTEXT` (which directs submissions to pursue theorems/lemmas/formalizations that directly answer, support, or advance the user prompt, with novelty/non-triviality valuable only inside that boundary) is appended to every subsequent submitter prompt via `_append_proof_framing()` and persisted to workflow state for crash recovery. Decision is broadcast via `proof_framing_decided`. Silent no-op when disabled or when the prompt is not proof-amenable.
 
 **Pipeline** (`backend/autonomous/core/proof_verification_stage.py`):
-1. **Candidate identification** — `ProofIdentificationAgent` (`build_proof_identification_prompt`) extracts up to 5 novel, non-trivial theorem candidates from brainstorm or paper content, ranked by novelty potential. Trivial identities, textbook restatements, and single-tactic-closable results are filtered out at this stage before any Lean 4 cost is incurred.
-2. **Optional Mathlib lemma search** — `MathlibLemmaSearchAgent` surfaces relevant existing lemmas into the formalization prompt
+1. **Candidate identification** — `ProofIdentificationAgent` (`build_proof_identification_prompt`) extracts every prompt-relevant, non-trivial theorem candidate from brainstorm or paper content. Candidates are ordered by direct usefulness to the user prompt first, then novelty/formalization value; there is no artificial theorem-count cap. Trivial identities, off-prompt curiosities, textbook restatements, and single-tactic-closable results are filtered out before any Lean 4 cost is incurred.
+2. **Optional Mathlib lemma search** — `MathlibLemmaSearchAgent` surfaces relevant existing lemmas into the formalization prompt, tied to the target theorem and user prompt
 3. **Optional SMT early-exit** — when `smt_enabled`, `SmtClient` classifies candidates conservatively; successful SMT results become Lean tactic hints (nativeDecide / omega / decide style), never stored as standalone proofs
 4. **Lean 4 formalization attempts** — two-phase retry: up to 3 full-proof attempts via `ProofFormalizationAgent.prove_candidate`, then up to 2 multi-tactic script attempts via `prove_candidate_tactic_script` (5 total per candidate). Prior `FailedProofCandidate` failure hints from `proof_database.inject_failure_hints_into_prompt()` thread into each retry.
 5. **Novelty check** — `autonomous_proof_novelty` role compares verified proof against existing proof library
-6. **Storage** — `proof_database.add_proof()` persists novel and known proofs as session-aware records (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and reverse Mathlib usage index. Verified proofs are also appended as a "Verified Proofs" section at the bottom of the source brainstorm DB and/or paper file via `append_proofs_section()`. Cross-session read access is provided by `proof_database.list_proof_library()` (all sessions, novelty-filtered) and `proof_database.get_library_proof(session_id, proof_id)`, consumed by the `ProofLibrary` UI component and `/api/proofs/library` endpoints.
+6. **Storage** — `proof_registration.register_verified_lean_proof()` uses `proof_database.add_proof_if_absent()` to atomically persist novel and known proofs as session-aware records (`proofs_index.json`, `proof_<id>.json`, `proof_<id>_lean.lean`) with extracted `ProofDependency` records and reverse Mathlib usage index. Duplicate detection is scoped to source type/id + normalized theorem statement + normalized Lean code and must return `duplicate=True` to callers so source files are not appended twice. If `proofs_index.json` is corrupt, rebuild from existing `proof_*.json` record files instead of replacing the library with an empty index. Verified proofs are appended as a "Verified Proofs" section at the bottom of the source brainstorm DB and/or paper file via `append_proofs_section()` only for non-duplicate novel records. Cross-session read access is provided by `proof_database.list_proof_library()` (all sessions, novelty-filtered) and `proof_database.get_library_proof(session_id, proof_id)`, consumed by the `ProofLibrary` UI component and `/api/proofs/library` endpoints.
 
-**Parallelism (two-phase execution per stage run)**: Steps 2–4 above (the per-candidate "Phase A" pipeline: lemma search → optional SMT hint → `prove_candidate` → `prove_candidate_tactic_script` → `proof_attempts_exhausted` broadcast on failure) run concurrently across *all* identified candidates inside a single `ProofVerificationStage.run()` invocation, bounded by `system_config.proof_max_parallel_candidates` (default 6, env: `MOTO_PROOF_MAX_PARALLEL_CANDIDATES` / `PROOF_MAX_PARALLEL_CANDIDATES`) via an `asyncio.Semaphore`. Phase A parallelizes agent/model work, but actual Lean 4 subprocess verification is serialized by `Lean4Client` behind a shared execution lock so all candidates queue one-at-a-time against the shared Mathlib workspace; LSP mode remains independently serialized by its operation lock and subprocess fallback uses the same shared queue. The identification stage (step 1) caps candidates at 5 and filters trivial/well-known results before Phase A begins, so Phase A only processes genuinely novel-potential theorems. Completed candidates are consumed by the driver loop through `asyncio.as_completed`, and steps 5–6 (the "Phase B" post-processing: novelty assessment, `add_proof`, dependency extraction via `ProofDependencyExtractor`, `append_proofs_section`, `novel_proof_discovered` / `known_proof_verified` broadcast, `record_failed_candidate` for brainstorm failures) are performed strictly **one-at-a-time** in Phase-A completion order inside that driver loop so later candidates can observe earlier stored proofs as MOTO dependencies. Each Phase-A task instantiates its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` so the per-agent `task_sequence` counter cannot collide across concurrent candidates. If any Phase-A task raises `FreeModelExhaustedError` (or any other exception), the driver cancels all still-running sibling tasks and re-raises so the coordinator's recovery path runs with no orphaned background API calls. `should_stop` is plumbed into each Phase-A pipeline and checked before each Phase-B pass, so a stop-request short-circuits cleanly without leaking tasks.
+**Parallelism (two-phase execution per stage run)**: Steps 2–4 above (the per-candidate "Phase A" pipeline: lemma search → optional SMT hint → `prove_candidate` → `prove_candidate_tactic_script` → `proof_attempts_exhausted` broadcast on failure) run concurrently across *all* identified candidates inside a single `ProofVerificationStage.run()` invocation, bounded by `system_config.proof_max_parallel_candidates` (default 6, env: `MOTO_PROOF_MAX_PARALLEL_CANDIDATES` / `PROOF_MAX_PARALLEL_CANDIDATES`) via an `asyncio.Semaphore`. Phase A parallelizes agent/model work, but actual Lean 4 subprocess verification is serialized by `Lean4Client` behind a shared execution lock so all candidates queue one-at-a-time against the shared Mathlib workspace; LSP mode remains independently serialized by its operation lock and subprocess fallback uses the same shared queue. The identification stage (step 1) filters off-prompt, trivial, and well-known results before Phase A begins, so Phase A only processes prompt-relevant theorem candidates. Completed candidates are consumed by the driver loop through `asyncio.as_completed`, and steps 5–6 (the "Phase B" post-processing: novelty assessment, `add_proof`, dependency extraction via `ProofDependencyExtractor`, `append_proofs_section`, `novel_proof_discovered` / `known_proof_verified` broadcast, `record_failed_candidate` for brainstorm failures) are performed strictly **one-at-a-time** in Phase-A completion order inside that driver loop so later candidates can observe earlier stored proofs as MOTO dependencies. Each Phase-A task instantiates its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` so the per-agent `task_sequence` counter cannot collide across concurrent candidates. If any Phase-A task raises `FreeModelExhaustedError` (or any other exception), the driver cancels all still-running sibling tasks and re-raises so the coordinator's recovery path runs with no orphaned background API calls. `should_stop` is plumbed into each Phase-A pipeline and checked before each Phase-B pass, so a stop-request short-circuits cleanly without leaking tasks.
 
 **Rigor mode is NOT parallelized** (compiler Part 2): `submit_rigor_lean_theorem()` runs one candidate per rigor cycle by design (discovery → 5 Lean attempts → novelty → placement) and the outer `_rigor_loop` drives cycles serially so each proven theorem can land in the paper before the next discovery sees updated context. The parallel candidate pipeline lives only in `ProofVerificationStage`.
 
@@ -1269,11 +1240,11 @@ Runs automatically after every completed brainstorm (Tier 1) and every completed
 
 **Subprocess vs LSP**: `lean4_client` runs Lean via subprocess by default. When `lean4_lsp_enabled`, a persistent LSP-style process reduces cold-start overhead; the subprocess path remains the fallback and must keep working when LSP is disabled. Missing/corrupt Mathlib `.olean` diagnostics are infrastructure failures, not proof failures: the client must re-check workspace readiness inside the serialized Lean execution queue, invalidate readiness when the cache is bad, refetch the Mathlib cache, retry the same Lean check once, and return a distinct `LEAN 4 WORKSPACE ERROR` if repair still fails. Future checks may attempt repair again after external fixes or transient failures clear, but the current failed check must not burn proof attempts as ordinary Lean feedback.
 
-**Manual proof checks** (Build 5): `POST /api/proofs/check` reuses `ProofVerificationStage.run_manual()` with the stored `ProofRuntimeConfigSnapshot` (brainstorm / paper / validator role configs captured during autonomous startup). Readiness is surfaced via `/api/proofs/status.manual_check_ready` + `manual_check_message`. Required state: `lean4_enabled=True` AND a runtime snapshot must exist (start autonomous research once to seed it).
+**Manual proof checks** (Build 5): `POST /api/proofs/check` reuses `ProofVerificationStage.run_manual()` with the stored `ProofRuntimeConfigSnapshot` (brainstorm / paper / validator role configs captured during autonomous startup). Manual checks may target any brainstorm with content, including in-progress brainstorms; papers remain completed-only. Readiness is surfaced via `/api/proofs/status.manual_check_ready` + `manual_check_message`. Required state: `lean4_enabled=True` AND a runtime snapshot must exist (start autonomous research once to seed it).
 
 **Proof runtime config snapshot** (`research_metadata.set_proof_runtime_config`): Captures a `ProofRuntimeConfigSnapshot` with three `ProofRoleConfigSnapshot` entries — `brainstorm` (from first aggregator submitter config), `paper` (from high-context submitter config), `validator` (from validator config). Each holds provider, model_id, openrouter_provider, lm_studio_fallback_id, context_window, and max_output_tokens. Lets manual checks run without an active autonomous session.
 
-**Proof WebSocket events** (all broadcast through the standard `/api/ws` stream):
+**Proof WebSocket events** (all broadcast through the standard `/api/ws` stream). `proof_verified` is emitted only after the proof has passed integrity checks and has been registered/reused in the proof database; payloads include `proof_id`.
 - `proof_framing_decided`
 - `proof_check_started`, `proof_check_complete`, `proof_check_no_candidates`
 - `proof_check_candidates_found`, `mathlib_lemmas_suggested`
@@ -1293,10 +1264,11 @@ Runs automatically after every completed brainstorm (Tier 1) and every completed
 7. Proof certificates stay text-based (`.lean` source + JSON metadata) — no binary artifacts
 8. Hosted/generic mode keeps `lean4_enabled` and `smt_enabled` default false and the hosted image stays Lean-free and Z3-free (no proof binaries in the `python:3.12-slim` runtime)
 9. Proof framing gate runs once per autonomous start and only when `lean4_enabled`; the resulting `proof_framing_active` flag and `PROOF_FRAMING_CONTEXT` are persisted in workflow state for crash recovery
-10. Candidate identification (`build_proof_identification_prompt`) is a novelty-seeking gate — it rejects trivial identities, textbook restatements, and single-tactic-closable results, and returns **at most 5** candidates ranked by novelty potential. Every candidate that passes this gate is attempted — Phase A is bounded by `proof_max_parallel_candidates` but never truncates the post-identification candidate list; Phase A agent/model work runs concurrently across candidates while actual Lean 4 subprocess verification queues one-at-a-time through `Lean4Client`, and Phase B (novelty / `add_proof` / dependency extraction / brainstorm+paper `append_proofs_section` / novel/known broadcasts / `record_failed_candidate`) remains strictly serialized in Phase-A completion order so intra-batch MOTO dependencies and per-source proof appending stay coherent
+10. Candidate identification (`build_proof_identification_prompt`) is a user-prompt relevance gate first and a novelty/non-triviality gate second — it rejects off-prompt curiosities, trivial identities, textbook restatements, and single-tactic-closable results, then returns every prompt-relevant candidate ordered by direct usefulness to the user prompt. Every candidate that passes this gate is attempted — Phase A is bounded by `proof_max_parallel_candidates` but never truncates the post-identification candidate list; Phase A agent/model work runs concurrently across candidates while actual Lean 4 subprocess verification queues one-at-a-time through `Lean4Client`, and Phase B (novelty / `add_proof` / dependency extraction / brainstorm+paper `append_proofs_section` / novel/known broadcasts / `record_failed_candidate`) remains strictly serialized in Phase-A completion order so intra-batch MOTO dependencies and per-source proof appending stay coherent
 11. Each Phase-A task owns its own `ProofIdentificationAgent` / `MathlibLemmaSearchAgent` / `ProofFormalizationAgent` instance to keep per-agent `task_sequence` counters collision-free; any Phase-A exception (including `FreeModelExhaustedError`) must cancel all sibling tasks and re-raise so the coordinator's recovery path runs without orphaned background API calls
 12. `should_stop` propagates into Phase A and is re-checked before each Phase-B pass so stop-requests short-circuit without leaking tasks or partially-applied Phase-B writes
-13. Compiler rigor mode (`submit_rigor_lean_theorem`, `_rigor_loop`) is NOT parallelized — rigor cycles discover, verify, and place one theorem per cycle so each verified theorem lands in the paper before the next discovery; the parallel candidate pipeline lives only in `ProofVerificationStage`
+13. Compiler rigor mode (`submit_rigor_lean_theorem`, `_rigor_loop`) is NOT parallelized — rigor cycles discover, verify, and route one theorem per cycle (inline for eligible existing-paper claims, appendix-only for extension-derived theorems or placement fallback) so each verified theorem lands in the paper before the next discovery; the parallel candidate pipeline lives only in `ProofVerificationStage`
+14. Post-Lean integrity scanning rejects newly introduced `axiom`, `constant`, and `opaque` declarations even when the declaration name appears on following lines. Generated source text is not an authorization baseline unless explicitly passed as allowed baseline.
 
 ---
 
@@ -1324,6 +1296,8 @@ Contains abstract only.
 
 Contains complete brainstorm database that sourced this paper.
 
+**Pruned Papers**: `auto_papers/pruned/pruned_paper_{paper_id}.txt` (or session `papers/pruned/`) preserves papers removed from model context. The raw file begins with a `PRUNED PAPER - REMOVED FROM MODEL CONTEXT` banner and is for user review/download only. Companion metadata/abstract/outline files use the same `pruned_` prefix. Brainstorms do not use this soft-prune preservation feature.
+
 ### Research Metadata File
 
 **File**: `auto_research_metadata.json` under the active instance data root (default desktop path: `backend/data/auto_research_metadata.json`)
@@ -1334,26 +1308,32 @@ Contains complete brainstorm database that sourced this paper.
 
 **File**: `auto_workflow_state.json` under the active instance data root (default desktop path: `backend/data/auto_workflow_state.json`)
 
-This file persists the current workflow state to enable **automatic resume** after program restart or crash. The system automatically saves this state at key checkpoints:
+This file persists the current workflow state to enable **automatic resume** after program restart, crash, or user stop. The system automatically saves this state at key checkpoints:
 
 - After topic selection (starting brainstorm aggregation)
 - Periodically during brainstorm aggregation (every 5 acceptances)
+- Before and after brainstorm proof verification (`paper_phase="brainstorm_proof_verification"` / `pre_paper_compilation`)
 - When transitioning to paper compilation
-- During paper writing phases
+- During paper writing phases (`body`, `conclusion`, `introduction`, `abstract`)
+- Before completed-paper proof verification (`paper_phase="paper_proof_verification"`)
 - **During Tier 3 final answer generation phases**
 
-On **clean stop** (user-initiated via stop button), this file is automatically cleared.
+On **clean stop** (user-initiated via stop button), this file is preserved for pause/resume. Only `clear_all_data()` should clear workflow state. `_save_workflow_state()` must preserve the previous `paper_phase` when called without an explicit phase, and only clear the phase when passed `phase=None` intentionally after successful completion.
 
-On **restart/crash recovery**, if this file exists with `is_running: true`, the system detects an interrupted workflow and:
+On **restart/crash recovery**, if this file exists with a resumable tier/topic/paper (regardless of `is_running`), the system detects an interrupted workflow and:
 1. Restores internal state (topic ID, acceptance counts, model config, etc.)
-2. Automatically resumes from the last known phase
-3. Broadcasts `auto_research_resumed` WebSocket event
+2. Recovers stale acceptance counts from brainstorm metadata/database files when workflow state says `0`
+3. Automatically resumes from the last known phase; completed brainstorms never re-enter aggregation and instead resume at proof/paper handoff
+4. Detects completed papers paused before proof verification and resumes `paper_proof_verification` before moving on
+5. Broadcasts `auto_research_resumed` WebSocket event
+
+If `workflow_state.json` is stale, idle, or missing, session recovery must conservatively synthesize a resume point from durable `session_stats.json`, brainstorm metadata/database files, and in-progress paper metadata/content. This includes scanning `papers/*_metadata.json` for `status="in_progress"` when stats lost `current_paper_id`; the resume phase is detected from saved paper content rather than defaulting to body.
 
 
 **Important Notes:**
 - The user research prompt is saved in `auto_research_metadata.json`, not the workflow state
 - Model configuration is saved to allow resuming with the same model settings
-- If the workflow state file is corrupted or missing, the system starts fresh
+- If the workflow state file is corrupted or missing, first try durable session-file recovery; start fresh only if no current topic, in-progress paper, completed unpapered brainstorm, completed papers, or active Tier 3 state can be recovered
 - The `clear_all_data` API endpoint clears the workflow state along with all other data
 
 ---
@@ -1501,7 +1481,7 @@ Paper library component:
 Persistent popup notification component for high-scoring paper critiques:
 - **Fixed position**: Bottom-right corner with z-index 999999
 - **Max 3 notifications**: FIFO queue (oldest removed when 4th arrives)
-- **Trigger condition**: Paper completed with validator critique avg rating ≥ 7.0
+- **Trigger condition**: Paper has validator critique avg rating ≥ 6.25
 - **Each notification displays**:
   - Paper title (truncated to 2 lines)
   - Average rating with color coding (green ≥8, blue ≥7)
@@ -1511,9 +1491,9 @@ Persistent popup notification component for high-scoring paper critiques:
 - **Interactions**:
   - Click anywhere (except X) → opens `PaperCritiqueModal` with full critique
   - Click X → dismisses notification with slide-out animation
-- **Persistence**: Stays visible across all screens until dismissed (not saved to localStorage)
+- **Persistence**: Stays visible across screens until dismissed; dismissed/clicked high-score popup keys are stored in localStorage so missed WebSocket events can be replayed once from saved paper critique ratings without repeating forever
 - **Styling**: Purple gradient, compact design (~250px × ~80px), smooth animations
-- **WebSocket Integration**: Listens to `high_score_critique` event from backend
+- **WebSocket Integration**: Listens to `high_score_critique` event from backend and de-duplicates against recovered paper-list notifications
 
 **State Management** (in App.jsx):
 - `critiqueNotifications` array stores active notifications
@@ -1535,7 +1515,7 @@ Settings integrated into main Settings panel:
 Metrics and logging component:
 - Real-time metrics:
   - Total brainstorms (complete / in-progress)
-  - Total papers (complete / archived)
+  - Total papers (complete / pruned)
   - Acceptance/rejection rates (brainstorm vs paper compilation)
   - Average submissions per brainstorm
   - Average words per paper
@@ -1613,9 +1593,10 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
   - Selective non-use of brainstorm/database material is allowed when the resulting paper is stronger, rigorous, and aligned with the prompt
 
 ### Running Modes
-- **Part 1, Part 2, and Part 3 remain user-selectable modes**
-- **Only ONE workflow mode may be active at a time** — Aggregator, Compiler, and Autonomous Research are mutually exclusive at runtime (applies identically in both default and generic deployment)
+- **Part 1, Part 2, Part 3, and LeanOJ Proof Solver remain user-selectable modes**
+- **Only ONE workflow mode may be active at a time** — Aggregator, Compiler, Autonomous Research, and LeanOJ Proof Solver are mutually exclusive at runtime (applies identically in both default and generic deployment)
 - **Part 3 internally controls Part 1 and Part 2 components** during autonomous execution
+- **LeanOJ is proof-only and separate from Part 3** — it does not write papers, does not mutate autonomous brainstorm/paper memory, and stores resumable run-local state under the active `leanoj_sessions` data root until explicit clear
 - Starting any mode while another mode is running must be blocked until the active mode is stopped
 - In generic mode, all API routes and WebSocket events are identical — the only difference is provider availability (OpenRouter-only, FastEmbed embeddings, no PDF download)
 
@@ -1710,9 +1691,9 @@ Tier 3 Final Answer display component (separate tab for completed/overall final
 21. **Same model = single author** - Model used in multiple instances counts as ONE author entry, but all API calls tallied
 22. **Paper redundancy is DISABLED during Tier 3** - `_tier3_active` flag prevents redundancy checks from purging papers being used in the final volume
 23. **Brainstorm hard limit is 30 acceptances** - After 30 acceptances, paper writing is forced (no completion review)
-24. **Maximum 1 completed rewrite per paper** - Rewrite counts as "completed" only after first successful body acceptance; prevents infinite loops from failed rewrite attempts
-25. **Partial revision option available** - Allows targeted edits without full body rewrite
-26. **Total rewrite is last resort** - Only for catastrophic issues that can't be fixed with targeted edits
+24. **Critiques append as self-review, never rewrite** - Post-body critique runs 3 total attempts and appends validator-accepted critiques as `AI Self-Review and Limitations`; no partial or total body rewrites are allowed
+25. **Self-review follows proofs/conclusion** - The self-review section is placed after compiler/appended proof material when present, otherwise after conclusion, and later proof appends must stay before it
+26. **Critique declines remain valid** - If no critiques are accepted after the 3 attempts, the workflow proceeds to conclusion without adding a self-review section
 27. **Rejection hard limit is 10 consecutive rejections (with 5+ acceptances)** - Prevents infinite rejection loops
 28. **Retroactive brainstorm corrections during Tier 2 paper compilation** - Submitter sees unified paper+brainstorm workspace; operations validated independently by validator (paper-only context for paper ops, brainstorm-only context for brainstorm ops); each operation must stand alone without requiring the other for correctness
 29. **Max 3 papers per brainstorm** - hard limit, continuation decision skipped after 3rd paper
@@ -1779,4 +1760,5 @@ Out-of-order paper writing: The sequential paper writing order (body → conclus
 - Handles reasoning tokens (`<think>...</think>`), markdown wrappers, control tokens
 - Extracts first complete JSON object when multiple present
 - Handles LaTeX escape sequences comprehensively: fixes invalid `\u{word}` patterns, fixes invalid `\uXXXX` non-hex escapes, **pre-escapes dangerous LaTeX commands BEFORE any json.loads() attempt** using `(?<!\\)` negative lookbehind (prevents `\to` becoming tab+o, `\text` becoming tab+ext, etc., while also preserving already-escaped `\\begin` from being double-corrupted) - dangerous commands include `\to`, `\text`, `\textbf`, `\times`, `\top`, `\tau`, `\theta`, `\triangle`, `\frac`, `\forall`, `\beta`, `\bar`, `\big*`, `\begin`, `\nu`, `\nabla`, `\neq`, `\not*`, `\rho`, `\right*`, `\rightarrow`, `\Rightarrow`, `\upsilon`, `\underline`, `\uparrow`
+- Retry/context hygiene uses `sanitize_model_output_for_retry_context()` before any failed model output is replayed or stored as reusable feedback. It removes known private thought/channel/control tokens while preserving visible malformed JSON and Lean/math syntax such as `<|`; retry-facing parser exceptions must not include raw response excerpts.
 - Agent-level array handling for models that return arrays instead of objects
diff --git a/.cursor/rules/program-directory-and-file-definitions.mdc b/.cursor/rules/program-directory-and-file-definitions.mdc
index ff05a19..773840b 100644
--- a/.cursor/rules/program-directory-and-file-definitions.mdc
+++ b/.cursor/rules/program-directory-and-file-definitions.mdc
@@ -13,6 +13,7 @@ LM Studio and its pre-loaded models can be reached at "http://127.0.0.1:1234" (o
 - The active backend instance may override mutable roots with `MOTO_DATA_ROOT` and `MOTO_LOG_ROOT`
 - Secret persistence may be isolated per instance with `MOTO_SECRET_NAMESPACE`
 - Frontend browser persistence may be isolated on shared origins with `MOTO_FRONTEND_STORAGE_PREFIX` / `VITE_MOTO_STORAGE_PREFIX`
+- Hosted protected request size may be capped with `MOTO_GENERIC_MAX_REQUEST_BYTES` / `GENERIC_MAX_REQUEST_BYTES` (default 16 MiB)
 - Additional local launches may create generated instance folders such as `.moto_instances/{instance_id}/data` and `.moto_instances/{instance_id}/logs`
 
 ## Complete Project Directory Structure and File Descriptions
@@ -28,17 +29,19 @@ project-root/
 │   ├── shared/                          # SHARED RESOURCES
 │   │   ├── __init__.py                  # Package initialization
 │   │   ├── config.py                    # RAGConfig, SystemConfig (instance runtime contract, ports, data/log roots, secret namespace, generic_mode)
-│   │   ├── models.py                    # Pydantic models (includes ModelConfig, BoostConfig, WorkflowTask)
-│   │   ├── lm_studio_client.py          # LM Studio HTTP API client
+│   │   ├── models.py                    # Pydantic models (includes ModelConfig with per-role supercharge_enabled, BoostConfig, WorkflowTask)
+│   │   ├── lm_studio_client.py          # LM Studio HTTP API client + same-base numeric :# instance sharing
 │   │   ├── openrouter_client.py         # OpenRouter HTTP API client (credit exhaustion detection + model/endpoint metadata)
-│   │   ├── api_client_manager.py        # Unified API router (OpenRouter/LM Studio fallback + boost)
-│   │   ├── boost_manager.py             # Singleton boost manager (tracks boost modes: next-count, always-prefer, category)
-│   │   ├── boost_logger.py              # Boost API call logger (persists to boost_api_log.txt)
+│   │   ├── api_client_manager.py        # Unified API router (Supercharge wrapper + OpenRouter/LM Studio fallback + boost)
+│   │   ├── boost_manager.py             # Singleton boost manager (tracks boost modes: next-count, always-prefer, category; aliases absorbed LeanOJ path-decision tasks into Final Solver boost category)
+│   │   ├── boost_logger.py              # Boost API call logger (persists redacted/default-safe entries to boost_api_log.txt)
 │   │   ├── workflow_predictor.py        # Predicts next 20 API calls (mode-specific algorithms)
+│   │   ├── workflow_start_guard.py       # Process-wide async guard for atomic mutually-exclusive workflow starts
 │   │   ├── free_model_manager.py        # Free model rotation/cooldown singleton (looping + auto-selector backup)
+│   │   ├── model_error_utils.py         # Shared helpers for non-retryable provider/config failures that should pause workflows
 │   │   ├── rag_lock.py                  # Global RAG operation lock (prevents Aggregator/Compiler collision)
 │   │   ├── token_tracker.py             # Cumulative input/output token tracker singleton with per-model breakdown and research timer
-│   │   ├── wolfram_alpha_client.py      # Wolfram Alpha API client
+│   │   ├── wolfram_alpha_client.py      # Wolfram Alpha API client (logs redacted metadata, not raw query/result text)
 │   │   ├── utils.py                     # Common utilities
 │   │   ├── json_parser.py               # JSON parsing with sanitization for LLM quirks
 │   │   ├── critique_memory.py           # Paper critique persistence (saves up to 10 validator critiques per paper)
@@ -47,13 +50,15 @@ project-root/
 │   │   ├── build_info.py                # Build identity resolver (loads version/build_commit/update_channel/api_contract_version from moto-update-manifest.json + env overrides)
 │   │   ├── path_safety.py               # Safe path resolution helpers (realpath/normpath containment checks)
 │   │   ├── fastembed_provider.py         # FastEmbed embedding wrapper (generic mode only, lazy-imported; ~30 lines)
-│   │   ├── lean4_client.py              # Lean 4 proof checker client (subprocess + optional LSP persistent mode; gated on `lean4_enabled` / `lean4_lsp_enabled`)
+│   │   ├── lean4_client.py              # Lean 4 proof checker client (subprocess + optional LSP persistent mode; gated on `lean4_enabled` / `lean4_lsp_enabled`; offloads temp/workspace filesystem operations from the FastAPI event loop)
+│   │   ├── lean_proof_integrity.py       # Shared post-Lean integrity gate (rejects fake axiom/constant/opaque devices and validates theorem-statement alignment)
+│   │   ├── brainstorm_proof_gate.py      # Shared Lean 4 gate for optional brainstorm proof candidates before normal validation
 │   │   └── smt_client.py                # Z3/SMT launcher-managed subprocess wrapper (gated on `smt_enabled`; never authoritative on its own)
 │   ├── aggregator/                      # AGGREGATOR 
 │   │   ├── __init__.py
 │   │   ├── core/
 │   │   │   ├── __init__.py
-│   │   │   ├── rag_manager.py           # 4-stage RAG pipeline orchestrator
+│   │   │   ├── rag_manager.py           # 4-stage RAG pipeline orchestrator (ChromaDB calls and heavy retrieval scoring are offloaded/snapshot-based to keep GUI/API routes responsive)
 │   │   │   ├── coordinator.py           # Manages 1-10 submitters + 1 validator (default 3, configurable per-submitter)
 │   │   │   ├── queue_manager.py         # Submission queue. Monitors queue size to trigger submitter pause when ≥10 submissions.
 │   │   │   └── context_allocator.py     # Direct injection vs RAG routing (tries direct first, offloads to RAG only when doesn't fit). Includes allocate_cleanup_review_context() which NEVER skips due to size - uses RAG when database too large.
@@ -115,7 +120,8 @@ project-root/
 │   │   │   ├── __init__.py              # Package initialization
 │   │   │   ├── autonomous_coordinator.py # Orchestrates the Tier 1 → Tier 2 → Tier 3 autonomous workflow (invokes proof verification checkpoint after brainstorm/paper completion when `lean4_enabled`)
 │   │   │   ├── autonomous_rag_manager.py # Autonomous-specific RAG wrapper
-│   │   │   ├── proof_verification_stage.py # Orchestrates proof identification → Lean 4 attempts (5-try loop) → novelty check → proof storage; optional SMT early-exit + Mathlib lemma search; per-source reservation lock
+│   │   │   ├── proof_verification_stage.py # Orchestrates proof identification → Lean 4 attempts (5-try loop) → shared integrity gate → novelty check → proof storage; optional SMT early-exit + Mathlib lemma search; per-source reservation lock
+│   │   │   ├── proof_registration.py     # Shared registration helper for verified Lean proofs from autonomous, compiler, aggregator, and LeanOJ flows
 │   │   │   └── proof_dependency_extractor.py # Parses verified Lean 4 code to extract `ProofDependency` records (imports, Mathlib lemmas, MOTO-origin refs)
 │   │   ├── agents/
 │   │   │   ├── __init__.py              # Package initialization
@@ -145,7 +151,7 @@ project-root/
 │   │   │   ├── paper_title_prompts.py   # Paper title selection prompts
 │   │   │   ├── paper_redundancy_prompts.py # Paper redundancy review prompts
 │   │   │   ├── paper_continuation_prompts.py # Brainstorm multi-paper continuation decision prompts
-│   │   │   ├── proof_prompts.py         # Proof identification/formalization/novelty prompts + failure-hint direct injection helper
+│   │   │   ├── proof_prompts.py         # Proof identification/formalization/statement-alignment/novelty prompts + failure-hint direct injection helper
 │   │   │   └── final_answer_prompts.py  # TIER 3 - Final answer assessment/selection/volume prompts
 │   │   └── memory/
 │   │       ├── __init__.py              # Package initialization
@@ -160,24 +166,34 @@ project-root/
 │   │       ├── final_answer_memory.py   # TIER 3 - Final answer state & volume management
 │   │       └── session_manager.py       # Prompt-based session folder organization
 │   │
+│   ├── leanoj/                          # LEANOJ PROOF SOLVER (proof-only top-level mode; no paper writing)
+│   │   ├── __init__.py
+│   │   ├── prompts.py                   # LeanOJ topic/batched-topic/brainstorm/prune/path/subproof/final-solver JSON prompts; brainstorm validation assigns final-context roles; prune review conservatively asks whether outdated/redundant memory should be removed or updated; final solver edits single-route durable master proofs and reviews Lean-accepted final code before stop
+│   │   └── core/
+│   │       ├── __init__.py
+│   │       ├── leanoj_context.py         # LeanOJ full artifact persistence, direct-first allocation, final-context routing (verified helpers + active plans direct; refuted constructions separated as compact warnings), session-scoped RAG indexing/retrieval, final-cycle packets, and clear/resume cleanup
+│   │       └── leanoj_coordinator.py     # Parallel topic + brainstorm submitters, batch validators, resumable persistence, partial proof capture, context-role classification, single-route durable master_proof.lean editing, watchdog, final Lean verification, and semantic final-solver review
+│   │
 │   ├── scripts/                         # Temporary utility scripts
 │   │   └── cache_openrouter_models.py   # (Auto-deleted after use) Caches OpenRouter models with mapping display_name -> api_id
 │   │
 │   ├── api/
 │   │   ├── __init__.py
-│   │   ├── main.py                      # FastAPI app entry point (lifespan reads generic_mode from env, fail-closes hosted startup when proxy auth env is missing, skips LM Studio test in generic mode)
-│   │   ├── middleware.py                # CORS, error handling, proxy auth validation (X-Moto-* headers in generic mode)
-│   │   ├── proxy_auth.py                # Shared generic-mode proxy auth helpers (allowlist + HMAC signature validation for REST/WebSocket)
+│   │   ├── main.py                      # FastAPI app entry point (lifespan reads generic_mode, fail-closes hosted auth env, ensures desktop API token, skips LM Studio test in generic mode)
+│   │   ├── middleware.py                # CORS, error handling, desktop token/origin checks, proxy auth validation, hosted body-size cap + actual-body hash check
+│   │   ├── proxy_auth.py                # Shared generic-mode proxy auth helpers (allowlist + HMAC over method/path/query/verified body hash for REST/WebSocket)
 │   │   └── routes/
 │   │       ├── __init__.py
 │   │       ├── aggregator.py            # Aggregator API endpoints (includes /events)
 │   │       ├── compiler.py              # Compiler API endpoints
 │   │       ├── autonomous.py            # Autonomous Research API endpoints
+│   │       ├── leanoj.py                # LeanOJ Proof Solver API endpoints (`/api/leanoj/*`: start/resume, stop, status, master-proof draft/edit summaries, proofs/library, skip-brainstorm, force-brainstorm, clear)
 │   │       ├── boost.py                 # Boost API endpoints (enable/disable/toggle/status + OpenRouter provider endpoint metadata)
 │   │       ├── workflow.py              # Workflow API endpoints (predictions/history)
-│   │       ├── download.py              # PDF generation endpoint via Playwright (POST /api/download/pdf); returns 501 in generic mode
-│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models, providers + endpoint metadata, LM Studio availability, **GET /api/model-cache** for model ID caching, **POST /api/openrouter/reset-exhaustion** to reset credit exhaustion mid-session)
-│   │       ├── websocket.py             # WebSocket for real-time updates (proxy auth validation in generic mode before accept)
+│   │       ├── update.py                # Update/check endpoints for launcher/updater state
+│   │       ├── download.py              # PDF generation endpoint via Playwright (desktop only; sanitize/block external requests; returns 501 in generic mode)
+│   │       ├── openrouter.py            # OpenRouter API endpoints (global key, models/providers via header/body keys only, LM Studio availability, model cache, reset exhaustion)
+│   │       ├── websocket.py             # WebSocket for real-time updates (generic proxy auth or desktop one-time tickets before accept)
 │   │       ├── features.py              # GET /api/features — shared build identity plus stable capability flags (`generic_mode`, `lm_studio_enabled`, `pdf_download_available`)
 │   │       ├── proofs.py                # Proof database + Lean 4/SMT runtime + manual proof-check + certificate export + dependency graph routes; listing proofs (`GET /`, `/novel`, `/known`, `/library*`) and certificate/lean downloads (`/{id}/certificate`, `/{id}/certificate.lean`) are always available regardless of `lean4_enabled`; dependency/graph routes and `/check` are gated on `lean4_enabled`; `/status` uses short timeouts so it never blocks the UI
 │   │       └── health.py                # GET /api/health — readiness/liveness probe with instance/build metadata
@@ -205,7 +221,10 @@ project-root/
 │   │   │   ├── paper_{paper_id}_abstract.txt              # Abstract only
 │   │   │   ├── paper_{paper_id}_source_brainstorm.txt     # Cached brainstorm database
 │   │   │   ├── paper_{paper_id}_last_10_rejections.txt    # Compiler rejections for this paper
-│   │   │   └── archive/                                   # Archived (redundant) papers
+│   │   │   ├── pruned/                                    # Pruned papers preserved for user download, excluded from model context
+│   │   │   │   ├── pruned_paper_{paper_id}.txt            # Pruned full paper with top-of-file PRUNED PAPER banner
+│   │   │   │   └── pruned_paper_{paper_id}_metadata.json  # Pruned metadata/reason
+│   │   │   └── archive/                                   # Legacy archived (redundant) papers, treated as pruned history
 │   │   │       └── paper_{paper_id}.txt
 │   │   ├── auto_final_answer/           # Autonomous Research - Tier 3 (LEGACY - replaced by auto_sessions)
 │   │   │   ├── final_answer_state.json                    # Tier 3 state (crash recovery)
@@ -217,13 +236,15 @@ project-root/
 │   │   ├── auto_sessions/               # Autonomous Research - Session-based folder organization
 │   │   │   └── {sanitized_prompt}_{timestamp}/            # Per-session folder
 │   │   │       ├── brainstorms/                           # Tier 1 brainstorm databases
-│   │   │       ├── papers/                                # Tier 2 completed papers
+│   │   │       ├── papers/                                # Tier 2 completed papers plus pruned/ preserved context-excluded papers
 │   │   │       ├── final_answer/                          # Tier 3 final answer data
 │   │   │       ├── proofs/                                # Lean 4 verified-proof records (proofs_index.json, proof_<id>.json, proof_<id>_lean.lean)
 │   │   │       ├── session_metadata.json                  # Session info (prompt, created_at, status)
 │   │   │       ├── session_stats.json                     # Session statistics
 │   │   │       └── workflow_state.json                    # Workflow state for crash recovery
 │   │   ├── proofs/                      # Legacy (non-session) Lean 4 proof storage (mirrors per-session proofs/ layout)
+│   │   ├── leanoj_sessions/             # LeanOJ run state (state.json, master_proof.lean, master_proof_edits.jsonl, master_proof_snapshots.jsonl, phase counters, subproofs, attempts, verified final Lean code; stop/crash resumes unless cleared)
+│   │   ├── leanoj_artifacts/            # LeanOJ full-memory artifact logs (accepted ideas with context_role metadata, recursive topics, verified/partial/failed subproofs, final attempts, final-cycle packets) used for direct-first RAG allocation
 │   │   ├── auto_research_metadata.json  # Autonomous Research metadata (LEGACY - now in session folders)
 │   │   ├── auto_research_stats.json     # Autonomous Research statistics (LEGACY - now in session folders)
 │   │   ├── auto_workflow_state.json     # Autonomous Research workflow state (LEGACY - now in session folders)
@@ -247,7 +268,7 @@ project-root/
 │   │   │   │   ├── CompilerLogs.jsx         # Metrics: construction vs rigor, miniscule edits
 │   │   │   │   └── LivePaper.jsx            # Real-time paper viewing, save draft, word count
 │   │   │   │
-│   │   │   └── autonomous/              # AUTONOMOUS RESEARCH
+│   │   │   ├── autonomous/              # AUTONOMOUS RESEARCH
 │   │   │       ├── AutonomousResearchInterface.jsx  # Main control: research prompt, start/stop, current tier
 │   │   │       ├── AutonomousResearch.css     # Autonomous research styles
 │   │   │       ├── BrainstormList.jsx       # List all brainstorm topics with status
@@ -271,6 +292,17 @@ project-root/
 │   │   │       ├── Stage2PaperHistory.jsx   # Tier 2 paper history list (grouped per research run; sub-tab inside CompletedWorksLibrary)
 │   │   │       └── Stage2PaperHistory.css   # Tier 2 paper history styles
 │   │   │
+│   │   │   └── leanoj/                  # LEANOJ PROOF SOLVER UI
+│   │   │       ├── LeanOJInterface.jsx  # Prompt/template input, start/resume, stop, skip/force brainstorm, clear progress, live status, verified Lean output
+│   │   │       ├── LeanOJSettings.jsx   # LeanOJ-specific model profiles/settings; grouped UI controls map to underlying role keys (Submitter 1 also sets topic_generator, Validator sets both validators, Brainstorm Proof Solver sets subproof identifier+solver, Final Proof Solver also owns path/final-readiness decisions)
+│   │   │       ├── LeanOJBrainstorms.jsx # LeanOJ accepted ideas/recursive brainstorm memory viewer
+│   │   │       ├── LeanOJLogs.jsx       # LeanOJ topics, subproofs, failed feedback, event stream
+│   │   │       ├── LeanOJMasterProof.jsx # Master proof draft tab (on-demand draft, metadata, edit history, download)
+│   │   │       ├── LeanOJMasterProof.css # Master proof draft tab styles
+│   │   │       ├── LeanOJMathematicalProofs.jsx # Current-run verified LeanOJ proof/subproof viewer
+│   │   │       ├── LeanOJProofLibrary.jsx # Cross-session completed LeanOJ proof-work library
+│   │   │       └── index.js             # LeanOJ component exports
+│   │   │
 │   │   ├── StartupProviderSetupModal.jsx # Post-disclaimer startup chooser for OpenRouter vs LM Studio setup (OpenRouter-only in generic mode)
 │   │   ├── OpenRouterApiKeyModal.jsx    # Modal for global OpenRouter API key configuration with mode-aware persistence messaging
 │   │   ├── PaperCritiqueModal.jsx       # Modal for displaying validator paper critiques (ratings, feedback, history)
@@ -285,11 +317,12 @@ project-root/
 │   │   ├── TextFileUploader.css         # File uploader styles
 │   │   ├── OpenRouterPrivacyWarningModal.jsx # Privacy policy error modal (OpenRouter data sharing, capability-aware alternatives)
 │   │   ├── HelpTooltip.jsx              # Shared portal-based help tooltip component (used across settings/interfaces)
+│   │   ├── ProofStrengthBadge.jsx       # Shared PS badge/tooltip for highlighted proof-strength models and primary proof-creation roles
 │   │   ├── settings-common.css          # Shared settings panel styles
 │   │   ├── critique-modal.css           # Paper critique modal styles
 │   │   │
 │   │   ├── services/
-│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI, `/api/features` capability bootstrap helper, proof routes under `/api/proofs/*`, and cross-session proof library routes `getProofLibrary` / `getLibraryProof` under `/api/proofs/library`)
+│   │   │   ├── api.js                   # Backend API calls (includes openRouterAPI, `/api/features`, proof routes, LeanOJ API, and cross-session proof library helpers)
 │   │   │   └── websocket.js             # WebSocket connection 
 │   │   │
 │   │   ├── hooks/
@@ -300,11 +333,12 @@ project-root/
 │   │   │   ├── modelCache.js            # Frontend model cache utilities (display_name → api_id lookup)
 │   │   │   ├── openRouterSelection.js   # Shared OpenRouter selector auto-fill helpers (context/output from model + host metadata)
 │   │   │   ├── autonomousProfiles.js    # Shared autonomous recommended-profile definitions and persistence helpers
+│   │   │   ├── leanojProfiles.js        # LeanOJ-specific recommended/user profile definitions, persistence helpers, and request builder (topic generation uses all submitters; legacy topic_generator/selector is sourced from Brainstorm Submitter 1; legacy path_decider request field is derived from Final Proof Solver)
 │   │   │   ├── runtimeConfig.js         # Frontend runtime helpers (instance storage prefix, active data-root display, instance ID)
 │   │   │   ├── researchRunHistory.js    # Groups Tier 2 papers + final answers into per-run history entries for Stage2PaperHistory/FinalAnswerLibrary
 │   │   │   └── disclaimerHelper.js      # Frontend-only disclaimer injection for brainstorm/paper views
 │   │   │
-│   │   ├── App.jsx                      # Main app shell with top-level mode switch, `/api/features` capability bootstrap, and capability propagation into settings/interfaces/modals
+│   │   ├── App.jsx                      # Main app shell with top-level mode switch, `/api/features` capability bootstrap, capability propagation, and developer-mode raw-settings shortcut
 │   │   ├── index.css                    # Styles
 │   │   └── index.jsx                    # React entry point
 │   │
@@ -321,7 +355,7 @@ project-root/
 ├── moto-update-manifest.json            # Build 0 updater/build identity manifest committed on main
 ├── SECURITY.md                          # Security policy and private vulnerability reporting
 ├── Click To Launch MOTO.bat             # The authoritative Windows launcher entrypoint (thin wrapper that delegates to moto_launcher.py)
-├── Launch MOTO.sh                       # Linux/Ubuntu launcher entrypoint (thin bash wrapper that delegates to moto_launcher.py)
+├── linux-ubuntu-launcher.sh             # Linux/Ubuntu launcher entrypoint (thin bash wrapper that delegates to moto_launcher.py)
 ├── moto_launcher.py                     # Internal Python launcher orchestration (update check, runtime resolution, dependency install, service startup)
 ├── moto_updater.py                      # Build 1 updater helper (manifest fetch, install classification, ZIP/git apply flow, launcher state tracking)
 └── .moto_launcher_state.json            # Gitignored local launcher state (tracks active service-window PIDs and runtime roots to block unsafe update-apply)
@@ -331,7 +365,7 @@ project-root/
 ### Launcher and Updater
 
 - `Click To Launch MOTO.bat`: The only Windows consumer entrypoint. It stays thin and always delegates to the Python launcher.
-- `Launch MOTO.sh`: The Linux/Ubuntu consumer entrypoint. Same thin-wrapper contract as the `.bat`; delegates to `moto_launcher.py`.
+- `linux-ubuntu-launcher.sh`: The Linux/Ubuntu consumer entrypoint. Same thin-wrapper contract as the `.bat`; delegates to `moto_launcher.py`.
 - `moto_launcher.py`: Orchestrates the launcher flow in order: update check, runtime resolution, dependency install, LM Studio detection, detached backend/frontend startup, and browser launch.
 - `moto_updater.py`: Owns Build 1 updater behavior, including GitHub `main` manifest fetch, install-state classification, clean-git fast-forward apply, ZIP overlay apply, rollback-aware relaunch, and launcher-managed instance safety checks.
 - `.moto_launcher_state.json`: Local-only state written by the launcher so future launches can detect still-open backend/frontend windows from the same install and skip update-apply until those windows are closed.
@@ -345,19 +379,21 @@ project-root/
 ### Shared Resources
 
 - `config.py`: RAGConfig, SystemConfig (context windows, chunk sizes, max output tokens, `generic_mode` flag)
-- `models.py`: Pydantic models (ModelConfig, BoostConfig, WorkflowTask, ModelUsageTracker, FinalAnswerState)
-- `lm_studio_client.py`: LM Studio HTTP client (completions, embeddings, model listing); unused in generic mode
+- `models.py`: Pydantic models (ModelConfig with per-role `supercharge_enabled`, BoostConfig, WorkflowTask, ModelUsageTracker, FinalAnswerState)
+- `lm_studio_client.py`: LM Studio HTTP client (completions, embeddings, model listing, same-base numeric `:#` instance sharing for independent calls); unused in generic mode
 - `openrouter_client.py`: OpenRouter HTTP client (credit exhaustion detection, fallback, model/provider endpoint metadata)
-- `api_client_manager.py`: Unified API router (OpenRouter/LM Studio fallback + boost + model tracking); generic mode early-returns FastEmbed for embeddings
-- `boost_manager.py`: Singleton boost manager (three modes: Boost Next X Calls, Always Prefer Boost, Category Boost; broadcasts events)
+- `api_client_manager.py`: Unified API router (optional per-role Supercharge wrapper, OpenRouter/LM Studio fallback, boost, and model tracking); generic mode early-returns FastEmbed for embeddings
+- `boost_manager.py`: Singleton boost manager (next-count, always-prefer, category, and per-task boost routing; broadcasts events)
 - `boost_logger.py`: Boost API call logger (persists boost-routed calls for the combined API log view)
 - `workflow_predictor.py`: Predicts next 20 API calls for internal boost routing (not displayed in UI)
 - `free_model_manager.py`: Free model rotation/cooldown singleton (looping, auto-selector `openrouter/free`, account exhaustion detection)
-- `wolfram_alpha_client.py`: Wolfram Alpha API client. Exposed to the HighContextSubmitter.submit_construction loop as the `wolfram_alpha_query` tool (up to 20 calls per construction submission).
+- `model_error_utils.py`: Shared non-retryable provider/config error detection; callers must pause/resume rather than convert those errors into proof or validation failures.
+- `brainstorm_proof_gate.py`: Shared Lean 4 gate for optional proof-candidate brainstorm submissions before normal brainstorm validation.
+- `wolfram_alpha_client.py`: Wolfram Alpha API client. Exposed to the HighContextSubmitter.submit_construction loop as the `wolfram_alpha_query` tool (up to 20 calls per construction submission); logs/broadcasts must redact raw query/result text.
 - `rag_lock.py`: Global RAG operation lock (prevents collision, retry logic for reads); embedding lock skip in generic mode (FastEmbed is in-process/thread-safe)
 - `token_tracker.py`: Cumulative input/output token tracker singleton with per-model breakdown and research timer. Reset on session start, timer start/stop tied to coordinator lifecycle. Stats broadcast via `token_usage_updated` WebSocket event after each successful LLM call.
 - `utils.py`: Token counting, text compression, file I/O
-- `json_parser.py`: JSON parsing with sanitization for LLM responses; sanitizes reasoning tokens, markdown blocks, control tokens, LaTeX escapes, control characters; **rejects truncated JSON** (raises ValueError with diagnostics) to prevent corrupted content from passing validation
+- `json_parser.py`: JSON parsing with sanitization for LLM responses; sanitizes reasoning tokens, markdown blocks, control tokens, LaTeX escapes, control characters; **rejects truncated JSON** (raises ValueError with diagnostics) to prevent corrupted content from passing validation; also provides `sanitize_model_output_for_retry_context()` so retries/memory/RAG can preserve visible failed-output excerpts without replaying known private thought/channel/control tokens or corrupting visible Lean/math syntax such as `<|`; retry-facing parser exceptions must not include raw response excerpts
 - `critique_memory.py`: Paper critique persistence (ratings, feedback, history, session-aware)
 - `critique_prompts.py`: Default critique prompt and builder function
 - `secret_store.py`: Secure API key persistence via OS keyring; bypassed in generic mode (keys are env-injected/in-memory only)
@@ -381,7 +417,8 @@ project-root/
 
 - `autonomous_coordinator.py`: Three-tier workflow orchestrator (Tier 1→2→3, triggers, crash recovery, invokes `ProofVerificationStage` after brainstorm/paper completion when `lean4_enabled`)
 - `autonomous_rag_manager.py`: Autonomous RAG wrapper
-- `proof_verification_stage.py`: Proof pipeline orchestrator — candidate identification → per-candidate Phase A (Mathlib lemma search → optional SMT early-exit → Lean 4 formalization attempts, 5 retries per candidate) runs concurrently across all identified candidates bounded by `proof_max_parallel_candidates` (default 6) → Phase B (novelty check → `add_proof` → `ProofDependency` extraction → brainstorm/paper `append_proofs_section`) remains strictly serialized in Phase-A completion order. Per-source reservation lock prevents duplicate concurrent checks for the same `{source_type}:{source_id}`; `FreeModelExhaustedError` (or any Phase-A exception) cancels sibling tasks before the coordinator's recovery path runs.
+- `proof_verification_stage.py`: Proof pipeline orchestrator — prompt-relevant candidate identification → per-candidate Phase A (Mathlib lemma search → optional SMT early-exit → Lean 4 formalization attempts, 5 retries per candidate) runs concurrently across all identified candidates bounded by `proof_max_parallel_candidates` (default 6) → Phase B (novelty check → `add_proof` → `ProofDependency` extraction → brainstorm/paper `append_proofs_section`) remains strictly serialized in Phase-A completion order. Per-source reservation lock prevents duplicate concurrent checks for the same `{source_type}:{source_id}`; `FreeModelExhaustedError` (or any Phase-A exception) cancels sibling tasks before the coordinator's recovery path runs.
+- `proof_registration.py`: Shared verified-proof registration helper used by autonomous, compiler, aggregator, and LeanOJ proof flows.
 - `proof_dependency_extractor.py`: Parses verified Lean 4 code into `ProofDependency` records (imports, Mathlib lemmas, MOTO-origin proof ancestry).
 - Agents: `topic_selector.py`, `topic_validator.py`, `completion_reviewer.py`, `reference_selector.py`, `paper_title_selector.py`, `proof_identification_agent.py`, `proof_formalization_agent.py`, `lemma_search_agent.py`
 - Tier 3 Agents: `certainty_assessor.py`, `answer_format_selector.py`, `volume_organizer.py`
@@ -389,18 +426,26 @@ project-root/
 - Prompts: `topic_prompts.py`, `topic_exploration_prompts.py`, `completion_prompts.py`, `paper_reference_prompts.py`, `paper_title_exploration_prompts.py`, `paper_title_prompts.py`, `paper_redundancy_prompts.py`, `paper_continuation_prompts.py`, `proof_prompts.py`, `final_answer_prompts.py`
 - Memory: `brainstorm_memory.py`, `paper_library.py`, `research_metadata.py` (also stores the proof runtime config snapshot), `session_manager.py`, `autonomous_rejection_logs.py`, `topic_exploration_memory.py` (in-memory candidate DB), `paper_model_tracker.py` (per-paper model usage tracking and author attribution), `autonomous_api_logger.py` (API call logging singleton), `proof_database.py` (session-aware Lean 4 proof storage + novelty index + reverse Mathlib index + cross-session library access), `final_answer_memory.py` (model tracking, archival)
 
+### LeanOJ Components
+
+- `leanoj_coordinator.py`: Runs the proof-only LeanOJ state machine. It uses parallel submitters plus batch validators for broad initial foundation topics and brainstorms; classifies accepted brainstorm context as `active_plan`, `verified_hint`, `refuted_construction`, or `scratch`; keeps ordinary partial `sorry` scaffolds and failed final attempts out of master-proof seeding unless explicitly elevated; persists accepted-idea `context_role` and chronological occurrence metadata; stores full proof memory independently from trimmed UI/status lists; rejects fake proof devices; persists final-cycle failure packets; emits LeanOJ progress events; routes prompt memory through allocated context blocks; passes the most recent 5 final attempts as compact final-solver execution feedback; and requires Final Proof Solver semantic review before a Lean-passing final proof stops as verified.
+- `leanoj_context.py`: Owns LeanOJ artifact JSONL persistence under the active data root, direct-first allocation, final-solver context routing (verified subproofs + `active_plan` notes direct, refuted constructions only as compact warnings, ordinary partial scaffolds excluded from final direct proof context), source-name generation, RAG indexing, session-scoped retrieval with `include_source_prefixes`, direct-source exclusion, resume reload support, and Clear Progress cleanup for LeanOJ RAG sources.
+- `prompts.py`: LeanOJ prompt builders for topic, brainstorm, prune review, path, subproof, final-solver editing, and final semantic review roles. These consume prepared context blocks (`direct_proof_context`, `rag_evidence_context`, `refuted_construction_warnings`, `capped_rejection_feedback`, `current_final_cycle_packet`) instead of owning persistence or truncation policy; prune prompts must conservatively ask whether any outdated/redundant memory should be removed or updated without forcing deletion; final-solver prompts must keep `master_proof.lean` to the current chosen proof route, include only compact recent-attempt execution feedback, and avoid accumulating explored/refuted routes.
+
 ### API Routes
 
 - `compiler.py`: Compiler control (start/stop/status), paper/outline access, critique management
 - `autonomous.py`: Autonomous research control (start/stop/clear/status), brainstorm/paper access, Tier 3 endpoints
 - `proofs.py`: Proof database listing (`GET /`, `/novel`, `/known`) and `/status` runtime readiness — always available, never gated. `/{id}/certificate` and `/{id}/certificate.lean` — always available (data is stored on disk; Lean version info populated only when Lean is enabled). `/status` uses `asyncio.wait_for` timeouts (5s Lean, 3s Z3) so the endpoint never hangs. `POST /settings` runtime flag updates. `POST /check` manual proof check, `/{id}/dependencies`, `/graph`, `/mathlib/{lemma}/dependents` graph/lineage queries — gated on `lean4_enabled`. `GET /library` + `GET /library/{session_id}/{proof_id}` cross-session proof library endpoints — always available.
+- `leanoj.py`: LeanOJ proof-solver routes for start/resume, stop, status, clear, skip-brainstorm, force-brainstorm, current proof listing/library, plus read-only `GET /api/leanoj/master-proof` and `/api/leanoj/master-proof/edits` for the durable master proof draft and compact edit-history summaries.
 
 ### Frontend Components
 
-- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global, and Build 3C bootstraps `/api/features` here so hosted mode can hide LM Studio-only UI and copy. **Tab persistence**: `autonomousActiveTab` → `localStorage['autonomousActiveTab']`; `completedWorksSubTab` → `localStorage['completedWorksSubTab']`; `manualActiveTab` → `localStorage['manualActiveTab']`. **Autonomous tab groups**: main tabs (interface, brainstorms, papers, proofs, optional final-answer) + settings group (Your Completed Works Library, API Call Logs, Settings). The "Your Completed Works Library" tab hosts three sub-tabs rendered inside its content area: Stage 2 Papers History, Stage 3 Final Answers History, and Proof Library.
+- `App.jsx`: Top-level GUI shell. Default mode is `Autonomous ASI S.T.E.M.` for Part 3 screens; `Advanced Manual ASI S.T.E.M.` contains the manual Part 1 Aggregator + Part 2 Compiler workspace; `LeanOJ Proof Solver` is a developer-mode-only proof mode. Shared utility controls (Boost, OpenRouter, WorkflowPanel) remain global, and Build 3C bootstraps `/api/features` here so hosted mode can hide LM Studio-only UI and copy. Shift + Z + X toggles persisted developer-mode settings, LeanOJ mode, raw JSON editors, and Supercharge controls. Supercharge request payloads must be forced off unless developer mode is active. **Tab persistence**: `autonomousActiveTab` → `localStorage['autonomousActiveTab']`; `completedWorksSubTab` → `localStorage['completedWorksSubTab']`; `manualActiveTab` → `localStorage['manualActiveTab']`; `leanojActiveTab` → `localStorage['leanojActiveTab']`. **Autonomous tab groups**: main tabs (interface, brainstorms, papers, proofs, optional final-answer) + settings group (Your Completed Works Library, API Call Logs, Settings). The "Your Completed Works Library" tab hosts three sub-tabs rendered inside its content area: Stage 2 Papers History, Stage 3 Final Answers History, and Proof Library.
 - **Aggregator**: `AggregatorInterface.jsx`, `AggregatorSettings.jsx`, `AggregatorLogs.jsx`, `LiveResults.jsx`
 - **Compiler**: `CompilerInterface.jsx`, `CompilerSettings.jsx`, `CompilerLogs.jsx`, `LivePaper.jsx`
 - **Autonomous**: `AutonomousResearchInterface.jsx`, `BrainstormList.jsx`, `PaperLibrary.jsx`, `AutonomousResearchSettings.jsx`, `AutonomousResearchLogs.jsx`, `LivePaperProgress.jsx`, `LiveTier3Progress.jsx`, `FinalAnswerView.jsx`, `FinalAnswerLibrary.jsx` (Stage 3 history sub-tab), `ArchiveViewerModal.jsx`, `MathematicalProofs.jsx` (live-session proof tab), `ProofGraph.jsx` (dependency graph), `ProofNotificationStack.jsx` (novel-proof popups), `ProofLibrary.jsx` (cross-session proof library sub-tab), `Stage2PaperHistory.jsx` (Stage 2 history sub-tab)
+- **LeanOJ**: `LeanOJInterface.jsx`, `LeanOJBrainstorms.jsx`, `LeanOJLogs.jsx`, `LeanOJMasterProof.jsx`, `LeanOJMathematicalProofs.jsx`, `LeanOJProofLibrary.jsx`, `LeanOJSettings.jsx`
 - **Shared**: `StartupProviderSetupModal.jsx`, `OpenRouterApiKeyModal.jsx`, `PaperCritiqueModal.jsx`, `CritiqueNotificationStack.jsx`, `CreditExhaustionNotificationStack.jsx`, `HungConnectionNotificationStack.jsx`, `BoostControlModal.jsx`, `WorkflowPanel.jsx`, `TextFileUploader.jsx`, `OpenRouterPrivacyWarningModal.jsx`, `LatexRenderer.jsx` (dual view, KaTeX, theorem parsing), `LatexRenderer.css`
 - **Hooks**: `useProofCheckRuntime.js` (reads `/api/proofs/status` + runtime config so UI can enable/disable manual proof-check controls)
 - **Utils**: `downloadHelpers.js` (PDF/raw download), `modelCache.js` (display_name → api_id lookup), `openRouterSelection.js` (shared OpenRouter selector auto-fill helpers using model context and provider endpoint caps), `autonomousProfiles.js` (shared recommended-profile definitions + persistence helpers; when editing a preset, anchor to the exact profile block and exact nested role such as `validator` or `highContext`, never to a shared literal alone, then verify the diff only touched that intended profile/role), `disclaimerHelper.js` (frontend-only disclaimer injection), `api.js`, `websocket.js`
diff --git a/.cursor/rules/rag-design-for-overall-program.mdc b/.cursor/rules/rag-design-for-overall-program.mdc
index 6057269..6b79c5a 100644
--- a/.cursor/rules/rag-design-for-overall-program.mdc
+++ b/.cursor/rules/rag-design-for-overall-program.mdc
@@ -9,11 +9,31 @@ The RAG system in this program is very advanced, be certain that any changes you
 
 DIRECT INJECTION FIRST, RAG SECOND IF DIRECT INJECTION DOESN'T FIT.
 
+Some inputs are **mandatory direct-inject** and must never be RAG'd, summarized, compressed, truncated, excerpted, or replaced by partial views. If mandatory direct-inject context does not fit the configured model context, halt with an explicit context-overflow error and tell the user which mandatory context overflowed.
+
 If an item is direct injected, its RAG counterpart must NOT also be included.
 
-**RAG Offload Priority — Submitter:** Shared Training DB → Local Submitter DB → Rejection Log → User Upload Files
+### Paper-Writing RAG Modes
+
+These priorities apply to the Aggregator/Compiler/Autonomous paper-writing workflows. They do **not** describe LeanOJ proof-only memory ordering.
+
+**RAG Offload Priority — Paper-Writing Submitter:** Shared Training DB → Local Submitter DB → Rejection Log → User Upload Files
+
+**RAG Offload Priority — Paper-Writing Validator:** Shared Training DB → User Upload Files (submission under review is always direct injected)
+
+### LeanOJ Proof-Only RAG Mode
+
+These priorities apply only to the LeanOJ proof solver. LeanOJ stores proof artifacts under session-scoped sources such as `leanoj_{session_id}_accepted_ideas` and retrieves with `include_source_prefixes=[f"leanoj_{session_id}_"]`. Do not apply these orders to paper-writing prompts.
+
+**RAG Offload Priority — LeanOJ Final Solver:** Verified Subproofs → Partial Proof Scaffolds → Accepted Proof Memory Notes. Final-solver proof memory must not include recursive topics, historical final-cycle packets, failed-attempt counts, or phase-transition/path vocabulary. It is an edit-only mode. The prompt may separately include the most recent 5 final attempts as compact execution feedback for edit selection only; this is not proof evidence and must not seed `master_proof.lean`.
 
-**RAG Offload Priority — Validator:** Shared Training DB → User Upload Files (submission under review is always direct injected)
+**RAG Offload Priority — LeanOJ Proofstorm/Subproof Solver:** Current Final-Cycle Failure Packet (always direct if active) → Verified Subproofs → Relevant Partial Proof Scaffolds → Accepted Brainstorm Ideas → Historical Failed Attempts For Related Obstacles
+
+**RAG Offload Priority — LeanOJ Brainstorm After Final-Loop Failure:** Current final-attempt-cycle failure packet (always direct) → Accepted Brainstorm Ideas → Partial Proof Scaffolds → Verified Subproofs → Older Historical Final Failures (RAG only)
+
+**LeanOJ capped feedback rule:** Same-subproof prior attempt errors and rejection/failure summaries may stay capped as direct feedback. The final solver may receive compact execution feedback from the most recent 5 final attempts after filtering or rewriting path-transition vocabulary and final-cycle attempt-count summaries. Validator feedback rejecting non-progressive `master_proof.lean` shortening edits is allowed as direct final-solver feedback. The cap applies only to direct rejection/execution feedback, not to total persisted LeanOJ memory.
+
+**LeanOJ mandatory direct-inject inputs:** User problem, Lean template, JSON/schema/task instructions, and the canonical `master_proof.lean` during the final proof-editing loop are mandatory direct-inject context. The master proof is the active proof attempt and must be injected in full. It must never be RAG offloaded, summarized, compressed, truncated, chunk-windowed, or replaced by an excerpt. If the full master proof cannot fit with the other mandatory prompt context, LeanOJ must stop with a hard mandatory direct-context overflow error.
 
 ## Further RAG Specifications
 
@@ -62,6 +82,9 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 - **Generic mode lock skip**: FastEmbed is in-process and thread-safe — embedding calls skip the global RAG lock. ChromaDB write locking remains in both modes.
 - **Read retry**: Vector search auto-retries with exponential backoff (0.5s → 1s → 2s, max 3 attempts) on HNSW index errors during concurrent writes
 - **Embedding rate limiting**: Semaphore limits concurrent embedding requests to 2 (default mode only; generic mode uses in-process FastEmbed)
+- **FastAPI event-loop safety**: `rag_manager` must not run synchronous ChromaDB calls or CPU-heavy scoring directly on the event loop. Use `asyncio.to_thread()` for ChromaDB `add/query/get/delete` and for large in-memory vector/BM25 scoring.
+- **Retrieval snapshots**: Take a stable chunk snapshot before threaded scoring so concurrent add/remove operations cannot mutate the iterable being scored. Worker-thread BM25/vector scoring should use local snapshot state and must not mutate shared caches such as `self.bm25_index`.
+- **GUI responsiveness invariant**: RAG work runs inside long-lived research/proof tasks; it must never starve `/api/health`, `/api/features`, status polling, OpenRouter key-status, or WebSocket handling.
 
 ---
 
@@ -69,12 +92,14 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Stage A — Query Rewriting**: Expands to 3-6 semantic variants; filters queries < 3 words; embeddings cached (500-entry LRU); variants batched into single embedding API call.
 
-**Stage B — Hybrid Recall**: BM25 (exact terms) + ANN Cosine (semantic); top 120 from each, deduped by chunk_id.
+**Stage B — Hybrid Recall**: BM25 (exact terms) + ANN Cosine (semantic); top 120 from each, deduped by chunk_id. Optional `include_sources` / `include_source_prefixes` scopes recall to named source files or source-name prefixes before reranking. Recall operates on a chunk snapshot; scoped in-memory vector fallback and BM25 scoring must run off-loop.
 
 **Stage C — Reranking + MMR**: Blend vector (60%) + BM25 (40%); MMR λ=0.8 (80% relevance, 20% diversity); removes near-duplicates (similarity > 0.85); hard cap at context budget.
 
 **Stage D — Packing**: Assembles evidence with headers; priority: document → section → relevance. Packs chunks incrementally until budget is reached (no compression — disabled as unreliable). Skips chunks from `exclude_sources` (content already direct-injected in prompt). Returns `ContextPack` with evidence tracking.
 
+**Scoped retrieval**: `rag_manager.retrieve()` may receive `include_sources` and/or `include_source_prefixes` to restrict recall to a namespaced source set before reranking/packing. Use this for mode-specific memory namespaces such as LeanOJ so proof-solver artifacts cannot leak into unrelated paper-writing or compiler retrieval. `exclude_sources` still applies afterward for anti-duplication when a scoped source was direct-injected.
+
 ---
 
 ## Multi-Configuration Chunk Storage
@@ -103,6 +128,8 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Always direct injected**: User prompt/goal, JSON output format specs, system prompts.
 
+**Mandatory direct-inject overflow**: Mandatory direct-inject inputs are not eligible for RAG fallback or compression. If they exceed available prompt context, halt with an explicit overflow error. Examples include the LeanOJ final-loop `master_proof.lean`, validator submissions under review, active Lean source/proof attempts, and proof-verification candidate theorem/formalization inputs.
+
 **Token budget formula**: `available_input = context_window - output_reserve - buffer(500)`
 
 **Context allocation algorithm**:
@@ -113,10 +140,12 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Key Invariant**: Context allocator returns content parts only. Prompt builder adds template parts (system prompt, JSON, user prompt). Both must be counted to avoid overflow.
 
-**Overflow handling**: User prompt always direct injected; if exceeds `context_window - minimum_RAG_allocation`: HALT with error. Content too large: offload to RAG. Still doesn't fit: compress (NEVER truncate).
+**Overflow handling**: User prompt always direct injected; if exceeds `context_window - minimum_RAG_allocation`: HALT with error. Mandatory direct-inject content that does not fit: HALT with explicit context-overflow error. Non-mandatory content too large: offload to RAG. Still doesn't fit: compress only when the mode explicitly allows compression (NEVER truncate).
 
 **Source Exclusion (anti-duplication)**: `rag_manager.retrieve(exclude_sources=[...])` filters chunks from named sources during Stage D packing. Callers pass source names of content already direct-injected so RAG budget goes entirely to non-duplicated content.
 
+**Source Scoping (anti-leakage)**: `rag_manager.retrieve(include_sources=[...], include_source_prefixes=[...])` restricts recall to explicit sources before reranking/packing. Use this whenever a mode stores specialized memory in the shared Chroma collections and must prevent cross-mode retrieval. LeanOJ uses session-prefixed sources such as `leanoj_{session_id}_accepted_ideas` and retrieves with `include_source_prefixes=[f"leanoj_{session_id}_"]`.
+
 | Mode | Excluded Sources | Reason |
 |---|---|---|
 | Compiler construction | `compiler_outline.txt`, `compiler_paper.txt`, brainstorm source (when direct-injected) | All three always direct-injected in construction prompts |
@@ -124,6 +153,7 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 | Compiler rigor | `compiler_outline.txt` | Outline always direct-injected; paper intentionally RAG'd (smaller context) |
 | Aggregator submitter/validator | Direct-injected user file names + direct-injected shared-training sources (current training file + `rag_shared_training_update_*`) | Prevents RAG returning chunks already in direct context when only some content is offloaded |
 | Aggregator cleanup review | Same as above, when full submissions DB is direct-injected | Prevents cleanup RAG evidence from repeating already-injected submissions |
+| LeanOJ proof solver | Direct-injected LeanOJ source names, scoped to `leanoj_{session_id}_*` sources | Keeps useful proof memory session-scoped and prevents cross-mode retrieval pollution |
 
 ---
 
@@ -162,6 +192,8 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 **Proof Verification Stage (optional, gated on `lean4_enabled`)**: Proof identification, formalization, and lemma search agents operate outside the RAG pipeline. Verified `ProofRecord` summaries and `FailedProofCandidate` hints (from `proof_prompts.format_failure_hints_for_injection`) are **highest-priority direct injections** into subsequent brainstorm/paper submitter prompts when present — never RAG'd. Lean source files under the session `proofs/` directory are not indexed into Chroma.
 
+**LeanOJ Proof Solver**: LeanOJ useful proof memory uses the existing RAG pipeline through `backend/leanoj/core/leanoj_context.py`, not a separate/simple retriever. Mandatory prompt inputs (user problem, Lean template, role task, JSON schema) stay direct. Useful artifacts (accepted ideas, recursive topics, verified subproofs, partial proof scaffolds, historical final attempts, final-cycle packets, failed subproof context) are persisted in full, direct-injected if they fit, otherwise indexed under session-scoped `leanoj_{session_id}_*` sources and retrieved with source scoping. Direct-injected LeanOJ sources must be excluded from RAG evidence. Current final-cycle failure packets are direct context for the next brainstorm/proofstorm phase; older final-cycle packets remain available through scoped RAG only. Recent rejection/error summaries remain capped direct feedback. During final proof-editing, allocation is narrower: no recursive topics, no historical final-cycle packets, no failed-attempt counts, and no phase-transition/path vocabulary; the prompt may still include the most recent 5 final attempts as capped execution feedback so the solver does not repeat stale edits or ignored Lean errors. Validator feedback from rejected non-progressive master-proof shortening edits may be direct feedback because it tells the next final solver what proof progress to restore. The canonical LeanOJ master proof draft (`master_proof.lean`) is file-backed working state, not a RAG artifact: during the final proof-editing loop it is mandatory direct-inject context and must be shown fully or the program must halt with a mandatory direct-context overflow error. Edits always apply to the full persisted proof.
+
 **Embedding provider routing**: See dual-contract table above. Default mode uses LM Studio with OpenRouter fallback. Generic mode uses in-process FastEmbed. Both modes produce compatible vector dimensions for the same ChromaDB collections.
 
 **Training DB files**: `rag_shared_training.txt` and `Summary_Of_Last_5_Validator_Rejections_For_Submitter_{num}.txt` live under the active instance data root (default desktop paths: `backend/data/rag_shared_training.txt` and `backend/data/Summary_Of_Last_5_Validator_Rejections_For_Submitter_{num}.txt`).
@@ -170,11 +202,11 @@ User-uploaded files: pre-generate ALL 4 configurations. Dynamic files (training
 
 ## Agents Intentionally Without RAG
 
-These agents use ONLY direct injection (no RAG fallback) by design. Each operates on compact metadata summaries where RAG is unnecessary. Documented in each file's module docstring.
+These agents use ONLY direct injection for their compact metadata decision steps. If a listed agent has a later full-content expansion step, that expansion may use the normal direct-first/RAG fallback documented in its module docstring.
 
 | Agent | Inputs | Why No RAG |
 |---|---|---|
-| Topic selector | Brainstorm metadata, paper titles/abstracts | Strategic "what to work on" decision — summaries suffice; abstracts truncated as overflow fallback |
+| Topic selector | Brainstorm metadata, paper titles/abstracts | Strategic "what to work on" decision — bounded metadata summaries suffice |
 | Topic validator | Same as topic selector | Validates strategic decision, same compact metadata |
 | Paper title selector | Brainstorm summary, existing paper titles/abstracts | Title selection needs topic overview, not full content |
 | Paper redundancy checker | Paper titles/abstracts | Redundancy detected at abstract level, not full-content comparison |
@@ -184,7 +216,7 @@ These agents use ONLY direct injection (no RAG fallback) by design. Each operate
 | Brainstorm continuation | Brainstorm summary, prior paper titles/abstracts | "Write another or move on" uses summary, not full DB |
 | Proof identification / formalization / lemma search | Candidate theorem text, Lean error output, targeted Mathlib lemma metadata | Operates on compact Lean source + structured hints; proof agents consume `ProofRecord` direct-injection summaries and do not route through the RAG pipeline |
 
-**Known oversight**: Certainty assessor Step 2 drops expanded papers when they don't fit instead of RAG'ing them. Should use RAG fallback like reference_selector does.
+**Certainty assessor overflow handling**: Certainty assessor Step 1 remains abstract/outline-only. Step 2 uses RAG fallback for requested expanded papers when full direct injection does not fit.
 
 ---
 
@@ -195,7 +227,7 @@ These agents use ONLY direct injection (no RAG fallback) by design. Each operate
 3. User files pre-generate 4 configs — no re-chunking during session
 4. Dynamic files re-chunked on update — single config
 5. Submitter cycling is independent — each maintains own cycle state
-6. No truncation fallback — fails cleanly, uses RAG or compresses
+6. No truncation fallback — mandatory direct-inject context fails cleanly; non-mandatory oversized content uses RAG or mode-approved compression
 7. Evidence tracking mandatory — all facts map to source spans
 8. User files protected from eviction — permanent cache
 9. Contradiction check pre-acceptance
@@ -205,3 +237,7 @@ These agents use ONLY direct injection (no RAG fallback) by design. Each operate
 13. Per-size chunk cap (`max_chunks_per_size`) enforced after every add — prevents unbounded in-memory embedding growth
 14. Agents that use only metadata summaries (topic selector, title selector, redundancy checker, etc.) intentionally skip RAG — see "Agents Intentionally Without RAG" table above
 15. If content is already direct-injected, it must NOT also appear in RAG retrieval results — no duplication
+16. Shared Chroma retrieval must use source scoping for mode/session-specific memory such as LeanOJ proof artifacts — no cross-mode memory leakage
+17. LeanOJ `master_proof.lean` is mandatory full direct-inject context during the final proof-editing loop. Never RAG, summarize, compress, truncate, or window it. If it does not fit, halt with a mandatory direct-context overflow error.
+18. Synchronous ChromaDB operations and heavy RAG scoring must be offloaded from the FastAPI event loop.
+19. Threaded RAG scoring must use local snapshots and must not mutate shared retrieval indexes/caches.
diff --git a/.dockerignore b/.dockerignore
index 765032d..8e3b315 100644
--- a/.dockerignore
+++ b/.dockerignore
@@ -31,7 +31,7 @@ commits_pending.txt
 proof-integration-build*-plan.md
 
 Click To Launch MOTO.bat
-Launch MOTO.sh
+linux-ubuntu-launcher.sh
 moto_launcher.py
 moto_updater.py
 
diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000..3bdebe0
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,16 @@
+* text=auto
+
+*.py text eol=lf
+*.js text eol=lf
+*.jsx text eol=lf
+*.json text eol=lf
+*.md text eol=lf
+*.mdc text eol=lf
+*.css text eol=lf
+*.yml text eol=lf
+*.yaml text eol=lf
+
+.gitignore text eol=lf
+.gitattributes text eol=lf
+
+*.sh text eol=lf
diff --git a/.gitignore b/.gitignore
index 50261b8..cc9881a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -71,6 +71,8 @@ backend/data/auto_final_answer/*
 !backend/data/auto_final_answer/.gitkeep
 
 backend/data/auto_sessions/
+backend/data/leanoj_sessions/
+backend/data/leanoj_artifacts/
 
 # Proof verification artifacts (Lean 4 / Z3 hybrid mode)
 backend/data/proofs/*
@@ -123,4 +125,6 @@ htmlcov/
 final_volume.txt
 RANDOM LOG.txt
 randomlog.txt
+randomlog*.txt
+leanoj_master_proof_*.lean.txt
 commits_pending.txt
diff --git a/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md b/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
new file mode 100644
index 0000000..ba9a15b
--- /dev/null
+++ b/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
@@ -0,0 +1,400 @@
+# HardOJ AWS Outline: User-Donated Lean Verification and Karma
+
+## Purpose
+
+HardOJ is an advanced Lean proof challenge platform where users can submit theorem templates, vote on templates, solve templates, and optionally donate their own compute to verify Lean proofs safely.
+
+The core product goal is to create a public problem marketplace for hard formalization targets, including advanced theorem templates such as unsolved Lean 100-style problems, while keeping verification trustworthy, reproducible, and resistant to compute abuse.
+
+## Core User Flows
+
+### Template Submission
+
+Users can submit Lean theorem templates as public challenge problems.
+
+A template includes:
+
+- A title and informal mathematical statement
+- The Lean theorem statement
+- Required imports
+- A pinned Lean version and Mathlib revision
+- Optional explanatory notes, references, and difficulty tags
+- Optional helper lemmas or staged subproblem templates
+- A starter file ending in `sorry`
+
+Example template shape:
+
+```lean
+import Mathlib
+
+/-!
+Informal statement:
+This section explains the intended mathematical theorem.
+
+Rules:
+- The final proof must not use `axiom`, `constant`, `opaque`, or unrelated imported shortcuts.
+- The theorem statement must remain unchanged.
+- The proof must compile under the pinned Lean and Mathlib versions.
+-/
+
+theorem hardoj_target_theorem
+    (/* variables */)
+    (/* hypotheses */) :
+    /* formal claim */ := by
+  sorry
+```
+
+Before a submitted template becomes public, HardOJ validates that:
+
+- The Lean file parses and typechecks with `sorry` allowed
+- Imports are on the allowlist or approved by moderation
+- The theorem statement is not empty, trivial, or already solved in the submitted file
+- The template does not introduce fake proof devices such as `axiom`, `constant`, `opaque`, or unsafe escape hatches
+- The informal statement reasonably matches the formal Lean target
+
+### Template Voting
+
+Users can upvote or downvote templates.
+
+Voting is used to surface important, interesting, difficult, and well-scoped theorem challenges. A template's visible score works like Reddit-style post score: upvotes increase the score, downvotes decrease it, and ranking can use time decay, controversy, and anti-abuse filtering.
+
+Templates with high scores become more valuable to solve because successful solvers receive karma based on the template's current score.
+
+### Proof Submission
+
+Users submit a completed Lean proof for a public template.
+
+A proof submission includes:
+
+- The unchanged template theorem statement
+- The user's proof replacing `sorry`
+- A proof hash
+- The Lean and Mathlib version used
+- Local verifier logs if available
+- Optional explanation of the proof strategy
+
+HardOJ accepts the solution only if the proof compiles in the pinned environment and passes integrity checks.
+
+### Karma Rewards
+
+Karma works like Reddit-style karma for platform reputation.
+
+Users gain karma when other users upvote their submitted templates, comments, explanations, and accepted solutions. Users lose karma from downvotes, subject to anti-abuse controls.
+
+Special HardOJ rule:
+
+- If a user solves a template, the solver receives solution karma equal to the template's current positive score at the time the solution is accepted.
+- If someone else solves a user's template, the template creator receives a creator bonus equal to 25% of that same positive score snapshot.
+
+Example:
+
+- A template has score `87`
+- A user submits the first accepted proof
+- The solver receives `87` solution karma
+- The template creator receives `21.75` creator-bonus karma, rounded according to the platform's configured karma precision
+
+If a template has a score below zero, the solution reward should floor at zero unless the platform later chooses to allow negative challenge rewards.
+
+## Compute Donation Model
+
+HardOJ should start with a safe model: users donate compute to verify their own submissions locally. Public volunteer verification can be added later with stronger controls.
+
+### Local User-Owned Verification
+
+The user runs a HardOJ verifier agent on their own machine.
+
+The verifier:
+
+1. Downloads the selected template package
+2. Uses the pinned Lean and Mathlib versions
+3. Inserts the user's submitted proof
+4. Runs Lean in a sandbox
+5. Returns verification metadata to HardOJ
+
+Returned metadata includes:
+
+- Template ID
+- Submission ID
+- Proof hash
+- Lean version
+- Mathlib revision
+- Success or failure
+- Lean errors if verification fails
+- Runtime, memory use, and timeout status
+
+Local verification helps users avoid wasting server resources and gives fast feedback. However, local verification alone should not be the sole source of official acceptance because a malicious client can fake success.
+
+### Official Acceptance
+
+For official karma, leaderboard placement, and "solved" status, HardOJ should use one of these trust paths:
+
+1. **Trusted AWS verification**: HardOJ re-verifies the final proof on AWS before accepting it.
+2. **Volunteer quorum plus spot check**: Multiple independent volunteer verifiers return matching success for the same proof hash, with HardOJ spot-checking high-value solves.
+3. **Attested verifier later**: Use stronger attestation if a reliable cross-platform proof-verifier attestation path becomes available.
+
+The recommended MVP is local pre-verification plus AWS official verification.
+
+## Anti-Exploitation Rules for Donated Compute
+
+User-donated compute must not become a free arbitrary job runner.
+
+Every donated verification job must be constrained:
+
+- Verify only a specific HardOJ template ID
+- Use only the pinned Lean and Mathlib revision
+- Use an immutable template package
+- Use a proof file whose hash is known before execution
+- Disable network access during Lean execution
+- Run in a container, VM, or OS sandbox
+- Enforce wall-time, CPU, RAM, process, and file-size limits
+- Use a read-only project root and a temporary write directory
+- Reject unauthorized imports or local file access
+- Never expose user secrets, API keys, cookies, or filesystem paths to the sandbox
+- Allow the user to cancel jobs at any time
+
+For MVP, donated compute should verify only the user's own proofs. Public volunteer verification should be opt-in and off by default.
+
+## AWS Architecture
+
+### Frontend
+
+Use one of:
+
+- S3 + CloudFront for a static web frontend
+- AWS Amplify for managed frontend deployment
+- A separate web app stack if HardOJ shares infrastructure with another website
+
+Frontend responsibilities:
+
+- Browse templates
+- Submit templates
+- Vote on templates
+- Submit proofs
+- Show verification status
+- Show karma, leaderboards, and user profiles
+- Connect to the local verifier agent when installed
+
+### API Layer
+
+Use API Gateway or an Application Load Balancer in front of backend services.
+
+Backend services can run on:
+
+- ECS Fargate for containerized API services
+- EKS if Kubernetes is already used
+- Lambda for small event-driven tasks
+
+Primary backend responsibilities:
+
+- Authentication and user sessions
+- Template submission and moderation
+- Voting and karma accounting
+- Proof submission lifecycle
+- Verification queue management
+- Leaderboards and notifications
+
+### Database
+
+Use PostgreSQL on Amazon RDS for relational data.
+
+Recommended tables:
+
+- `users`
+- `templates`
+- `template_versions`
+- `template_votes`
+- `proof_submissions`
+- `verification_jobs`
+- `verification_results`
+- `karma_events`
+- `comments`
+- `comment_votes`
+- `moderation_events`
+
+Use immutable event rows for karma changes so reputation can be audited and recomputed.
+
+### Object Storage
+
+Use S3 for immutable artifacts:
+
+- Template packages
+- Lean source files
+- Submitted proofs
+- Verification logs
+- Generated problem bundles
+- Public downloadable archives
+
+Every stored artifact should include a content hash.
+
+### Verification Queue
+
+Use SQS for verification jobs.
+
+Job payload:
+
+- Job ID
+- Template ID
+- Template version hash
+- Proof submission ID
+- Proof hash
+- Lean toolchain version
+- Mathlib revision
+- Resource limits
+
+AWS official verifiers and optional volunteer verifiers both consume jobs, but they should use different queues and trust levels.
+
+### Official AWS Verifier Workers
+
+Run official verifier workers on ECS Fargate, AWS Batch, or EC2 autoscaling groups.
+
+Each verifier worker:
+
+- Pulls one job from SQS
+- Downloads immutable artifacts from S3
+- Builds or reuses the pinned Lean environment
+- Runs Lean in a locked sandbox
+- Uploads logs and result metadata
+- Writes the result to the backend
+
+For hard theorem templates, AWS Batch or EC2 workers may be more practical than Lambda because Lean and Mathlib verification can be CPU-heavy and long-running.
+
+## Local Verifier Agent
+
+The local verifier agent is a small desktop service or CLI installed by the user.
+
+Responsibilities:
+
+- Authenticate with HardOJ
+- Receive only user-approved jobs
+- Download immutable template packages
+- Run Lean in a sandbox
+- Stream local logs to the browser
+- Submit signed result metadata
+
+The browser can connect to the local verifier through:
+
+- `localhost` HTTP/WebSocket with a one-time pairing token
+- A CLI command that verifies a downloaded package
+- A desktop app wrapper
+
+The local verifier should never accept remote arbitrary commands. It should expose only a narrow API:
+
+- `GET /status`
+- `POST /verify-template-proof`
+- `POST /cancel-job`
+
+## Template Ranking
+
+Template ranking can use Reddit-style concepts:
+
+- Net score: upvotes minus downvotes
+- Hot ranking: score adjusted by age
+- Top ranking: highest score over a time window
+- New ranking: recent submissions
+- Controversial ranking: high activity with mixed votes
+
+HardOJ-specific ranking signals:
+
+- Number of failed serious attempts
+- Whether the template has a verified solution
+- Difficulty tag
+- Formalization quality score
+- Moderator approval level
+- Number of staged helper templates
+
+## Karma System
+
+Karma should be event-sourced.
+
+Each karma change is stored as a `karma_event`:
+
+- User ID
+- Event type
+- Source object type
+- Source object ID
+- Delta
+- Timestamp
+- Reason
+
+Event types:
+
+- Template upvote received
+- Template downvote received
+- Comment upvote received
+- Comment downvote received
+- Solution accepted
+- Template solved creator bonus
+- Solution upvote received
+- Moderator adjustment
+- Abuse rollback
+
+Template solve reward:
+
+- On accepted solution, compute `reward = max(template_score_at_acceptance, 0)`
+- Compute `creator_bonus = reward * 0.25` for the template author when the solver is not the same user as the template author
+- Add a `solution_accepted` karma event for the solver
+- Add a `template_solved_creator_bonus` karma event for the template creator
+- Store the score snapshot used for the reward
+- Do not retroactively change the solver's reward or creator bonus if the template later gains or loses votes, unless the platform later adds a bounty mechanism
+
+This keeps rewards predictable and prevents old solves from constantly changing user karma.
+
+## Abuse Controls
+
+HardOJ needs anti-abuse protections because votes and karma create incentives.
+
+Recommended controls:
+
+- One vote per user per object
+- Rate limits on voting, posting, and proof submissions
+- New-account vote weighting or trust thresholds
+- Bot and sockpuppet detection
+- Vote-ring detection
+- Moderator review for high-value solve rewards
+- Karma rollback events for abuse
+- Shadow filtering for suspicious votes until reviewed
+- No unlimited verification retries on shared AWS compute
+
+## MVP Scope
+
+The first version should implement:
+
+- User accounts
+- Template submission
+- Template upvotes/downvotes
+- Reddit-style template score
+- Proof submission
+- Local user-owned verifier for pre-checking
+- AWS official verifier for accepted solves
+- Karma events
+- Solver receives karma equal to template score at acceptance
+- Template creator receives a 25% karma bonus when another user solves their template
+- Basic leaderboards
+
+Public donated verification for other users should wait until after the local verifier and AWS verifier are stable.
+
+## Later Extensions
+
+Possible future additions:
+
+- Volunteer verifier pool for public proofs
+- Quorum-based verification
+- Template bounties separate from karma
+- AI-generated Lean template proposals
+- AI semantic review for informal/formal theorem match
+- Staged theorem packs for major open formalization targets
+- Team solving
+- Private templates before publication
+- Proof explanation rewards
+- HardOJ API for external theorem-proving agents
+
+## Critical Invariants
+
+1. A template can be public only if it typechecks with `sorry` in the pinned Lean environment.
+2. A proof can be officially accepted only after trusted verification or an approved trust policy.
+3. User-donated compute must never run arbitrary unscoped jobs.
+4. Verification jobs must be sandboxed, resource-limited, and network-isolated.
+5. Karma must be auditable through immutable karma events.
+6. Solver karma from a template solve is based on the template score snapshot at acceptance.
+7. Template creator solve bonuses are 25% of the same acceptance-time score snapshot.
+8. Lean acceptance is necessary but not always semantically sufficient; high-value templates need informal/formal review.
diff --git a/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md b/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
new file mode 100644
index 0000000..4e934bb
--- /dev/null
+++ b/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
@@ -0,0 +1,25 @@
+# LeanOJ Master Proof Writer Remainder
+
+## Audit Result
+The master-proof edit loop, persistent `master_proof.lean`, edit history log, resume metadata, stuck-to-brainstorm signal, and focused coordinator tests are implemented.
+
+## Fixed After Audit
+### Mandatory Full Proof Direct Injection
+The final-solver prompt now directly injects the full `master_proof.lean` as mandatory context. The proof attempt is never truncated, summarized, windowed, or RAG-substituted. If the full master proof cannot fit alongside the other mandatory prompt context, LeanOJ raises a hard mandatory direct context overflow error and stops instead of continuing with partial proof context.
+
+Implemented:
+1. Full master proof direct injection.
+2. Hard overflow error when the mandatory full proof cannot fit.
+3. Token counting before prompt assembly.
+4. Test coverage for mandatory context overflow.
+
+## Completed Follow-Ups
+1. Added read-only API access for retrieving the current master proof draft on demand, without broadcasting it in normal status payloads.
+2. Added compact edit-history summaries for debugging.
+3. Added snapshot compaction for large `master_proof_edits.jsonl` logs.
+4. Added a conservative progress watchdog for repeated `needs_more_time: true` edits that do not make meaningful progress.
+5. Added focused coordinator/API route tests for the follow-up behavior.
+6. Added a UI viewer tab for the master proof draft and edit history.
+
+## Remaining Optional Follow-Ups
+- None currently known.
diff --git a/LEANOJ_PROBLEM_11_PROMPT.md b/LEANOJ_PROBLEM_11_PROMPT.md
new file mode 100644
index 0000000..73cea60
--- /dev/null
+++ b/LEANOJ_PROBLEM_11_PROMPT.md
@@ -0,0 +1,34 @@
+# LeanOJ Problem 11 Prompt
+
+Source: [LeanOJ Problem 11](https://leanoj.org/index.php?action=view_problem&id=11)
+
+# User Prompt
+
+Solve the LeanOJ problem "RMM 2023 Shortlist N1" completely in Lean 4.
+
+Problem statement:
+
+Let `n` be a positive integer. Let `S` be a set of ordered pairs `(x, y)` such that `1 <= x <= n` and `0 <= y <= n` in each pair, and there are no pairs `(a, b)` and `(c, d)` of different elements in `S` such that `a^2 + b^2` divides both `ac + bd` and `ad - bc`. In terms of `n`, determine the size of the largest possible set `S`.
+
+Your task is to replace every `sorry` in the LeanOJ template with a complete Lean 4 proof accepted by the LeanOJ checker. Preserve the imports, definitions, theorem statement, and overall template structure unless a change is strictly necessary for Lean 4 verification. Do not use `sorry`, `admit`, fake axioms, or placeholder proof devices.
+
+Mathlib version used by the checker: `v4.29.0`.
+
+The final answer must be a complete Lean 4 file suitable for direct LeanOJ submission.
+
+# LeanOJ Template
+
+```lean
+import Mathlib.Data.Finset.Card
+import Mathlib.Order.Bounds.Defs
+
+def answer (n : ℕ) : ℕ := sorry
+
+def S (n : ℕ) : Set ℕ := { a : ℕ | ∃ S : Finset (ℕ × ℕ), S.card = a ∧
+    (∀ p ∈ S, 1 ≤ p.1 ∧ p.1 ≤ n ∧ 0 ≤ p.2 ∧ p.2 ≤ n) ∧
+    (∀ u ∈ S, ∀ v ∈ S, u ≠ v → ¬(
+      (u.1 ^ 2 + u.2 ^ 2) ∣ (u.1 * v.1 + u.2 * v.2) ∧
+      (u.1 ^ 2 + u.2 ^ 2) ∣ (u.1 * v.2 - u.2 * v.1))) }
+
+theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := sorry
+```
diff --git a/README.md b/README.md
index 3da2ffb..a4aead6 100644
--- a/README.md
+++ b/README.md
@@ -1,12 +1,12 @@
 # MOTO Autonomous ASI
-## An Autonomous Prototype Superintelligence - Automated Theorem Generation with Lean 4 Mathematics Proof Verification
-**Version: 1.0.7**
+## Autonomous Prototype Superintelligence - Automated Theorem Generation with Lean 4 Math Proof Verification
+**Version: 1.0.8**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
 
-**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers — and the machine-checked theorem proving programming language Lean 4 proofs alongside them for definitive mathematical confirmation of correctness. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in deciphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. Additionally, MOTO ships an optional automated theorem generation pipeline that formalizes candidate theorems and lemmas in Lean 4 (with optional Z3/SMT hinting and Mathlib lemma search) and only stores proofs that Lean 4 accepts as genuinely verified. This exact version of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
+**A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers — and the machine-checked theorem proving programming language Lean 4 proofs alongside them for definitive mathematical confirmation of correctness. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in deciphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. Additionally, MOTO has optional automated theorem generation capabilities that formalize candidate theorems and lemmas in Lean 4 (with optional Z3/SMT hinting and Mathlib lemma search) and only stores proofs that Lean 4 accepts as genuinely mathematically verified. Lean 4 automation means the user gets guaranteed verification of the mathematical results produced. This exact version of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, researchers, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
 ### The Core Discovery: Top-P Exploration 
 
@@ -22,7 +22,7 @@ MOTO may produce many brilliant papers as it runs; these intermediate papers are
 
 ### Secondary Feature: Automated Theorem Generation with Lean 4 Verification
 
-Paired with Top-P Exploration — and secondary to it — MOTO ships an **optional automated theorem generation pipeline** that turns the autonomous brainstorm and paper stream into **machine-checked Lean 4 proofs**. When `lean4_enabled` is on, the coordinator first runs a one-shot *proof-framing gate* to decide whether the user's prompt is proof-amenable; if it is, every subsequent brainstorm and paper becomes a candidate source for formalization. After each completed brainstorm (Tier 1) and each completed paper (Tier 2 / Tier 3 chapter), a dedicated proof stage runs:
+Paired with Top-P Exploration — and secondary to it — MOTO has an **optional automated theorem generation pipeline** that turns the autonomous brainstorm and paper stream into **machine-checked Lean 4 proofs**. When `lean4_enabled` is on, the coordinator first runs a one-shot *proof-framing gate* to decide whether the user's prompt is proof-amenable; if it is, every subsequent brainstorm and paper becomes a candidate source for formalization. After each completed brainstorm (Tier 1) and each completed paper (Tier 2 / Tier 3 chapter), a dedicated proof stage runs:
 
 1. **Candidate identification** — an LLM agent extracts theorem/lemma candidates from the brainstorm or paper.
 2. **Mathlib lemma search** — a second agent surfaces relevant existing Mathlib lemmas and threads them into the formalization prompt.
@@ -33,7 +33,7 @@ Paired with Top-P Exploration — and secondary to it — MOTO ships an **option
 
 **Lean 4 is authoritative.** SMT results are hints only — they never substitute for Lean verification, and any proof that would compile only because of a `sorry` or `admit` is rejected. The pipeline is entirely silent and skipped when `lean4_enabled=False`, so it never blocks brainstorm or paper completion; the default hosted image stays Lean-free and Z3-free. A manual-check endpoint (`POST /api/proofs/check`) also lets you re-run the pipeline on any stored brainstorm or paper after the fact, and the compiler's "rigor mode" reuses the same Lean 4 checker to upgrade lemmas inside a paper as it's being written.
 
-Give the program a try — MOTO is as cool as it sounds. Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash "Launch MOTO.sh"`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
+Give the program a try — MOTO is as cool as it sounds. Windows has a one-click launcher and Ubuntu 24.04 now has a repo-root launcher too. Use the two links below to download Python and Node.js, they should automatically install in seconds. Once those are downloaded, click the green "< > Code" drop-down menu on the top right of this GitHub page and download the zip file. On Windows, extract it to your desktop and double-click `Click To Launch MOTO.bat`. On Ubuntu 24.04, extract it and run `bash linux-ubuntu-launcher.sh`. Put in your OpenRouter.AI API key (or optionally connect LM Studio for faster performance), select your agents in the settings profile - if desired and you are unsure you may use the preselected "fastest" profile.
 
 ***Now you are set up and every time you press launch your home lab is ready for your prompt!*** **Give MOTO the toughest question you can think of and press start to begin YOUR creations!**
 
@@ -69,6 +69,16 @@ Before installation, you need:
 4. **If using cloud AI - Get an OpenRouter API key**: Sign up at OpenRouter.ai and get a paid or free API key to use the most powerful cloud models available from your favorite providers. OpenRouter may also offer a certain amount of free API calls per day with your account key. When you download MOTO Autonomous ASI, you can see which models are free by checking the "show only free models" check box(es) in the MOTO app settings.
 5. **On first startup, pick your provider path**: After you acknowledge the disclaimer, MOTO will prompt you to either enter an OpenRouter key or confirm that LM Studio is running. If you save an OpenRouter key there, the recommended default autonomous profile is applied immediately so you can open Settings and see it already selected.
 
+#### Optional Lean 4 / SMT Proof Verification Requirements
+
+Lean 4 proof verification is optional. The launcher prepares it when available, but normal brainstorming and paper generation still run when Lean 4 is disabled or unavailable.
+
+- **Lean 4 / elan / lake**: Required only when `lean4_enabled` is turned on. The launcher attempts a one-time `elan` install and expects both `lean` and `lake` to be available afterward.
+- **Git and internet access**: Required for the first Lean 4 workspace setup because Mathlib is fetched through Lake.
+- **Mathlib storage**: Plan on several additional GB for the repo-local Lean workspace, Mathlib sources, and prebuilt `.olean` cache. First setup can take a while.
+- **Z3 / SMT**: Optional. When `smt_enabled` is turned on, MOTO uses Z3 only for conservative hints; Lean 4 remains authoritative. The launcher attempts to find or download Z3, and advanced users can provide a path through the proof settings or `MOTO_Z3_PATH`.
+- **Linux note**: On Ubuntu 24.04, make sure `python3`, `python3-venv`, `bash`, `curl`, `git`, Node.js, and npm are available. A desktop keyring backend is recommended if you want provider keys saved securely.
+
 ### Installation
 
 #### Windows (One-Click Launcher)
@@ -98,7 +108,7 @@ Before installation, you need:
 3. From the repo root, run:
 
 ```bash
-bash "Launch MOTO.sh"
+bash linux-ubuntu-launcher.sh
 ```
 
 4. The Ubuntu launcher will:
@@ -112,13 +122,15 @@ bash "Launch MOTO.sh"
 
 **Ubuntu note:** If Playwright or the desktop keyring is unavailable, the launcher stays runnable and explains the limitation. Saved provider keys will only persist when a Linux desktop keyring backend is available.
 
+**Linux support note:** Ubuntu 24.04 is the tested Linux launcher target. Other Linux distributions may work through the manual installation flow if they provide compatible Python, Node.js/npm, shell, keyring, Lean 4/elan, and browser dependencies, but they are best-effort unless explicitly tested.
+
 ### Build Identity and Update Contract
 
 - `moto-update-manifest.json` is the authoritative Build 0 updater/build identity manifest for the `main` branch.
 - `GET /api/features` exposes the public build-comparison fields `version`, `build_commit`, `update_channel`, and `api_contract_version`.
 - Official update comparisons target GitHub `main`, not GitHub Releases.
 - `Click To Launch MOTO.bat` is the authoritative Windows launcher entrypoint and delegates to `moto_launcher.py`.
-- `Launch MOTO.sh` is the authoritative Ubuntu 24.04 launcher entrypoint; it bootstraps the repo-local `.venv`, delegates to `moto_launcher.py`, and is used again for relaunch after an update when MOTO was started from that wrapper.
+- `linux-ubuntu-launcher.sh` is the authoritative Ubuntu 24.04 launcher entrypoint; it bootstraps the repo-local `.venv`, delegates to `moto_launcher.py`, and is used again for relaunch after an update when MOTO was started from that wrapper.
 - Clean extracted ZIP installs and clean `main`-tracking git clones are the supported automatic update-apply targets.
 - Dirty or locally mutated repos remain runnable, but they are update-detection-only and are not eligible for automatic update-apply behavior.
 - If launcher-managed backend/frontend services from this install are still running, the updater warns and skips update-apply until those services are closed.
@@ -207,6 +219,7 @@ moto-math-variant/
 ├── .cursor/
 │   └── rules/               # AI agent design specifications (full system documentation)
 ├── Click To Launch MOTO.bat  # One-click Windows launcher
+├── linux-ubuntu-launcher.sh  # Ubuntu 24.04 launcher
 ├── moto_launcher.py          # Internal Python launcher orchestration
 ├── moto_updater.py           # Build 1 updater helper and launcher state manager
 ├── requirements.txt         # Python dependencies
@@ -323,7 +336,7 @@ All configurable per role:
 
 #### Manual Installation (All Platforms)
 
-If you want the consumer launcher experience on Ubuntu 24.04, prefer `bash "Launch MOTO.sh"` instead of the manual steps below. The manual flow remains the fallback path when you intentionally want full terminal-level control.
+If you want the consumer launcher experience on Ubuntu 24.04, prefer `bash linux-ubuntu-launcher.sh` instead of the manual steps below. The manual flow remains the fallback path when you intentionally want full terminal-level control.
 
 ```bash
 # Clone the repository
@@ -427,9 +440,9 @@ All content generated by this system is for informational purposes only. Papers
 
 Best if you want to run local models in LM Studio, especially models above 20B parameters or larger MoE-style models.
 
-- **OS**: Windows 10+, macOS 12+, Linux
+- **OS**: Windows 10+, macOS 12+, Linux; Ubuntu 24.04 is the tested Linux launcher target
 - **RAM**: 32GB+ recommended
-- **Storage**: 50GB+ free space for models and project data
+- **Storage**: 50GB+ free space for models and project data; add several GB more if Lean 4 / Mathlib proof verification is enabled
 - **GPU**: 16GB+ VRAM recommended for practical local inference on 20B+ class models
 - **Internet**: Required for installation; optional afterward if staying local-only
 
@@ -437,13 +450,13 @@ Best if you want to run local models in LM Studio, especially models above 20B p
 
 Best if you want the lightest local hardware requirements and are comfortable running inference in the cloud through OpenRouter.
 
-- **OS**: Windows, macOS, Linux, or Raspberry Pi OS
+- **OS**: Windows, macOS, Linux, or Raspberry Pi OS; Ubuntu 24.04 is the tested Linux launcher target
 - **RAM**: 4GB minimum, 8GB recommended
-- **Storage**: 5GB+ free space
+- **Storage**: 5GB+ free space for base MOTO; use 15GB+ if enabling Lean 4 / Mathlib proof verification
 - **GPU**: Not required
 - **Internet**: Required
 
-Because the heavy model inference happens on OpenRouter, MOTO can run on very modest local hardware in this mode, including a Raspberry Pi, as long as it can run Python, Node.js, and maintain a stable internet connection.
+Because the heavy model inference happens on OpenRouter, MOTO can run on very modest local hardware in this mode, including a Raspberry Pi, as long as it can run Python, Node.js, and maintain a stable internet connection. Lean 4 proof verification adds a local toolchain and Mathlib workspace requirement even in OpenRouter-only mode.
 
 ---
 
diff --git a/backend/aggregator/agents/submitter.py b/backend/aggregator/agents/submitter.py
index 0ca5646..0072d9f 100644
--- a/backend/aggregator/agents/submitter.py
+++ b/backend/aggregator/agents/submitter.py
@@ -13,8 +13,9 @@
 from backend.shared.models import Submission, SubmitterState
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.api_client_manager import api_client_manager
+from backend.shared.brainstorm_proof_gate import is_lean_proof_submission, verify_brainstorm_proof_candidate
 from backend.shared.openrouter_client import FreeModelExhaustedError
-from backend.shared.json_parser import parse_json
+from backend.shared.json_parser import parse_json, sanitize_model_output_for_retry_context
 from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.core.queue_manager import queue_manager
@@ -89,6 +90,12 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
         return f"agg_sub{self.submitter_id}_{self.task_sequence:03d}"
+
+    def _generation_temperature(self) -> float:
+        """Use diversified lanes only when the coordinator is running submitters in parallel."""
+        if self.coordinator and not getattr(self.coordinator, "single_model_mode", False):
+            return api_client_manager.parallel_brainstorm_submitter_temperature(self.submitter_id)
+        return 0.0
     
     async def start(self) -> None:
         """Start the submitter agent."""
@@ -250,7 +257,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                         role_id=self.role_id,
                         model=self.model_name,
                         messages=[{"role": "user", "content": prompt}],
-                        temperature=0.0,  # Deterministic generation - evolving context provides diversity
+                        temperature=self._generation_temperature(),
                         max_tokens=self.max_output_tokens  # Per-submitter max output tokens
                     )
                     call_metadata = api_client_manager.extract_call_metadata(response)
@@ -349,13 +356,13 @@ async def _generate_submission(self) -> Optional[Submission]:
                 )
                 
                 try:
-                    # CRITICAL FIX: Don't include full failed output - it can be 90K+ tokens!
-                    # Truncate to prevent context overflow during retry
+                    # Keep conversational retry context, but never replay private
+                    # model thought/channel/control tokens as an assistant turn.
                     max_failed_output_chars = 2000  # ~500 tokens - enough to show error context
-                    if len(llm_output) > max_failed_output_chars:
-                        failed_output_preview = llm_output[:max_failed_output_chars] + "\n[...output truncated for retry...]"
-                    else:
-                        failed_output_preview = llm_output
+                    failed_output_preview = sanitize_model_output_for_retry_context(
+                        llm_output,
+                        max_chars=max_failed_output_chars,
+                    )
                     
                     # Calculate if conversation fits in context window
                     prompt_tokens = count_tokens(prompt)
@@ -426,11 +433,10 @@ async def _generate_submission(self) -> Optional[Submission]:
                             )
                             
                             try:
-                                # Truncate retry output for second stage as well
-                                if len(retry_output_1) > max_failed_output_chars:
-                                    retry_output_1_preview = retry_output_1[:max_failed_output_chars] + "\n[...truncated...]"
-                                else:
-                                    retry_output_1_preview = retry_output_1
+                                retry_output_1_preview = sanitize_model_output_for_retry_context(
+                                    retry_output_1,
+                                    max_chars=max_failed_output_chars,
+                                )
                                 
                                 # Check if second retry conversation fits
                                 retry2_tokens = (prompt_tokens + preview_tokens + retry_prompt_tokens + 
@@ -516,7 +522,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                     # Record as rejection in local memory
                     await self.local_memory.add_rejection(
                         error_feedback,
-                        llm_output[:750]
+                        sanitize_model_output_for_retry_context(llm_output, max_chars=750)
                     )
                     self._increment_rejection()
                     # Notify task completed (failed but still completed)
@@ -524,6 +530,83 @@ async def _generate_submission(self) -> Optional[Submission]:
                         self.task_tracking_callback("completed", task_id)
                     return None
             
+            proof_metadata = {}
+            if is_lean_proof_submission(parsed):
+                if not system_config.lean4_enabled:
+                    await self.local_memory.add_rejection(
+                        "Lean proof candidate rejected before validation because Lean 4 verification is disabled. "
+                        "Submit a normal brainstorm idea or enable Lean 4 before choosing `submission_type: lean_proof`.",
+                        str(parsed)[:750]
+                    )
+                    self._increment_rejection()
+                    if self.task_tracking_callback:
+                        self.task_tracking_callback("completed", task_id)
+                    return None
+
+                validator_model = getattr(self.coordinator, "validator_model", self.model_name) if self.coordinator else self.model_name
+                validator_context = getattr(context_allocator, "validator_context_window", rag_config.validator_context_window)
+                validator_max_tokens = getattr(rag_config, "validator_max_output_tokens", self.max_output_tokens)
+                source_context = "\n\n".join(
+                    part
+                    for part in [
+                        allocation.get("direct", ""),
+                        rag_evidence,
+                        shared_training_content,
+                    ]
+                    if part
+                )
+                gate_result = await verify_brainstorm_proof_candidate(
+                    parsed=parsed,
+                    user_prompt=self.user_prompt,
+                    source_context=source_context,
+                    model_id=self.model_name,
+                    role_id=self.role_id,
+                    task_id_prefix=f"{task_id}_lean",
+                    max_tokens=self.max_output_tokens,
+                    validator_model=validator_model,
+                    validator_context=validator_context,
+                    validator_max_tokens=validator_max_tokens,
+                    validator_role_id="aggregator_validator",
+                    max_attempts=5,
+                )
+                if not gate_result.accepted:
+                    await self.local_memory.add_rejection(
+                        gate_result.failure_feedback,
+                        str(parsed.get("lean_code") or parsed.get("submission") or parsed)[:750],
+                    )
+                    self._increment_rejection()
+                    if self.task_tracking_callback:
+                        self.task_tracking_callback("completed", task_id)
+                    return None
+
+                parsed["submission"] = gate_result.submission_content
+                parsed["reasoning"] = gate_result.reasoning or parsed.get("reasoning", "")
+                proof_metadata = {
+                    "brainstorm_lean_proof": {
+                        "theorem_statement": gate_result.theorem_statement,
+                        "theorem_name": gate_result.theorem_name,
+                        "formal_sketch": gate_result.formal_sketch,
+                        "lean_code": gate_result.lean_code,
+                        "lean_feedback": gate_result.lean_feedback,
+                        "reasoning": gate_result.reasoning,
+                        "attempts": [
+                            attempt.model_dump(mode="json")
+                            for attempt in (gate_result.attempts or [])
+                        ],
+                        "attempt_count": len(gate_result.attempts or []),
+                    }
+                }
+
+            if "submission" not in parsed or "reasoning" not in parsed:
+                await self.local_memory.add_rejection(
+                    "Submission JSON missing required `submission` or `reasoning` fields after proof gating.",
+                    str(parsed)[:750],
+                )
+                self._increment_rejection()
+                if self.task_tracking_callback:
+                    self.task_tracking_callback("completed", task_id)
+                return None
+
             # Create submission
             submission = Submission(
                 submission_id=str(uuid.uuid4()),
@@ -535,6 +618,7 @@ async def _generate_submission(self) -> Optional[Submission]:
                     "chunk_size": chunk_size,
                     "rag_used": bool(allocation["rag_context"]),
                     "llm_call": call_metadata,
+                    **proof_metadata,
                 }
             )
             
diff --git a/backend/aggregator/agents/validator.py b/backend/aggregator/agents/validator.py
index 5551f25..6ce0dee 100644
--- a/backend/aggregator/agents/validator.py
+++ b/backend/aggregator/agents/validator.py
@@ -12,7 +12,7 @@
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
-from backend.shared.json_parser import parse_json
+from backend.shared.json_parser import parse_json, sanitize_model_output_for_retry_context
 from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.memory.shared_training import shared_training_memory
@@ -326,12 +326,13 @@ async def _assess_quality(self, submission: Submission) -> ValidationResult:
                 )
                 
                 try:
-                    # CRITICAL FIX: Truncate failed output to prevent context overflow during retry
+                    # Keep conversational retry context, but never replay private
+                    # model thought/channel/control tokens as an assistant turn.
                     max_failed_output_chars = 2000  # ~500 tokens - enough for error context
-                    if len(llm_output) > max_failed_output_chars:
-                        failed_output_preview = llm_output[:max_failed_output_chars] + "\n[...output truncated for retry...]"
-                    else:
-                        failed_output_preview = llm_output
+                    failed_output_preview = sanitize_model_output_for_retry_context(
+                        llm_output,
+                        max_chars=max_failed_output_chars,
+                    )
                     
                     # Calculate if conversation fits in context window
                     prompt_tokens = count_tokens(prompt)
@@ -817,12 +818,13 @@ async def _retry_batch_json_parse(
         
         try:
             call_metadata = {}
-            # CRITICAL FIX: Truncate failed output to prevent context overflow during retry
+            # Keep conversational retry context, but never replay private
+            # model thought/channel/control tokens as an assistant turn.
             max_failed_output_chars = 2000  # ~500 tokens - enough for error context
-            if len(failed_output) > max_failed_output_chars:
-                failed_output_preview = failed_output[:max_failed_output_chars] + "\n[...output truncated for retry...]"
-            else:
-                failed_output_preview = failed_output
+            failed_output_preview = sanitize_model_output_for_retry_context(
+                failed_output,
+                max_chars=max_failed_output_chars,
+            )
             
             # Calculate if conversation fits in context window
             from backend.shared.utils import count_tokens
diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index 3b89d3a..d192614 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -12,13 +12,14 @@
 import aiofiles
 
 from backend.shared.config import system_config, rag_config
-from backend.shared.models import SystemStatus, Submission, ValidationResult, SubmitterConfig, WorkflowTask, ModelConfig
+from backend.shared.models import SystemStatus, Submission, ValidationResult, SubmitterConfig, WorkflowTask, ModelConfig, ProofAttemptFeedback
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.rag_lock import rag_operation_lock
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.free_model_manager import free_model_manager
+from backend.shared.path_safety import resolve_path_within_root, validate_single_path_component
 from backend.aggregator.agents.submitter import SubmitterAgent
 from backend.aggregator.agents.validator import ValidatorAgent
 from backend.aggregator.core.queue_manager import queue_manager
@@ -29,6 +30,42 @@
 logger = logging.getLogger(__name__)
 
 
+def _resolve_uploaded_user_file(file_ref: str, *, allow_trusted_context_files: bool = False) -> Optional[Path]:
+    """Resolve a user upload reference without exposing arbitrary local files."""
+    raw_ref = str(file_ref or "").strip()
+    if not raw_ref:
+        return None
+
+    uploads_root = Path(system_config.user_uploads_dir).resolve()
+    data_root = Path(system_config.data_dir).resolve()
+    candidate = Path(raw_ref)
+
+    if candidate.is_absolute():
+        resolved_candidate = candidate.resolve()
+        try:
+            resolved_candidate.relative_to(uploads_root)
+            return resolved_candidate
+        except ValueError:
+            pass
+
+        if allow_trusted_context_files:
+            try:
+                resolved_candidate.relative_to(data_root)
+                return resolved_candidate
+            except ValueError:
+                pass
+
+        logger.warning("Rejected uploaded file path outside trusted context roots: %s", candidate.name)
+        return None
+
+    try:
+        safe_filename = validate_single_path_component(raw_ref, "uploaded filename")
+        return resolve_path_within_root(uploads_root, safe_filename)
+    except ValueError as exc:
+        logger.warning("Rejected unsafe uploaded file reference: %s", exc)
+        return None
+
+
 class Coordinator:
     """
     Coordinates the entire aggregator system.
@@ -72,6 +109,7 @@ def __init__(self):
         self.single_model_mode = False
         self.submitter_configs: List[SubmitterConfig] = []
         self.validator_model = ""
+        self.validator_provider = "lm_studio"
         
         # Workflow tracking
         self.workflow_tasks: List[WorkflowTask] = []
@@ -84,6 +122,12 @@ def __init__(self):
         
         # Cleanup review toggle (disabled for short-lived mini-brainstorm phases)
         self.enable_cleanup_review = True
+
+        # Optional source-level hard cap used by autonomous brainstorm mode.
+        self.max_total_acceptances: Optional[int] = None
+        self.acceptance_count_offset: int = 0
+        self.acceptance_cap_callback: Optional[Callable[[int], Any]] = None
+        self._acceptance_cap_reached = False
     
     async def _load_stats(self) -> None:
         """Load persisted stats from file."""
@@ -120,6 +164,43 @@ async def _save_stats(self) -> None:
             logger.debug("Saved stats to file")
         except Exception as e:
             logger.error(f"Failed to save stats: {e}")
+
+    def _should_use_single_model_mode(
+        self,
+        submitter_configs: List[SubmitterConfig],
+        validator_model: str,
+        validator_provider: str,
+        loaded_models: List[str],
+    ) -> bool:
+        """
+        Decide whether same-model aggregator roles must run sequentially.
+
+        Multiple loaded LM Studio `:#` siblings of the same base model provide
+        safe submitter fan-out capacity; otherwise preserve the existing
+        sequential single-model mode.
+        """
+        all_models = [sc.model_id for sc in submitter_configs] + [validator_model]
+        if len(set(all_models)) != 1:
+            return False
+
+        all_lm_studio = (
+            validator_provider == "lm_studio"
+            and all(sc.provider == "lm_studio" for sc in submitter_configs)
+        )
+        if not all_lm_studio:
+            return True
+
+        sibling_count = lm_studio_client.count_sibling_instances_from_loaded(validator_model, loaded_models)
+        if sibling_count > 1:
+            logger.info(
+                "Single configured LM Studio model '%s' has %s loaded same-base instances; "
+                "using parallel submitter workflow with instance sharing.",
+                validator_model,
+                sibling_count,
+            )
+            return False
+
+        return True
     
     async def initialize(
         self,
@@ -132,8 +213,14 @@ async def initialize(
         validator_max_tokens: Optional[int] = None,
         validator_provider: str = "lm_studio",
         validator_openrouter_provider: Optional[str] = None,
+        validator_openrouter_reasoning_effort: str = "auto",
         validator_lm_studio_fallback: Optional[str] = None,
-        enable_cleanup_review: bool = True
+        validator_supercharge_enabled: bool = False,
+        enable_cleanup_review: bool = True,
+        max_total_acceptances: Optional[int] = None,
+        acceptance_count_offset: int = 0,
+        acceptance_cap_callback: Optional[Callable[[int], Any]] = None,
+        allow_trusted_context_files: bool = False,
     ) -> None:
         """
         Initialize the coordinator with configuration.
@@ -148,12 +235,22 @@ async def initialize(
             validator_max_tokens: Optional max output tokens override for validator
             validator_provider: Provider for validator ("lm_studio" or "openrouter")
             validator_openrouter_provider: OpenRouter host provider for validator (e.g., "Anthropic")
+            validator_openrouter_reasoning_effort: OpenRouter reasoning effort for validator
             validator_lm_studio_fallback: LM Studio fallback model for validator when using OpenRouter
+            validator_supercharge_enabled: Whether validator answers should use Supercharge
+            max_total_acceptances: Optional hard cap for accepted submissions, including offset
+            acceptance_count_offset: Existing acceptances before this coordinator run
+            acceptance_cap_callback: Async callback fired when the cap is reached
+            allow_trusted_context_files: Allow internal callers to pass data-root files as context
         """
         logger.info("Initializing coordinator...")
         
         # Store cleanup review toggle
         self.enable_cleanup_review = enable_cleanup_review
+        self.max_total_acceptances = max_total_acceptances
+        self.acceptance_count_offset = max(0, acceptance_count_offset)
+        self.acceptance_cap_callback = acceptance_cap_callback
+        self._acceptance_cap_reached = False
         
         # Validate submitter count
         num_submitters = len(submitter_configs)
@@ -189,13 +286,21 @@ async def initialize(
         final_validator_max_output = validator_max_tokens if validator_max_tokens is not None else rag_config.validator_max_output_tokens
         context_allocator.set_context_windows(final_submitter_context, final_validator_context, final_submitter_max_output, final_validator_max_output)
         
-        # CRITICAL: Detect single-model mode ONLY based on configured model IDs
+        # Log currently loaded models for diagnostics and same-base instance scheduling.
+        loaded_models = await lm_studio_client.get_loaded_models()
+        logger.info(f"Currently loaded models: {loaded_models}")
+
+        # CRITICAL: Detect single-model mode based on configured model IDs, with
+        # an LM Studio sibling-instance exception for safe submitter fan-out.
         # Boost routing is INDEPENDENT of this decision and does NOT affect concurrency
         # Single-model mode prevents queue overflow when all agents share the same LM Studio server
         # Boost can route calls to OpenRouter even in single-model mode (if enabled)
-        all_models = [sc.model_id for sc in submitter_configs] + [validator_model]
-        unique_models = set(all_models)
-        self.single_model_mode = len(unique_models) == 1
+        self.single_model_mode = self._should_use_single_model_mode(
+            submitter_configs,
+            validator_model,
+            validator_provider,
+            loaded_models,
+        )
         
         if self.single_model_mode:
             logger.info(
@@ -217,10 +322,6 @@ async def initialize(
                 f"This does NOT affect parallel execution mode."
             )
         
-        # Log currently loaded models for diagnostics
-        loaded_models = await lm_studio_client.get_loaded_models()
-        logger.info(f"Currently loaded models: {loaded_models}")
-        
         # CRITICAL: Warn user about potential context mismatches
         # LM Studio may not load models with requested context - this causes silent failures
         context_info = "\n".join([
@@ -260,17 +361,22 @@ async def initialize(
         
         # Load user files into RAG system
         user_files_content = {}
-        for file_path in user_files:
-            path = Path(file_path)
+        for file_ref in user_files:
+            path = _resolve_uploaded_user_file(
+                file_ref,
+                allow_trusted_context_files=allow_trusted_context_files,
+            )
+            if path is None:
+                continue
             if path.exists():
                 # Add to RAG system with all 4 chunk configs
                 await rag_manager.add_document(
-                    file_path,
+                    str(path),
                     chunk_sizes=rag_config.submitter_chunk_intervals,
                     is_user_file=True
                 )
                 # Also load content for potential direct injection (async to avoid blocking)
-                async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
+                async with aiofiles.open(path, 'r', encoding='utf-8') as f:
                     user_files_content[path.name] = await f.read()
                 logger.info(f"Loaded user file: {path.name}")
         
@@ -301,9 +407,11 @@ async def initialize(
                     provider=config.provider,
                     model_id=config.model_id,
                     openrouter_provider=config.openrouter_provider,
+                    openrouter_reasoning_effort=config.openrouter_reasoning_effort,
                     lm_studio_fallback_id=config.lm_studio_fallback_id,
                     context_window=config.context_window,
-                    max_output_tokens=config.max_output_tokens
+                    max_output_tokens=config.max_output_tokens,
+                    supercharge_enabled=config.supercharge_enabled
                 )
             )
             logger.info(f"Created Submitter {config.submitter_id}: model={config.model_id}, provider={config.provider}, context={config.context_window}")
@@ -326,9 +434,11 @@ async def initialize(
                 provider=validator_provider,
                 model_id=validator_model,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=validator_lm_studio_fallback,
                 context_window=final_validator_context,
-                max_output_tokens=final_validator_max_output
+                max_output_tokens=final_validator_max_output,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
         logger.info(f"Created Validator: model={validator_model}, provider={validator_provider}")
@@ -627,6 +737,8 @@ async def _validator_loop(self) -> None:
                 for submission, result in zip(submissions, results):
                     if result.decision == "accept":
                         await self._handle_acceptance(submission, result)
+                        if self._acceptance_cap_reached:
+                            break
                     else:
                         await self._handle_rejection(submission, result)
                 
@@ -721,6 +833,8 @@ async def _single_model_workflow(self) -> None:
                     for submission, result in zip(submissions, results):
                         if result.decision == "accept":
                             await self._handle_acceptance(submission, result)
+                            if self._acceptance_cap_reached:
+                                break
                         else:
                             await self._handle_rejection(submission, result)
                 
@@ -755,10 +869,22 @@ async def _single_model_workflow(self) -> None:
     
     async def _handle_acceptance(self, submission: Submission, result: ValidationResult) -> None:
         """Handle accepted submission."""
+        next_total_acceptances = self.acceptance_count_offset + self.total_acceptances + 1
+        if (
+            self.max_total_acceptances is not None
+            and next_total_acceptances > self.max_total_acceptances
+        ):
+            await self._handle_acceptance_cap_reached(
+                self.acceptance_count_offset + self.total_acceptances
+            )
+            return
+
         self.total_acceptances += 1
+        total_acceptances_with_offset = self.acceptance_count_offset + self.total_acceptances
         
         # Add to shared training
         await shared_training_memory.add_accepted_submission(submission.content)
+        await self._register_accepted_brainstorm_proof(submission)
         
         # Notify submitter
         submitter = next((s for s in self.submitters if s.submitter_id == submission.submitter_id), None)
@@ -812,6 +938,115 @@ async def _handle_acceptance(self, submission: Submission, result: ValidationRes
         # Trigger cleanup review every 7 acceptances
         if self.enable_cleanup_review and self.total_acceptances % 7 == 0 and self.total_acceptances > 0:
             await self._perform_cleanup_review()
+
+        if (
+            self.max_total_acceptances is not None
+            and total_acceptances_with_offset >= self.max_total_acceptances
+        ):
+            await self._handle_acceptance_cap_reached(total_acceptances_with_offset)
+
+    async def _handle_acceptance_cap_reached(self, total_acceptances: int) -> None:
+        """Stop accepting new work once an optional source-level cap is reached."""
+        if self._acceptance_cap_reached:
+            return
+
+        self._acceptance_cap_reached = True
+        self.is_running = False
+
+        logger.info(
+            "Acceptance cap reached at %s total acceptances; stopping aggregator at source",
+            total_acceptances,
+        )
+
+        await self._broadcast("acceptance_cap_reached", {
+            "total_acceptances": total_acceptances,
+            "max_total_acceptances": self.max_total_acceptances,
+        })
+
+        if self.acceptance_cap_callback:
+            try:
+                await self.acceptance_cap_callback(total_acceptances)
+            except Exception as e:
+                logger.error("Acceptance cap callback failed: %s", e, exc_info=True)
+
+        current_task = asyncio.current_task()
+        for submitter in self.submitters:
+            try:
+                await submitter.stop()
+            except Exception as e:
+                logger.warning("Error stopping submitter after acceptance cap: %s", e)
+
+        if self._main_task and self._main_task is not current_task and not self._main_task.done():
+            self._main_task.cancel()
+
+    def _brainstorm_proof_source_id(self) -> str:
+        """Derive a stable proof source id from the active brainstorm database path."""
+        try:
+            stem = Path(shared_training_memory.file_path).stem
+            if stem.startswith("brainstorm_"):
+                return stem[len("brainstorm_"):] or stem
+            return stem or "manual_aggregator"
+        except Exception:
+            return "manual_aggregator"
+
+    async def _register_accepted_brainstorm_proof(self, submission: Submission) -> None:
+        """Store validator-accepted Lean-verified brainstorm proofs in the proof database."""
+        proof_payload = (submission.metadata or {}).get("brainstorm_lean_proof")
+        if not isinstance(proof_payload, dict):
+            return
+
+        theorem_statement = str(proof_payload.get("theorem_statement") or "").strip()
+        lean_code = str(proof_payload.get("lean_code") or "").strip()
+        if not theorem_statement or not lean_code:
+            return
+
+        try:
+            from backend.autonomous.core.proof_registration import register_verified_lean_proof
+            from backend.autonomous.memory.proof_database import proof_database
+
+            attempts = [
+                item if isinstance(item, ProofAttemptFeedback) else ProofAttemptFeedback.model_validate(item)
+                for item in (proof_payload.get("attempts") or [])
+            ]
+            source_id = self._brainstorm_proof_source_id()
+            source_title = (self.validator.user_prompt if self.validator else "")[:300]
+            registration = await register_verified_lean_proof(
+                proof_database=proof_database,
+                user_prompt=self.validator.user_prompt if self.validator else "",
+                theorem_statement=theorem_statement,
+                lean_code=lean_code,
+                validator_model=self.validator_model,
+                validator_context=rag_config.validator_context_window,
+                validator_max_tokens=rag_config.validator_max_output_tokens,
+                task_id=f"agg_proof_novelty_{self.total_acceptances:03d}",
+                role_id="aggregator_validator",
+                source_type="brainstorm",
+                source_id=source_id,
+                source_title=source_title,
+                theorem_id=f"brainstorm_submission_{self.total_acceptances}",
+                theorem_name=str(proof_payload.get("theorem_name") or ""),
+                formal_sketch=str(proof_payload.get("formal_sketch") or ""),
+                verification_notes="Lean 4 accepted this brainstorm proof before validator acceptance.",
+                attempt_count=int(proof_payload.get("attempt_count") or len(attempts)),
+                attempts=attempts,
+                broadcast_fn=self._broadcast,
+                base_event={
+                    "source_type": "brainstorm",
+                    "source_id": source_id,
+                    "submission_id": submission.submission_id,
+                    "submitter_id": submission.submitter_id,
+                    "trigger": "brainstorm_inline",
+                },
+                proof_label=f"Brainstorm submission {self.total_acceptances}",
+            )
+            submission.metadata["proof_id"] = registration.record.proof_id
+        except Exception as exc:
+            logger.warning(
+                "Accepted Lean brainstorm proof registration failed for submission %s: %s",
+                submission.submission_id,
+                exc,
+                exc_info=True,
+            )
     
     async def _handle_rejection(self, submission: Submission, result: ValidationResult) -> None:
         """Handle rejected submission."""
diff --git a/backend/aggregator/core/queue_manager.py b/backend/aggregator/core/queue_manager.py
index e7a7b50..4c5de1d 100644
--- a/backend/aggregator/core/queue_manager.py
+++ b/backend/aggregator/core/queue_manager.py
@@ -1,9 +1,9 @@
 """
 Submission queue manager.
-Handles queue with special logic: if 10+ submissions waiting, skip to latest.
+The coordinator handles overflow by pausing submitters; queued submissions stay FIFO.
 """
 import asyncio
-from typing import Optional, List
+from typing import List, Optional
 from collections import deque
 import logging
 
@@ -15,56 +15,20 @@
 
 class QueueManager:
     """
-    Thread-safe submission queue.
-    If queue >= 10 on next dequeue, jump to latest and clear rest.
+    Thread-safe FIFO submission queue.
     """
     
     def __init__(self):
         self.queue: deque[Submission] = deque()
         self._lock = asyncio.Lock()
-        self._not_empty = asyncio.Event()
         self.overflow_threshold = system_config.queue_overflow_threshold
     
     async def enqueue(self, submission: Submission) -> None:
         """Add submission to queue."""
         async with self._lock:
             self.queue.append(submission)
-            self._not_empty.set()
             logger.debug(f"Enqueued submission {submission.submission_id}. Queue size: {len(self.queue)}")
     
-    async def dequeue(self) -> Optional[Submission]:
-        """
-        Dequeue next submission.
-        If queue >= overflow_threshold, skip to latest and clear rest.
-        """
-        # Wait for queue to have items
-        while True:
-            async with self._lock:
-                if self.queue:
-                    break
-                self._not_empty.clear()
-            
-            await self._not_empty.wait()
-        
-        async with self._lock:
-            # Check for overflow
-            if len(self.queue) >= self.overflow_threshold:
-                # Get latest submission
-                latest = self.queue[-1]
-                # Clear all others
-                cleared_count = len(self.queue) - 1
-                self.queue.clear()
-                
-                logger.warning(
-                    f"Queue overflow ({cleared_count + 1} submissions). "
-                    f"Cleared {cleared_count} old submissions, processing latest."
-                )
-                
-                return latest
-            else:
-                # Normal dequeue
-                return self.queue.popleft()
-    
     async def size(self) -> int:
         """Get current queue size."""
         async with self._lock:
@@ -79,7 +43,6 @@ async def clear(self) -> None:
         """Clear the queue."""
         async with self._lock:
             self.queue.clear()
-            self._not_empty.clear()
             logger.info("Queue cleared")
     
     async def peek(self) -> Optional[Submission]:
diff --git a/backend/aggregator/core/rag_manager.py b/backend/aggregator/core/rag_manager.py
index 4e1e35c..54305e2 100644
--- a/backend/aggregator/core/rag_manager.py
+++ b/backend/aggregator/core/rag_manager.py
@@ -166,7 +166,9 @@ async def retrieve(
         query: str,
         chunk_size: int = 512,
         max_tokens: int = None,
-        exclude_sources: Optional[List[str]] = None
+        exclude_sources: Optional[List[str]] = None,
+        include_sources: Optional[List[str]] = None,
+        include_source_prefixes: Optional[List[str]] = None
     ) -> ContextPack:
         """
         4-stage retrieval pipeline.
@@ -176,6 +178,8 @@ async def retrieve(
             chunk_size: Chunk size to retrieve from
             max_tokens: Maximum tokens in result
             exclude_sources: Source names to skip during packing (already direct-injected)
+            include_sources: Optional source allowlist for scoped retrieval
+            include_source_prefixes: Optional source-name prefixes for scoped retrieval
         
         Returns:
             ContextPack with retrieved context
@@ -189,7 +193,18 @@ async def retrieve(
         
         # Stage B: Hybrid Recall (BM25 + Vector)
         logger.debug(f"RAG Stage 2/4: Hybrid recall (BM25 + Vector) with chunk_size={chunk_size}")
-        candidates = await self._hybrid_recall(queries, chunk_size)
+        if include_sources or include_source_prefixes:
+            logger.info(
+                "RAG Stage 2/4: Restricting retrieval scope to sources=%s prefixes=%s",
+                include_sources or [],
+                include_source_prefixes or [],
+            )
+        candidates = await self._hybrid_recall(
+            queries,
+            chunk_size,
+            include_sources=include_sources,
+            include_source_prefixes=include_source_prefixes,
+        )
         logger.debug(f"RAG Stage 2/4 complete: Retrieved {len(candidates)} candidate chunks")
         
         # Stage C: Reranking + MMR
@@ -213,14 +228,19 @@ async def _add_chunks(self, chunks: List[DocumentChunk], chunk_size: int) -> Non
         
         texts = [chunk.text for chunk in chunks]
 
+        embeddings = None
+        lock_acquired = False
         if system_config.generic_mode:
             embeddings = await api_client_manager.get_embeddings(texts)
             await rag_operation_lock.acquire(f"RAGManager add_chunks write (size={chunk_size})")
+            lock_acquired = True
         else:
             await rag_operation_lock.acquire(f"RAGManager add_chunks (size={chunk_size})")
-            embeddings = await api_client_manager.get_embeddings(texts)
-
+            lock_acquired = True
         try:
+            if embeddings is None:
+                embeddings = await api_client_manager.get_embeddings(texts)
+
             # Update chunks with embeddings and tokens
             for chunk, embedding in zip(chunks, embeddings):
                 chunk.embedding = embedding
@@ -229,7 +249,8 @@ async def _add_chunks(self, chunks: List[DocumentChunk], chunk_size: int) -> Non
             # ChromaDB writes stay under the global RAG lock in both modes.
             collection = self.collections[chunk_size]
             try:
-                collection.add(
+                await asyncio.to_thread(
+                    collection.add,
                     ids=[chunk.chunk_id for chunk in chunks],
                     embeddings=embeddings,
                     documents=texts,
@@ -247,7 +268,8 @@ async def _add_chunks(self, chunks: List[DocumentChunk], chunk_size: int) -> Non
             # Invalidate BM25 index for this size
             self.bm25_index[chunk_size] = None
         finally:
-            rag_operation_lock.release()
+            if lock_acquired:
+                rag_operation_lock.release()
     
     async def _rewrite_query(self, query: str) -> List[str]:
         """Stage A: Expand query into semantic variants."""
@@ -283,18 +305,31 @@ async def _rewrite_query(self, query: str) -> List[str]:
     async def _hybrid_recall(
         self,
         queries: List[str],
-        chunk_size: int
+        chunk_size: int,
+        include_sources: Optional[List[str]] = None,
+        include_source_prefixes: Optional[List[str]] = None
     ) -> List[Tuple[DocumentChunk, float]]:
         """Stage B: Hybrid BM25 + Vector search."""
-        chunks = self.chunks_by_size[chunk_size]
+        # Work from a stable snapshot so threaded scoring does not race with
+        # concurrent RAG add/remove operations mutating the live chunk lists.
+        chunks = list(self._filter_chunks_by_source_scope(
+            self.chunks_by_size[chunk_size],
+            include_sources=include_sources,
+            include_source_prefixes=include_source_prefixes,
+        ))
         if not chunks:
             return []
         
         # Vector search
-        vector_results = await self._vector_search(queries, chunk_size)
+        vector_results = await self._vector_search(queries, chunk_size, candidate_chunks=chunks)
         
         # BM25 search
-        bm25_results = self._bm25_search(queries, chunk_size)
+        bm25_results = await asyncio.to_thread(
+            self._bm25_search,
+            queries,
+            chunk_size,
+            chunks,
+        )
         
         # Combine and deduplicate
         combined = {}
@@ -315,17 +350,26 @@ async def _hybrid_recall(
     async def _vector_search(
         self,
         queries: List[str],
-        chunk_size: int
+        chunk_size: int,
+        candidate_chunks: Optional[List[DocumentChunk]] = None
     ) -> List[Tuple[DocumentChunk, float]]:
         """Vector similarity search with retry logic for HNSW index race conditions."""
         collection = self.collections[chunk_size]
-        chunks = self.chunks_by_size[chunk_size]
+        chunks = candidate_chunks if candidate_chunks is not None else self.chunks_by_size[chunk_size]
         
         if not chunks:
             return []
         
         query_embeddings = await api_client_manager.get_embeddings(queries)
+        if candidate_chunks is not None and len(candidate_chunks) != len(self.chunks_by_size[chunk_size]):
+            return await asyncio.to_thread(
+                self._score_vector_candidates,
+                query_embeddings,
+                chunks,
+            )
+
         all_results = []
+        chunk_by_id = {chunk.chunk_id: chunk for chunk in chunks}
         for query_embedding in query_embeddings:
             # Search with retry logic for transient HNSW errors during concurrent writes
             max_retries = 3
@@ -334,7 +378,8 @@ async def _vector_search(
             
             for attempt in range(max_retries):
                 try:
-                    results = collection.query(
+                    results = await asyncio.to_thread(
+                        collection.query,
                         query_embeddings=[query_embedding],
                         n_results=min(rag_config.hybrid_recall_top_k, len(chunks))
                     )
@@ -359,7 +404,7 @@ async def _vector_search(
             
             # Map back to chunks
             for chunk_id, distance in zip(results['ids'][0], results['distances'][0]):
-                chunk = next((c for c in chunks if c.chunk_id == chunk_id), None)
+                chunk = chunk_by_id.get(chunk_id)
                 if chunk:
                     # Convert distance to similarity (cosine distance -> similarity)
                     similarity = 1.0 - distance
@@ -374,23 +419,43 @@ async def _vector_search(
                 unique_results.append((chunk, score))
         
         return unique_results[:rag_config.hybrid_recall_top_k]
+
+    def _score_vector_candidates(
+        self,
+        query_embeddings: List[List[float]],
+        chunks: List[DocumentChunk],
+    ) -> List[Tuple[DocumentChunk, float]]:
+        """Score a scoped chunk snapshot in memory without blocking the event loop."""
+        scored: List[Tuple[DocumentChunk, float]] = []
+        for query_embedding in query_embeddings:
+            for chunk in chunks:
+                if not chunk.embedding:
+                    continue
+                scored.append((chunk, self._cosine_similarity(query_embedding, chunk.embedding)))
+
+        seen = set()
+        unique_results = []
+        for chunk, score in sorted(scored, key=lambda x: x[1], reverse=True):
+            if chunk.chunk_id in seen:
+                continue
+            seen.add(chunk.chunk_id)
+            unique_results.append((chunk, score))
+        return unique_results[:rag_config.hybrid_recall_top_k]
     
     def _bm25_search(
         self,
         queries: List[str],
-        chunk_size: int
+        chunk_size: int,
+        candidate_chunks: Optional[List[DocumentChunk]] = None
     ) -> List[Tuple[DocumentChunk, float]]:
         """BM25 lexical search."""
-        chunks = self.chunks_by_size[chunk_size]
+        chunks = list(candidate_chunks) if candidate_chunks is not None else list(self.chunks_by_size[chunk_size])
         if not chunks:
             return []
         
-        # Build or get BM25 index
-        if self.bm25_index[chunk_size] is None:
-            corpus = [chunk.tokens for chunk in chunks]
-            self.bm25_index[chunk_size] = BM25Okapi(corpus)
-        
-        bm25 = self.bm25_index[chunk_size]
+        # Build a local index for the snapshot. This runs in a worker thread
+        # and intentionally does not mutate self.bm25_index across threads.
+        bm25 = BM25Okapi([chunk.tokens for chunk in chunks])
         
         all_scores = np.zeros(len(chunks))
         for query in queries:
@@ -407,6 +472,25 @@ def _bm25_search(
         results = [(chunks[i], float(all_scores[i])) for i in top_indices if all_scores[i] > 0]
         
         return results
+
+    @staticmethod
+    def _filter_chunks_by_source_scope(
+        chunks: List[DocumentChunk],
+        *,
+        include_sources: Optional[List[str]] = None,
+        include_source_prefixes: Optional[List[str]] = None
+    ) -> List[DocumentChunk]:
+        """Limit chunks to an explicit source allowlist and/or source prefixes."""
+        include_set = {source for source in (include_sources or []) if source}
+        prefixes = tuple(prefix for prefix in (include_source_prefixes or []) if prefix)
+        if not include_set and not prefixes:
+            return chunks
+
+        scoped = []
+        for chunk in chunks:
+            if chunk.source_file in include_set or (prefixes and chunk.source_file.startswith(prefixes)):
+                scoped.append(chunk)
+        return scoped
     
     def _rerank_and_diversify(
         self,
@@ -610,7 +694,7 @@ async def _enforce_chunk_cap(self) -> None:
             if evict_ids:
                 collection = self.collections[chunk_size]
                 try:
-                    collection.delete(ids=evict_ids)
+                    await asyncio.to_thread(collection.delete, ids=evict_ids)
                 except Exception as e:
                     logger.error(f"ChromaDB delete during chunk cap enforcement (size={chunk_size}): {e}")
 
@@ -659,9 +743,9 @@ async def remove_document(self, source_name: str) -> None:
             # Remove from ChromaDB
             collection = self.collections[chunk_size]
             # Get IDs for this source
-            results = collection.get(where={"source_file": source_name})
+            results = await asyncio.to_thread(collection.get, where={"source_file": source_name})
             if results['ids']:
-                collection.delete(ids=results['ids'])
+                await asyncio.to_thread(collection.delete, ids=results['ids'])
             
             # Invalidate BM25
             self.bm25_index[chunk_size] = None
diff --git a/backend/aggregator/memory/local_training.py b/backend/aggregator/memory/local_training.py
index 9ac8a23..a501a8b 100644
--- a/backend/aggregator/memory/local_training.py
+++ b/backend/aggregator/memory/local_training.py
@@ -9,7 +9,10 @@
 import logging
 
 from backend.shared.config import system_config, rag_config
-from backend.shared.utils import truncate_with_ellipsis
+from backend.shared.json_parser import (
+    RETRY_CONTEXT_EMPTY_PLACEHOLDER,
+    sanitize_model_output_for_retry_context,
+)
 
 logger = logging.getLogger(__name__)
 
@@ -69,9 +72,14 @@ async def add_rejection(
             submission_content: Original submission (first 750 chars)
         """
         async with self._lock:
-            # Truncate to limits
-            summary = truncate_with_ellipsis(validator_summary, 750)
-            preview = truncate_with_ellipsis(submission_content, 750)
+            # This log is reused as submitter context, so sanitize at the memory
+            # boundary rather than persisting raw provider/model transcript text.
+            summary = sanitize_model_output_for_retry_context(validator_summary, max_chars=750)
+            preview = sanitize_model_output_for_retry_context(submission_content, max_chars=750)
+            if summary == RETRY_CONTEXT_EMPTY_PLACEHOLDER:
+                summary = "Validator rejection summary unavailable after retry-context sanitization."
+            if preview == RETRY_CONTEXT_EMPTY_PLACEHOLDER:
+                preview = "Rejected submission preview unavailable after retry-context sanitization."
             
             # Add rejection
             self.rejections.append({
diff --git a/backend/aggregator/prompts/submitter_prompts.py b/backend/aggregator/prompts/submitter_prompts.py
index 5bb1fbf..dd55ee4 100644
--- a/backend/aggregator/prompts/submitter_prompts.py
+++ b/backend/aggregator/prompts/submitter_prompts.py
@@ -21,7 +21,7 @@ def get_submitter_system_prompt() -> str:
 1. Analyze the user's prompt and provided context carefully
 2. Build upon the shared training database (accepted submissions from other agents)
 3. Learn from your rejection history to avoid repeating mistakes
-4. Generate novel, valuable mathematical insights that advance the solution
+4. Generate novel, valuable mathematical progress that advances the solution
 
 ⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
 
@@ -43,13 +43,25 @@ def get_submitter_system_prompt() -> str:
 ---
 
 YOUR TASK:
-Generate a novel mathematical insight that advances the user's goal.
+Generate the strongest rigorous mathematical contribution you can toward the user's goal, preferring direct solutions, direct partial solutions, impossibility results, exact reductions, or sharp constraints whenever they are justified.
 
 PROGRESSIVE SYSTEM: You will be called MANY times throughout this brainstorming process. Each call should produce ONE deep, well-developed mathematical insight. Do not try to cover everything at once — focus on thoroughly developing a single avenue per submission with full rigor. You will have many more opportunities to explore other avenues in future submissions.
 
-Focus on mathematical concepts, theorems, techniques, and proofs that may provide an avenue towards solving or understanding the mathematical problem in the prompt. Use all available resources including web search if available.
+DIRECT-SOLUTION PREFERENCE:
+- If you can directly solve the user's problem, a clearly necessary subproblem, or prove a meaningful impossibility/limitation result, do that FIRST
+- Prefer contributions that close the problem, partially close it, or sharply reduce what remains
+- Use indirect background, exploratory framing, or supportive observations ONLY when a stronger direct step is not yet justified
+
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, follow that requested output format exactly:
+- For TOPIC EXPLORATION PHASE, propose one candidate brainstorm question optimized for producing a future direct answer
+- For PAPER TITLE EXPLORATION PHASE, propose one candidate paper title optimized for communicating the paper's direct answer-bearing content
+- In these meta-phases, do NOT solve the mathematical problem or write the paper unless the user prompt explicitly asks for that; the direct-solution preference means the candidate should point toward or communicate direct resolution
+
+Focus on mathematical concepts, theorems, techniques, and proofs that solve, partially solve, refute, or sharply characterize the mathematical problem in the prompt whenever possible. Use all available resources including web search if available.
 
 WHAT MAKES A VALUABLE SUBMISSION - Consider:
+- Does it directly answer, partially answer, or sharply constrain the user's problem or a necessary subproblem?
 - Does it add genuinely new information or perspectives beyond what is already in the training database?
 - Does it connect existing mathematical concepts in novel ways?
 - Does it provide concrete methods, theorems, proofs, or mathematical techniques?
@@ -59,6 +71,7 @@ def get_submitter_system_prompt() -> str:
 
 CRITICAL REQUIREMENTS - CONTENT:
 - ALL submissions must be rooted in sound mathematical reasoning - NO unfounded claims or logical fallacies
+- Prefer directly resolving the user's problem or a clearly necessary subproblem over auxiliary exposition
 - Focus on mathematical concepts, theorems, and techniques that are verifiable and established
 - Be specific and actionable, not vague or generic
 - Avoid redundancy with existing accepted submissions
@@ -67,17 +80,36 @@ def get_submitter_system_prompt() -> str:
 - Unsupported empirical or artifact claims must be framed as proposals, hypotheses, or future work rather than as completed results
 
 Your submission will be validated against these criteria:
+- Does it provide the strongest direct progress currently justified?
 - Does it meaningfully advance the solution space?
 - Is it based on sound mathematical principles?
 - Does it avoid contradictions?
 - Is it non-redundant with existing knowledge?
 - Is it mathematically rigorous?
 
-Output your response ONLY as JSON in this exact format:
+OPTIONAL LEAN 4 PROOF ROUTE:
+If Lean 4 proof verification is enabled and you can produce a complete Lean 4 proof that would be useful brainstorm progress, you may choose the `lean_proof` submission type. A Lean proof candidate is NOT added directly to the knowledge base: the system first runs Lean 4, gives you up to 5 repair attempts with Lean/integrity feedback, and only then sends the Lean-verified proof to the normal brainstorm validator for usefulness and redundancy review.
+
+Use `lean_proof` only for complete proof code you genuinely expect Lean 4 to accept. Do not use `sorry`, `admit`, or fake `axiom`/`constant`/`opaque` devices.
+
+Output your response ONLY as JSON in one of these exact formats:
+
+Normal brainstorm idea:
 {
+  "submission_type": "idea",
   "submission": "Your detailed mathematical submission describing concepts, theorems, proofs, and approaches based on established mathematical principles.",
   "reasoning": "Brief explanation of why this submission is valuable"
 }
+
+Lean proof candidate:
+{
+  "submission_type": "lean_proof",
+  "theorem_statement": "Natural-language statement of the theorem or lemma proved by the Lean code.",
+  "formal_sketch": "Brief note about assumptions, formalization choices, and why this proof helps the brainstorm.",
+  "theorem_name": "Optional Lean declaration name",
+  "lean_code": "Complete Lean 4 code expected to verify.",
+  "reasoning": "Why this verified proof would be a useful brainstorm addition"
+}
 """
 
 
@@ -85,11 +117,23 @@ def get_submitter_json_schema() -> str:
     """Get JSON schema specification for submitter."""
     return """
 REQUIRED JSON FORMAT:
+Normal brainstorm idea:
 {
+  "submission_type": "idea",
   "submission": "string - your detailed mathematical submission with theorems, proofs, and techniques",
   "reasoning": "string - explanation of submission value"
 }
 
+Lean proof candidate, only when Lean 4 is enabled and you can provide complete code:
+{
+  "submission_type": "lean_proof",
+  "theorem_statement": "string - natural-language statement proved",
+  "formal_sketch": "string - formalization notes",
+  "theorem_name": "string - optional Lean declaration name",
+  "lean_code": "string - complete Lean 4 source code",
+  "reasoning": "string - why the verified proof would help the brainstorm"
+}
+
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
    - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
@@ -103,15 +147,27 @@ def get_submitter_json_schema() -> str:
 
 Example (mathematical proof):
 {
+  "submission_type": "idea",
   "submission": "The problem of squaring the circle is equivalent to constructing a line segment of length \\\\sqrt{\\\\pi} using only compass and straightedge. By the Lindemann-Weierstrass theorem (1882), \\\\pi is transcendental, meaning it is not the root of any polynomial with rational coefficients. Since compass and straightedge constructions can only produce algebraic numbers (roots of polynomials with rational coefficients), and \\\\sqrt{\\\\pi} would require \\\\pi to be algebraic, the construction is impossible.",
   "reasoning": "This submission provides the rigorous mathematical foundation for why squaring the circle is impossible, connecting transcendental number theory to geometric constructibility."
 }
 
 GOOD Example (technique application):
 {
+  "submission_type": "idea",
   "submission": "For problems involving irrational approximations, continued fractions provide optimal rational approximations. The continued fraction expansion of \\\\pi = [3; 7, 15, 1, 292, ...] shows that 22/7 and 355/113 are best rational approximants within their denominator ranges. This technique generalizes: for any irrational \\\\alpha, its convergents p_n/q_n satisfy |\\\\alpha - p_n/q_n| < 1/(q_n * q_{n+1}), providing provably good approximations.",
   "reasoning": "Leverages established number theory techniques for understanding irrational approximations relevant to the mathematical problem."
 }
+
+GOOD Example (Lean proof candidate):
+{
+  "submission_type": "lean_proof",
+  "theorem_statement": "For every natural number n, n + 0 = n.",
+  "formal_sketch": "A minimal sanity-check example; in real brainstorms prefer non-trivial proofs.",
+  "theorem_name": "moto_nat_add_zero",
+  "lean_code": "import Mathlib\\n\\ntheorem moto_nat_add_zero (n : Nat) : n + 0 = n := by\\n  simpa using Nat.add_zero n",
+  "reasoning": "Demonstrates the Lean proof-candidate format."
+}
 """
 
 
diff --git a/backend/aggregator/prompts/validator_prompts.py b/backend/aggregator/prompts/validator_prompts.py
index 52822de..0b694c1 100644
--- a/backend/aggregator/prompts/validator_prompts.py
+++ b/backend/aggregator/prompts/validator_prompts.py
@@ -13,6 +13,12 @@
 - If a submission offers an unsupported benchmark-style idea that is still useful, it must be framed as a proposed experiment, hypothesis, expected benefit, or future-work direction rather than as a completed result.
 - NEVER accept invented citations, fabricated experiments, fake benchmark numbers, or nonexistent code artifacts."""
 
+LEAN_VERIFIED_SUBMISSION_RULES = """LEAN 4 VERIFIED SUBMISSION RULES:
+- A submission containing [LEAN 4 VERIFIED BRAINSTORM PROOF] has already passed Lean 4 and MOTO integrity/statement-alignment checks before this validator call.
+- Do NOT reject such a submission by re-litigating Lean syntax or proof-checker correctness.
+- Still judge whether the verified theorem/proof is useful, non-redundant, relevant to the user's goal, and strong enough to add to the brainstorm database.
+- Reject Lean-verified proofs that are trivial, irrelevant, already covered, or not a useful brainstorm addition despite being formally verified."""
+
 
 def get_validator_system_prompt() -> str:
     """Get system prompt for validator agent."""
@@ -29,7 +35,7 @@ def get_validator_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + "\n\n" + LEAN_VERIFIED_SUBMISSION_RULES + """
 
  The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
  
@@ -38,13 +44,25 @@ def get_validator_system_prompt() -> str:
 ---
 
 YOUR TASK:
-Tell me if the addition of the new submission increases potential solution availability in a significant way and/or provides a valuable solution space-constraint that narrows where we need to search in a significant way.
+Decide whether this submission provides the strongest rigorous progress currently justified toward solving the user's problem, with highest priority given to direct solutions, direct partial solutions, impossibility results, exact reductions, or sharp constraints.
+
+Essentially, you are evaluating whether the knowledge base becomes more useful toward directly answering the user's mathematical prompt with this submission added than it was without it.
 
-Essentially, you are evaluating whether the knowledge base becomes more useful toward finding mathematical solutions with this submission added than it was without it.
+CRITICAL: You are NOT generating solutions yourself. You are judging whether this submission directly solves, partially solves, refutes, or materially enables the user's problem better than the current knowledge base does.
 
-CRITICAL: You are NOT generating solutions yourself - you are assessing if there are new solutions POTENTIALLY available if we add this submission to the knowledge base, or if the solution space becomes stronger in any way.
+DIRECT-SOLUTION PREFERENCE:
+- If the submission directly resolves the user's problem, a clearly necessary subproblem, or proves a meaningful impossibility/limitation result, that is the strongest kind of acceptance case
+- If no direct resolution is available, accept supportive material only when it materially increases the chance of a later direct answer
+- Do not reward breadth, novelty, or interesting side observations over a stronger direct result
+
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate the submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA - Consider:
+- Does the submission directly answer, partially answer, refute, or sharply constrain the user's problem or a necessary subproblem?
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
 - Does the submission connect existing mathematical concepts in novel ways?
 - Does the submission provide concrete methods, theorems, proofs, or mathematical techniques?
@@ -57,9 +75,9 @@ def get_validator_system_prompt() -> str:
 
 VALIDATION DECISION RULES:
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -71,8 +89,9 @@ def get_validator_system_prompt() -> str:
 6. Contains logical fallacies or mathematically unsound reasoning
 7. Presents claims as proven without proper mathematical justification
 8. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
+9. Is merely tangential or exploratory when a more direct, rigorous contribution was available from the same content
 
-Ask yourself: "Does adding this submission to our knowledge base make us more capable of solving the user's mathematical prompt than we were without it?"
+Ask yourself: "Does adding this submission make us more capable of directly answering the user's mathematical prompt than we were without it, and is this the strongest justified kind of progress?"
 
 REJECTION FEEDBACK FORMAT:
 If rejecting, your "summary" field must provide CONCRETE, ACTIONABLE guidance using this structure:
@@ -199,7 +218,7 @@ def get_validator_dual_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + "\n\n" + LEAN_VERIFIED_SUBMISSION_RULES + """
 
  The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
  
@@ -211,11 +230,23 @@ def get_validator_dual_system_prompt() -> str:
 Evaluate EACH submission INDEPENDENTLY to determine if it would make a valuable cumulative addition to the shared knowledge base.
 
 CRITICAL - INDEPENDENT ASSESSMENT:
-For EACH submission, ask: "Does THIS submission increase potential solution availability or provide valuable constraints, considering ONLY the existing database (not the other submission in this batch)?"
+For EACH submission, ask: "Does THIS submission provide the strongest rigorous direct progress currently justified toward the user's problem, considering ONLY the existing database (not the other submission in this batch)?"
+
+Essentially, you are evaluating whether the training database becomes more useful toward directly answering the user's mathematical prompt with each submission added than it was without it.
 
-Essentially, you are evaluating whether the training database becomes more useful toward finding mathematical solutions with each submission added than it was without it.
+DIRECT-SOLUTION PREFERENCE:
+- Prefer submissions that directly solve, partially solve, refute, or sharply constrain the problem
+- Accept supportive material only when it materially enables a later direct answer and no stronger direct step is currently justified
+- Do not prefer broader or more novel side ideas over a stronger direct result
+
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate each submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA (Apply to EACH submission independently):
+- Does the submission directly answer, partially answer, refute, or sharply constrain the user's problem or a necessary subproblem?
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
 - Does the submission connect existing mathematical concepts in novel ways?
 - Does the submission provide concrete methods, theorems, proofs, or mathematical techniques?
@@ -227,9 +258,9 @@ def get_validator_dual_system_prompt() -> str:
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -239,6 +270,7 @@ def get_validator_dual_system_prompt() -> str:
 4. Is too vague or generic to be actionable
 5. Contains logical fallacies or mathematically unsound reasoning
 6. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
+7. Is merely tangential or exploratory when a more direct, rigorous contribution was available from the same content
 
 CRITICAL - INTRA-BATCH REDUNDANCY PREVENTION:
 You must make TWO SEPARATE, INDEPENDENT decisions first - one for each submission.
@@ -422,7 +454,7 @@ def get_validator_triple_system_prompt() -> str:
 - NEVER cite internal documents as authoritative or established sources
 - Question and validate every assertion, even if it appears in validated content
 
-""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + """
+""" + EMPIRICAL_PROVENANCE_VALIDATION_RULES + "\n\n" + LEAN_VERIFIED_SUBMISSION_RULES + """
 
  The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous, verifiable mathematical content. Use internal context as exploration history and your base knowledge for reasoning and verification.
  
@@ -434,11 +466,23 @@ def get_validator_triple_system_prompt() -> str:
 Evaluate EACH submission INDEPENDENTLY to determine if it would make a valuable cumulative addition to the shared knowledge base.
 
 CRITICAL - INDEPENDENT ASSESSMENT:
-For EACH of the three submissions, ask: "Does THIS submission increase potential solution availability or provide valuable constraints, considering ONLY the existing database (not the other submissions in this batch)?"
+For EACH of the three submissions, ask: "Does THIS submission provide the strongest rigorous direct progress currently justified toward the user's problem, considering ONLY the existing database (not the other submissions in this batch)?"
+
+Essentially, you are evaluating whether the training database becomes more useful toward directly answering the user's mathematical prompt with each submission added than it was without it.
 
-Essentially, you are evaluating whether the training database becomes more useful toward finding mathematical solutions with each submission added than it was without it.
+DIRECT-SOLUTION PREFERENCE:
+- Prefer submissions that directly solve, partially solve, refute, or sharply constrain the problem
+- Accept supportive material only when it materially enables a later direct answer and no stronger direct step is currently justified
+- Do not prefer broader or more novel side ideas over a stronger direct result
+
+META-PHASE EXCEPTION:
+If the USER PROMPT explicitly says TOPIC EXPLORATION PHASE or PAPER TITLE EXPLORATION PHASE, evaluate each submission as the requested candidate artifact, not as a direct solution:
+- TOPIC EXPLORATION PHASE: accept a candidate brainstorm question if it is specific, distinct, relevant, grounded, and aimed at a strong direct-answer path
+- PAPER TITLE EXPLORATION PHASE: accept a candidate title if it is accurate, specific, distinct, professional, and foregrounds direct answer-bearing content when justified
+- Do NOT reject these meta-phase submissions merely because they are questions or titles rather than mathematical solutions
 
 EVALUATION CRITERIA (Apply to EACH submission independently):
+- Does the submission directly answer, partially answer, refute, or sharply constrain the user's problem or a necessary subproblem?
 - Does the submission add genuinely new information or perspectives beyond what is already accepted?
 - Does the submission connect existing mathematical concepts in novel ways?
 - Does the submission provide concrete methods, theorems, proofs, or mathematical techniques?
@@ -450,9 +494,9 @@ def get_validator_triple_system_prompt() -> str:
 
 VALIDATION DECISION RULES (for each submission):
 A submission should be ACCEPTED if it:
-1. Increases potential solution availability in a significant way, OR
-2. Provides valuable solution space constraints that narrow where to search, OR
-3. Offers novel mathematical insights not present in existing accepted submissions, OR
+1. Directly solves, partially solves, or proves a meaningful impossibility/limitation result for the user's problem or a necessary subproblem, OR
+2. Provides valuable solution space constraints that sharply narrow where a direct answer can lie, OR
+3. Offers rigorous enabling insights not present in existing accepted submissions when a stronger direct step is not yet available, OR
 4. Presents rigorous mathematical arguments based on established principles
 
 A submission should be REJECTED if it:
@@ -462,6 +506,7 @@ def get_validator_triple_system_prompt() -> str:
 4. Is too vague or generic to be actionable
 5. Contains logical fallacies or mathematically unsound reasoning
 6. Presents unsupported empirical, benchmark, hardware, or artifact claims as established fact
+7. Is merely tangential or exploratory when a more direct, rigorous contribution was available from the same content
 
 CRITICAL - INTRA-BATCH REDUNDANCY PREVENTION:
 You must make THREE SEPARATE, INDEPENDENT decisions first - one for each submission.
@@ -708,10 +753,11 @@ def get_cleanup_review_system_prompt() -> str:
 6. Contains unsupported empirical or artifact claims presented as established fact
 
 REASONS TO KEEP - A submission should be kept if it:
-1. Provides ANY unique information not covered elsewhere
-2. Offers a different perspective or approach even if related to other content
-3. Contains specific mathematical details, proofs, or techniques
-4. Contributes to solution diversity in any meaningful way
+1. Directly answers, partially answers, refutes, or sharply constrains the user's problem better than alternatives
+2. Provides ANY unique information not covered elsewhere
+3. Offers a different perspective or approach even if related to other content
+4. Contains specific mathematical details, proofs, or techniques
+5. Contributes to solution diversity in any meaningful way
 
 CONSERVATIVE APPROACH:
 - When in doubt, DO NOT recommend removal
@@ -721,6 +767,9 @@ def get_cleanup_review_system_prompt() -> str:
 CRITICAL SELECTION RULE:
 When multiple submissions are redundant with each other, you MUST select the WEAKEST one for removal - the one that provides the LEAST unique value. NEVER remove a more complete submission in favor of keeping a less complete one.
 
+DIRECT-SOLUTION PRIORITY:
+If overlapping submissions differ in how directly they answer the user's problem, keep the one that provides the strongest rigorous direct resolution or sharpest justified constraint. Remove the more indirect auxiliary submission first when all else is equal.
+
 Output your decision ONLY as JSON in this exact format:
 {
   "should_remove": true or false,
@@ -850,12 +899,14 @@ def get_removal_validation_system_prompt() -> str:
 2. The reasoning for removal is sound and well-justified
 3. The database would be objectively better without this submission
 4. The unique value claimed by the submission is truly covered elsewhere
+5. Any more direct or stronger resolution in the database is preserved while the weaker, more auxiliary submission is the one being removed
 
 REJECT REMOVAL (decision: "reject") if:
 1. The submission provides ANY unique value not covered elsewhere
 2. The reasoning for removal is weak or unconvincing
 3. There is ANY doubt about whether the content is truly redundant
 4. Removing would reduce solution diversity or coverage
+5. The proposed removal would discard a more direct answer, stronger impossibility result, or sharper constraint than the alternatives being kept
 
 CONSERVATIVE DEFAULT:
 - If uncertain, REJECT the removal (keep the submission)
diff --git a/backend/api/main.py b/backend/api/main.py
index bc1c77b..281138b 100644
--- a/backend/api/main.py
+++ b/backend/api/main.py
@@ -3,6 +3,7 @@
 """
 import asyncio
 import os
+import secrets
 from pathlib import Path
 from typing import Optional
 from fastapi import FastAPI
@@ -23,6 +24,7 @@
     health,
     proofs,
     update,
+    leanoj,
 )
 from backend.shared.build_info import get_build_info
 from backend.shared.lm_studio_client import lm_studio_client
@@ -31,6 +33,7 @@
 from backend.aggregator.core.coordinator import coordinator
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
 
 # Setup logging with millisecond precision for log correlation
 logging.basicConfig(
@@ -79,6 +82,19 @@ def _validate_generic_mode_startup_env() -> None:
         )
 
 
+def _ensure_desktop_api_token() -> None:
+    """Ensure default-mode HTTP/WebSocket routes have an instance token."""
+    if system_config.generic_mode:
+        return
+
+    if not system_config.desktop_api_token:
+        system_config.desktop_api_token = secrets.token_urlsafe(32)
+        logger.warning(
+            "Generated a runtime desktop API token because MOTO_DESKTOP_API_TOKEN was not provided. "
+            "Launch through moto_launcher.py so the frontend receives the same token."
+        )
+
+
 def _apply_generic_mode_openrouter_env(api_client_manager) -> None:
     """Load the hosted OpenRouter key from env without using the desktop keyring."""
     api_key = os.environ.get("OPENROUTER_API_KEY", "").strip()
@@ -149,6 +165,7 @@ async def lifespan(app: FastAPI):
     """Lifespan events for the FastAPI app."""
     _apply_generic_mode_from_env()
     _validate_generic_mode_startup_env()
+    _ensure_desktop_api_token()
 
     # Startup
     logger.info(
@@ -218,6 +235,7 @@ async def lifespan(app: FastAPI):
     coordinator.set_websocket_broadcaster(websocket.broadcast_event)
     compiler_coordinator.set_websocket_broadcaster(websocket.broadcast_event)
     autonomous_coordinator.set_broadcast_callback(websocket.broadcast_event)
+    leanoj_coordinator.set_broadcast_callback(websocket.broadcast_event)
     
     # Set boost manager broadcaster
     from backend.shared.boost_manager import boost_manager
@@ -226,6 +244,16 @@ async def lifespan(app: FastAPI):
     # Set API client manager broadcaster (token tracking, rate limits, fallbacks)
     api_client_manager.set_broadcast_callback(websocket.broadcast_event)
 
+    try:
+        # Restore saved LeanOJ state for the UI, but only launch model work when
+        # explicitly requested. Lean 4 being enabled is not enough to imply that
+        # LM Studio/OpenRouter models are loaded and ready at backend startup.
+        await leanoj_coordinator.restore_latest_session(
+            auto_resume=system_config.lean4_enabled and system_config.leanoj_auto_resume_enabled
+        )
+    except Exception as exc:
+        logger.warning("Failed to restore LeanOJ session state on startup: %s", exc)
+
     # Lean 4 warm start must NEVER block the FastAPI lifespan. A cold Mathlib
     # workspace can spend many minutes inside `lake update` / `lake exe cache
     # get`, during which the backend would otherwise refuse every HTTP request
@@ -264,6 +292,7 @@ async def _warm_start_lean4() -> None:
     await coordinator.stop()
     await compiler_coordinator.stop()
     await autonomous_coordinator.stop()
+    await leanoj_coordinator.stop()
     await close_lean4_client()
     clear_lean4_client()
     await lm_studio_client.close()
@@ -293,6 +322,7 @@ async def _warm_start_lean4() -> None:
 app.include_router(openrouter.router)
 app.include_router(download.router)
 app.include_router(update.router)
+app.include_router(leanoj.router)
 app.include_router(websocket.router)
 
 
diff --git a/backend/api/middleware.py b/backend/api/middleware.py
index 357f160..1099165 100644
--- a/backend/api/middleware.py
+++ b/backend/api/middleware.py
@@ -1,13 +1,23 @@
 """
 Middleware for CORS and error handling.
 """
+import hmac
 import os
+from urllib.parse import urlparse
 from fastapi import FastAPI, Request
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
+from starlette import status
 import logging
 
-from backend.api.proxy_auth import ProxyAuthError, validate_proxy_headers
+from backend.api.proxy_auth import (
+    EMPTY_BODY_SHA256,
+    PROXY_BODY_SHA256_HEADER,
+    ProxyAuthError,
+    hash_proxy_body,
+    is_proxy_auth_allowlisted,
+    validate_proxy_headers,
+)
 from backend.shared.config import system_config
 
 logger = logging.getLogger(__name__)
@@ -19,6 +29,85 @@
     f"http://localhost:{system_config.backend_port}",
     f"http://127.0.0.1:{system_config.backend_port}",
 ]
+DESKTOP_API_TOKEN_HEADER = "X-Moto-Desktop-Token"
+UNSAFE_HTTP_METHODS = {"POST", "PUT", "PATCH", "DELETE"}
+
+
+def _origin_from_url(value: str) -> str:
+    """Return scheme://host[:port] for an Origin/Referer-like value."""
+    parsed = urlparse(value or "")
+    if not parsed.scheme or not parsed.netloc:
+        return ""
+    return f"{parsed.scheme}://{parsed.netloc}"
+
+
+def _validate_desktop_token(request: Request, allowed_origins: list[str]) -> None:
+    """Require the launcher-provided desktop API token outside public routes."""
+    if is_proxy_auth_allowlisted(request.method, request.url.path):
+        return
+
+    expected = (system_config.desktop_api_token or "").strip()
+    if not expected:
+        raise ProxyAuthError(
+            "Desktop API token is not configured for this runtime.",
+            status.HTTP_503_SERVICE_UNAVAILABLE,
+        )
+
+    provided = (request.headers.get(DESKTOP_API_TOKEN_HEADER) or "").strip()
+    if not provided or not hmac.compare_digest(provided, expected):
+        raise ProxyAuthError(
+            "Missing or invalid desktop API token.",
+            status.HTTP_401_UNAUTHORIZED,
+        )
+
+    if request.method.upper() in UNSAFE_HTTP_METHODS:
+        origin = (request.headers.get("origin") or "").strip()
+        referer = _origin_from_url(request.headers.get("referer") or "")
+        candidate = origin or referer
+        if candidate and candidate not in allowed_origins:
+            raise ProxyAuthError(
+                "Unsafe request origin is not allowed for this desktop runtime.",
+                status.HTTP_403_FORBIDDEN,
+            )
+
+
+def _validate_generic_content_length(request: Request) -> None:
+    """Reject oversized hosted requests before route handlers parse the body."""
+    raw_content_length = (request.headers.get("content-length") or "").strip()
+    if not raw_content_length:
+        return
+
+    try:
+        content_length = int(raw_content_length)
+    except ValueError as exc:
+        raise ProxyAuthError(
+            "Invalid Content-Length header.",
+            status.HTTP_400_BAD_REQUEST,
+        ) from exc
+
+    max_bytes = max(int(system_config.generic_max_request_bytes or 0), 1)
+    if content_length > max_bytes:
+        raise ProxyAuthError(
+            f"Request body exceeds hosted limit of {max_bytes} bytes.",
+            status.HTTP_413_CONTENT_TOO_LARGE,
+        )
+
+
+async def _validate_generic_body_hash(request: Request, expected_hash: str) -> str:
+    """Verify the signed body hash against the actual request body."""
+    body = await request.body()
+    actual_hash = hash_proxy_body(body)
+    if not hmac.compare_digest(expected_hash, actual_hash):
+        raise ProxyAuthError(
+            "X-Moto body hash does not match the received request body.",
+            status.HTTP_403_FORBIDDEN,
+        )
+
+    async def receive():
+        return {"type": "http.request", "body": body, "more_body": False}
+
+    request._receive = receive
+    return actual_hash
 
 
 def setup_middleware(app: FastAPI) -> None:
@@ -44,20 +133,47 @@ def setup_middleware(app: FastAPI) -> None:
     )
 
     @app.middleware("http")
-    async def generic_mode_proxy_auth(request: Request, call_next):
-        """Require signed internal proxy headers for protected hosted routes."""
+    async def moto_request_auth(request: Request, call_next):
+        """Require hosted proxy auth or desktop instance tokens for protected routes."""
         if system_config.generic_mode:
             try:
+                if not is_proxy_auth_allowlisted(request.method, request.url.path):
+                    _validate_generic_content_length(request)
+
+                body_hash = request.headers.get(PROXY_BODY_SHA256_HEADER)
+                verified_body_hash = EMPTY_BODY_SHA256
+                if (
+                    not is_proxy_auth_allowlisted(request.method, request.url.path)
+                    and request.method.upper() not in {"GET", "HEAD"}
+                    and not body_hash
+                ):
+                    raise ProxyAuthError(
+                        "Missing required X-Moto body hash header.",
+                        status.HTTP_401_UNAUTHORIZED,
+                    )
+                if (
+                    not is_proxy_auth_allowlisted(request.method, request.url.path)
+                    and request.method.upper() not in {"GET", "HEAD"}
+                ):
+                    verified_body_hash = await _validate_generic_body_hash(request, body_hash or "")
                 validate_proxy_headers(
                     request.headers,
                     method=request.method,
                     path=request.url.path,
+                    query_string=request.url.query,
+                    body_hash=verified_body_hash,
                     expected_instance_id=system_config.instance_id,
                     shared_secret=system_config.internal_proxy_secret or "",
                 )
             except ProxyAuthError as exc:
                 logger.warning("Rejected generic-mode request %s %s: %s", request.method, request.url.path, exc.detail)
                 return JSONResponse(status_code=exc.status_code, content={"detail": exc.detail})
+        else:
+            try:
+                _validate_desktop_token(request, origins)
+            except ProxyAuthError as exc:
+                logger.warning("Rejected desktop request %s %s: %s", request.method, request.url.path, exc.detail)
+                return JSONResponse(status_code=exc.status_code, content={"detail": exc.detail})
 
         return await call_next(request)
     
diff --git a/backend/api/proxy_auth.py b/backend/api/proxy_auth.py
index f1577c2..f85ecd6 100644
--- a/backend/api/proxy_auth.py
+++ b/backend/api/proxy_auth.py
@@ -13,12 +13,16 @@
 PROXY_INSTANCE_HEADER = "X-Moto-Instance-Id"
 PROXY_TIMESTAMP_HEADER = "X-Moto-Proxy-Timestamp"
 PROXY_SIGNATURE_HEADER = "X-Moto-Proxy-Signature"
+PROXY_BODY_SHA256_HEADER = "X-Moto-Body-SHA256"
 PROXY_AUTH_MAX_SKEW_SECONDS = 60
+PROXY_REPLAY_CACHE_MAX_ENTRIES = 4096
+EMPTY_BODY_SHA256 = hashlib.sha256(b"").hexdigest()
 PROXY_AUTH_ALLOWLIST = {
     ("GET", "/health"),
     ("GET", "/api/health"),
     ("GET", "/api/features"),
 }
+_SEEN_PROXY_SIGNATURES: dict[str, int] = {}
 
 
 class ProxyAuthError(RuntimeError):
@@ -36,6 +40,51 @@ def normalize_proxy_path(path: str) -> str:
     return normalized or "/"
 
 
+def normalize_proxy_query(query_string: str | bytes | None) -> str:
+    """Normalize the raw query string used for proxy signatures."""
+    if isinstance(query_string, bytes):
+        query_string = query_string.decode("utf-8", errors="surrogatepass")
+    normalized = (query_string or "").strip()
+    return normalized[1:] if normalized.startswith("?") else normalized
+
+
+def hash_proxy_body(body: bytes | str | None) -> str:
+    """Return the SHA-256 hex digest for the request body."""
+    if body is None:
+        raw_body = b""
+    elif isinstance(body, bytes):
+        raw_body = body
+    else:
+        raw_body = body.encode("utf-8")
+    return hashlib.sha256(raw_body).hexdigest()
+
+
+def _remember_proxy_signature(signature: str, timestamp_value: int, current_time: int) -> None:
+    """Reject replayed signatures within the accepted timestamp skew window."""
+    stale_cutoff = current_time - PROXY_AUTH_MAX_SKEW_SECONDS
+    stale_signatures = [
+        seen_signature
+        for seen_signature, seen_timestamp in _SEEN_PROXY_SIGNATURES.items()
+        if seen_timestamp < stale_cutoff
+    ]
+    for seen_signature in stale_signatures:
+        _SEEN_PROXY_SIGNATURES.pop(seen_signature, None)
+
+    if signature in _SEEN_PROXY_SIGNATURES:
+        raise ProxyAuthError(
+            "Replayed X-Moto-Proxy-Signature was rejected.",
+            status.HTTP_401_UNAUTHORIZED,
+        )
+
+    _SEEN_PROXY_SIGNATURES[signature] = timestamp_value
+    if len(_SEEN_PROXY_SIGNATURES) > PROXY_REPLAY_CACHE_MAX_ENTRIES:
+        for seen_signature, _ in sorted(
+            _SEEN_PROXY_SIGNATURES.items(),
+            key=lambda item: item[1],
+        )[: len(_SEEN_PROXY_SIGNATURES) - PROXY_REPLAY_CACHE_MAX_ENTRIES]:
+            _SEEN_PROXY_SIGNATURES.pop(seen_signature, None)
+
+
 def is_proxy_auth_allowlisted(method: str, path: str) -> bool:
     """Return True when a route is intentionally public in generic mode."""
     normalized_method = (method or "").upper()
@@ -45,9 +94,26 @@ def is_proxy_auth_allowlisted(method: str, path: str) -> bool:
     return (normalized_method, normalized_path) in PROXY_AUTH_ALLOWLIST
 
 
-def build_proxy_signature(secret: str, instance_id: str, timestamp: str, method: str, path: str) -> str:
+def build_proxy_signature(
+    secret: str,
+    instance_id: str,
+    timestamp: str,
+    method: str,
+    path: str,
+    query_string: str | bytes | None = "",
+    body_hash: str | None = EMPTY_BODY_SHA256,
+) -> str:
     """Build the expected HMAC signature for a proxied request."""
-    payload = f"{instance_id}:{timestamp}:{(method or '').upper()}:{normalize_proxy_path(path)}"
+    payload = "\n".join(
+        (
+            instance_id,
+            timestamp,
+            (method or "").upper(),
+            normalize_proxy_path(path),
+            normalize_proxy_query(query_string),
+            body_hash or EMPTY_BODY_SHA256,
+        )
+    )
     return hmac.new(secret.encode("utf-8"), payload.encode("utf-8"), hashlib.sha256).hexdigest()
 
 
@@ -56,6 +122,9 @@ def validate_proxy_headers(
     *,
     method: str,
     path: str,
+    query_string: str | bytes | None = "",
+    body: bytes | str | None = b"",
+    body_hash: str | None = None,
     expected_instance_id: str,
     shared_secret: str,
     now: int | None = None,
@@ -107,9 +176,13 @@ def validate_proxy_headers(
         timestamp=timestamp_raw,
         method=method,
         path=path,
+        query_string=query_string,
+        body_hash=body_hash or hash_proxy_body(body),
     )
     if not hmac.compare_digest(signature, expected_signature):
         raise ProxyAuthError(
             "Invalid X-Moto-Proxy-Signature for the requested path.",
             status.HTTP_403_FORBIDDEN,
         )
+
+    _remember_proxy_signature(signature, timestamp_value, current_time)
diff --git a/backend/api/routes/__init__.py b/backend/api/routes/__init__.py
index 512b263..9183649 100644
--- a/backend/api/routes/__init__.py
+++ b/backend/api/routes/__init__.py
@@ -1,4 +1,4 @@
 """API routes"""
-from . import aggregator, compiler, autonomous, websocket, boost, workflow, features, health, proofs, update
+from . import aggregator, compiler, autonomous, websocket, boost, workflow, features, health, proofs, update, leanoj
 
-__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow', 'features', 'health', 'proofs', 'update']
+__all__ = ['aggregator', 'compiler', 'autonomous', 'websocket', 'boost', 'workflow', 'features', 'health', 'proofs', 'update', 'leanoj']
diff --git a/backend/api/routes/aggregator.py b/backend/api/routes/aggregator.py
index 54bb5ce..6ae150e 100644
--- a/backend/api/routes/aggregator.py
+++ b/backend/api/routes/aggregator.py
@@ -12,16 +12,20 @@
 from backend.shared.config import system_config, rag_config
 from backend.shared.token_tracker import token_tracker
 from backend.shared.path_safety import resolve_path_within_root, validate_single_path_component
+from backend.shared.workflow_start_guard import workflow_start_guard
 from backend.aggregator.core.coordinator import coordinator
 from backend.aggregator.core.context_allocator import context_allocator
 from backend.aggregator.memory.event_log import event_log
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
 
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/aggregator", tags=["aggregator"])
 
+MAX_UPLOAD_BYTES = 5 * 1024 * 1024
+
 
 def _get_start_conflict() -> Optional[str]:
     """Return a user-facing conflict message if another workflow is active."""
@@ -32,9 +36,12 @@ def _get_start_conflict() -> Optional[str]:
         return "Cannot start Aggregator while Compiler is running. Stop Compiler first."
 
     autonomous_state = autonomous_coordinator.get_state()
-    if autonomous_state.is_running:
+    if autonomous_state.is_running or autonomous_coordinator.is_active:
         return "Cannot start Aggregator while Autonomous Research is running. Stop Autonomous Research first."
 
+    if leanoj_coordinator.is_active:
+        return "Cannot start Aggregator while Proof Solver is running. Stop Proof Solver first."
+
     return None
 
 
@@ -42,71 +49,76 @@ def _get_start_conflict() -> Optional[str]:
 async def start_aggregator(request: AggregatorStartRequest):
     """Start the aggregator system."""
     try:
-        conflict = _get_start_conflict()
-        if conflict:
-            raise HTTPException(status_code=400, detail=conflict)
-
-        # Validate submitter configs
-        num_submitters = len(request.submitter_configs)
-        if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
-            raise HTTPException(
-                status_code=400,
-                detail=f"Number of submitters must be {system_config.min_submitters}-{system_config.max_submitters}, got {num_submitters}"
-            )
-        
-        # Update validator context window configuration
-        rag_config.validator_context_window = request.validator_context_size
-        rag_config.validator_max_output_tokens = request.validator_max_output_tokens
-        
-        # Use first submitter's context for context_allocator (for compatibility)
-        if request.submitter_configs:
-            first_submitter = request.submitter_configs[0]
-            rag_config.submitter_context_window = first_submitter.context_window
-            rag_config.submitter_max_output_tokens = first_submitter.max_output_tokens
-            context_allocator.set_context_windows(
-                first_submitter.context_window,
-                request.validator_context_size,
-                first_submitter.max_output_tokens,
-                request.validator_max_output_tokens
-            )
-        
-        # Log submitter configurations
-        for config in request.submitter_configs:
-            label = "(Main Submitter)" if config.submitter_id == 1 else ""
+        async with workflow_start_guard.reserve():
+            conflict = _get_start_conflict()
+            if conflict:
+                raise HTTPException(status_code=400, detail=conflict)
+
+            # Validate submitter configs
+            num_submitters = len(request.submitter_configs)
+            if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Number of submitters must be {system_config.min_submitters}-{system_config.max_submitters}, got {num_submitters}"
+                )
+
+            # Update validator context window configuration
+            rag_config.validator_context_window = request.validator_context_size
+            rag_config.validator_max_output_tokens = request.validator_max_output_tokens
+
+            # Use first submitter's context for context_allocator (for compatibility)
+            if request.submitter_configs:
+                first_submitter = request.submitter_configs[0]
+                rag_config.submitter_context_window = first_submitter.context_window
+                rag_config.submitter_max_output_tokens = first_submitter.max_output_tokens
+                context_allocator.set_context_windows(
+                    first_submitter.context_window,
+                    request.validator_context_size,
+                    first_submitter.max_output_tokens,
+                    request.validator_max_output_tokens
+                )
+
+            # Log submitter configurations
+            for config in request.submitter_configs:
+                label = "(Main Submitter)" if config.submitter_id == 1 else ""
+                logger.info(
+                    f"Submitter {config.submitter_id} {label}: model={config.model_id}, "
+                    f"context={config.context_window}, max_tokens={config.max_output_tokens}"
+                )
             logger.info(
-                f"Submitter {config.submitter_id} {label}: model={config.model_id}, "
-                f"context={config.context_window}, max_tokens={config.max_output_tokens}"
+                f"Validator: model={request.validator_model}, "
+                f"context={request.validator_context_size}, max_tokens={request.validator_max_output_tokens}"
             )
-        logger.info(
-            f"Validator: model={request.validator_model}, "
-            f"context={request.validator_context_size}, max_tokens={request.validator_max_output_tokens}"
-        )
-        
-        # Initialize coordinator with per-submitter configs (includes OpenRouter provider fields)
-        await coordinator.initialize(
-            user_prompt=request.user_prompt,
-            submitter_configs=request.submitter_configs,
-            validator_model=request.validator_model,
-            user_files=request.uploaded_files,
-            validator_context_window=request.validator_context_size,
-            validator_max_tokens=request.validator_max_output_tokens,
-            # Pass OpenRouter provider config for validator
-            validator_provider=request.validator_provider,
-            validator_openrouter_provider=request.validator_openrouter_provider,
-            validator_lm_studio_fallback=request.validator_lm_studio_fallback
-        )
-        
-        # Start coordinator
-        token_tracker.reset()
-        token_tracker.start_timer()
-        await coordinator.start()
-        
-        return {
-            "status": "started",
-            "message": f"Aggregator system started with {num_submitters} submitters",
-            "num_submitters": num_submitters
-        }
-    
+
+            # Initialize coordinator with per-submitter configs (includes OpenRouter provider fields)
+            await coordinator.initialize(
+                user_prompt=request.user_prompt,
+                submitter_configs=request.submitter_configs,
+                validator_model=request.validator_model,
+                user_files=request.uploaded_files,
+                validator_context_window=request.validator_context_size,
+                validator_max_tokens=request.validator_max_output_tokens,
+                # Pass OpenRouter provider config for validator
+                validator_provider=request.validator_provider,
+                validator_openrouter_provider=request.validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=request.validator_openrouter_reasoning_effort,
+                validator_lm_studio_fallback=request.validator_lm_studio_fallback,
+                validator_supercharge_enabled=request.validator_supercharge_enabled
+            )
+
+            # Start coordinator
+            token_tracker.reset()
+            token_tracker.start_timer()
+            await coordinator.start()
+
+            return {
+                "status": "started",
+                "message": f"Aggregator system started with {num_submitters} submitters",
+                "num_submitters": num_submitters
+            }
+
+    except HTTPException:
+        raise
     except ValueError as e:
         # Model compatibility errors
         logger.error(f"Model compatibility error: {e}", exc_info=True)
@@ -169,8 +181,8 @@ async def save_results():
         
         return {
             "status": "saved",
-            "path": str(output_path),
-            "message": f"Results saved to {output_path}"
+            "path": output_path.name,
+            "message": f"Results saved to {output_path.name}"
         }
     except Exception as e:
         logger.error(f"Failed to save results: {e}")
@@ -197,19 +209,30 @@ async def upload_file(file: UploadFile = File(...)):
     """Upload a user file."""
     try:
         safe_filename = validate_single_path_component(file.filename, "filename")
+        if not safe_filename.lower().endswith(".txt"):
+            raise HTTPException(status_code=400, detail="Only .txt uploads are supported")
+
+        content = await file.read(MAX_UPLOAD_BYTES + 1)
+        if len(content) > MAX_UPLOAD_BYTES:
+            raise HTTPException(status_code=413, detail="Upload exceeds 5 MB limit")
+
         uploads_dir = Path(system_config.user_uploads_dir)
         uploads_dir.mkdir(parents=True, exist_ok=True)
         file_path = resolve_path_within_root(uploads_dir, safe_filename)
         
         async with aiofiles.open(file_path, 'wb') as f:
-            content = await file.read()
             await f.write(content)
         
         return {
             "status": "uploaded",
             "filename": safe_filename,
-            "path": str(file_path)
+            "path": safe_filename
         }
+    except HTTPException:
+        raise
+    except ValueError as e:
+        logger.warning("Rejected unsafe upload filename: %s", e)
+        raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to upload file: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
diff --git a/backend/api/routes/autonomous.py b/backend/api/routes/autonomous.py
index 8f6fb79..2cb7a7c 100644
--- a/backend/api/routes/autonomous.py
+++ b/backend/api/routes/autonomous.py
@@ -3,6 +3,7 @@
 Includes Tier 1 (Brainstorm), Tier 2 (Paper Writing), and Tier 3 (Final Answer) endpoints.
 """
 import logging
+import hashlib
 from datetime import datetime
 from pathlib import Path
 from typing import Optional, Any, Dict, List
@@ -21,8 +22,11 @@
 from backend.autonomous.memory.session_manager import session_manager
 from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
 from backend.aggregator.core.coordinator import coordinator
+from backend.aggregator.memory.shared_training import shared_training_memory
 from backend.compiler.core.compiler_coordinator import compiler_coordinator
+from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
 from backend.shared.boost_logger import boost_logger
+from backend.shared.workflow_start_guard import workflow_start_guard
 
 logger = logging.getLogger(__name__)
 
@@ -51,6 +55,19 @@ def _parse_api_log_timestamp(timestamp: Optional[str]) -> datetime:
         return datetime.min
 
 
+def _infer_api_log_workflow(entry: Dict[str, Any]) -> str:
+    """Infer workflow namespace for legacy API log entries."""
+    workflow = str(entry.get("workflow") or "").strip().lower()
+    if workflow:
+        return workflow
+
+    role_id = str(entry.get("role_id") or "")
+    task_id = str(entry.get("task_id") or "")
+    if role_id.startswith("leanoj_") or task_id.startswith("leanoj_"):
+        return "leanoj"
+    return "autonomous"
+
+
 def _normalize_autonomous_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
     """Normalize autonomous log entries into the combined API log shape."""
     return {
@@ -60,10 +77,11 @@ def _normalize_autonomous_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
         "boost_mode": entry.get("boost_mode"),
         "provider": entry.get("provider") or "unknown",
         "phase": entry.get("phase") or "unknown",
+        "workflow": _infer_api_log_workflow(entry),
         "prompt_preview": entry.get("prompt_preview") or "",
-        "prompt_full": entry.get("prompt_full") or entry.get("prompt_preview") or "",
+        "prompt_full": entry.get("prompt_full") or "",
         "response_preview": entry.get("response_preview") or "",
-        "response_full": entry.get("response_full") or entry.get("response_preview") or "",
+        "response_full": entry.get("response_full") or "",
     }
 
 
@@ -71,7 +89,7 @@ def _normalize_boost_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
     """Normalize boost log entries so they can be shown in the main API log view."""
     prompt_preview = entry.get("prompt_preview") or ""
     response_preview = entry.get("response_preview") or ""
-    response_full = entry.get("response_full") or response_preview
+    response_full = entry.get("response_full") or ""
 
     return {
         **entry,
@@ -79,8 +97,9 @@ def _normalize_boost_api_log(entry: Dict[str, Any]) -> Dict[str, Any]:
         "boosted": True,
         "provider": entry.get("provider") or "openrouter",
         "phase": entry.get("phase") or "boost",
+        "workflow": _infer_api_log_workflow(entry),
         "prompt_preview": prompt_preview,
-        "prompt_full": entry.get("prompt_full") or prompt_preview,
+        "prompt_full": entry.get("prompt_full") or "",
         "response_preview": response_preview,
         "response_full": response_full,
     }
@@ -214,20 +233,73 @@ def _build_combined_api_stats(logs: List[Dict[str, Any]]) -> Dict[str, Any]:
     }
 
 
-async def _get_combined_api_logs(limit: int = 100) -> Dict[str, Any]:
+def _normalize_api_log_workflow_filter(workflow: Optional[str]) -> Optional[str]:
+    if workflow is None:
+        return None
+
+    normalized = workflow.strip().lower()
+    if not normalized:
+        return None
+    if normalized not in {"autonomous", "leanoj"}:
+        raise HTTPException(status_code=400, detail="Invalid workflow filter")
+    return normalized
+
+
+def _get_api_log_key(entry: Dict[str, Any]) -> str:
+    """Build a stable opaque key for a combined API log entry."""
+    parts = [
+        str(entry.get("timestamp") or ""),
+        str(entry.get("task_id") or ""),
+        str(entry.get("role_id") or ""),
+        str(entry.get("model") or ""),
+        str(entry.get("source") or ""),
+        str(entry.get("boost_mode") or ""),
+    ]
+    return hashlib.sha256("\x1f".join(parts).encode("utf-8")).hexdigest()[:24]
+
+
+def _summarize_api_log_entry(entry: Dict[str, Any]) -> Dict[str, Any]:
+    """Return a UI-safe log-list entry without large prompt/response bodies."""
+    prompt_full = str(entry.get("prompt_full") or "")
+    response_full = str(entry.get("response_full") or "")
+    prompt_size = int(entry.get("prompt_size") or len(prompt_full))
+    response_size = int(entry.get("response_size") or len(response_full))
+    summary = {
+        **entry,
+        "log_key": _get_api_log_key(entry),
+        "prompt_full": "",
+        "response_full": "",
+        "prompt_size": prompt_size,
+        "response_size": response_size,
+        "has_full_prompt": bool(entry.get("has_full_prompt", bool(prompt_full))),
+        "has_full_response": bool(entry.get("has_full_response", bool(response_full))),
+    }
+    return summary
+
+
+async def _get_combined_api_logs(
+    limit: int = 100,
+    workflow: Optional[str] = None,
+    include_full: bool = True,
+) -> Dict[str, Any]:
     """Fetch, deduplicate, and summarize the combined autonomous + boost API logs."""
     fetch_limit = max(limit * 3, 300)
-    autonomous_logs = await autonomous_api_logger.get_logs(limit=fetch_limit)
-    boost_logs = await boost_logger.get_logs(limit=fetch_limit)
-    combined_logs = _merge_combined_api_logs(autonomous_logs, boost_logs, limit=limit)
-    combined_stats = _build_combined_api_stats(
-        _merge_combined_api_logs(
-            autonomous_logs,
-            boost_logs,
-            limit=max(fetch_limit, len(autonomous_logs) + len(boost_logs)),
-        )
+    autonomous_logs = await autonomous_api_logger.get_logs(limit=fetch_limit, include_full=include_full)
+    boost_logs = await boost_logger.get_logs(limit=fetch_limit, include_full=include_full)
+    all_combined_logs = _merge_combined_api_logs(
+        autonomous_logs,
+        boost_logs,
+        limit=max(fetch_limit, len(autonomous_logs) + len(boost_logs)),
     )
-    return {"logs": combined_logs, "stats": combined_stats}
+    if workflow:
+        all_combined_logs = [
+            log for log in all_combined_logs
+            if log.get("workflow") == workflow
+        ]
+    return {
+        "logs": all_combined_logs[:limit],
+        "stats": _build_combined_api_stats(all_combined_logs),
+    }
 
     if session_id == "legacy":
         return
@@ -250,6 +322,9 @@ def _get_start_conflict() -> Optional[str]:
     if compiler_coordinator.is_running:
         return "Cannot start Autonomous Research while Compiler is running. Stop Compiler first."
 
+    if leanoj_coordinator.is_active:
+        return "Cannot start Autonomous Research while Proof Solver is running. Stop Proof Solver first."
+
     return None
 
 
@@ -379,16 +454,20 @@ def _resolve_validator_config(request: Optional[CritiqueRequest]) -> Dict[str, A
     validator_max_tokens = None
     validator_provider = None
     validator_openrouter_provider = None
+    validator_openrouter_reasoning_effort = "auto"
+    validator_supercharge_enabled = False
     custom_prompt = None
 
     if request:
         custom_prompt = request.custom_prompt
+        validator_supercharge_enabled = bool(request.validator_supercharge_enabled)
         if request.validator_model:
             validator_model = request.validator_model
             validator_context_window = request.validator_context_window or 131072
             validator_max_tokens = request.validator_max_tokens or 25000
             validator_provider = request.validator_provider or "lm_studio"
             validator_openrouter_provider = request.validator_openrouter_provider
+            validator_openrouter_reasoning_effort = request.validator_openrouter_reasoning_effort
 
     if not validator_model:
         coordinator_config = autonomous_coordinator.get_validator_config()
@@ -398,6 +477,8 @@ def _resolve_validator_config(request: Optional[CritiqueRequest]) -> Dict[str, A
             validator_max_tokens = coordinator_config["validator_max_tokens"]
             validator_provider = coordinator_config["validator_provider"]
             validator_openrouter_provider = coordinator_config.get("validator_openrouter_provider")
+            validator_openrouter_reasoning_effort = coordinator_config.get("validator_openrouter_reasoning_effort", "auto")
+            validator_supercharge_enabled = bool(coordinator_config.get("validator_supercharge_enabled", False))
 
     if not validator_model:
         raise HTTPException(
@@ -412,6 +493,8 @@ def _resolve_validator_config(request: Optional[CritiqueRequest]) -> Dict[str, A
         "validator_max_tokens": validator_max_tokens,
         "validator_provider": validator_provider,
         "validator_openrouter_provider": validator_openrouter_provider,
+        "validator_openrouter_reasoning_effort": validator_openrouter_reasoning_effort,
+        "validator_supercharge_enabled": validator_supercharge_enabled,
     }
 
 
@@ -465,9 +548,11 @@ async def _generate_autonomous_paper_critique(
             model_id=config["validator_model"],
             openrouter_model_id=config["validator_model"] if config["validator_provider"] == "openrouter" else None,
             openrouter_provider=config["validator_openrouter_provider"],
+            openrouter_reasoning_effort=config["validator_openrouter_reasoning_effort"],
             lm_studio_fallback_id=None,
             context_window=config["validator_context_window"],
             max_output_tokens=config["validator_max_tokens"],
+            supercharge_enabled=bool(config.get("validator_supercharge_enabled", False)),
         )
     )
 
@@ -544,9 +629,7 @@ async def _delete_autonomous_paper_from_scope(
     scoped_research_metadata: ResearchMetadata,
     paper_id: str,
 ) -> Dict[str, Any]:
-    """Delete a Stage 2 paper and clean its related metadata/critique state."""
-    from backend.shared.critique_memory import clear_critiques
-
+    """Soft-prune a Stage 2 paper and remove it from future model context."""
     state = autonomous_coordinator.get_state()
     active_session_id = _get_active_autonomous_session_id()
     if (
@@ -564,18 +647,25 @@ async def _delete_autonomous_paper_from_scope(
     if not metadata:
         raise HTTPException(status_code=404, detail=f"Paper not found: {paper_id}")
 
-    paper_path = scoped_paper_library.get_paper_path(paper_id)
-    base_dir = Path(paper_path).parent
     source_brainstorms = metadata.source_brainstorm_ids or []
 
-    success = await scoped_paper_library.delete_paper(paper_id)
+    prune_reason = "The user removed this paper from model context accumulation."
+    success = await scoped_paper_library.prune_paper(
+        paper_id,
+        reason=prune_reason,
+        pruned_by="user",
+    )
     if not success:
         raise HTTPException(
             status_code=500,
-            detail=f"Failed to delete paper files for {paper_id}"
+            detail=f"Failed to prune paper files for {paper_id}"
         )
 
-    await scoped_research_metadata.delete_paper(paper_id)
+    await scoped_research_metadata.prune_paper(
+        paper_id,
+        reason=prune_reason,
+        pruned_by="user",
+    )
 
     for topic_id in source_brainstorms:
         try:
@@ -586,22 +676,23 @@ async def _delete_autonomous_paper_from_scope(
             )
 
     try:
-        await clear_critiques("autonomous_paper", paper_id, base_dir)
-        logger.info(f"Cleared critiques for deleted paper {paper_id}")
+        from backend.autonomous.core.autonomous_rag_manager import autonomous_rag_manager
+        await autonomous_rag_manager.remove_paper_from_rag(paper_id)
     except Exception as e:
-        logger.warning(f"Failed to clear critiques for paper {paper_id}: {e}")
+        logger.warning(f"Failed to remove pruned paper {paper_id} from RAG: {e}")
 
     logger.info(
-        f"Deleted paper {paper_id} from session {session_id} "
+        f"Pruned paper {paper_id} from session {session_id} "
         f"(from brainstorms: {', '.join(source_brainstorms)})"
     )
 
     return {
         "success": True,
-        "message": f"Paper {paper_id} deleted successfully",
+        "message": f"Paper {paper_id} was pruned from model context and preserved for download",
         "paper_id": paper_id,
         "session_id": session_id,
         "source_brainstorms": source_brainstorms,
+        "pruned": True,
     }
 
 
@@ -611,71 +702,80 @@ async def start_autonomous_research(request: AutonomousResearchStartRequest):
     try:
         from backend.shared.config import system_config
 
-        conflict = _get_start_conflict()
-        if conflict:
-            raise HTTPException(status_code=400, detail=conflict)
-        
-        # Validate submitter configs
-        num_submitters = len(request.submitter_configs)
-        if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
-            raise HTTPException(
-                status_code=400,
-                detail=f"Number of submitters must be {system_config.min_submitters}-{system_config.max_submitters}, got {num_submitters}"
-            )
-        
-        # Log submitter configurations
-        for config in request.submitter_configs:
-            label = "(Main Submitter)" if config.submitter_id == 1 else ""
+        async with workflow_start_guard.reserve():
+            conflict = _get_start_conflict()
+            if conflict:
+                raise HTTPException(status_code=400, detail=conflict)
+
+            # Validate submitter configs
+            num_submitters = len(request.submitter_configs)
+            if not (system_config.min_submitters <= num_submitters <= system_config.max_submitters):
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Number of submitters must be {system_config.min_submitters}-{system_config.max_submitters}, got {num_submitters}"
+                )
+
+            # Log submitter configurations
+            for config in request.submitter_configs:
+                label = "(Main Submitter)" if config.submitter_id == 1 else ""
+                logger.info(
+                    f"Brainstorm Submitter {config.submitter_id} {label}: model={config.model_id}, "
+                    f"context={config.context_window}, max_tokens={config.max_output_tokens}"
+                )
             logger.info(
-                f"Brainstorm Submitter {config.submitter_id} {label}: model={config.model_id}, "
-                f"context={config.context_window}, max_tokens={config.max_output_tokens}"
+                f"Validator: model={request.validator_model}, "
+                f"context={request.validator_context_window}, max_tokens={request.validator_max_tokens}"
             )
-        logger.info(
-            f"Validator: model={request.validator_model}, "
-            f"context={request.validator_context_window}, max_tokens={request.validator_max_tokens}"
-        )
-        
-        # Initialize coordinator
-        await autonomous_coordinator.initialize(
-            user_research_prompt=request.user_research_prompt,
-            submitter_configs=request.submitter_configs,
-            validator_model=request.validator_model,
-            validator_context_window=request.validator_context_window,
-            validator_max_tokens=request.validator_max_tokens,
-            high_context_model=request.high_context_model,
-            high_context_context_window=request.high_context_context_window,
-            high_context_max_tokens=request.high_context_max_tokens,
-            high_param_model=request.high_param_model,
-            high_param_context_window=request.high_param_context_window,
-            high_param_max_tokens=request.high_param_max_tokens,
-            critique_submitter_model=request.critique_submitter_model,
-            critique_submitter_context_window=request.critique_submitter_context_window,
-            critique_submitter_max_tokens=request.critique_submitter_max_tokens,
-            # OpenRouter provider configs for each role
-            validator_provider=request.validator_provider,
-            validator_openrouter_provider=request.validator_openrouter_provider,
-            validator_lm_studio_fallback=request.validator_lm_studio_fallback,
-            high_context_provider=request.high_context_provider,
-            high_context_openrouter_provider=request.high_context_openrouter_provider,
-            high_context_lm_studio_fallback=request.high_context_lm_studio_fallback,
-            high_param_provider=request.high_param_provider,
-            high_param_openrouter_provider=request.high_param_openrouter_provider,
-            high_param_lm_studio_fallback=request.high_param_lm_studio_fallback,
-            critique_submitter_provider=request.critique_submitter_provider,
-            critique_submitter_openrouter_provider=request.critique_submitter_openrouter_provider,
-            critique_submitter_lm_studio_fallback=request.critique_submitter_lm_studio_fallback,
-            tier3_enabled=request.tier3_enabled
-        )
-        
-        # Start in background with a retained task handle so Stop can cancel it.
-        if not autonomous_coordinator.start_in_background():
-            raise HTTPException(status_code=400, detail="Autonomous research is already running")
-        
-        return {
-            "success": True,
-            "message": f"Autonomous research started with {num_submitters} brainstorm submitters",
-            "num_submitters": num_submitters
-        }
+
+            # Initialize coordinator
+            await autonomous_coordinator.initialize(
+                user_research_prompt=request.user_research_prompt,
+                submitter_configs=request.submitter_configs,
+                validator_model=request.validator_model,
+                validator_context_window=request.validator_context_window,
+                validator_max_tokens=request.validator_max_tokens,
+                high_context_model=request.high_context_model,
+                high_context_context_window=request.high_context_context_window,
+                high_context_max_tokens=request.high_context_max_tokens,
+                high_param_model=request.high_param_model,
+                high_param_context_window=request.high_param_context_window,
+                high_param_max_tokens=request.high_param_max_tokens,
+                critique_submitter_model=request.critique_submitter_model,
+                critique_submitter_context_window=request.critique_submitter_context_window,
+                critique_submitter_max_tokens=request.critique_submitter_max_tokens,
+                # OpenRouter provider configs for each role
+                validator_provider=request.validator_provider,
+                validator_openrouter_provider=request.validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=request.validator_openrouter_reasoning_effort,
+                validator_lm_studio_fallback=request.validator_lm_studio_fallback,
+                high_context_provider=request.high_context_provider,
+                high_context_openrouter_provider=request.high_context_openrouter_provider,
+                high_context_openrouter_reasoning_effort=request.high_context_openrouter_reasoning_effort,
+                high_context_lm_studio_fallback=request.high_context_lm_studio_fallback,
+                high_param_provider=request.high_param_provider,
+                high_param_openrouter_provider=request.high_param_openrouter_provider,
+                high_param_openrouter_reasoning_effort=request.high_param_openrouter_reasoning_effort,
+                high_param_lm_studio_fallback=request.high_param_lm_studio_fallback,
+                critique_submitter_provider=request.critique_submitter_provider,
+                critique_submitter_openrouter_provider=request.critique_submitter_openrouter_provider,
+                critique_submitter_openrouter_reasoning_effort=request.critique_submitter_openrouter_reasoning_effort,
+                critique_submitter_lm_studio_fallback=request.critique_submitter_lm_studio_fallback,
+                tier3_enabled=request.tier3_enabled,
+                validator_supercharge_enabled=request.validator_supercharge_enabled,
+                high_context_supercharge_enabled=request.high_context_supercharge_enabled,
+                high_param_supercharge_enabled=request.high_param_supercharge_enabled,
+                critique_submitter_supercharge_enabled=request.critique_submitter_supercharge_enabled
+            )
+
+            # Start in background with a retained task handle so Stop can cancel it.
+            if not autonomous_coordinator.start_in_background():
+                raise HTTPException(status_code=400, detail="Autonomous research is already running")
+
+            return {
+                "success": True,
+                "message": f"Autonomous research started with {num_submitters} brainstorm submitters",
+                "num_submitters": num_submitters
+            }
         
     except HTTPException:
         raise
@@ -791,14 +891,28 @@ async def get_autonomous_status():
                 
                 # Try to get aggregator queue size
                 if autonomous_coordinator._brainstorm_aggregator:
-                    from backend.aggregator.core.queue_manager import queue_manager
                     try:
-                        queue_size = await queue_manager.size()
+                        aggregator_status = await autonomous_coordinator._brainstorm_aggregator.get_status()
+                        queue_size = aggregator_status.queue_size
+                        aggregator_offset = autonomous_coordinator._brainstorm_aggregator.acceptance_count_offset
+                        acceptance_count = max(
+                            acceptance_count,
+                            aggregator_offset + aggregator_status.total_acceptances,
+                            aggregator_status.shared_training_size,
+                        )
                     except Exception:
-                        pass
+                        from backend.aggregator.core.queue_manager import queue_manager
+                        try:
+                            queue_size = await queue_manager.size()
+                        except Exception:
+                            pass
                 
                 # Get counts from autonomous coordinator internal state
-                acceptance_count = autonomous_coordinator._acceptance_count
+                acceptance_count = max(
+                    acceptance_count,
+                    autonomous_coordinator._acceptance_count,
+                    metadata.submission_count or 0,
+                )
                 rejection_count = autonomous_coordinator._rejection_count
                 cleanup_removals = autonomous_coordinator._cleanup_removals
                 
@@ -1013,6 +1127,75 @@ async def get_paper_history():
         raise HTTPException(status_code=500, detail="Internal server error")
 
 
+@router.get("/paper-history/pruned")
+async def get_pruned_paper_history():
+    """Get all pruned Stage 2 papers from legacy and session history."""
+    try:
+        papers = await paper_library.list_pruned_history_papers()
+        return {
+            "success": True,
+            "papers": papers,
+            "total_count": len(papers)
+        }
+    except Exception as e:
+        logger.error(f"Failed to get pruned Stage 2 paper history: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
+@router.get("/paper-history/pruned/{session_id}/{paper_id}")
+async def get_pruned_history_paper(session_id: str, paper_id: str):
+    """Get one pruned Stage 2 paper from legacy/session history."""
+    try:
+        paper = await paper_library.get_pruned_history_paper(session_id, paper_id)
+        if not paper:
+            raise HTTPException(
+                status_code=404,
+                detail=f"Pruned paper not found in history: session={session_id}, paper={paper_id}"
+            )
+
+        return {
+            "success": True,
+            **paper
+        }
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to get pruned history paper {session_id}/{paper_id}: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
+@router.delete("/paper-history/pruned/{session_id}")
+async def delete_pruned_history_papers(session_id: str, confirm: bool = False):
+    """Permanently delete all pruned Stage 2 paper files in one legacy/session scope."""
+    try:
+        if not confirm:
+            raise HTTPException(
+                status_code=400,
+                detail="Must confirm deletion with confirm=true"
+            )
+        paths = _resolve_history_session_paths(session_id)
+        scoped_paper_library = _build_scoped_paper_library(paths)
+        scoped_research_metadata = await _build_scoped_research_metadata(paths)
+        pruned_papers = await scoped_paper_library._list_pruned_history_papers_from_directory(
+            paths["papers_dir"],
+            session_id,
+        )
+        deleted_count = await scoped_paper_library.delete_all_pruned_papers()
+        for paper in pruned_papers:
+            await scoped_research_metadata.delete_paper(paper["paper_id"])
+        return {
+            "success": True,
+            "session_id": session_id,
+            "deleted_count": deleted_count,
+            "message": f"Deleted {deleted_count} pruned paper records"
+        }
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to delete pruned history papers for {session_id}: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
 @router.get("/paper-history/{session_id}/{paper_id}")
 async def get_history_paper(session_id: str, paper_id: str):
     """Get one completed, non-archived Stage 2 paper from legacy/session history."""
@@ -1179,7 +1362,7 @@ async def get_current_session():
         return {
             "is_active": True,
             "session_id": session_manager.session_id,
-            "path": str(session_manager.session_path) if session_manager.session_path else None
+            "path": session_manager.session_id
         }
         
     except Exception as e:
@@ -1523,15 +1706,23 @@ async def delete_brainstorm(topic_id: str, confirm: bool = False):
                 detail="Must confirm deletion with confirm=true"
             )
         
-        # Check if running
-        state = autonomous_coordinator.get_state()
-        if state.is_running and state.current_tier == "tier1_aggregation":
-            # Check if this is the active brainstorm
-            if autonomous_coordinator._current_topic_id == topic_id:
-                raise HTTPException(
-                    status_code=400,
-                    detail="Cannot delete active brainstorm while it's being aggregated. Stop autonomous research first."
-                )
+        # Check if this brainstorm is still owned by the running coordinator.
+        # The live aggregator keeps a direct file handle path through shared_training_memory;
+        # deleting it while active can recreate an unlisted "invisible" brainstorm DB.
+        active_topic_id = autonomous_coordinator._current_topic_id
+        active_aggregator = autonomous_coordinator._brainstorm_aggregator
+        aggregator_running = bool(active_aggregator and active_aggregator.is_running)
+        target_db_path = Path(brainstorm_memory.get_database_path(topic_id)).resolve()
+        active_shared_path = Path(shared_training_memory.file_path).resolve()
+        active_shared_path_matches = active_shared_path == target_db_path
+        if (
+            (active_topic_id == topic_id or active_shared_path_matches)
+            and (autonomous_coordinator.is_active or aggregator_running)
+        ):
+            raise HTTPException(
+                status_code=400,
+                detail="Cannot delete the active brainstorm while autonomous research is running. Stop autonomous research first."
+            )
         
         # Get brainstorm metadata
         metadata = await brainstorm_memory.get_metadata(topic_id)
@@ -1554,6 +1745,15 @@ async def delete_brainstorm(topic_id: str, confirm: bool = False):
         
         # Remove from central metadata
         await research_metadata.delete_brainstorm(topic_id)
+        if active_topic_id == topic_id:
+            await autonomous_coordinator.clear_deleted_brainstorm_reference(
+                topic_id,
+                "brainstorm deleted through API while coordinator was stopped"
+            )
+        else:
+            stats = await research_metadata.get_stats()
+            if stats.get("current_brainstorm_id") == topic_id:
+                await research_metadata.set_current_brainstorm(None)
         
         logger.info(f"Deleted brainstorm {topic_id} (had {len(associated_papers)} associated papers)")
         
@@ -1574,7 +1774,7 @@ async def delete_brainstorm(topic_id: str, confirm: bool = False):
 @router.delete("/paper/{paper_id}")
 async def delete_paper(paper_id: str, confirm: bool = False):
     """
-    Delete a paper and optionally its source brainstorm.
+    Prune a paper from model context while preserving it for user download.
     
     Query params:
         confirm: Must be True to execute deletion (safety check)
@@ -1600,9 +1800,39 @@ async def delete_paper(paper_id: str, confirm: bool = False):
         raise HTTPException(status_code=500, detail="Internal server error")
 
 
+@router.delete("/pruned-papers")
+async def delete_current_pruned_papers(confirm: bool = False):
+    """Permanently delete all pruned papers in the active autonomous paper scope."""
+    try:
+        if not confirm:
+            raise HTTPException(
+                status_code=400,
+                detail="Must confirm deletion with confirm=true"
+            )
+
+        pruned_papers = await paper_library._list_pruned_history_papers_from_directory(
+            paper_library._base_dir,
+            _get_active_autonomous_session_id(),
+        )
+        deleted_count = await paper_library.delete_all_pruned_papers()
+        for paper in pruned_papers:
+            await research_metadata.delete_paper(paper["paper_id"])
+        return {
+            "success": True,
+            "session_id": _get_active_autonomous_session_id(),
+            "deleted_count": deleted_count,
+            "message": f"Deleted {deleted_count} pruned paper records"
+        }
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to delete current pruned papers: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
 @router.delete("/paper-history/{session_id}/{paper_id}")
 async def delete_history_paper(session_id: str, paper_id: str, confirm: bool = False):
-    """Delete a completed Stage 2 history paper from a specific legacy/session scope."""
+    """Prune a completed Stage 2 history paper from a specific legacy/session scope."""
     try:
         if not confirm:
             raise HTTPException(
@@ -1994,6 +2224,10 @@ async def get_final_answer_archived_papers(answer_id: str):
         memory = _build_scoped_final_answer_memory(answer_id)
         papers = await memory.get_archived_papers_list()
         return {"papers": papers}
+    except HTTPException:
+        raise
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to get archived papers for {answer_id}: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
@@ -2020,6 +2254,8 @@ async def get_final_answer_archived_paper(answer_id: str, paper_id: str):
         return paper
     except HTTPException:
         raise
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to get archived paper {paper_id} for {answer_id}: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
@@ -2040,6 +2276,10 @@ async def get_final_answer_archived_brainstorms(answer_id: str):
         memory = _build_scoped_final_answer_memory(answer_id)
         brainstorms = await memory.get_archived_brainstorms_list()
         return {"brainstorms": brainstorms}
+    except HTTPException:
+        raise
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to get archived brainstorms for {answer_id}: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
@@ -2066,6 +2306,8 @@ async def get_final_answer_archived_brainstorm(answer_id: str, topic_id: str):
         return brainstorm
     except HTTPException:
         raise
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
     except Exception as e:
         logger.error(f"Failed to get archived brainstorm {topic_id} for {answer_id}: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
@@ -2315,10 +2557,13 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
         validator_max_tokens = None
         validator_provider = None
         validator_openrouter_provider = None
+        validator_openrouter_reasoning_effort = "auto"
+        validator_supercharge_enabled = False
         custom_prompt = None
         
         if request:
             custom_prompt = request.custom_prompt
+            validator_supercharge_enabled = bool(request.validator_supercharge_enabled)
             # Check if request provides validator config
             if request.validator_model:
                 validator_model = request.validator_model
@@ -2326,6 +2571,7 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
                 validator_max_tokens = request.validator_max_tokens or 25000
                 validator_provider = request.validator_provider or "lm_studio"
                 validator_openrouter_provider = request.validator_openrouter_provider
+                validator_openrouter_reasoning_effort = request.validator_openrouter_reasoning_effort
         
         # If no validator config from request, try coordinator
         if not validator_model:
@@ -2336,6 +2582,8 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
                 validator_max_tokens = coordinator_config["validator_max_tokens"]
                 validator_provider = coordinator_config["validator_provider"]
                 validator_openrouter_provider = coordinator_config.get("validator_openrouter_provider")
+                validator_openrouter_reasoning_effort = coordinator_config.get("validator_openrouter_reasoning_effort", "auto")
+                validator_supercharge_enabled = bool(coordinator_config.get("validator_supercharge_enabled", False))
         
         # If still no config, error
         if not validator_model:
@@ -2386,9 +2634,11 @@ async def request_final_answer_critique(answer_id: str, request: CritiqueRequest
                 model_id=validator_model,
                 openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=None,  # No fallback for direct critique calls
                 context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
         
@@ -2559,7 +2809,7 @@ async def get_default_critique_prompt():
 # ============================================================================
 
 @router.get("/api-logs")
-async def get_autonomous_api_logs(limit: int = 100):
+async def get_autonomous_api_logs(limit: int = 100, workflow: Optional[str] = None):
     """
     Get autonomous research API call logs.
     
@@ -2570,20 +2820,57 @@ async def get_autonomous_api_logs(limit: int = 100):
         Dict with logs and statistics
     """
     try:
-        combined = await _get_combined_api_logs(limit=limit)
+        safe_limit = max(1, min(limit, 100))
+        workflow_filter = _normalize_api_log_workflow_filter(workflow)
+        combined = await _get_combined_api_logs(
+            limit=safe_limit,
+            workflow=workflow_filter,
+            include_full=False,
+        )
         
         return {
             "success": True,
-            "logs": combined["logs"],
+            "logs": [_summarize_api_log_entry(log) for log in combined["logs"]],
             "stats": combined["stats"],
         }
+    except HTTPException:
+        raise
     except Exception as e:
         logger.error(f"Failed to get autonomous API logs: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
 
 
+@router.get("/api-logs/detail/{log_key}")
+async def get_autonomous_api_log_detail(log_key: str, workflow: Optional[str] = None):
+    """Get one full API log entry by key for explicit user inspection/copy."""
+    try:
+        if not log_key or len(log_key) > 128:
+            raise HTTPException(status_code=400, detail="Invalid API log key")
+
+        workflow_filter = _normalize_api_log_workflow_filter(workflow)
+        combined = await _get_combined_api_logs(limit=1000, workflow=workflow_filter)
+        for log in combined["logs"]:
+            if _get_api_log_key(log) == log_key:
+                return {
+                    "success": True,
+                    "log": {
+                        **log,
+                        "log_key": log_key,
+                        "prompt_size": len(str(log.get("prompt_full") or "")),
+                        "response_size": len(str(log.get("response_full") or "")),
+                    },
+                }
+
+        raise HTTPException(status_code=404, detail="API log entry not found")
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to get autonomous API log detail: {e}")
+        raise HTTPException(status_code=500, detail="Internal server error")
+
+
 @router.post("/api-logs/clear")
-async def clear_autonomous_api_logs():
+async def clear_autonomous_api_logs(workflow: Optional[str] = None):
     """
     Clear all autonomous API logs.
     
@@ -2591,20 +2878,23 @@ async def clear_autonomous_api_logs():
         Success status
     """
     try:
-        await autonomous_api_logger.clear_logs()
-        await boost_logger.clear_logs()
+        workflow_filter = _normalize_api_log_workflow_filter(workflow)
+        await autonomous_api_logger.clear_logs(workflow=workflow_filter)
+        await boost_logger.clear_logs(workflow=workflow_filter)
         
         return {
             "success": True,
             "message": "Combined API logs cleared successfully"
         }
+    except HTTPException:
+        raise
     except Exception as e:
         logger.error(f"Failed to clear autonomous API logs: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
 
 
 @router.get("/api-logs/stats")
-async def get_autonomous_api_stats():
+async def get_autonomous_api_stats(workflow: Optional[str] = None):
     """
     Get statistics about autonomous API calls.
     
@@ -2612,12 +2902,19 @@ async def get_autonomous_api_stats():
         Statistics dict (total calls, by phase, by model, success rate, etc.)
     """
     try:
-        combined = await _get_combined_api_logs(limit=1000)
+        workflow_filter = _normalize_api_log_workflow_filter(workflow)
+        combined = await _get_combined_api_logs(
+            limit=1000,
+            workflow=workflow_filter,
+            include_full=False,
+        )
         
         return {
             "success": True,
             "stats": combined["stats"]
         }
+    except HTTPException:
+        raise
     except Exception as e:
         logger.error(f"Failed to get autonomous API stats: {e}")
         raise HTTPException(status_code=500, detail="Internal server error")
\ No newline at end of file
diff --git a/backend/api/routes/boost.py b/backend/api/routes/boost.py
index 2838296..8d87f6b 100644
--- a/backend/api/routes/boost.py
+++ b/backend/api/routes/boost.py
@@ -13,7 +13,7 @@
 from typing import Dict, Any, Optional
 import logging
 
-from backend.shared.config import rag_config
+from backend.shared.config import rag_config, system_config
 from backend.shared.models import BoostConfig
 from backend.shared.boost_manager import boost_manager
 from backend.shared.boost_logger import boost_logger
@@ -28,12 +28,17 @@ class BoostNextCountRequest(BaseModel):
     count: int
 
 
-def _resolve_boost_api_key(api_key: Optional[str]) -> str:
-    """Use the explicit boost key when provided, otherwise fall back to the active global key."""
+def _resolve_boost_api_key(api_key: Optional[str], *, allow_current_override: bool = False) -> str:
+    """Use an explicit/current boost key when provided, otherwise fall back to the active global key."""
     explicit_key = (api_key or "").strip()
     if explicit_key:
         return explicit_key
 
+    if allow_current_override and boost_manager.boost_config:
+        current_key = (boost_manager.boost_config.openrouter_api_key or "").strip()
+        if current_key:
+            return current_key
+
     global_key = (rag_config.openrouter_api_key or "").strip()
     if global_key:
         return global_key
@@ -56,7 +61,8 @@ async def enable_boost(config: BoostConfig) -> Dict[str, Any]:
         Status and boost configuration
     """
     try:
-        effective_api_key = _resolve_boost_api_key(config.openrouter_api_key)
+        explicit_api_key = (config.openrouter_api_key or "").strip()
+        effective_api_key = _resolve_boost_api_key(explicit_api_key)
         
         client = OpenRouterClient(effective_api_key)
         try:
@@ -70,7 +76,9 @@ async def enable_boost(config: BoostConfig) -> Dict[str, Any]:
         finally:
             await client.close()
 
-        config.openrouter_api_key = effective_api_key
+        # Keep explicit boost override keys in process memory only. When the
+        # user relies on the global OpenRouter key, Boost stores no key at all.
+        config.openrouter_api_key = explicit_api_key
         
         # Enable boost
         await boost_manager.set_boost_config(config)
@@ -84,6 +92,7 @@ async def enable_boost(config: BoostConfig) -> Dict[str, Any]:
             "config": {
                 "model_id": config.boost_model_id,
                 "provider": config.boost_provider,
+                "reasoning_effort": config.boost_reasoning_effort,
                 "context_window": config.boost_context_window,
                 "max_output_tokens": config.boost_max_output_tokens
             }
@@ -119,7 +128,11 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
                 detail="Boost must be enabled first. Use /api/boost/enable to enable boost."
             )
         
-        effective_api_key = _resolve_boost_api_key(config.openrouter_api_key)
+        explicit_api_key = (config.openrouter_api_key or "").strip()
+        effective_api_key = _resolve_boost_api_key(
+            explicit_api_key,
+            allow_current_override=True,
+        )
         
         client = OpenRouterClient(effective_api_key)
         try:
@@ -133,7 +146,12 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
         finally:
             await client.close()
 
-        config.openrouter_api_key = effective_api_key
+        if explicit_api_key:
+            config.openrouter_api_key = explicit_api_key
+        elif boost_manager.boost_config and boost_manager.boost_config.openrouter_api_key:
+            config.openrouter_api_key = boost_manager.boost_config.openrouter_api_key
+        else:
+            config.openrouter_api_key = ""
         
         # Store current boost state before update
         old_boost_next_count = boost_manager.boost_next_count
@@ -158,6 +176,7 @@ async def update_boost_model(config: BoostConfig) -> Dict[str, Any]:
             "config": {
                 "model_id": config.boost_model_id,
                 "provider": config.boost_provider,
+                "reasoning_effort": config.boost_reasoning_effort,
                 "context_window": config.boost_context_window,
                 "max_output_tokens": config.boost_max_output_tokens
             },
@@ -467,7 +486,7 @@ async def get_boost_logs(limit: int = 100) -> Dict[str, Any]:
         List of log entries (most recent first)
     """
     try:
-        logs = await boost_logger.get_logs(limit)
+        logs = await boost_logger.get_logs(limit, include_full=False)
         stats = await boost_logger.get_stats()
         
         return {
@@ -493,7 +512,7 @@ async def get_boost_log_entry(index: int) -> Dict[str, Any]:
         Full log entry including complete response
     """
     try:
-        entry = await boost_logger.get_log_entry(index)
+        entry = await boost_logger.get_log_entry(index, include_full=system_config.api_log_store_full_payloads)
         
         if not entry:
             raise HTTPException(status_code=404, detail="Log entry not found")
diff --git a/backend/api/routes/compiler.py b/backend/api/routes/compiler.py
index 4561369..4c431a7 100644
--- a/backend/api/routes/compiler.py
+++ b/backend/api/routes/compiler.py
@@ -1,25 +1,106 @@
 """
 Compiler API routes.
 """
+import asyncio
+import hashlib
 from fastapi import APIRouter, HTTPException
 import logging
 from pathlib import Path
 import aiofiles
 
-from backend.shared.models import CompilerStartRequest, CompilerState, CritiqueRequest
+from backend.api.routes import websocket
+from backend.shared.models import CompilerStartRequest, CompilerState, CritiqueRequest, ModelConfig
 from backend.shared.config import system_config
 from backend.shared.token_tracker import token_tracker
-from backend.compiler.core.compiler_coordinator import compiler_coordinator
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.workflow_start_guard import workflow_start_guard
+from backend.compiler.core.compiler_coordinator import CRITIQUE_ATTEMPT_TARGET, compiler_coordinator
 from backend.compiler.memory.outline_memory import outline_memory
 from backend.compiler.memory.paper_memory import paper_memory
 from backend.aggregator.core.coordinator import coordinator
 from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+from backend.autonomous.core.proof_verification_stage import ProofVerificationStage
+from backend.autonomous.memory.proof_database import proof_database
+from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
 
 logger = logging.getLogger(__name__)
 
 router = APIRouter(prefix="/api/compiler", tags=["compiler"])
 
 
+async def _run_saved_compiler_paper_proof_check(
+    full_content: str,
+    source_title: str,
+    proof_config: dict,
+) -> None:
+    """Run autonomous proof extraction/tiering for a saved manual compiler paper."""
+    if not proof_config.get("lean4_enabled"):
+        logger.info("Skipping saved compiler paper proof check: Lean 4 disabled")
+        return
+    if not full_content.strip():
+        return
+    submitter_model = str(proof_config.get("submitter_model") or "")
+    validator_model = str(proof_config.get("validator_model") or "")
+    if not submitter_model:
+        logger.warning("Skipping saved compiler paper proof check: high-context model is unavailable")
+        return
+    if not validator_model:
+        logger.warning("Skipping saved compiler paper proof check: validator model is unavailable")
+        return
+
+    source_hash = hashlib.sha256(full_content.encode("utf-8")).hexdigest()[:16]
+    source_id = f"compiler_manual_{source_hash}"
+    role_suffix = "compiler_manual_paper"
+
+    submitter_config = ModelConfig(
+        provider=str(proof_config.get("submitter_provider") or "lm_studio"),
+        model_id=submitter_model,
+        openrouter_provider=proof_config.get("submitter_openrouter_provider"),
+        openrouter_reasoning_effort=proof_config.get("submitter_openrouter_reasoning_effort", "auto"),
+        lm_studio_fallback_id=proof_config.get("submitter_lm_studio_fallback"),
+        context_window=int(proof_config.get("submitter_context") or system_config.compiler_high_context_context_window),
+        max_output_tokens=int(proof_config.get("submitter_max_tokens") or system_config.compiler_high_context_max_output_tokens),
+        supercharge_enabled=bool(proof_config.get("submitter_supercharge_enabled", False)),
+    )
+    validator_config = ModelConfig(
+        provider=str(proof_config.get("validator_provider") or "lm_studio"),
+        model_id=validator_model,
+        openrouter_provider=proof_config.get("validator_openrouter_provider"),
+        openrouter_reasoning_effort=proof_config.get("validator_openrouter_reasoning_effort", "auto"),
+        lm_studio_fallback_id=proof_config.get("validator_lm_studio_fallback"),
+        context_window=int(proof_config.get("validator_context") or system_config.compiler_validator_context_window),
+        max_output_tokens=int(proof_config.get("validator_max_tokens") or system_config.compiler_validator_max_output_tokens),
+        supercharge_enabled=bool(proof_config.get("validator_supercharge_enabled", False)),
+    )
+    for role_id in (
+        f"autonomous_proof_identification_{role_suffix}",
+        f"autonomous_proof_lemma_search_{role_suffix}",
+        f"autonomous_proof_formalization_{role_suffix}",
+    ):
+        api_client_manager.configure_role(role_id, submitter_config)
+    api_client_manager.configure_role("autonomous_proof_novelty", validator_config)
+
+    stage = ProofVerificationStage()
+    await stage.run(
+        content=full_content,
+        source_type="paper",
+        source_id=source_id,
+        user_prompt=str(proof_config.get("user_prompt") or ""),
+        submitter_model=submitter_model,
+        submitter_context=submitter_config.context_window,
+        submitter_max_tokens=submitter_config.max_output_tokens,
+        validator_model=validator_model,
+        validator_context=validator_config.context_window,
+        validator_max_tokens=validator_config.max_output_tokens,
+        broadcast_fn=websocket.broadcast_event,
+        novel_proofs_db=proof_database,
+        source_title=source_title,
+        role_suffix_override=role_suffix,
+        trigger="manual_compiler_save",
+        append_to_source=False,
+    )
+
+
 def _get_start_conflict() -> str | None:
     """Return a user-facing conflict message if another workflow is active."""
     if compiler_coordinator.is_running:
@@ -29,71 +110,94 @@ def _get_start_conflict() -> str | None:
         return "Cannot start Compiler while Aggregator is running. Stop Aggregator first."
 
     autonomous_state = autonomous_coordinator.get_state()
-    if autonomous_state.is_running:
+    if autonomous_state.is_running or autonomous_coordinator.is_active:
         return "Cannot start Compiler while Autonomous Research is running. Stop Autonomous Research first."
 
+    if leanoj_coordinator.is_active:
+        return "Cannot start Compiler while Proof Solver is running. Stop Proof Solver first."
+
     return None
 
 
+def _log_background_task_failure(task: asyncio.Task) -> None:
+    try:
+        task.result()
+    except asyncio.CancelledError:
+        logger.info("Saved compiler paper proof check was cancelled")
+    except Exception:
+        logger.exception("Saved compiler paper proof check failed")
+
+
 @router.post("/start")
 async def start_compiler(request: CompilerStartRequest):
     """Start the compiler system."""
     try:
-        conflict = _get_start_conflict()
-        if conflict:
-            raise HTTPException(status_code=400, detail=conflict)
-
-        # Update system config with user-provided context sizes
-        system_config.compiler_validator_context_window = request.validator_context_size
-        system_config.compiler_high_context_context_window = request.high_context_context_size
-        system_config.compiler_high_param_context_window = request.high_param_context_size
-        system_config.compiler_critique_submitter_context_window = request.critique_submitter_context_window
-        
-        # Update max output token configurations
-        system_config.compiler_validator_max_output_tokens = request.validator_max_output_tokens
-        system_config.compiler_high_context_max_output_tokens = request.high_context_max_output_tokens
-        system_config.compiler_high_param_max_output_tokens = request.high_param_max_output_tokens
-        system_config.compiler_critique_submitter_max_tokens = request.critique_submitter_max_tokens
-        
-        # Store critique submitter model
-        system_config.compiler_critique_submitter_model = request.critique_submitter_model
-        
-        logger.info(
-            f"Compiler max output tokens - "
-            f"Validator: {request.validator_max_output_tokens}, "
-            f"High-context: {request.high_context_max_output_tokens}, "
-            f"High-param: {request.high_param_max_output_tokens}"
-        )
-        
-        # Initialize coordinator with OpenRouter provider configurations
-        await compiler_coordinator.initialize(
-            compiler_prompt=request.compiler_prompt,
-            validator_model=request.validator_model,
-            high_context_model=request.high_context_model,
-            high_param_model=request.high_param_model,
-            critique_submitter_model=request.critique_submitter_model,
-            # OpenRouter provider configs for each role
-            validator_provider=request.validator_provider,
-            validator_openrouter_provider=request.validator_openrouter_provider,
-            validator_lm_studio_fallback=request.validator_lm_studio_fallback,
-            high_context_provider=request.high_context_provider,
-            high_context_openrouter_provider=request.high_context_openrouter_provider,
-            high_context_lm_studio_fallback=request.high_context_lm_studio_fallback,
-            high_param_provider=request.high_param_provider,
-            high_param_openrouter_provider=request.high_param_openrouter_provider,
-            high_param_lm_studio_fallback=request.high_param_lm_studio_fallback,
-            critique_submitter_provider=request.critique_submitter_provider,
-            critique_submitter_openrouter_provider=request.critique_submitter_openrouter_provider,
-            critique_submitter_lm_studio_fallback=request.critique_submitter_lm_studio_fallback
-        )
-        
-        # Start coordinator
-        token_tracker.reset()
-        token_tracker.start_timer()
-        await compiler_coordinator.start()
-        
-        return {"status": "started", "message": "Compiler started successfully"}
+        async with workflow_start_guard.reserve():
+            conflict = _get_start_conflict()
+            if conflict:
+                raise HTTPException(status_code=400, detail=conflict)
+
+            # Update system config with user-provided context sizes
+            system_config.compiler_validator_context_window = request.validator_context_size
+            system_config.compiler_high_context_context_window = request.high_context_context_size
+            system_config.compiler_high_param_context_window = request.high_param_context_size
+            system_config.compiler_critique_submitter_context_window = request.critique_submitter_context_window
+
+            # Update max output token configurations
+            system_config.compiler_validator_max_output_tokens = request.validator_max_output_tokens
+            system_config.compiler_high_context_max_output_tokens = request.high_context_max_output_tokens
+            system_config.compiler_high_param_max_output_tokens = request.high_param_max_output_tokens
+            system_config.compiler_critique_submitter_max_tokens = request.critique_submitter_max_tokens
+
+            # Store critique submitter model
+            system_config.compiler_critique_submitter_model = request.critique_submitter_model
+
+            logger.info(
+                f"Compiler max output tokens - "
+                f"Validator: {request.validator_max_output_tokens}, "
+                f"High-context: {request.high_context_max_output_tokens}, "
+                f"High-param: {request.high_param_max_output_tokens}"
+            )
+
+            # Initialize coordinator with OpenRouter provider configurations
+            await compiler_coordinator.initialize(
+                compiler_prompt=request.compiler_prompt,
+                validator_model=request.validator_model,
+                high_context_model=request.high_context_model,
+                high_param_model=request.high_param_model,
+                critique_submitter_model=request.critique_submitter_model,
+                # OpenRouter provider configs for each role
+                validator_provider=request.validator_provider,
+                validator_openrouter_provider=request.validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=request.validator_openrouter_reasoning_effort,
+                validator_lm_studio_fallback=request.validator_lm_studio_fallback,
+                high_context_provider=request.high_context_provider,
+                high_context_openrouter_provider=request.high_context_openrouter_provider,
+                high_context_openrouter_reasoning_effort=request.high_context_openrouter_reasoning_effort,
+                high_context_lm_studio_fallback=request.high_context_lm_studio_fallback,
+                high_param_provider=request.high_param_provider,
+                high_param_openrouter_provider=request.high_param_openrouter_provider,
+                high_param_openrouter_reasoning_effort=request.high_param_openrouter_reasoning_effort,
+                high_param_lm_studio_fallback=request.high_param_lm_studio_fallback,
+                critique_submitter_provider=request.critique_submitter_provider,
+                critique_submitter_openrouter_provider=request.critique_submitter_openrouter_provider,
+                critique_submitter_openrouter_reasoning_effort=request.critique_submitter_openrouter_reasoning_effort,
+                critique_submitter_lm_studio_fallback=request.critique_submitter_lm_studio_fallback,
+                validator_supercharge_enabled=request.validator_supercharge_enabled,
+                high_context_supercharge_enabled=request.high_context_supercharge_enabled,
+                high_param_supercharge_enabled=request.high_param_supercharge_enabled,
+                critique_submitter_supercharge_enabled=request.critique_submitter_supercharge_enabled
+            )
+
+            # Start coordinator
+            token_tracker.reset()
+            token_tracker.start_timer()
+            await compiler_coordinator.start()
+
+            return {"status": "started", "message": "Compiler started successfully"}
     
+    except HTTPException:
+        raise
     except ValueError as e:
         # Model compatibility errors - provide structured error response
         error_msg = str(e)
@@ -336,13 +440,47 @@ async def save_paper():
         
         async with aiofiles.open(output_path, 'w', encoding='utf-8') as f:
             await f.write(full_content)
+
+        high_context = compiler_coordinator.high_context_submitter
+        proof_check_scheduled = bool(
+            system_config.lean4_enabled
+            and full_content.strip()
+            and high_context is not None
+            and getattr(high_context, "model_name", "")
+            and compiler_coordinator.validator_model
+        )
+        if proof_check_scheduled:
+            source_title = compiler_coordinator.paper_title or compiler_coordinator.user_prompt or "Compiler Paper"
+            proof_config = {
+                "lean4_enabled": system_config.lean4_enabled,
+                "user_prompt": compiler_coordinator.user_prompt,
+                "submitter_model": high_context.model_name,
+                "submitter_provider": compiler_coordinator.high_context_provider,
+                "submitter_openrouter_provider": compiler_coordinator.high_context_openrouter_provider,
+                "submitter_openrouter_reasoning_effort": compiler_coordinator.high_context_openrouter_reasoning_effort,
+                "submitter_lm_studio_fallback": compiler_coordinator.high_context_lm_studio_fallback,
+                "submitter_context": system_config.compiler_high_context_context_window,
+                "submitter_max_tokens": system_config.compiler_high_context_max_output_tokens,
+                "submitter_supercharge_enabled": getattr(compiler_coordinator, "high_context_supercharge_enabled", False),
+                "validator_model": compiler_coordinator.validator_model,
+                "validator_provider": compiler_coordinator.validator_provider,
+                "validator_openrouter_provider": compiler_coordinator.validator_openrouter_provider,
+                "validator_openrouter_reasoning_effort": compiler_coordinator.validator_openrouter_reasoning_effort,
+                "validator_lm_studio_fallback": compiler_coordinator.validator_lm_studio_fallback,
+                "validator_context": compiler_coordinator.validator_context_window,
+                "validator_max_tokens": compiler_coordinator.validator_max_tokens,
+                "validator_supercharge_enabled": getattr(compiler_coordinator, "validator_supercharge_enabled", False),
+            }
+            task = asyncio.create_task(_run_saved_compiler_paper_proof_check(full_content, source_title, proof_config))
+            task.add_done_callback(_log_background_task_failure)
         
         return {
             "status": "saved",
-            "path": str(output_path),
+            "path": output_path.name,
             "word_count": word_count,
-            "message": f"Paper saved to {output_path} ({word_count} words)",
-            "has_attribution": bool(attribution_section)
+            "message": f"Paper saved to {output_path.name} ({word_count} words)",
+            "has_attribution": bool(attribution_section),
+            "proof_check_scheduled": proof_check_scheduled
         }
     except Exception as e:
         logger.error(f"Failed to save paper: {e}")
@@ -441,7 +579,7 @@ async def get_critique_status():
             "in_critique_phase": compiler_coordinator.in_critique_phase,
             "critique_acceptances": compiler_coordinator.critique_acceptances,
             "paper_version": compiler_coordinator.paper_version,
-            "target_critiques": 5
+            "target_critiques": CRITIQUE_ATTEMPT_TARGET
         }
     except Exception as e:
         logger.error(f"Failed to get critique status: {e}")
@@ -512,6 +650,8 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
         validator_max_tokens = critique_request.validator_max_tokens
         validator_provider = critique_request.validator_provider
         validator_openrouter_provider = critique_request.validator_openrouter_provider
+        validator_openrouter_reasoning_effort = critique_request.validator_openrouter_reasoning_effort
+        validator_supercharge_enabled = bool(critique_request.validator_supercharge_enabled)
         
         # If validator config not provided in request, fall back to coordinator config
         if not validator_model:
@@ -520,6 +660,8 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
             validator_max_tokens = system_config.compiler_validator_max_output_tokens
             validator_provider = getattr(compiler_coordinator, 'validator_provider', 'lm_studio')
             validator_openrouter_provider = getattr(compiler_coordinator, 'validator_openrouter_provider', None)
+            validator_openrouter_reasoning_effort = getattr(compiler_coordinator, 'validator_openrouter_reasoning_effort', 'auto')
+            validator_supercharge_enabled = bool(getattr(compiler_coordinator, 'validator_supercharge_enabled', False))
         
         if not validator_model:
             raise HTTPException(
@@ -576,9 +718,11 @@ async def request_compiler_critique(critique_request: CritiqueRequest = None):
                 model_id=validator_model,
                 openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=None,  # No fallback for direct critique calls
                 context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
         
diff --git a/backend/api/routes/download.py b/backend/api/routes/download.py
index 07cdf7f..dfe44dc 100644
--- a/backend/api/routes/download.py
+++ b/backend/api/routes/download.py
@@ -3,6 +3,8 @@
 Runs in a thread pool so the FastAPI event loop is never blocked.
 """
 import asyncio
+from html import escape
+from html.parser import HTMLParser
 import logging
 from pathlib import Path
 from fastapi import APIRouter, HTTPException
@@ -46,6 +48,140 @@ class PDFRequest(BaseModel):
     filename: str = "document"
 
 
+_ALLOWED_PDF_TAGS = {
+    "div", "span", "p", "br", "hr",
+    "strong", "b", "em", "i", "u", "s", "sub", "sup", "small",
+    "h1", "h2", "h3", "h4", "h5", "h6",
+    "ul", "ol", "li", "dl", "dt", "dd",
+    "table", "thead", "tbody", "tr", "th", "td",
+    "math", "semantics", "mrow", "mi", "mo", "mn", "msup", "msub",
+    "mfrac", "mroot", "msqrt", "mtext", "mspace", "mtable", "mtr", "mtd",
+    "annotation", "annotation-xml",
+    "svg", "path", "line", "rect", "circle", "g", "use", "defs", "clippath",
+}
+_VOID_PDF_TAGS = {"br", "hr", "path", "line", "rect", "circle", "use"}
+_DROP_CONTENT_TAGS = {"script", "style", "iframe", "object", "embed", "form", "textarea", "select"}
+_ALLOWED_PDF_ATTRS = {
+    "class", "id", "title", "style",
+    "mathvariant", "encoding", "xmlns", "displaystyle", "scriptlevel",
+    "columnalign", "rowalign", "columnspacing", "rowspacing", "stretchy",
+    "symmetric", "fence", "separator", "lspace", "rspace", "accent",
+    "accentunder", "movablelimits", "minsize", "maxsize", "width", "height",
+    "d", "viewbox", "preserveaspectratio", "fill", "stroke", "stroke-width",
+    "transform", "x", "y", "dx", "dy", "x1", "y1", "x2", "y2", "r", "cx", "cy",
+    "href", "xlink:href", "clip-path",
+}
+_FORBIDDEN_STYLE_TOKENS = ("url(", "expression", "@import", "behavior:")
+
+
+class _PdfHtmlSanitizer(HTMLParser):
+    """Small allowlist sanitizer for already-rendered LaTeX/KaTeX HTML."""
+
+    def __init__(self) -> None:
+        super().__init__(convert_charrefs=True)
+        self._parts: list[str] = []
+        self._drop_content_depth = 0
+
+    @staticmethod
+    def _is_safe_attr(name: str, value: str) -> bool:
+        attr = name.lower()
+        if attr not in _ALLOWED_PDF_ATTRS or attr.startswith("on"):
+            return False
+        lowered_value = (value or "").strip().lower()
+        if attr == "style":
+            return not any(token in lowered_value for token in _FORBIDDEN_STYLE_TOKENS)
+        if attr in {"href", "xlink:href"}:
+            return lowered_value.startswith("#") or lowered_value.startswith("data:image/")
+        return True
+
+    def _append_start_tag(self, tag: str, attrs, *, self_closing: bool = False) -> None:
+        normalized_tag = tag.lower()
+        if normalized_tag not in _ALLOWED_PDF_TAGS:
+            if normalized_tag in _DROP_CONTENT_TAGS and not self_closing:
+                self._drop_content_depth += 1
+            return
+
+        rendered_attrs = []
+        for name, value in attrs:
+            attr_name = (name or "").lower()
+            attr_value = "" if value is None else str(value)
+            if self._is_safe_attr(attr_name, attr_value):
+                rendered_attrs.append(f'{attr_name}="{escape(attr_value, quote=True)}"')
+
+        suffix = " /" if self_closing and normalized_tag not in _VOID_PDF_TAGS else ""
+        attr_text = f" {' '.join(rendered_attrs)}" if rendered_attrs else ""
+        self._parts.append(f"<{normalized_tag}{attr_text}{suffix}>")
+
+    def handle_starttag(self, tag, attrs) -> None:
+        self._append_start_tag(tag, attrs)
+
+    def handle_startendtag(self, tag, attrs) -> None:
+        self._append_start_tag(tag, attrs, self_closing=True)
+
+    def handle_endtag(self, tag) -> None:
+        normalized_tag = tag.lower()
+        if normalized_tag in _DROP_CONTENT_TAGS and self._drop_content_depth > 0:
+            self._drop_content_depth -= 1
+            return
+        if normalized_tag in _ALLOWED_PDF_TAGS and normalized_tag not in _VOID_PDF_TAGS:
+            self._parts.append(f"</{normalized_tag}>")
+
+    def handle_data(self, data) -> None:
+        if self._drop_content_depth > 0:
+            return
+        self._parts.append(escape(data or ""))
+
+    def handle_entityref(self, name) -> None:
+        if self._drop_content_depth > 0:
+            return
+        self._parts.append(f"&{name};")
+
+    def handle_charref(self, name) -> None:
+        if self._drop_content_depth > 0:
+            return
+        self._parts.append(f"&#{name};")
+
+    def get_html(self) -> str:
+        return "".join(self._parts)
+
+
+def _sanitize_pdf_html(html_body: str) -> str:
+    sanitizer = _PdfHtmlSanitizer()
+    sanitizer.feed(html_body or "")
+    sanitizer.close()
+    return sanitizer.get_html()
+
+
+def _encoded_size(value: Optional[str]) -> int:
+    return len((value or "").encode("utf-8"))
+
+
+def _validate_pdf_request_size(req: PDFRequest) -> None:
+    html_size = _encoded_size(req.html_body)
+    if html_size > system_config.pdf_max_html_bytes:
+        raise HTTPException(
+            status_code=413,
+            detail=f"html_body exceeds PDF limit of {system_config.pdf_max_html_bytes} bytes",
+        )
+
+    outline_size = _encoded_size(req.outline)
+    if outline_size > system_config.pdf_max_outline_bytes:
+        raise HTTPException(
+            status_code=413,
+            detail=f"outline exceeds PDF limit of {system_config.pdf_max_outline_bytes} bytes",
+        )
+
+    metadata_size = sum(
+        _encoded_size(value)
+        for value in (req.title, req.date, req.models, req.filename)
+    )
+    if metadata_size > system_config.pdf_max_metadata_bytes:
+        raise HTTPException(
+            status_code=413,
+            detail=f"PDF metadata exceeds limit of {system_config.pdf_max_metadata_bytes} bytes",
+        )
+
+
 def _build_html_document(req: PDFRequest) -> str:
     """
     Wrap the rendered HTML body in a complete standalone HTML document
@@ -56,9 +192,9 @@ def _build_html_document(req: PDFRequest) -> str:
     if req.word_count:
         meta_parts.append(f"Word Count: {req.word_count:,}")
     if req.date:
-        meta_parts.append(f"Generated: {req.date}")
+        meta_parts.append(f"Generated: {_escape_html(req.date)}")
     if req.models:
-        meta_parts.append(f"AI Models: {req.models}")
+        meta_parts.append(f"AI Models: {_escape_html(req.models)}")
     meta_line = " &nbsp;|&nbsp; ".join(meta_parts) if meta_parts else ""
 
     outline_section = ""
@@ -293,10 +429,18 @@ def _generate_pdf_sync(html: str) -> bytes:
     with sync_playwright() as pw:
         browser = pw.chromium.launch(
             headless=True,
-            args=["--no-sandbox", "--disable-setuid-sandbox", "--disable-dev-shm-usage"]
+            args=["--disable-dev-shm-usage"]
         )
+        context = None
         try:
-            page = browser.new_page()
+            context = browser.new_context(java_script_enabled=False)
+            page = context.new_page()
+            page.route(
+                "**/*",
+                lambda route: route.continue_()
+                if route.request.url.startswith(("data:", "blob:", "about:"))
+                else route.abort(),
+            )
             page.set_content(html, wait_until="load", timeout=60000)
             pdf_bytes = page.pdf(
                 format="A4",
@@ -305,6 +449,11 @@ def _generate_pdf_sync(html: str) -> bytes:
             )
             return pdf_bytes
         finally:
+            if context is not None:
+                try:
+                    context.close()
+                except Exception:
+                    pass
             browser.close()
 
 
@@ -329,7 +478,10 @@ async def generate_pdf(req: PDFRequest):
         raise HTTPException(status_code=400, detail="html_body is required and cannot be empty")
 
     try:
-        html_document = _build_html_document(req)
+        _validate_pdf_request_size(req)
+        sanitized_body = _sanitize_pdf_html(req.html_body)
+        sanitized_request = req.model_copy(update={"html_body": sanitized_body})
+        html_document = _build_html_document(sanitized_request)
 
         loop = asyncio.get_running_loop()
         pdf_bytes = await loop.run_in_executor(None, _generate_pdf_sync, html_document)
diff --git a/backend/api/routes/leanoj.py b/backend/api/routes/leanoj.py
new file mode 100644
index 0000000..851d88c
--- /dev/null
+++ b/backend/api/routes/leanoj.py
@@ -0,0 +1,392 @@
+"""Proof Solver API routes backed by the LeanOJ workflow."""
+from __future__ import annotations
+
+import json
+import logging
+from pathlib import Path
+from typing import Any, Optional
+
+from fastapi import APIRouter, HTTPException
+
+from backend.aggregator.core.coordinator import coordinator
+from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+from backend.compiler.core.compiler_coordinator import compiler_coordinator
+from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
+from backend.shared.config import system_config
+from backend.shared.models import LeanOJStartRequest
+from backend.shared.workflow_start_guard import workflow_start_guard
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(prefix="/api/leanoj", tags=["leanoj"])
+
+
+def _leanoj_sessions_base_dir() -> Path:
+    return Path(system_config.data_dir) / "leanoj_sessions"
+
+
+def _read_leanoj_state_file(path: Path) -> dict[str, Any] | None:
+    try:
+        payload = json.loads(path.read_text(encoding="utf-8"))
+    except Exception as exc:
+        logger.warning("Failed to read LeanOJ state file %s: %s", path, exc)
+        return None
+
+    if not isinstance(payload, dict):
+        return None
+    payload.setdefault("session_id", path.parent.name)
+    return payload
+
+
+def _iter_leanoj_state_payloads() -> list[dict[str, Any]]:
+    base_dir = _leanoj_sessions_base_dir()
+    if not base_dir.exists():
+        return []
+
+    payloads: list[dict[str, Any]] = []
+    for state_file in base_dir.glob("*/state.json"):
+        if not state_file.is_file():
+            continue
+        payload = _read_leanoj_state_file(state_file)
+        if payload is not None:
+            payload["_state_file_mtime"] = state_file.stat().st_mtime
+            payloads.append(payload)
+
+    return payloads
+
+
+def _leanoj_request_payload(payload: dict[str, Any]) -> dict[str, Any]:
+    request_payload = payload.get("request")
+    return request_payload if isinstance(request_payload, dict) else {}
+
+
+def _leanoj_prompt(payload: dict[str, Any]) -> str:
+    request_payload = _leanoj_request_payload(payload)
+    return (
+        str(request_payload.get("user_prompt") or "").strip()
+        or str(payload.get("selected_topic") or "").strip()
+        or "Proof Solver problem"
+    )
+
+
+def _leanoj_created_at(payload: dict[str, Any], fallback: str = "") -> str:
+    return (
+        str(payload.get("updated_at") or "").strip()
+        or fallback
+        or ""
+    )
+
+
+def _leanoj_library_id(session_id: str, proof_id: str) -> str:
+    return f"{session_id}:{proof_id}"
+
+
+def _build_leanoj_final_proof(payload: dict[str, Any]) -> dict[str, Any] | None:
+    final_solution = str(payload.get("final_solution") or "").strip()
+    if not final_solution:
+        return None
+
+    session_id = str(payload.get("session_id") or "latest")
+    prompt = _leanoj_prompt(payload)
+    request_payload = _leanoj_request_payload(payload)
+    proof_id = "final_solution"
+    shared_proof_id = str(payload.get("final_proof_id") or "").strip()
+    return {
+        "library_id": _leanoj_library_id(session_id, proof_id),
+        "proof_id": proof_id,
+        "shared_proof_id": shared_proof_id,
+        "session_id": session_id,
+        "proof_kind": "final",
+        "theorem_name": "Final Proof Solver Submission",
+        "theorem_statement": prompt,
+        "source_type": "leanoj_final",
+        "source_id": session_id,
+        "source_title": str(payload.get("selected_topic") or "").strip() or prompt,
+        "user_prompt": prompt,
+        "lean_template": str(request_payload.get("lean_template") or ""),
+        "lean_code": final_solution,
+        "solver": "Proof Solver",
+        "attempt_count": int(payload.get("final_attempt_count") or 0),
+        "verified": True,
+        "novel": bool(payload.get("final_novel")),
+        "novelty_tier": str(payload.get("final_novelty_tier") or "not_novel"),
+        "novelty_reasoning": str(payload.get("final_novelty_reasoning") or ""),
+        "created_at": _leanoj_created_at(payload),
+        "phase": str(payload.get("phase") or ""),
+    }
+
+
+def _build_leanoj_subproofs(payload: dict[str, Any]) -> list[dict[str, Any]]:
+    session_id = str(payload.get("session_id") or "latest")
+    prompt = _leanoj_prompt(payload)
+    request_payload = _leanoj_request_payload(payload)
+    created_at_fallback = _leanoj_created_at(payload)
+    subproofs = payload.get("verified_subproofs") or []
+    if not isinstance(subproofs, list):
+        return []
+
+    proofs: list[dict[str, Any]] = []
+    for index, subproof in enumerate(subproofs, start=1):
+        if not isinstance(subproof, dict) or subproof.get("verified") is False:
+            continue
+        lean_code = str(subproof.get("lean_code") or "").strip()
+        if not lean_code:
+            continue
+
+        proof_id = str(subproof.get("subproof_id") or f"subproof_{index:03d}")
+        shared_proof_id = str(subproof.get("proof_id") or "").strip()
+        request_text = str(subproof.get("request") or "").strip()
+        theorem_or_lemma = str(subproof.get("theorem_or_lemma") or "").strip()
+        return_title = theorem_or_lemma or request_text or proof_id
+        proofs.append(
+            {
+                "library_id": _leanoj_library_id(session_id, proof_id),
+                "proof_id": proof_id,
+                "shared_proof_id": shared_proof_id,
+                "session_id": session_id,
+                "proof_kind": "subproof",
+                "theorem_name": return_title,
+                "theorem_statement": theorem_or_lemma or request_text or "Verified Proof Solver subproof",
+                "source_type": "leanoj_subproof",
+                "source_id": session_id,
+                "source_title": request_text or prompt,
+                "user_prompt": prompt,
+                "lean_template": str(request_payload.get("lean_template") or ""),
+                "lean_code": lean_code,
+                "lean_feedback": str(subproof.get("lean_feedback") or ""),
+                "verification_notes": str(subproof.get("lean_feedback") or ""),
+                "solver": "Proof Solver",
+                "attempt_count": int(subproof.get("attempts_used") or 0),
+                "verified": True,
+                "novel": bool(subproof.get("novel")),
+                "novelty_tier": str(subproof.get("novelty_tier") or "not_novel"),
+                "novelty_reasoning": str(subproof.get("novelty_reasoning") or ""),
+                "role": str(subproof.get("role") or ""),
+                "created_at": str(subproof.get("created_at") or "") or created_at_fallback,
+                "phase": str(payload.get("phase") or ""),
+            }
+        )
+    return proofs
+
+
+def _extract_leanoj_proofs(payload: dict[str, Any], *, include_subproofs: bool = True) -> list[dict[str, Any]]:
+    proofs: list[dict[str, Any]] = []
+    final_proof = _build_leanoj_final_proof(payload)
+    if final_proof is not None:
+        proofs.append(final_proof)
+    if include_subproofs:
+        proofs.extend(_build_leanoj_subproofs(payload))
+    return proofs
+
+
+def _build_leanoj_session_summary(payload: dict[str, Any], proofs: list[dict[str, Any]]) -> dict[str, Any]:
+    session_id = str(payload.get("session_id") or "latest")
+    prompt = _leanoj_prompt(payload)
+    final_count = sum(1 for proof in proofs if proof.get("proof_kind") == "final")
+    subproof_count = sum(1 for proof in proofs if proof.get("proof_kind") == "subproof")
+    return {
+        "session_id": session_id,
+        "user_prompt": prompt,
+        "selected_topic": str(payload.get("selected_topic") or ""),
+        "created_at": _leanoj_created_at(payload),
+        "updated_at": _leanoj_created_at(payload),
+        "phase": str(payload.get("phase") or ""),
+        "proof_count": len(proofs),
+        "final_count": final_count,
+        "subproof_count": subproof_count,
+        "is_current": session_id == leanoj_coordinator.get_state().session_id,
+    }
+
+
+def _sort_leanoj_proofs(proofs: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    return sorted(
+        proofs,
+        key=lambda proof: str(proof.get("created_at") or ""),
+        reverse=True,
+    )
+
+
+def _get_start_conflict() -> Optional[str]:
+    if leanoj_coordinator.is_active:
+        return "Proof Solver is already running"
+    if coordinator.is_running:
+        return "Cannot start Proof Solver while Aggregator is running. Stop Aggregator first."
+    if compiler_coordinator.is_running:
+        return "Cannot start Proof Solver while Compiler is running. Stop Compiler first."
+    autonomous_state = autonomous_coordinator.get_state()
+    if autonomous_state.is_running or autonomous_coordinator.is_active:
+        return "Cannot start Proof Solver while Autonomous Research is running. Stop Autonomous Research first."
+    return None
+
+
+@router.post("/start")
+async def start_leanoj(request: LeanOJStartRequest):
+    """Start a Proof Solver run."""
+    try:
+        async with workflow_start_guard.reserve():
+            conflict = _get_start_conflict()
+            if conflict:
+                raise HTTPException(status_code=400, detail=conflict)
+            if not system_config.lean4_enabled:
+                raise HTTPException(status_code=400, detail="Lean 4 is disabled. Enable Lean 4 proof verification before starting Proof Solver.")
+            resumed = await leanoj_coordinator.resume_or_initialize(request)
+            if not leanoj_coordinator.start_in_background():
+                raise HTTPException(status_code=400, detail="Proof Solver is already running")
+            return {
+                "success": True,
+                "message": "Proof Solver resumed" if resumed else "Proof Solver started",
+                "resumed": resumed,
+                "session_id": leanoj_coordinator.get_state().session_id,
+            }
+    except HTTPException:
+        raise
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc))
+    except Exception as exc:
+        logger.exception("Failed to start Proof Solver")
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.post("/stop")
+async def stop_leanoj():
+    """Stop the active Proof Solver run."""
+    try:
+        await leanoj_coordinator.stop()
+        return {
+            "success": True,
+            "message": "Proof Solver stopped",
+            "status": leanoj_coordinator.get_status(),
+        }
+    except Exception as exc:
+        logger.exception("Failed to stop Proof Solver")
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.post("/clear")
+async def clear_leanoj(confirm: bool = False):
+    """Clear saved Proof Solver progress."""
+    if not confirm:
+        raise HTTPException(status_code=400, detail="Confirmation required. Use ?confirm=true to clear Proof Solver progress.")
+    try:
+        await leanoj_coordinator.clear()
+        return {
+            "success": True,
+            "message": "Proof Solver progress cleared",
+            "status": leanoj_coordinator.get_status(),
+        }
+    except Exception as exc:
+        logger.exception("Failed to clear Proof Solver progress")
+        raise HTTPException(status_code=500, detail=str(exc))
+
+
+@router.get("/status")
+async def get_leanoj_status():
+    """Return the current Proof Solver state."""
+    return leanoj_coordinator.get_status()
+
+
+@router.get("/master-proof")
+async def get_leanoj_master_proof():
+    """Return the current Proof Solver master proof draft on demand."""
+    return await leanoj_coordinator.get_master_proof_draft()
+
+
+@router.get("/master-proof/edits")
+async def get_leanoj_master_proof_edits(limit: int = 50):
+    """Return compact summaries of recent Proof Solver master proof edits."""
+    return await leanoj_coordinator.get_master_proof_edit_summaries(limit=limit)
+
+
+@router.get("/proofs")
+async def get_leanoj_proofs():
+    """Return verified proofs from the currently loaded LeanOJ run."""
+    status = leanoj_coordinator.get_status()
+    proofs = _extract_leanoj_proofs(status)
+    return {
+        "proofs": _sort_leanoj_proofs(proofs),
+        "status": status,
+        "counts": {
+            "total": len(proofs),
+            "final": sum(1 for proof in proofs if proof.get("proof_kind") == "final"),
+            "subproof": sum(1 for proof in proofs if proof.get("proof_kind") == "subproof"),
+        },
+    }
+
+
+@router.get("/library")
+async def get_leanoj_library(include_subproofs: bool = True):
+    """Return completed Proof Solver proof works across saved sessions."""
+    payloads_by_session: dict[str, dict[str, Any]] = {
+        str(payload.get("session_id") or ""): payload
+        for payload in _iter_leanoj_state_payloads()
+        if payload.get("session_id")
+    }
+
+    current_status = leanoj_coordinator.get_status()
+    current_session_id = str(current_status.get("session_id") or "")
+    if current_session_id:
+        payloads_by_session[current_session_id] = current_status
+
+    proofs: list[dict[str, Any]] = []
+    sessions: list[dict[str, Any]] = []
+    for payload in payloads_by_session.values():
+        session_proofs = _extract_leanoj_proofs(payload, include_subproofs=include_subproofs)
+        if not session_proofs:
+            continue
+        proofs.extend(session_proofs)
+        sessions.append(_build_leanoj_session_summary(payload, session_proofs))
+
+    return {
+        "proofs": _sort_leanoj_proofs(proofs),
+        "sessions": sorted(
+            sessions,
+            key=lambda session: str(session.get("updated_at") or ""),
+            reverse=True,
+        ),
+    }
+
+
+@router.get("/library/{session_id}/{proof_id}")
+async def get_leanoj_library_proof(session_id: str, proof_id: str):
+    """Return one completed Proof Solver proof work with full Lean source."""
+    current_status = leanoj_coordinator.get_status()
+    if str(current_status.get("session_id") or "") == session_id:
+        for proof in _extract_leanoj_proofs(current_status):
+            if proof.get("proof_id") == proof_id:
+                return proof
+
+    for payload in _iter_leanoj_state_payloads():
+        if str(payload.get("session_id") or "") != session_id:
+            continue
+        for proof in _extract_leanoj_proofs(payload):
+            if proof.get("proof_id") == proof_id:
+                return proof
+        break
+
+    raise HTTPException(status_code=404, detail="Proof Solver proof work not found")
+
+
+@router.post("/skip-brainstorm")
+async def skip_leanoj_brainstorm():
+    """Request immediate exit from Proof Solver brainstorming into final proof solving."""
+    if not leanoj_coordinator.is_active:
+        raise HTTPException(status_code=400, detail="Proof Solver is not running")
+    await leanoj_coordinator.skip_brainstorm()
+    return {
+        "success": True,
+        "message": "Proof Solver brainstorming will be skipped and final proof solving will start",
+        "status": leanoj_coordinator.get_status(),
+    }
+
+
+@router.post("/force-brainstorm")
+async def force_leanoj_brainstorm():
+    """Request a return to recursive Proof Solver brainstorming without clearing proof progress."""
+    if not leanoj_coordinator.is_active:
+        raise HTTPException(status_code=400, detail="Proof Solver is not running")
+    await leanoj_coordinator.force_brainstorm()
+    return {
+        "success": True,
+        "message": "Proof Solver will return to recursive brainstorming with the current proof preserved",
+        "status": leanoj_coordinator.get_status(),
+    }
diff --git a/backend/api/routes/openrouter.py b/backend/api/routes/openrouter.py
index 5289f2c..8ae6294 100644
--- a/backend/api/routes/openrouter.py
+++ b/backend/api/routes/openrouter.py
@@ -10,7 +10,7 @@
 Note: Boost routes can reuse the active global key by default, while still allowing
 an explicit boost-only override key when the user provides one.
 """
-from fastapi import APIRouter, HTTPException, Header
+from fastapi import APIRouter, HTTPException, Header, Request
 from pydantic import BaseModel
 from typing import Dict, Any, Optional
 import logging
@@ -242,21 +242,27 @@ async def get_api_key_status() -> Dict[str, Any]:
 
 
 @router.get("/api/openrouter/models")
-async def get_models(api_key: Optional[str] = None, free_only: bool = False) -> Dict[str, Any]:
+async def get_models(request: Request, free_only: bool = False, authorization: Optional[str] = Header(None)) -> Dict[str, Any]:
     """
     Fetch available OpenRouter models.
     
-    If api_key is provided, uses that key. Otherwise uses the stored global key.
+    If Authorization is provided, uses that key. Otherwise uses the stored global key.
     
     Args:
-        api_key: Optional API key to use instead of stored key (query parameter)
         free_only: If True, only return models with $0 pricing (query parameter)
+        authorization: Optional API key via Authorization header (Bearer token)
         
     Returns:
         List of available models with their details
     """
     try:
-        # Use provided key or fall back to stored key
+        if "api_key" in request.query_params:
+            raise HTTPException(
+                status_code=400,
+                detail="OpenRouter API keys must be supplied via Authorization header, not URL query parameters.",
+            )
+
+        api_key = authorization.replace("Bearer ", "") if authorization and authorization.startswith("Bearer ") else authorization
         key_to_use = api_key or rag_config.openrouter_api_key
         
         if not key_to_use:
diff --git a/backend/api/routes/proofs.py b/backend/api/routes/proofs.py
index 9dff94b..f46333d 100644
--- a/backend/api/routes/proofs.py
+++ b/backend/api/routes/proofs.py
@@ -5,9 +5,10 @@
 
 import asyncio
 import logging
+from pathlib import Path
 from typing import Optional, Tuple
 
-from fastapi import APIRouter, BackgroundTasks, HTTPException
+from fastapi import APIRouter, BackgroundTasks, HTTPException, Query
 from fastapi.responses import JSONResponse, PlainTextResponse
 
 from backend.api.routes import websocket
@@ -39,19 +40,50 @@
 router = APIRouter(prefix="/api/proofs", tags=["proofs"])
 
 
+def _safe_path_label(path_value: str) -> str:
+    """Return a display-safe basename instead of an absolute local path."""
+    text = str(path_value or "").strip()
+    if not text:
+        return ""
+    try:
+        return Path(text).name or "[configured]"
+    except Exception:
+        return "[configured]"
+
+
 def _build_model_config(role: ProofRoleConfigSnapshot) -> ModelConfig:
     return ModelConfig(
         provider=role.provider,
         model_id=role.model_id,
         openrouter_model_id=role.model_id if role.provider == "openrouter" else None,
         openrouter_provider=role.openrouter_provider,
+        openrouter_reasoning_effort=role.openrouter_reasoning_effort,
         lm_studio_fallback_id=role.lm_studio_fallback_id,
         context_window=role.context_window,
         max_output_tokens=role.max_output_tokens,
+        supercharge_enabled=role.supercharge_enabled,
     )
 
 
-async def _get_runtime_snapshot() -> Optional[ProofRuntimeConfigSnapshot]:
+def _get_request_runtime_snapshot(request: Optional[ProofCheckRequest]) -> Optional[ProofRuntimeConfigSnapshot]:
+    if not request or not request.proof_runtime_config:
+        return None
+
+    try:
+        return ProofRuntimeConfigSnapshot(**request.proof_runtime_config)
+    except Exception as exc:
+        logger.error("Manual proof runtime config from request is invalid: %s", exc)
+        raise HTTPException(
+            status_code=400,
+            detail="Manual proof runtime model configuration is invalid.",
+        )
+
+
+async def _get_runtime_snapshot(request: Optional[ProofCheckRequest] = None) -> Optional[ProofRuntimeConfigSnapshot]:
+    request_snapshot = _get_request_runtime_snapshot(request)
+    if request_snapshot is not None:
+        return request_snapshot
+
     snapshot_dict = autonomous_coordinator.get_proof_runtime_config()
     if not snapshot_dict:
         snapshot_dict = await research_metadata.get_proof_runtime_config()
@@ -134,7 +166,7 @@ async def _resolve_manual_source(request: ProofCheckRequest) -> Tuple[str, str]:
 async def _run_manual_proof_check(request: ProofCheckRequest) -> None:
     try:
         source_content, source_title = await _resolve_manual_source(request)
-        snapshot = await _get_runtime_snapshot()
+        snapshot = await _get_runtime_snapshot(request)
         if snapshot is None:
             raise RuntimeError("No proof runtime model configuration is available yet.")
 
@@ -287,15 +319,38 @@ def _clean_content(content: str, proof_header: str) -> tuple[str, int]:
 
 
 @router.post("/cleanup-known-from-files")
-async def cleanup_known_proofs_from_files():
+async def cleanup_known_proofs_from_files(confirm: bool = Query(default=False)):
     """One-time cleanup: strip non-novel proof entries from brainstorm/paper files.
 
     Non-novel proofs are stored in ProofDatabase (no data loss).  This endpoint
     removes their raw Lean 4 code from brainstorm and paper .txt files so that
     compiler and RAG context is no longer polluted by standard known results.
 
-    Safe to call on a running session.  Novel proof entries are preserved.
+    Requires explicit confirmation because it mutates brainstorm/paper files.
+    Novel proof entries are preserved.
     """
+    if system_config.generic_mode:
+        raise HTTPException(
+            status_code=501,
+            detail={
+                "lean4_enabled": False,
+                "message": "Proof file cleanup is unavailable in hosted mode.",
+            },
+        )
+    if not system_config.lean4_enabled:
+        raise HTTPException(
+            status_code=501,
+            detail={
+                "lean4_enabled": False,
+                "message": "Proof file cleanup is unavailable while Lean 4 is disabled.",
+            },
+        )
+    if not confirm:
+        raise HTTPException(
+            status_code=400,
+            detail="Pass ?confirm=true to strip known proof entries from brainstorm and paper files.",
+        )
+
     result = await _strip_known_proofs_from_files()
     return result
 
@@ -335,8 +390,11 @@ async def get_proofs_status():
     return {
         "lean4_enabled": system_config.lean4_enabled,
         "lean4_lsp_enabled": system_config.lean4_lsp_enabled,
-        "lean4_path": system_config.lean4_path,
-        "lean4_workspace_dir": system_config.lean4_workspace_dir,
+        "lean4_path": _safe_path_label(system_config.lean4_path),
+        "lean4_path_configured": bool(system_config.lean4_path),
+        "lean4_workspace_dir": _safe_path_label(system_config.lean4_workspace_dir),
+        "lean4_workspace_configured": bool(system_config.lean4_workspace_dir),
+        "runtime_paths_redacted": True,
         "lean_version": version,
         "lean4_version": version,
         "lean4_proof_timeout": system_config.lean4_proof_timeout,
@@ -347,7 +405,8 @@ async def get_proofs_status():
         "mathlib_commit": mathlib_commit,
         "smt_enabled": system_config.smt_enabled,
         "smt_available": smt_available,
-        "z3_path": system_config.z3_path,
+        "z3_path": _safe_path_label(system_config.z3_path),
+        "z3_path_configured": bool(system_config.z3_path),
         "smt_timeout": system_config.smt_timeout,
         "z3_version": z3_version,
         "manual_check_ready": manual_check_ready,
@@ -371,7 +430,6 @@ async def update_proof_settings(request: ProofSettingsUpdateRequest):
     )
     previous_smt_settings = (
         system_config.smt_enabled,
-        system_config.z3_path,
         system_config.smt_timeout,
     )
 
@@ -383,8 +441,6 @@ async def update_proof_settings(request: ProofSettingsUpdateRequest):
         system_config.lean4_lsp_idle_timeout = int(request.lean4_lsp_idle_timeout)
     if request.smt_enabled is not None:
         system_config.smt_enabled = bool(request.smt_enabled)
-    if request.z3_path is not None:
-        system_config.z3_path = str(request.z3_path or "").strip()
     if request.smt_timeout is not None:
         system_config.smt_timeout = int(request.smt_timeout)
 
@@ -397,7 +453,6 @@ async def update_proof_settings(request: ProofSettingsUpdateRequest):
     )
     smt_settings_changed = previous_smt_settings != (
         system_config.smt_enabled,
-        system_config.z3_path,
         system_config.smt_timeout,
     )
 
@@ -421,7 +476,7 @@ async def run_manual_proof_check(request: ProofCheckRequest, background_tasks: B
     if not system_config.lean4_enabled:
         raise HTTPException(status_code=501, detail={"lean4_enabled": False, "message": "Lean 4 proof checks are disabled."})
 
-    snapshot = await _get_runtime_snapshot()
+    snapshot = await _get_runtime_snapshot(request)
     if snapshot is None:
         raise HTTPException(
             status_code=409,
@@ -431,7 +486,7 @@ async def run_manual_proof_check(request: ProofCheckRequest, background_tasks: B
     if not selected_role.model_id or not snapshot.validator.model_id:
         raise HTTPException(
             status_code=409,
-            detail="Proof runtime model configuration is incomplete. Start autonomous research again to refresh proof roles.",
+            detail="Proof runtime model configuration is incomplete. Select models for the proof role and validator, then try again.",
         )
 
     await _resolve_manual_source(request)
diff --git a/backend/api/routes/update.py b/backend/api/routes/update.py
index 1a23699..d6fc8bf 100644
--- a/backend/api/routes/update.py
+++ b/backend/api/routes/update.py
@@ -14,7 +14,9 @@
 from pathlib import Path
 from typing import Any, Dict, Tuple
 
-from fastapi import APIRouter
+from fastapi import APIRouter, HTTPException
+
+from backend.shared.config import system_config
 
 router = APIRouter(tags=["update"])
 logger = logging.getLogger(__name__)
@@ -30,7 +32,7 @@
 
 
 def _parse_semver(version_str: str) -> Tuple[int, ...]:
-    """Extract numeric version tuple from a semver string (e.g. '1.0.7' -> (1,0,7))."""
+    """Extract numeric version tuple from a semver string (e.g. '1.0.8' -> (1,0,8))."""
     parts = re.findall(r"\d+", version_str or "")
     return tuple(int(p) for p in parts) if parts else (0,)
 
@@ -215,6 +217,12 @@ async def _run_zip_update() -> None:
 @router.post("/api/update/pull")
 async def start_pull() -> Dict[str, Any]:
     """Kick off an update. Routes to git pull or ZIP overlay depending on install type."""
+    if system_config.generic_mode:
+        raise HTTPException(
+            status_code=501,
+            detail="Self-update is unavailable in hosted generic mode.",
+        )
+
     if _pull_state["status"] == "running":
         return {"started": False, "reason": "An update is already in progress."}
 
diff --git a/backend/api/routes/websocket.py b/backend/api/routes/websocket.py
index 02608e4..3ccce5a 100644
--- a/backend/api/routes/websocket.py
+++ b/backend/api/routes/websocket.py
@@ -1,12 +1,14 @@
 """
 WebSocket route for real-time updates.
 """
-from fastapi import APIRouter, WebSocket, WebSocketDisconnect, status
+from fastapi import APIRouter, HTTPException, WebSocket, WebSocketDisconnect, status
 from typing import List, Dict
 from datetime import datetime
 import asyncio
 import logging
 import json
+import secrets
+import time
 
 from backend.api.proxy_auth import ProxyAuthError, validate_proxy_headers
 from backend.shared.config import system_config
@@ -57,6 +59,34 @@ async def broadcast(self, event_type: str, data: Dict):
 
 # Global connection manager
 manager = ConnectionManager()
+_DESKTOP_WS_TICKET_TTL_SECONDS = 30
+_desktop_ws_tickets: Dict[str, float] = {}
+
+
+def _prune_expired_desktop_tickets(now: float) -> None:
+    expired = [
+        ticket
+        for ticket, expires_at in _desktop_ws_tickets.items()
+        if expires_at <= now
+    ]
+    for ticket in expired:
+        _desktop_ws_tickets.pop(ticket, None)
+
+
+@router.post("/api/ws-ticket")
+async def create_desktop_websocket_ticket():
+    """Create a one-time desktop WebSocket ticket via token-authenticated HTTP."""
+    if system_config.generic_mode:
+        raise HTTPException(
+            status_code=501,
+            detail="Desktop WebSocket tickets are not used in generic mode.",
+        )
+
+    now = time.time()
+    _prune_expired_desktop_tickets(now)
+    ticket = secrets.token_urlsafe(32)
+    _desktop_ws_tickets[ticket] = now + _DESKTOP_WS_TICKET_TTL_SECONDS
+    return {"ticket": ticket, "expires_in": _DESKTOP_WS_TICKET_TTL_SECONDS}
 
 
 @router.websocket("/ws")
@@ -68,6 +98,8 @@ async def websocket_endpoint(websocket: WebSocket):
                 websocket.headers,
                 method="GET",
                 path=websocket.url.path,
+                query_string=websocket.url.query,
+                body=b"",
                 expected_instance_id=system_config.instance_id,
                 shared_secret=system_config.internal_proxy_secret or "",
             )
@@ -78,6 +110,18 @@ async def websocket_endpoint(websocket: WebSocket):
                 reason=exc.detail,
             )
             return
+    else:
+        now = time.time()
+        _prune_expired_desktop_tickets(now)
+        ticket = (websocket.query_params.get("ticket") or "").strip()
+        expires_at = _desktop_ws_tickets.pop(ticket, None) if ticket else None
+        if not expires_at or expires_at <= now:
+            logger.warning("Rejected desktop websocket connection: missing or invalid ticket")
+            await websocket.close(
+                code=status.WS_1008_POLICY_VIOLATION,
+                reason="Missing or invalid desktop WebSocket ticket.",
+            )
+            return
 
     await manager.connect(websocket)
     
diff --git a/backend/api/routes/workflow.py b/backend/api/routes/workflow.py
index 8ccaa45..2f9c375 100644
--- a/backend/api/routes/workflow.py
+++ b/backend/api/routes/workflow.py
@@ -33,12 +33,17 @@ async def get_workflow_predictions() -> Dict[str, Any]:
         from backend.aggregator.core.coordinator import coordinator
         from backend.compiler.core.compiler_coordinator import compiler_coordinator
         from backend.autonomous.core.autonomous_coordinator import autonomous_coordinator
+        from backend.leanoj.core.leanoj_coordinator import leanoj_coordinator
         
         # Determine which coordinator is active and return its workflow
         tasks = []
         mode = "idle"
         
-        if autonomous_coordinator._running:
+        if leanoj_coordinator.is_active:
+            mode = "leanoj"
+            tasks = [task.model_dump(mode="json") for task in leanoj_coordinator.workflow_tasks]
+            logger.debug(f"Returning {len(tasks)} tasks from LeanOJ coordinator")
+        elif autonomous_coordinator._running:
             mode = "autonomous"
             # For autonomous mode, check which sub-coordinator is active
             if autonomous_coordinator._brainstorm_aggregator and autonomous_coordinator._brainstorm_aggregator.is_running:
diff --git a/backend/autonomous/agents/final_answer/certainty_assessor.py b/backend/autonomous/agents/final_answer/certainty_assessor.py
index 4c04b1e..e6f0961 100644
--- a/backend/autonomous/agents/final_answer/certainty_assessor.py
+++ b/backend/autonomous/agents/final_answer/certainty_assessor.py
@@ -9,8 +9,7 @@
 CRITICAL: Operates ONLY on Tier 2 papers, NOT on Tier 1 brainstorm databases.
 
 NO RAG FOR ABSTRACTS (by design): Step 1 browses abstracts/outlines which are small metadata.
-EXPANDED PAPERS OVERFLOW: Step 2 currently drops expanded papers if they don't fit.
-TODO: Should RAG expanded papers instead of dropping — see audit note in rag-design rule.
+EXPANDED PAPERS OVERFLOW: Step 2 uses RAG fallback for expanded papers when full direct injection does not fit.
 """
 import asyncio
 import json
diff --git a/backend/autonomous/agents/lemma_search_agent.py b/backend/autonomous/agents/lemma_search_agent.py
index d2e69a2..cd696f7 100644
--- a/backend/autonomous/agents/lemma_search_agent.py
+++ b/backend/autonomous/agents/lemma_search_agent.py
@@ -13,6 +13,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.json_parser import parse_json
 from backend.shared.lean4_client import get_lean4_client
+from backend.shared.model_error_utils import is_non_retryable_model_error
 from backend.shared.models import MathlibLemmaHint, ProofCandidate
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.utils import count_tokens
@@ -295,6 +296,8 @@ async def suggest_relevant_lemmas(
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             logger.warning(
                 "MathlibLemmaSearchAgent failed for theorem %s: %s",
                 theorem_candidate.theorem_id,
diff --git a/backend/autonomous/agents/paper_title_selector.py b/backend/autonomous/agents/paper_title_selector.py
index 6107b56..195c364 100644
--- a/backend/autonomous/agents/paper_title_selector.py
+++ b/backend/autonomous/agents/paper_title_selector.py
@@ -55,6 +55,10 @@ def set_task_tracking_callback(self, callback: Callable) -> None:
     def get_current_task_id(self) -> str:
         """Get the task ID for the current/next API call."""
         return f"agg_sub1_{self.task_sequence:03d}"
+
+    def get_current_validation_task_id(self) -> str:
+        """Get a validator-routed task ID for title validation."""
+        return f"agg_val_{self.task_sequence:03d}"
     
     async def select_title(
         self,
@@ -232,7 +236,7 @@ async def _generate_title(
                 return None
 
             # Generate task ID for tracking
-            task_id = self.get_current_task_id()
+            task_id = self.get_current_validation_task_id()
             self.task_sequence += 1
             
             # Notify task started (for workflow panel)
@@ -326,7 +330,7 @@ async def _validate_title(
             
             response = await api_client_manager.generate_completion(
                 task_id=task_id,
-                role_id=self.role_id,  # Use same role_id for validation
+                role_id="autonomous_paper_title_validator",
                 model=self.validator_model_id,
                 messages=[{"role": "user", "content": prompt}],
                 max_tokens=15000,
diff --git a/backend/autonomous/agents/proof_formalization_agent.py b/backend/autonomous/agents/proof_formalization_agent.py
index aa589e3..e43c085 100644
--- a/backend/autonomous/agents/proof_formalization_agent.py
+++ b/backend/autonomous/agents/proof_formalization_agent.py
@@ -10,6 +10,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.json_parser import parse_json
 from backend.shared.lean4_client import get_lean4_client
+from backend.shared.model_error_utils import is_non_retryable_model_error
 from backend.shared.models import ProofAttemptFeedback, ProofCandidate, SmtHint
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.utils import count_tokens
@@ -266,6 +267,8 @@ async def _run_full_script_attempt(
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             is_parse_error = _is_json_parse_error(exc)
             feedback = ProofAttemptFeedback(
                 attempt=attempt_number,
@@ -558,6 +561,8 @@ async def prove_candidate_tactic_script(
             except FreeModelExhaustedError:
                 raise
             except Exception as exc:
+                if is_non_retryable_model_error(exc):
+                    raise
                 is_parse_error = _is_json_parse_error(exc)
                 feedback = ProofAttemptFeedback(
                     attempt=attempt_number,
diff --git a/backend/autonomous/agents/proof_identification_agent.py b/backend/autonomous/agents/proof_identification_agent.py
index 9fa7791..82bde54 100644
--- a/backend/autonomous/agents/proof_identification_agent.py
+++ b/backend/autonomous/agents/proof_identification_agent.py
@@ -6,6 +6,7 @@
 
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.json_parser import parse_json
+from backend.shared.model_error_utils import is_non_retryable_model_error
 from backend.shared.models import ProofCandidate
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.utils import count_tokens
@@ -104,6 +105,8 @@ async def translate_candidate_to_smt(
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             logger.debug(
                 "ProofIdentificationAgent SMT translation failed for theorem %s: %s",
                 theorem_candidate.theorem_id,
@@ -183,6 +186,8 @@ async def identify_candidates(
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             logger.error(
                 "ProofIdentificationAgent failed for %s %s: %s",
                 source_type,
diff --git a/backend/autonomous/core/autonomous_coordinator.py b/backend/autonomous/core/autonomous_coordinator.py
index 337e922..3805d1c 100644
--- a/backend/autonomous/core/autonomous_coordinator.py
+++ b/backend/autonomous/core/autonomous_coordinator.py
@@ -84,6 +84,10 @@
 
 logger = logging.getLogger(__name__)
 
+_PARENT_PHASE_SHUTDOWN_TIMEOUT_SECONDS = 60 * 60
+_WORKFLOW_PHASE_UNSET = object()
+_BRAINSTORM_ACCEPTANCE_HARD_LIMIT = 30
+
 
 class AutonomousCoordinator:
     """
@@ -107,7 +111,9 @@ def __init__(self):
         self._validator_max_tokens: int = 15000
         self._validator_provider: str = "lm_studio"
         self._validator_openrouter_provider: Optional[str] = None
+        self._validator_openrouter_reasoning_effort: str = "auto"
         self._validator_lm_studio_fallback: Optional[str] = None
+        self._validator_supercharge_enabled: bool = False
         
         # Compiler models (separate from aggregator submitters)
         self._high_context_model: str = ""
@@ -116,6 +122,24 @@ def __init__(self):
         self._high_param_context: int = 10000
         self._high_context_max_tokens: int = 25000
         self._high_param_max_tokens: int = 15000
+        self._high_context_provider: str = "lm_studio"
+        self._high_context_openrouter_provider: Optional[str] = None
+        self._high_context_openrouter_reasoning_effort: str = "auto"
+        self._high_context_lm_studio_fallback: Optional[str] = None
+        self._high_context_supercharge_enabled: bool = False
+        self._high_param_provider: str = "lm_studio"
+        self._high_param_openrouter_provider: Optional[str] = None
+        self._high_param_openrouter_reasoning_effort: str = "auto"
+        self._high_param_lm_studio_fallback: Optional[str] = None
+        self._high_param_supercharge_enabled: bool = False
+        self._critique_submitter_model: str = ""
+        self._critique_submitter_context: int = 131072
+        self._critique_submitter_max_tokens: int = 25000
+        self._critique_submitter_provider: str = "lm_studio"
+        self._critique_submitter_openrouter_provider: Optional[str] = None
+        self._critique_submitter_openrouter_reasoning_effort: str = "auto"
+        self._critique_submitter_lm_studio_fallback: Optional[str] = None
+        self._critique_submitter_supercharge_enabled: bool = False
         
         # Agents (initialized during setup)
         self._topic_selector: Optional[TopicSelectorAgent] = None
@@ -133,6 +157,7 @@ def __init__(self):
         # Part 1 & 2 Integration
         self._brainstorm_aggregator: Optional[AggregatorCoordinator] = None
         self._paper_compiler: Optional[CompilerCoordinator] = None
+        self._active_child_aggregators: List[AggregatorCoordinator] = []
         
         # Callbacks
         self._broadcast_callback: Optional[Callable] = None
@@ -151,6 +176,7 @@ def __init__(self):
         self._last_redundancy_check_at: int = 0
         self._last_completion_review_at: int = 0  # Acceptance count at last completion review
         self._manual_paper_writing_triggered: bool = False
+        self._brainstorm_hard_limit_triggered: bool = False
         self._resume_paper_phase: Optional[str] = None  # Saved phase for resume (body/conclusion/intro/abstract)
         self._brainstorm_missing_during_paper: bool = False
         
@@ -190,6 +216,52 @@ async def _broadcast(self, event: str, data: Dict[str, Any] = None) -> None:
             # broadcast_event expects (event_type, data) as separate arguments
             await self._broadcast_callback(event, data or {})
 
+    def _track_child_aggregator(self, aggregator: AggregatorCoordinator) -> None:
+        """Track local child aggregators so parent phase changes can stop them."""
+        if aggregator not in self._active_child_aggregators:
+            self._active_child_aggregators.append(aggregator)
+
+    def _untrack_child_aggregator(self, aggregator: Optional[AggregatorCoordinator]) -> None:
+        if aggregator in self._active_child_aggregators:
+            self._active_child_aggregators.remove(aggregator)
+
+    async def _await_parent_phase_shutdown(
+        self,
+        label: str,
+        awaitable,
+        *,
+        timeout: float = _PARENT_PHASE_SHUTDOWN_TIMEOUT_SECONDS,
+    ) -> bool:
+        task = asyncio.create_task(awaitable)
+        try:
+            await asyncio.wait_for(task, timeout=timeout)
+            return True
+        except asyncio.TimeoutError:
+            logger.warning(
+                "Timed out waiting %.0fs for %s; cancelling so parent phase can continue",
+                timeout,
+                label,
+            )
+            task.cancel()
+            try:
+                await task
+            except asyncio.CancelledError:
+                pass
+            return False
+
+    async def _stop_active_child_aggregators(self, reason: str) -> None:
+        for aggregator in list(self._active_child_aggregators):
+            try:
+                if await self._await_parent_phase_shutdown(
+                    f"child aggregator shutdown for {reason}",
+                    aggregator.stop(),
+                ):
+                    logger.info("Stopped child aggregator for %s", reason)
+            except Exception as exc:
+                logger.warning("Error stopping child aggregator for %s: %s", reason, exc)
+            finally:
+                self._untrack_child_aggregator(aggregator)
+
     def _append_proof_framing(self, prompt: str) -> str:
         """Append the persisted proof-framing context when active."""
         effective_prompt = prompt or ""
@@ -240,25 +312,31 @@ def _build_proof_runtime_config_snapshot(self) -> Dict[str, Any]:
             provider=first_submitter.provider if first_submitter else "lm_studio",
             model_id=first_submitter.model_id if first_submitter else self._high_context_model,
             openrouter_provider=first_submitter.openrouter_provider if first_submitter else self._high_context_openrouter_provider,
+            openrouter_reasoning_effort=first_submitter.openrouter_reasoning_effort if first_submitter else self._high_context_openrouter_reasoning_effort,
             lm_studio_fallback_id=first_submitter.lm_studio_fallback_id if first_submitter else self._high_context_lm_studio_fallback,
             context_window=first_submitter.context_window if first_submitter else self._high_context_context,
             max_output_tokens=first_submitter.max_output_tokens if first_submitter else self._high_context_max_tokens,
+            supercharge_enabled=first_submitter.supercharge_enabled if first_submitter else self._high_context_supercharge_enabled,
         )
         paper_config = ProofRoleConfigSnapshot(
             provider=self._high_context_provider,
             model_id=self._high_context_model,
             openrouter_provider=self._high_context_openrouter_provider,
+            openrouter_reasoning_effort=self._high_context_openrouter_reasoning_effort,
             lm_studio_fallback_id=self._high_context_lm_studio_fallback,
             context_window=self._high_context_context,
             max_output_tokens=self._high_context_max_tokens,
+            supercharge_enabled=self._high_context_supercharge_enabled,
         )
         validator_config = ProofRoleConfigSnapshot(
             provider=self._validator_provider,
             model_id=self._validator_model,
             openrouter_provider=self._validator_openrouter_provider,
+            openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
             lm_studio_fallback_id=self._validator_lm_studio_fallback,
             context_window=self._validator_context,
             max_output_tokens=self._validator_max_tokens,
+            supercharge_enabled=self._validator_supercharge_enabled,
         )
         return ProofRuntimeConfigSnapshot(
             brainstorm=brainstorm_config,
@@ -373,6 +451,16 @@ async def _run_brainstorm_completion_proofs(self) -> None:
         if not self._current_topic_id:
             return
 
+        # Entering Lean proof verification is already past brainstorm aggregation.
+        # Persist that handoff before the potentially long proof stage so a restart
+        # cannot fall back to a fresh 0-count brainstorm loop.
+        self._state.current_tier = "tier2_paper_writing"
+        await self._recover_brainstorm_acceptance_count(self._current_topic_id)
+        await self._save_workflow_state(
+            tier="tier2_paper_writing",
+            phase="brainstorm_proof_verification",
+        )
+
         metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
         brainstorm_content = await brainstorm_memory.get_database_content(self._current_topic_id)
         await self._run_proof_verification(
@@ -381,6 +469,96 @@ async def _run_brainstorm_completion_proofs(self) -> None:
             self._current_topic_id,
             source_title=metadata.topic_prompt if metadata else "",
         )
+
+        if not self._stop_event.is_set():
+            await self._save_workflow_state(
+                tier="tier2_paper_writing",
+                phase="pre_paper_compilation",
+            )
+
+    async def _recover_brainstorm_acceptance_count(self, topic_id: Optional[str]) -> int:
+        """Recover a non-zero brainstorm acceptance count from durable files.
+
+        Older workflow states can be stale around the proof handoff.  Use the
+        current workflow count when present, but fall back to brainstorm metadata
+        and finally to the database file so resume/status never shows a completed
+        brainstorm as starting from zero.
+        """
+        if not topic_id:
+            return self._acceptance_count
+
+        recovered_count = max(0, int(self._acceptance_count or 0))
+        metadata = await brainstorm_memory.get_metadata(topic_id)
+        if metadata is not None:
+            recovered_count = max(recovered_count, int(metadata.submission_count or 0))
+
+        try:
+            content = await brainstorm_memory.get_database_content(topic_id, strip_proofs=True)
+            file_count = len(
+                re.findall(r"^SUBMISSION\s+#\d+\s*\|", content or "", flags=re.MULTILINE)
+            )
+            recovered_count = max(recovered_count, file_count)
+        except Exception as exc:
+            logger.debug("Failed to recover brainstorm count for %s from file: %s", topic_id, exc)
+
+        if recovered_count > (self._acceptance_count or 0):
+            logger.info(
+                "Recovered brainstorm acceptance count for %s: %s -> %s",
+                topic_id,
+                self._acceptance_count,
+                recovered_count,
+            )
+            self._acceptance_count = recovered_count
+
+        if metadata is not None and recovered_count > int(metadata.submission_count or 0):
+            try:
+                await brainstorm_memory.update_metadata(topic_id, submission_count=recovered_count)
+            except Exception as exc:
+                logger.debug("Failed to update recovered brainstorm count for %s: %s", topic_id, exc)
+
+        return self._acceptance_count
+
+    async def _trigger_brainstorm_hard_limit(self, acceptance_count: int) -> None:
+        """Record the brainstorm hard-limit transition exactly once."""
+        self._acceptance_count = max(self._acceptance_count, int(acceptance_count or 0))
+        if self._brainstorm_hard_limit_triggered:
+            return
+
+        self._brainstorm_hard_limit_triggered = True
+        logger.info(
+            "Hard limit of %s acceptances reached for %s. Forcing paper writing transition.",
+            _BRAINSTORM_ACCEPTANCE_HARD_LIMIT,
+            self._current_topic_id,
+        )
+
+        shared_training_size = 0
+        try:
+            shared_training_size = await shared_training_memory.get_insights_count()
+        except Exception as exc:
+            logger.debug("Failed to read live brainstorm size at hard limit: %s", exc)
+
+        if self._current_topic_id:
+            try:
+                await brainstorm_memory.update_metadata(
+                    self._current_topic_id,
+                    submission_count=shared_training_size or self._acceptance_count,
+                )
+            except Exception as exc:
+                logger.debug("Failed to update hard-limit brainstorm metadata: %s", exc)
+
+            await self._broadcast("brainstorm_hard_limit_reached", {
+                "topic_id": self._current_topic_id,
+                "acceptance_count": self._acceptance_count,
+                "message": (
+                    f"Brainstorm hard limit of {_BRAINSTORM_ACCEPTANCE_HARD_LIMIT} "
+                    "acceptances reached. Forcing paper writing."
+                )
+            })
+
+            await brainstorm_memory.mark_complete(self._current_topic_id)
+            await research_metadata.mark_brainstorm_complete(self._current_topic_id)
+
+        await self._save_workflow_state(tier="tier1_aggregation")
     
     async def initialize(
         self,
@@ -401,21 +579,29 @@ async def initialize(
         # OpenRouter provider configs for validator
         validator_provider: str = "lm_studio",
         validator_openrouter_provider: Optional[str] = None,
+        validator_openrouter_reasoning_effort: str = "auto",
         validator_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider configs for high-context submitter
         high_context_provider: str = "lm_studio",
         high_context_openrouter_provider: Optional[str] = None,
+        high_context_openrouter_reasoning_effort: str = "auto",
         high_context_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider configs for high-param submitter
         high_param_provider: str = "lm_studio",
         high_param_openrouter_provider: Optional[str] = None,
+        high_param_openrouter_reasoning_effort: str = "auto",
         high_param_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider configs for critique submitter
         critique_submitter_provider: str = "lm_studio",
         critique_submitter_openrouter_provider: Optional[str] = None,
+        critique_submitter_openrouter_reasoning_effort: str = "auto",
         critique_submitter_lm_studio_fallback: Optional[str] = None,
         # Tier 3 Final Answer setting
-        tier3_enabled: bool = False
+        tier3_enabled: bool = False,
+        validator_supercharge_enabled: bool = False,
+        high_context_supercharge_enabled: bool = False,
+        high_param_supercharge_enabled: bool = False,
+        critique_submitter_supercharge_enabled: bool = False
     ) -> None:
         """Initialize the coordinator with configuration."""
         # Store configuration
@@ -447,17 +633,25 @@ async def initialize(
         # Store OpenRouter provider configs for all roles
         self._validator_provider = validator_provider
         self._validator_openrouter_provider = validator_openrouter_provider
+        self._validator_openrouter_reasoning_effort = validator_openrouter_reasoning_effort
         self._validator_lm_studio_fallback = validator_lm_studio_fallback
         self._high_context_provider = high_context_provider
         self._high_context_openrouter_provider = high_context_openrouter_provider
+        self._high_context_openrouter_reasoning_effort = high_context_openrouter_reasoning_effort
         self._high_context_lm_studio_fallback = high_context_lm_studio_fallback
         self._high_param_provider = high_param_provider
         self._high_param_openrouter_provider = high_param_openrouter_provider
+        self._high_param_openrouter_reasoning_effort = high_param_openrouter_reasoning_effort
         self._high_param_lm_studio_fallback = high_param_lm_studio_fallback
         self._critique_submitter_provider = critique_submitter_provider
         self._critique_submitter_openrouter_provider = critique_submitter_openrouter_provider
+        self._critique_submitter_openrouter_reasoning_effort = critique_submitter_openrouter_reasoning_effort
         self._critique_submitter_lm_studio_fallback = critique_submitter_lm_studio_fallback
         self._tier3_enabled = tier3_enabled
+        self._validator_supercharge_enabled = validator_supercharge_enabled
+        self._high_context_supercharge_enabled = high_context_supercharge_enabled
+        self._high_param_supercharge_enabled = high_param_supercharge_enabled
+        self._critique_submitter_supercharge_enabled = critique_submitter_supercharge_enabled
         
         logger.info(f"Autonomous coordinator initializing with {len(submitter_configs)} submitters")
         for config in submitter_configs:
@@ -613,6 +807,8 @@ async def initialize(
         # CRITICAL: Configure roles with api_client_manager so routing works correctly
         # Configure first submitter (used by topic selector, completion reviewer, reference selector, title selector)
         first_config = submitter_configs[0] if submitter_configs else SubmitterConfig(submitter_id=1, model_id=first_submitter_model)
+        first_supercharge_enabled = first_config.supercharge_enabled if hasattr(first_config, 'supercharge_enabled') else False
+        first_reasoning_effort = getattr(first_config, "openrouter_reasoning_effort", "auto")
         api_client_manager.configure_role(
             "autonomous_topic_selector",
             ModelConfig(
@@ -620,9 +816,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
         
@@ -633,9 +831,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
         
@@ -646,9 +846,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
         
@@ -659,9 +861,25 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
+            )
+        )
+        api_client_manager.configure_role(
+            "autonomous_paper_title_validator",
+            ModelConfig(
+                provider=validator_provider,
+                model_id=validator_model,
+                openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
+                openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
+                lm_studio_fallback_id=validator_lm_studio_fallback,
+                context_window=validator_context_window,
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
         
@@ -673,9 +891,11 @@ async def initialize(
                 model_id=validator_model,
                 openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=validator_lm_studio_fallback,
                 context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
         
@@ -686,9 +906,11 @@ async def initialize(
                 model_id=validator_model,
                 openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=validator_lm_studio_fallback,
                 context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
 
@@ -699,9 +921,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -712,9 +936,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -725,9 +951,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -738,9 +966,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -751,9 +981,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -764,9 +996,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -777,9 +1011,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -790,9 +1026,11 @@ async def initialize(
                 model_id=validator_model,
                 openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
                 openrouter_provider=validator_openrouter_provider,
+                openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=validator_lm_studio_fallback,
                 context_window=validator_context_window,
-                max_output_tokens=validator_max_tokens
+                max_output_tokens=validator_max_tokens,
+                supercharge_enabled=validator_supercharge_enabled
             )
         )
 
@@ -803,9 +1041,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -816,9 +1056,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -829,9 +1071,11 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
 
@@ -842,9 +1086,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -855,9 +1101,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -868,9 +1116,11 @@ async def initialize(
                 model_id=self._high_context_model,
                 openrouter_model_id=self._high_context_model if high_context_provider == "openrouter" else None,
                 openrouter_provider=high_context_openrouter_provider,
+                openrouter_reasoning_effort=high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=high_context_lm_studio_fallback,
                 context_window=self._high_context_context,
-                max_output_tokens=self._high_context_max_tokens
+                max_output_tokens=self._high_context_max_tokens,
+                supercharge_enabled=high_context_supercharge_enabled
             )
         )
 
@@ -885,11 +1135,28 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
+        tier3_validator_config = ModelConfig(
+            provider=validator_provider,
+            model_id=validator_model,
+            openrouter_model_id=validator_model if validator_provider == "openrouter" else None,
+            openrouter_provider=validator_openrouter_provider,
+            openrouter_reasoning_effort=validator_openrouter_reasoning_effort,
+            lm_studio_fallback_id=validator_lm_studio_fallback,
+            context_window=validator_context_window,
+            max_output_tokens=validator_max_tokens,
+            supercharge_enabled=validator_supercharge_enabled,
+        )
+        api_client_manager.configure_role(
+            "autonomous_certainty_assessor_validator",
+            tier3_validator_config,
+        )
         
         api_client_manager.configure_role(
             "autonomous_format_selector",
@@ -898,11 +1165,17 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
+        api_client_manager.configure_role(
+            "autonomous_format_selector_validator",
+            tier3_validator_config,
+        )
         
         api_client_manager.configure_role(
             "autonomous_volume_organizer",
@@ -911,11 +1184,17 @@ async def initialize(
                 model_id=first_submitter_model,
                 openrouter_model_id=first_config.openrouter_model_id if hasattr(first_config, 'openrouter_model_id') else None,
                 openrouter_provider=first_config.openrouter_provider if hasattr(first_config, 'openrouter_provider') else None,
+                openrouter_reasoning_effort=first_reasoning_effort,
                 lm_studio_fallback_id=first_config.lm_studio_fallback_id if hasattr(first_config, 'lm_studio_fallback_id') else None,
                 context_window=first_submitter_context,
-                max_output_tokens=first_submitter_max_tokens
+                max_output_tokens=first_submitter_max_tokens,
+                supercharge_enabled=first_supercharge_enabled
             )
         )
+        api_client_manager.configure_role(
+            "autonomous_volume_organizer_validator",
+            tier3_validator_config,
+        )
         
         logger.info("Configured Tier 3 Final Answer agents with api_client_manager")
         
@@ -963,6 +1242,8 @@ async def _check_resume_state(self) -> None:
             self._current_reference_papers = workflow_state.get("reference_paper_ids", [])
             self._current_paper_title = workflow_state.get("current_paper_title")
             self._acceptance_count = workflow_state.get("acceptance_count", 0)
+            if self._current_topic_id:
+                await self._recover_brainstorm_acceptance_count(self._current_topic_id)
             self._rejection_count = workflow_state.get("rejection_count", 0)
             self._consecutive_rejections = workflow_state.get("consecutive_rejections", 0)
             self._exhaustion_signals = workflow_state.get("exhaustion_signals", 0)
@@ -1302,6 +1583,65 @@ async def _current_brainstorm_available_for_paper(self) -> bool:
 
         return True
 
+    async def clear_deleted_brainstorm_reference(self, topic_id: str, reason: str) -> None:
+        """Clear stale coordinator pointers after a stopped brainstorm is deleted."""
+        if self._current_topic_id != topic_id:
+            return
+
+        logger.warning(
+            f"Clearing current brainstorm reference for {topic_id}: {reason}"
+        )
+        stale_paper_id = self._current_paper_id
+        if stale_paper_id:
+            await self._delete_stale_incomplete_paper(stale_paper_id, topic_id, reason)
+
+        self._current_topic_id = None
+        self._current_paper_id = None
+        self._current_paper_title = None
+        self._resume_paper_phase = None
+        self._acceptance_count = 0
+        self._rejection_count = 0
+        self._cleanup_removals = 0
+        self._consecutive_rejections = 0
+        self._exhaustion_signals = 0
+        self._brainstorm_hard_limit_triggered = False
+        self._current_reference_papers = []
+        self._brainstorm_paper_count = 0
+        self._current_brainstorm_paper_ids = []
+        self._last_completed_paper_id = None
+        await research_metadata.set_current_brainstorm(None)
+        await self._save_workflow_state(tier="tier1_aggregation")
+
+    async def _current_brainstorm_available_for_aggregation(self, db_path: Path) -> bool:
+        """Return False if the active brainstorm was deleted during aggregation."""
+        if not self._current_topic_id:
+            return False
+
+        metadata = await brainstorm_memory.get_metadata(self._current_topic_id)
+        if metadata is None or not db_path.exists():
+            logger.warning(
+                f"Stopping aggregation for missing brainstorm {self._current_topic_id}: "
+                f"metadata_exists={metadata is not None}, db_path={db_path}, "
+                f"db_exists={db_path.exists()}"
+            )
+            if self._brainstorm_aggregator and self._brainstorm_aggregator.is_running:
+                await self._brainstorm_aggregator.stop()
+
+            if metadata is None and db_path.exists():
+                try:
+                    db_path.unlink()
+                    logger.info(f"Deleted orphaned brainstorm database: {db_path}")
+                except Exception as e:
+                    logger.warning(f"Failed to delete orphaned brainstorm database {db_path}: {e}")
+
+            await self.clear_deleted_brainstorm_reference(
+                self._current_topic_id,
+                "brainstorm metadata or database disappeared during aggregation"
+            )
+            return False
+
+        return True
+
     async def _preserve_failed_paper_state(self, paper_id: str, paper_title: str) -> None:
         """
         Preserve in-progress paper state after a compiler failure so retries resume.
@@ -1336,8 +1676,18 @@ async def _preserve_failed_paper_state(self, paper_id: str, paper_title: str) ->
             f"outline_chars={len(current_outline or '')}"
         )
     
-    async def _save_workflow_state(self, tier: str = None, phase: str = None) -> None:
+    async def _save_workflow_state(self, tier: str = None, phase: Any = _WORKFLOW_PHASE_UNSET) -> None:
         """Save current workflow state for crash recovery."""
+        if phase is _WORKFLOW_PHASE_UNSET:
+            phase_to_store = self._resume_paper_phase
+            try:
+                existing_state = await research_metadata.get_workflow_state()
+                phase_to_store = phase_to_store or existing_state.get("paper_phase")
+            except Exception:
+                phase_to_store = phase_to_store or None
+        else:
+            phase_to_store = phase
+
         # Serialize submitter configs for storage
         submitter_configs_data = [
             {
@@ -1359,7 +1709,7 @@ async def _save_workflow_state(self, tier: str = None, phase: str = None) -> Non
             "current_topic_id": self._current_topic_id,
             "current_paper_id": self._current_paper_id,
             "current_paper_title": self._current_paper_title,
-            "paper_phase": phase,
+            "paper_phase": phase_to_store,
             "reference_paper_ids": self._current_reference_papers,  # Persist reference papers across restarts
             "acceptance_count": self._acceptance_count,
             "rejection_count": self._rejection_count,
@@ -1546,24 +1896,90 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                         # CRITICAL: Restore paper_id so compilation workflow knows to resume
                         self._current_topic_id = resume_topic
                         self._current_paper_id = resume_paper  # FIX: Restore paper_id
+                        await self._recover_brainstorm_acceptance_count(resume_topic)
+
+                        if resume_paper and resume_state.get("paper_phase") != "paper_proof_verification":
+                            resume_paper_metadata = await paper_library.get_metadata(resume_paper)
+                            if resume_paper_metadata and resume_paper_metadata.status == "complete":
+                                if await paper_library.is_paper_complete(resume_paper):
+                                    logger.info(
+                                        "Recovered completed paper %s from stale Tier 2 resume state; "
+                                        "running paper proof checkpoint instead of recompiling.",
+                                        resume_paper,
+                                    )
+                                    resume_state["paper_phase"] = "paper_proof_verification"
+                            elif resume_paper and resume_paper_metadata is None:
+                                logger.warning(
+                                    "Ignoring stale current_paper_id %s during resume: metadata missing",
+                                    resume_paper,
+                                )
+                                self._current_paper_id = None
+                                resume_paper = None
+
+                        paper_resume_completed = False
+                        if resume_state.get("paper_phase") == "paper_proof_verification" and resume_paper:
+                            logger.info(
+                                "Resuming paper proof verification before continuing: %s",
+                                resume_paper,
+                            )
+                            paper_metadata = await paper_library.get_metadata(resume_paper)
+                            paper_content = await paper_library.get_paper_content(
+                                resume_paper,
+                                strip_proofs=True,
+                            )
+                            if paper_metadata and paper_content:
+                                self._current_paper_title = paper_metadata.title
+                                self._current_reference_papers = paper_metadata.referenced_papers or self._current_reference_papers
+                                await self._run_completed_paper_proof_checks(
+                                    paper_id=resume_paper,
+                                    title=paper_metadata.title,
+                                    content=paper_content,
+                                    source_brainstorm_ids=paper_metadata.source_brainstorm_ids,
+                                )
+                                if self._stop_event.is_set():
+                                    break
+                                self._last_completed_paper_id = resume_paper
+                                self._current_paper_id = None
+                                self._current_paper_title = None
+                                self._current_paper_tracker = None
+                                await self._save_workflow_state(tier=None, phase=None)
+                                paper_resume_completed = True
+                            else:
+                                logger.warning(
+                                    "Cannot resume paper proof verification for %s; saved paper metadata/content is missing",
+                                    resume_paper,
+                                )
+                                self._current_paper_id = None
+
+                        if resume_state.get("paper_phase") == "brainstorm_proof_verification":
+                            logger.info(
+                                "Resuming brainstorm proof verification before paper compilation: %s",
+                                resume_topic,
+                            )
+                            self._resume_paper_phase = None
+                            await self._run_brainstorm_completion_proofs()
+                            if self._stop_event.is_set():
+                                break
+
                         resume_state = None  # Clear resume state before retry loop
 
                         # A resumed brainstorm MUST produce a paper - retry until success or stop
                         _resume_paper_attempt = 0
-                        while not self._stop_event.is_set():
-                            _resume_paper_attempt += 1
-                            if _resume_paper_attempt > 1:
-                                logger.warning(
-                                    f"Resume paper compilation attempt {_resume_paper_attempt} "
-                                    f"for brainstorm {self._current_topic_id} - retrying..."
-                                )
-                                await asyncio.sleep(5)
-                            if await self._paper_compilation_workflow(
-                                emit_resume_event=(_resume_paper_attempt == 1)
-                            ):
-                                break
-                            if self._brainstorm_missing_during_paper:
-                                break
+                        if not paper_resume_completed:
+                            while not self._stop_event.is_set():
+                                _resume_paper_attempt += 1
+                                if _resume_paper_attempt > 1:
+                                    logger.warning(
+                                        f"Resume paper compilation attempt {_resume_paper_attempt} "
+                                        f"for brainstorm {self._current_topic_id} - retrying..."
+                                    )
+                                    await asyncio.sleep(5)
+                                if await self._paper_compilation_workflow(
+                                    emit_resume_event=(_resume_paper_attempt == 1)
+                                ):
+                                    break
+                                if self._brainstorm_missing_during_paper:
+                                    break
 
                         if self._brainstorm_missing_during_paper:
                             self._brainstorm_missing_during_paper = False
@@ -1704,6 +2120,24 @@ async def log_callback(task_id, role_id, model, provider, prompt, response,
                             await self._save_workflow_state(tier="tier1_aggregation")
                             resume_state = None
                             continue
+                        await self._recover_brainstorm_acceptance_count(resume_topic)
+                        if metadata.status == "complete":
+                            logger.info(
+                                "Recovered completed brainstorm %s from Tier 1 resume state; "
+                                "continuing at proof/paper handoff instead of aggregation.",
+                                resume_topic,
+                            )
+                            await self._save_workflow_state(
+                                tier="tier2_paper_writing",
+                                phase="brainstorm_proof_verification",
+                            )
+                            resume_state = {
+                                **resume_state,
+                                "current_tier": "tier2_paper_writing",
+                                "paper_phase": "brainstorm_proof_verification",
+                                "acceptance_count": self._acceptance_count,
+                            }
+                            continue
                         
                         write_paper = await self._brainstorm_aggregation_loop()
                         resume_state = None  # Clear resume state after handling
@@ -2018,7 +2452,88 @@ async def _get_resume_point(self) -> Optional[Dict[str, Any]]:
         """Get resume point if there's an interrupted workflow."""
         if research_metadata.has_interrupted_workflow():
             return await research_metadata.get_workflow_state()
+        recovered_state = await self._recover_resume_point_from_current_metadata()
+        if recovered_state:
+            await research_metadata.save_workflow_state(recovered_state)
+            logger.info(
+                "Recovered resume point from saved metadata: tier=%s topic=%s paper=%s",
+                recovered_state.get("current_tier"),
+                recovered_state.get("current_topic_id"),
+                recovered_state.get("current_paper_id"),
+            )
+            return recovered_state
         return None
+
+    async def _recover_resume_point_from_current_metadata(self) -> Optional[Dict[str, Any]]:
+        """Synthesize a resume point from durable stats/metadata when workflow state is stale."""
+        try:
+            stats = await research_metadata.get_stats()
+            topic_id = stats.get("current_brainstorm_id")
+            paper_id = stats.get("current_paper_id")
+            if not topic_id and not paper_id:
+                return None
+
+            paper_title = None
+            reference_paper_ids: List[str] = []
+            paper_phase = None
+            if paper_id:
+                paper_metadata = await paper_library.get_metadata(paper_id)
+                if paper_metadata is None:
+                    logger.info("Ignoring stale current_paper_id %s during resume recovery: metadata missing", paper_id)
+                    paper_id = None
+                else:
+                    paper_is_complete = await paper_library.is_paper_complete(paper_id)
+                    paper_title = paper_metadata.title
+                    reference_paper_ids = paper_metadata.referenced_papers or []
+                    if not topic_id and paper_metadata.source_brainstorm_ids:
+                        topic_id = paper_metadata.source_brainstorm_ids[0]
+                    if paper_metadata.status == "in_progress" or not paper_is_complete:
+                        paper_content = await self._get_paper_content_for_resume(paper_id)
+                        paper_phase = self._detect_paper_phase(paper_content)
+                    else:
+                        logger.info(
+                            "Ignoring stale current_paper_id %s during resume recovery: paper is already complete",
+                            paper_id,
+                        )
+                        paper_id = None
+                        paper_title = None
+                        reference_paper_ids = []
+
+            metadata = await brainstorm_memory.get_metadata(topic_id) if topic_id else None
+            if topic_id and metadata is None:
+                return None
+
+            current_tier = "tier2_paper_writing" if paper_id else "tier1_aggregation"
+            if (
+                metadata is not None
+                and metadata.status == "complete"
+                and not paper_id
+                and not (metadata.papers_generated or [])
+            ):
+                current_tier = "tier2_paper_writing"
+                paper_phase = "brainstorm_proof_verification"
+            elif metadata is not None and metadata.status == "complete" and not paper_id:
+                return None
+
+            acceptance_count = await self._recover_brainstorm_acceptance_count(topic_id)
+            workflow_state = await research_metadata.get_workflow_state()
+            workflow_state.update(
+                {
+                    "is_running": False,
+                    "current_tier": current_tier,
+                    "current_topic_id": topic_id,
+                    "current_paper_id": paper_id,
+                    "current_paper_title": paper_title,
+                    "paper_phase": paper_phase,
+                    "reference_paper_ids": reference_paper_ids,
+                    "acceptance_count": acceptance_count,
+                    "papers_completed_count": stats.get("total_papers_completed", 0),
+                }
+            )
+            return workflow_state
+        except Exception as exc:
+            logger.debug("Failed to recover resume point from metadata: %s", exc)
+            return None
     
     async def stop(self) -> None:
         """Stop the autonomous research gracefully.
@@ -2050,6 +2565,8 @@ async def _run_shutdown_step(label: str, awaitable, timeout: float = 5.0) -> boo
             return False
         
         # Stop any running aggregator or compiler to prevent orphan tasks
+        await self._stop_active_child_aggregators("autonomous stop")
+
         if self._brainstorm_aggregator:
             try:
                 if await _run_shutdown_step("brainstorm aggregator", self._brainstorm_aggregator.stop()):
@@ -2435,8 +2952,7 @@ def get_validator_config(self) -> Optional[Dict[str, Any]]:
         Returns None if not initialized.
         
         Returns:
-            Dict with validator_model, validator_context_window, validator_max_tokens,
-            validator_provider, and validator_openrouter_provider, or None if not initialized.
+            Dict with validator model/runtime settings, or None if not initialized.
         """
         if not self._validator_model:
             return None
@@ -2447,6 +2963,8 @@ def get_validator_config(self) -> Optional[Dict[str, Any]]:
             "validator_max_tokens": self._validator_max_tokens,
             "validator_provider": self._validator_provider,
             "validator_openrouter_provider": self._validator_openrouter_provider,
+            "validator_openrouter_reasoning_effort": self._validator_openrouter_reasoning_effort,
+            "validator_supercharge_enabled": self._validator_supercharge_enabled,
         }
 
     def get_proof_runtime_config(self) -> Optional[Dict[str, Any]]:
@@ -2530,6 +3048,7 @@ async def _topic_exploration_phase(self) -> str:
         
         try:
             exploration_aggregator = AggregatorCoordinator()
+            self._track_child_aggregator(exploration_aggregator)
             
             await exploration_aggregator.initialize(
                 user_prompt=exploration_prompt,
@@ -2541,7 +3060,9 @@ async def _topic_exploration_phase(self) -> str:
                 validator_max_tokens=self._validator_max_tokens,
                 validator_provider=self._validator_provider,
                 validator_openrouter_provider=self._validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
                 validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                validator_supercharge_enabled=self._validator_supercharge_enabled,
                 enable_cleanup_review=False
             )
             
@@ -2644,6 +3165,8 @@ async def _topic_exploration_phase(self) -> str:
                     pass
             return ""
         finally:
+            self._untrack_child_aggregator(exploration_aggregator)
+
             # Restore original shared training path
             system_config.shared_training_file = original_shared_path
             shared_training_memory.file_path = original_memory_path
@@ -3019,7 +3542,7 @@ async def _pre_brainstorm_reference_selection(self) -> List[str]:
         logger.info(f"Pre-brainstorm reference selection: selected {len(selected_ids)} papers")
         return selected_ids
     
-    def _get_reference_paper_paths(self) -> List[str]:
+    async def _get_reference_paper_paths(self) -> List[str]:
         """
         Get file paths for currently selected reference papers.
         Uses session-based paths if session manager is active.
@@ -3029,6 +3552,10 @@ def _get_reference_paper_paths(self) -> List[str]:
         """
         paths = []
         for paper_id in self._current_reference_papers:
+            metadata = await paper_library.get_metadata(paper_id)
+            if metadata and metadata.status != "complete":
+                logger.info(f"Skipping pruned/non-complete reference paper {paper_id}")
+                continue
             # Use paper_library to get session-aware path
             # paper_library handles both legacy flat structure and session-based paths
             paper_path = paper_library._get_paper_path(paper_id)
@@ -3052,6 +3579,9 @@ async def _get_reference_paper_details(
             if not metadata:
                 logger.warning(f"Reference paper metadata not found: {paper_id}")
                 continue
+            if metadata.status != "complete":
+                logger.info(f"Skipping non-complete reference paper metadata: {paper_id} ({metadata.status})")
+                continue
 
             reference_title_display = await paper_library.get_reference_title_display(
                 paper_id,
@@ -3089,6 +3619,8 @@ async def _brainstorm_aggregation_loop(self) -> bool:
         if metadata is None:
             logger.error(f"Cannot start aggregation: brainstorm {self._current_topic_id} not found")
             return False
+
+        self._brainstorm_hard_limit_triggered = False
         
         # Initialize per-paper model tracker for this brainstorm/paper cycle
         self._current_paper_tracker = PaperModelTracker(
@@ -3114,6 +3646,15 @@ async def paper_model_tracking_callback(model_id: str) -> None:
         # Override shared training memory path to brainstorm-specific
         # Use brainstorm_memory to get correct path (respects session manager)
         brainstorm_db_path = brainstorm_memory._get_database_path(self._current_topic_id)
+        if not brainstorm_db_path.exists():
+            logger.error(
+                f"Cannot start aggregation: brainstorm database not found at {brainstorm_db_path}"
+            )
+            await self.clear_deleted_brainstorm_reference(
+                self._current_topic_id,
+                "brainstorm database missing before aggregation start"
+            )
+            return False
         brainstorm_db_path.parent.mkdir(parents=True, exist_ok=True)
         
         # Temporarily override shared training path
@@ -3134,9 +3675,12 @@ async def paper_model_tracking_callback(model_id: str) -> None:
         try:
             # Get reference paper paths for brainstorm context
             # This enables compounding knowledge - brainstorm submitters can build on prior papers
-            reference_paper_paths = self._get_reference_paper_paths()
+            reference_paper_paths = await self._get_reference_paper_paths()
             if reference_paper_paths:
                 logger.info(f"Loading {len(reference_paper_paths)} reference papers for brainstorm aggregation")
+
+            async def hard_limit_callback(total_acceptances: int) -> None:
+                await self._trigger_brainstorm_hard_limit(total_acceptances)
             
             # Initialize aggregator with topic prompt
             # CRITICAL: skip_stats_load=True to prevent loading manual aggregator stats
@@ -3153,7 +3697,13 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                 # Pass OpenRouter provider configs for validator
                 validator_provider=self._validator_provider,
                 validator_openrouter_provider=self._validator_openrouter_provider,
-                validator_lm_studio_fallback=self._validator_lm_studio_fallback
+                validator_openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
+                validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                validator_supercharge_enabled=self._validator_supercharge_enabled,
+                max_total_acceptances=_BRAINSTORM_ACCEPTANCE_HARD_LIMIT,
+                acceptance_count_offset=max(0, self._acceptance_count),
+                acceptance_cap_callback=hard_limit_callback,
+                allow_trusted_context_files=True,
             )
             
             # CRITICAL FIX: Re-ingest existing submissions into RAG after resume
@@ -3240,18 +3790,22 @@ async def paper_model_tracking_callback(model_id: str) -> None:
             # Safety check: if topic already at or past hard cap (e.g. resume of
             # already-complete brainstorm that slipped past the code guard), skip
             # aggregation entirely and go straight to paper writing.
-            if self._acceptance_count >= 30:
+            if self._acceptance_count >= _BRAINSTORM_ACCEPTANCE_HARD_LIMIT:
                 logger.info(
                     f"Topic {self._current_topic_id} already at {self._acceptance_count} "
-                    f"acceptances (>= 30 cap). Skipping aggregation, forcing paper writing."
+                    f"acceptances (>= {_BRAINSTORM_ACCEPTANCE_HARD_LIMIT} cap). "
+                    f"Skipping aggregation, forcing paper writing."
                 )
-                await brainstorm_memory.mark_complete(self._current_topic_id)
-                await research_metadata.mark_brainstorm_complete(self._current_topic_id)
+                await self._trigger_brainstorm_hard_limit(self._acceptance_count)
                 await self._brainstorm_aggregator.stop()
                 await self._run_brainstorm_completion_proofs()
                 return True
             
             while self._running and not self._stop_event.is_set():
+                if not await self._current_brainstorm_available_for_aggregation(brainstorm_db_path):
+                    await self._brainstorm_aggregator.stop()
+                    return False
+
                 # Get current aggregator stats
                 status = await self._brainstorm_aggregator.get_status()
                 current_acceptances = status.total_acceptances
@@ -3294,25 +3848,10 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                         await self._save_workflow_state(tier="tier1_aggregation")
                     
                     # Check for hard limit of 30 acceptances (FORCE paper writing, skip completion review)
-                    if self._acceptance_count >= 30:
-                        logger.info(f"Hard limit of 30 acceptances reached for {self._current_topic_id}. Forcing paper writing transition.")
-                        
-                        # Broadcast hard limit reached event
-                        await self._broadcast("brainstorm_hard_limit_reached", {
-                            "topic_id": self._current_topic_id,
-                            "acceptance_count": self._acceptance_count,
-                            "message": "Brainstorm hard limit of 30 acceptances reached. Forcing paper writing."
-                        })
-                        
-                        # Mark brainstorm complete
-                        await brainstorm_memory.mark_complete(self._current_topic_id)
-                        await research_metadata.mark_brainstorm_complete(self._current_topic_id)
-                        
-                        # Stop aggregator
+                    if self._acceptance_count >= _BRAINSTORM_ACCEPTANCE_HARD_LIMIT:
+                        await self._trigger_brainstorm_hard_limit(self._acceptance_count)
                         await self._brainstorm_aggregator.stop()
                         await self._run_brainstorm_completion_proofs()
-                        
-                        # Force transition to paper writing (skip completion review)
                         return True
                     
                     # Check for early completion triggers
@@ -3330,6 +3869,11 @@ async def paper_model_tracking_callback(model_id: str) -> None:
                             await self._brainstorm_aggregator.stop()
                             await self._run_brainstorm_completion_proofs()
                             return True
+
+                        if self._brainstorm_hard_limit_triggered:
+                            await self._brainstorm_aggregator.stop()
+                            await self._run_brainstorm_completion_proofs()
+                            return True
                 
                 # Check for manual override trigger (before checking stop event)
                 if self._manual_paper_writing_triggered:
@@ -3422,7 +3966,10 @@ async def _check_early_completion_triggers(self) -> bool:
         ]
         
         exhaustion_count = 0
-        for submitter_id in [1, 2, 3]:
+        configured_submitter_ids = sorted(
+            {config.submitter_id for config in self._submitter_configs if config.submitter_id}
+        ) or [1, 2, 3]
+        for submitter_id in configured_submitter_ids:
             rejections = await autonomous_rejection_logs.get_brainstorm_submitter_rejections(
                 self._current_topic_id,
                 submitter_id
@@ -3481,8 +4028,19 @@ async def force_paper_writing(self) -> bool:
             await brainstorm_memory.mark_complete(self._current_topic_id)
             await research_metadata.mark_brainstorm_complete(self._current_topic_id)
             
-            # Set flag to trigger paper writing on next loop iteration
+            # Parent/user action wins immediately: stop child aggregation now,
+            # then let the owning workflow loop transition into Tier 2.
             self._manual_paper_writing_triggered = True
+            self._state.current_tier = "tier2_paper_writing"
+            await self._save_workflow_state(tier="tier2_paper_writing")
+            try:
+                if await self._await_parent_phase_shutdown(
+                    "brainstorm aggregator shutdown for manual paper-writing override",
+                    self._brainstorm_aggregator.stop(),
+                ):
+                    logger.info("Brainstorm aggregator stopped by manual paper-writing override")
+            except Exception as stop_exc:
+                logger.warning(f"Error stopping aggregator during manual paper-writing override: {stop_exc}")
             
             return True
             
@@ -3563,10 +4121,15 @@ async def force_tier3_final_answer(self, mode: str = "complete_current") -> dict
                 logger.info("Force Tier 3: Main loop stopped")
                 
                 # Stop current aggregator if it exists (don't check tier - state is unreliable)
+                await self._stop_active_child_aggregators("forced Tier 3")
+
                 if self._brainstorm_aggregator:
                     try:
-                        await self._brainstorm_aggregator.stop()
-                        logger.info("Aggregator stopped for forced Tier 3")
+                        if await self._await_parent_phase_shutdown(
+                            "brainstorm aggregator shutdown for forced Tier 3",
+                            self._brainstorm_aggregator.stop(),
+                        ):
+                            logger.info("Aggregator stopped for forced Tier 3")
                     except Exception as e:
                         logger.warning(f"Error stopping aggregator: {e}")
                     
@@ -3581,17 +4144,35 @@ async def force_tier3_final_answer(self, mode: str = "complete_current") -> dict
                 # Stop compiler if it exists (don't check tier - state is unreliable)
                 if self._paper_compiler:
                     try:
-                        await self._paper_compiler.stop()
-                        logger.info("Compiler stopped for forced Tier 3")
+                        if await self._await_parent_phase_shutdown(
+                            "paper compiler shutdown for forced Tier 3",
+                            self._paper_compiler.stop(),
+                        ):
+                            logger.info("Compiler stopped for forced Tier 3")
                     except Exception as e:
                         logger.warning(f"Error stopping compiler: {e}")
                 
-                # CRITICAL: Wait for main loop to actually exit before resetting flags
-                # The main loop checks these flags, and if we reset them too quickly,
-                # the loop will see _running=True and continue creating brainstorms!
-                # This delay ensures the main loop's next iteration sees _running=False and exits.
-                await asyncio.sleep(0.5)
-                logger.info("Force Tier 3: Waited for main loop to exit")
+                # CRITICAL: Wait for the old main loop to actually exit before
+                # resetting flags for Tier 3. Otherwise a child branch can see the
+                # cleared stop flag and continue under the parent final phase.
+                current_task = asyncio.current_task()
+                main_task = self._main_task
+                if main_task and main_task is not current_task and not main_task.done():
+                    try:
+                        await asyncio.wait_for(
+                            asyncio.shield(main_task),
+                            timeout=_PARENT_PHASE_SHUTDOWN_TIMEOUT_SECONDS,
+                        )
+                        logger.info("Force Tier 3: Main loop exited cleanly")
+                    except asyncio.TimeoutError:
+                        logger.warning("Force Tier 3: Main loop did not exit in time; cancelling it")
+                        main_task.cancel()
+                        try:
+                            await main_task
+                        except asyncio.CancelledError:
+                            pass
+                else:
+                    await asyncio.sleep(0)
                 
                 # CRITICAL: Reset flags for Tier 3 execution
                 # Now that the main loop has exited, we can reset flags for Tier 3's internal loops
@@ -3633,8 +4214,9 @@ async def force_tier3_final_answer(self, mode: str = "complete_current") -> dict
                     logger.info("Force Tier 3: Restarting main research loop to generate more papers")
                     
                     # Flags are already in running state (set at lines 1737-1738)
-                    # Create a background task to resume the main research loop
-                    asyncio.create_task(self._resume_research_loop_after_tier3())
+                    # Create a tracked background task to resume the main research loop.
+                    self._main_task = asyncio.create_task(self._resume_research_loop_after_tier3())
+                    self._main_task.add_done_callback(self._on_main_task_done)
                     
                     return {
                         "success": True, 
@@ -4116,6 +4698,7 @@ async def _paper_title_exploration_phase(
                 last_rejections = 0
             else:
                 exploration_aggregator = AggregatorCoordinator()
+                self._track_child_aggregator(exploration_aggregator)
                 
                 await exploration_aggregator.initialize(
                     user_prompt=exploration_prompt,
@@ -4127,7 +4710,9 @@ async def _paper_title_exploration_phase(
                     validator_max_tokens=self._validator_max_tokens,
                     validator_provider=self._validator_provider,
                     validator_openrouter_provider=self._validator_openrouter_provider,
+                    validator_openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
                     validator_lm_studio_fallback=self._validator_lm_studio_fallback,
+                    validator_supercharge_enabled=self._validator_supercharge_enabled,
                     enable_cleanup_review=False
                 )
                 
@@ -4229,6 +4814,8 @@ async def _paper_title_exploration_phase(
                     pass
             return ""
         finally:
+            self._untrack_child_aggregator(exploration_aggregator)
+
             system_config.shared_training_file = original_shared_path
             shared_training_memory.file_path = original_memory_path
             
@@ -4306,16 +4893,24 @@ async def _compile_paper(
                 # Pass OpenRouter provider configs for all compiler roles
                 validator_provider=self._validator_provider,
                 validator_openrouter_provider=self._validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
                 validator_lm_studio_fallback=self._validator_lm_studio_fallback,
                 high_context_provider=self._high_context_provider,
                 high_context_openrouter_provider=self._high_context_openrouter_provider,
+                high_context_openrouter_reasoning_effort=self._high_context_openrouter_reasoning_effort,
                 high_context_lm_studio_fallback=self._high_context_lm_studio_fallback,
                 high_param_provider=self._high_param_provider,
                 high_param_openrouter_provider=self._high_param_openrouter_provider,
+                high_param_openrouter_reasoning_effort=self._high_param_openrouter_reasoning_effort,
                 high_param_lm_studio_fallback=self._high_param_lm_studio_fallback,
                 critique_submitter_provider=self._critique_submitter_provider,
                 critique_submitter_openrouter_provider=self._critique_submitter_openrouter_provider,
-                critique_submitter_lm_studio_fallback=self._critique_submitter_lm_studio_fallback
+                critique_submitter_openrouter_reasoning_effort=self._critique_submitter_openrouter_reasoning_effort,
+                critique_submitter_lm_studio_fallback=self._critique_submitter_lm_studio_fallback,
+                validator_supercharge_enabled=self._validator_supercharge_enabled,
+                high_context_supercharge_enabled=self._high_context_supercharge_enabled,
+                high_param_supercharge_enabled=self._high_param_supercharge_enabled,
+                critique_submitter_supercharge_enabled=self._critique_submitter_supercharge_enabled
             )
             
             # Set WebSocket broadcaster for compiler events
@@ -4401,6 +4996,10 @@ async def _compile_paper(
             if reference_paper_ids:
                 logger.info(f"Loading {len(reference_paper_ids)} reference papers into compiler RAG")
                 for ref_paper_id in reference_paper_ids:
+                    ref_metadata = await paper_library.get_metadata(ref_paper_id)
+                    if not ref_metadata or ref_metadata.status != "complete":
+                        logger.info(f"Skipping non-complete compiler reference paper {ref_paper_id}")
+                        continue
                     # IMPORTANT: Use paper_library.get_paper_path() for session-aware path resolution
                     paper_path = paper_library.get_paper_path(ref_paper_id)
                     if os.path.exists(paper_path):
@@ -4423,6 +5022,10 @@ async def _compile_paper(
             if self._current_brainstorm_paper_ids:
                 logger.info(f"Loading {len(self._current_brainstorm_paper_ids)} prior brainstorm papers as auto-references")
                 for bp_id in self._current_brainstorm_paper_ids:
+                    bp_metadata = await paper_library.get_metadata(bp_id)
+                    if not bp_metadata or bp_metadata.status != "complete":
+                        logger.info(f"Skipping non-complete prior brainstorm paper {bp_id}")
+                        continue
                     bp_path = paper_library.get_paper_path(bp_id)
                     if os.path.exists(bp_path):
                         bp_content = await paper_library.get_paper_content(bp_id, strip_proofs=True)
@@ -4671,63 +5274,22 @@ async def _handle_paper_completion(
                 "word_count": paper_metadata.word_count
             })
 
-            await self._run_proof_verification(
-                content,
-                "paper",
-                paper_id,
-                source_title=title,
+            await self._save_workflow_state(
+                tier="tier2_paper_writing",
+                phase="paper_proof_verification",
             )
-
-            pending_retry_candidates: List[ProofCandidate] = []
-            retry_source_ids = paper_metadata.source_brainstorm_ids or ([self._current_topic_id] if self._current_topic_id else [])
-            for brainstorm_id in retry_source_ids:
-                pending_retries = await proof_database.get_pending_retries(
-                    brainstorm_id,
-                    retry_source_id=paper_id,
-                )
-                for pending_retry in pending_retries:
-                    combined_excerpt_parts = []
-                    if pending_retry.source_excerpt:
-                        combined_excerpt_parts.append(
-                            "ORIGINAL BRAINSTORM EXCERPT:\n" + pending_retry.source_excerpt
-                        )
-                    if content:
-                        combined_excerpt_parts.append(
-                            "REFINED PAPER CONTEXT:\n" + content[:6000]
-                        )
-
-                    retry_formal_sketch = pending_retry.formal_sketch
-                    if pending_retry.error_summary:
-                        retry_formal_sketch = (
-                            f"{retry_formal_sketch}\n\nPrior Lean 4 failure summary: {pending_retry.error_summary}"
-                        ).strip()
-
-                    pending_retry_candidates.append(
-                        ProofCandidate(
-                            theorem_id=pending_retry.theorem_id,
-                            statement=pending_retry.theorem_statement,
-                            formal_sketch=retry_formal_sketch,
-                            source_excerpt="\n\n".join(part for part in combined_excerpt_parts if part).strip(),
-                            origin_source_id=brainstorm_id,
-                        )
-                    )
-
-            if pending_retry_candidates:
-                await self._broadcast("proof_retry_scheduled", {
-                    "source_type": "paper",
-                    "source_id": paper_id,
-                    "source_title": title,
-                    "count": len(pending_retry_candidates),
-                    "brainstorm_ids": retry_source_ids,
-                })
-                await self._run_proof_verification(
-                    content,
-                    "paper",
+            await self._run_completed_paper_proof_checks(
+                paper_id=paper_id,
+                title=title,
+                content=content,
+                source_brainstorm_ids=paper_metadata.source_brainstorm_ids,
+            )
+            if self._stop_event.is_set():
+                logger.info(
+                    "Stop requested during paper proof verification for %s; preserving proof checkpoint",
                     paper_id,
-                    source_title=title,
-                    theorem_candidates=pending_retry_candidates,
-                    trigger="retry",
                 )
+                return
 
             # Trigger auto-critique generation in background (only if marking as complete)
             asyncio.create_task(self._auto_generate_paper_critique(
@@ -4748,6 +5310,81 @@ async def _handle_paper_completion(
         else:
             # Paper saved but still in progress - keep state
             logger.info(f"Paper saved (in progress): {paper_id} ({paper_metadata.word_count} words)")
+
+    async def _run_completed_paper_proof_checks(
+        self,
+        paper_id: str,
+        title: str,
+        content: str,
+        source_brainstorm_ids: List[str],
+    ) -> None:
+        """Run proof checks for a completed paper and any deferred brainstorm retries."""
+        self._state.current_tier = "tier2_paper_writing"
+        await self._save_workflow_state(
+            tier="tier2_paper_writing",
+            phase="paper_proof_verification",
+        )
+
+        await self._run_proof_verification(
+            content,
+            "paper",
+            paper_id,
+            source_title=title,
+        )
+
+        if self._stop_event.is_set():
+            return
+
+        pending_retry_candidates: List[ProofCandidate] = []
+        retry_source_ids = source_brainstorm_ids or ([self._current_topic_id] if self._current_topic_id else [])
+        for brainstorm_id in retry_source_ids:
+            pending_retries = await proof_database.get_pending_retries(
+                brainstorm_id,
+                retry_source_id=paper_id,
+            )
+            for pending_retry in pending_retries:
+                combined_excerpt_parts = []
+                if pending_retry.source_excerpt:
+                    combined_excerpt_parts.append(
+                        "ORIGINAL BRAINSTORM EXCERPT:\n" + pending_retry.source_excerpt
+                    )
+                if content:
+                    combined_excerpt_parts.append(
+                        "REFINED PAPER CONTEXT:\n" + content[:6000]
+                    )
+
+                retry_formal_sketch = pending_retry.formal_sketch
+                if pending_retry.error_summary:
+                    retry_formal_sketch = (
+                        f"{retry_formal_sketch}\n\nPrior Lean 4 failure summary: {pending_retry.error_summary}"
+                    ).strip()
+
+                pending_retry_candidates.append(
+                    ProofCandidate(
+                        theorem_id=pending_retry.theorem_id,
+                        statement=pending_retry.theorem_statement,
+                        formal_sketch=retry_formal_sketch,
+                        source_excerpt="\n\n".join(part for part in combined_excerpt_parts if part).strip(),
+                        origin_source_id=brainstorm_id,
+                    )
+                )
+
+        if pending_retry_candidates and not self._stop_event.is_set():
+            await self._broadcast("proof_retry_scheduled", {
+                "source_type": "paper",
+                "source_id": paper_id,
+                "source_title": title,
+                "count": len(pending_retry_candidates),
+                "brainstorm_ids": retry_source_ids,
+            })
+            await self._run_proof_verification(
+                content,
+                "paper",
+                paper_id,
+                source_title=title,
+                theorem_candidates=pending_retry_candidates,
+                trigger="retry",
+            )
     
     async def _auto_generate_paper_critique(
         self,
@@ -4814,9 +5451,11 @@ async def _auto_generate_paper_critique(
                     model_id=self._validator_model,
                     openrouter_model_id=self._validator_model if self._validator_provider == "openrouter" else None,
                     openrouter_provider=self._validator_openrouter_provider,
+                    openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
                     lm_studio_fallback_id=self._validator_lm_studio_fallback,
                     context_window=self._validator_context,
-                    max_output_tokens=self._validator_max_tokens
+                    max_output_tokens=self._validator_max_tokens,
+                    supercharge_enabled=self._validator_supercharge_enabled
                 )
             )
             
@@ -4944,7 +5583,12 @@ async def _check_paper_redundancy(self) -> None:
         
         if result and result.should_remove and result.paper_id:
             # Execute removal
-            success = await self._redundancy_checker.execute_removal(result.paper_id)
+            success = await self._redundancy_checker.execute_removal(
+                result.paper_id,
+                reason=result.reasoning,
+            )
+            if success:
+                await autonomous_rag_manager.remove_paper_from_rag(result.paper_id)
             
             await self._broadcast("paper_redundancy_review", {
                 "should_remove": True,
@@ -5829,16 +6473,24 @@ async def _compile_tier3_paper(
                 # Pass OpenRouter provider configs for all compiler roles
                 validator_provider=self._validator_provider,
                 validator_openrouter_provider=self._validator_openrouter_provider,
+                validator_openrouter_reasoning_effort=self._validator_openrouter_reasoning_effort,
                 validator_lm_studio_fallback=self._validator_lm_studio_fallback,
                 high_context_provider=self._high_context_provider,
                 high_context_openrouter_provider=self._high_context_openrouter_provider,
+                high_context_openrouter_reasoning_effort=self._high_context_openrouter_reasoning_effort,
                 high_context_lm_studio_fallback=self._high_context_lm_studio_fallback,
                 high_param_provider=self._high_param_provider,
                 high_param_openrouter_provider=self._high_param_openrouter_provider,
+                high_param_openrouter_reasoning_effort=self._high_param_openrouter_reasoning_effort,
                 high_param_lm_studio_fallback=self._high_param_lm_studio_fallback,
                 critique_submitter_provider=self._critique_submitter_provider,
                 critique_submitter_openrouter_provider=self._critique_submitter_openrouter_provider,
-                critique_submitter_lm_studio_fallback=self._critique_submitter_lm_studio_fallback
+                critique_submitter_openrouter_reasoning_effort=self._critique_submitter_openrouter_reasoning_effort,
+                critique_submitter_lm_studio_fallback=self._critique_submitter_lm_studio_fallback,
+                validator_supercharge_enabled=self._validator_supercharge_enabled,
+                high_context_supercharge_enabled=self._high_context_supercharge_enabled,
+                high_param_supercharge_enabled=self._high_param_supercharge_enabled,
+                critique_submitter_supercharge_enabled=self._critique_submitter_supercharge_enabled
             )
             
             # Set WebSocket broadcaster
@@ -6137,6 +6789,7 @@ def safe_rmtree(path: Path, max_retries: int = 5) -> bool:
         self._last_redundancy_check_at = 0
         self._last_completion_review_at = 0
         self._manual_paper_writing_triggered = False
+        self._brainstorm_hard_limit_triggered = False
         self._force_tier3_after_paper = False
         self._force_tier3_immediate = False
         self._tier3_active = False
diff --git a/backend/autonomous/core/autonomous_rag_manager.py b/backend/autonomous/core/autonomous_rag_manager.py
index dfabcb6..548f9ab 100644
--- a/backend/autonomous/core/autonomous_rag_manager.py
+++ b/backend/autonomous/core/autonomous_rag_manager.py
@@ -222,6 +222,10 @@ async def get_reference_papers_context(
         for paper_id in paper_ids:
             content = await paper_library.get_paper_content(paper_id, strip_proofs=True)
             metadata = await paper_library.get_metadata(paper_id)
+
+            if metadata and metadata.status != "complete":
+                logger.info(f"Skipping non-complete reference paper {paper_id} ({metadata.status})")
+                continue
             
             if content and metadata:
                 paper_tokens = count_tokens(content)
@@ -523,6 +527,20 @@ async def remove_brainstorm_from_rag(self, topic_id: str) -> None:
             except Exception as e:
                 logger.error(f"Failed to remove brainstorm {topic_id} from RAG: {e}")
 
+    async def remove_paper_from_rag(self, paper_id: str) -> None:
+        """Remove a pruned paper from any active paper RAG sources."""
+        self._papers_indexed.discard(paper_id)
+        for source_name in (
+            f"reference_paper_{paper_id}",
+            f"reference_paper_{paper_id}.txt",
+            f"prior_paper_{paper_id}.txt",
+        ):
+            try:
+                await rag_manager.remove_document(source_name)
+                logger.info(f"Removed pruned paper RAG source {source_name}")
+            except Exception as e:
+                logger.debug(f"Reference paper RAG source {source_name} not removed: {e}")
+
 
 # Global instance
 autonomous_rag_manager = AutonomousRAGManager()
diff --git a/backend/autonomous/core/proof_novelty.py b/backend/autonomous/core/proof_novelty.py
index 573d538..4b4cf6f 100644
--- a/backend/autonomous/core/proof_novelty.py
+++ b/backend/autonomous/core/proof_novelty.py
@@ -21,7 +21,13 @@
 
 
 VALID_NOVELTY_TIERS = frozenset(
-    {"not_novel", "novel_formulation", "novel_variant", "mathematical_discovery"}
+    {
+        "not_novel",
+        "novel_formulation",
+        "novel_variant",
+        "mathematical_discovery",
+        "major_mathematical_discovery",
+    }
 )
 
 
@@ -37,7 +43,7 @@ async def assess_proof_novelty(
     task_id: str,
     role_id: str = "autonomous_proof_novelty",
 ) -> Tuple[str, str]:
-    """Classify a Lean-4-verified theorem into one of four novelty tiers.
+    """Classify a Lean-4-verified theorem into one of five novelty tiers.
 
     Args:
         user_prompt: Top-level research prompt for context.
@@ -55,7 +61,8 @@ async def assess_proof_novelty(
 
     Returns:
         Tuple of (novelty_tier, reasoning) where novelty_tier is one of:
-        "not_novel", "novel_formulation", "novel_variant", "mathematical_discovery".
+        "not_novel", "novel_formulation", "novel_variant",
+        "mathematical_discovery", "major_mathematical_discovery".
         Falls back to ("not_novel", <message>) when the validator returns no
         usable response or an unrecognised tier string.
     """
diff --git a/backend/autonomous/core/proof_registration.py b/backend/autonomous/core/proof_registration.py
new file mode 100644
index 0000000..ab02d8f
--- /dev/null
+++ b/backend/autonomous/core/proof_registration.py
@@ -0,0 +1,216 @@
+"""
+Shared registration for Lean-verified proofs.
+
+Callers that already have Lean-accepted code use this module to classify the
+proof with the validator novelty prompt and store the resulting ProofRecord in
+the central proof database.
+"""
+from __future__ import annotations
+
+import logging
+from dataclasses import dataclass
+from typing import Any, Awaitable, Callable, Optional
+
+from backend.autonomous.core.proof_novelty import assess_proof_novelty
+from backend.shared.models import ProofAttemptFeedback, ProofDependency, ProofRecord
+
+logger = logging.getLogger(__name__)
+
+BroadcastFn = Optional[Callable[[str, dict[str, Any]], Awaitable[None]]]
+
+
+@dataclass
+class RegisteredProof:
+    """Result of registering or reusing a verified proof record."""
+
+    record: ProofRecord
+    duplicate: bool = False
+
+
+def _normalize_for_duplicate_check(value: str) -> str:
+    return "\n".join((value or "").strip().splitlines())
+
+
+async def _find_existing_proof(
+    proof_database,
+    *,
+    source_type: str,
+    source_id: str,
+    theorem_statement: str,
+    lean_code: str,
+) -> Optional[ProofRecord]:
+    """Return an existing proof for the same source/theorem/code if present."""
+    normalized_statement = " ".join((theorem_statement or "").split())
+    normalized_code = _normalize_for_duplicate_check(lean_code)
+    try:
+        for proof in await proof_database.get_all_proofs():
+            if proof.source_type != source_type or proof.source_id != source_id:
+                continue
+            if " ".join((proof.theorem_statement or "").split()) != normalized_statement:
+                continue
+            if _normalize_for_duplicate_check(proof.lean_code) != normalized_code:
+                continue
+            return proof
+    except Exception as exc:
+        logger.debug("Existing proof lookup failed for %s %s: %s", source_type, source_id, exc)
+    return None
+
+
+async def _broadcast_registered_proof(
+    *,
+    broadcast_fn: BroadcastFn,
+    record: ProofRecord,
+    base_event: Optional[dict[str, Any]],
+    proof_label: str = "",
+    retry_origin_source_id: str = "",
+) -> None:
+    if not broadcast_fn:
+        return
+
+    event_payload = {
+        **(base_event or {}),
+        "proof_id": record.proof_id,
+        "theorem_statement": record.theorem_statement,
+        "solver": record.solver,
+        "novelty_tier": record.novelty_tier,
+        "retry_origin_source_id": retry_origin_source_id,
+    }
+    if proof_label:
+        event_payload["proof_label"] = proof_label
+
+    if record.novel:
+        await broadcast_fn("novel_proof_discovered", event_payload)
+    else:
+        await broadcast_fn("known_proof_verified", event_payload)
+
+
+async def _broadcast_duplicate_proof(
+    *,
+    broadcast_fn: BroadcastFn,
+    record: ProofRecord,
+    base_event: Optional[dict[str, Any]],
+    proof_label: str = "",
+) -> None:
+    if not broadcast_fn:
+        return
+    event_payload = {
+        **(base_event or {}),
+        "proof_id": record.proof_id,
+        "theorem_statement": record.theorem_statement,
+        "solver": record.solver,
+        "novelty_tier": record.novelty_tier,
+        "duplicate": True,
+    }
+    if proof_label:
+        event_payload["proof_label"] = proof_label
+    await broadcast_fn("proof_registration_duplicate", event_payload)
+
+
+async def register_verified_lean_proof(
+    *,
+    proof_database,
+    user_prompt: str,
+    theorem_statement: str,
+    lean_code: str,
+    validator_model: str,
+    validator_context: int,
+    validator_max_tokens: int,
+    task_id: str,
+    role_id: str,
+    source_type: str,
+    source_id: str,
+    source_title: str = "",
+    theorem_id: str = "",
+    theorem_name: str = "",
+    formal_sketch: str = "",
+    solver: str = "Lean 4",
+    verification_notes: str = "Lean 4 accepted the submitted proof.",
+    attempt_count: int = 0,
+    attempts: Optional[list[ProofAttemptFeedback]] = None,
+    dependencies: Optional[list[ProofDependency]] = None,
+    solver_hints: Optional[list[str]] = None,
+    broadcast_fn: BroadcastFn = None,
+    base_event: Optional[dict[str, Any]] = None,
+    proof_label: str = "",
+    retry_origin_source_id: str = "",
+) -> RegisteredProof:
+    """
+    Classify and store Lean-verified proof code using the shared novelty tiers.
+
+    Duplicate detection is scoped to source type/id, theorem statement, and
+    Lean code. When a duplicate is found, the existing record is returned and
+    no novelty API call is made.
+    """
+    existing = await _find_existing_proof(
+        proof_database,
+        source_type=source_type,
+        source_id=source_id,
+        theorem_statement=theorem_statement,
+        lean_code=lean_code,
+    )
+    if existing is not None:
+        await _broadcast_duplicate_proof(
+            broadcast_fn=broadcast_fn,
+            record=existing,
+            base_event=base_event,
+            proof_label=proof_label,
+        )
+        return RegisteredProof(record=existing, duplicate=True)
+
+    existing_novel_proofs = proof_database.get_novel_proofs_for_injection()
+    novelty_tier, novelty_reasoning = await assess_proof_novelty(
+        user_prompt=user_prompt,
+        theorem_statement=theorem_statement,
+        lean_code=lean_code,
+        validator_model=validator_model,
+        validator_context=validator_context,
+        validator_max_tokens=validator_max_tokens,
+        existing_novel_proofs=existing_novel_proofs,
+        task_id=task_id,
+        role_id=role_id,
+    )
+    is_novel = novelty_tier != "not_novel"
+
+    record = ProofRecord(
+        proof_id="",
+        theorem_id=theorem_id,
+        theorem_statement=theorem_statement,
+        theorem_name=theorem_name,
+        formal_sketch=formal_sketch,
+        source_type=source_type,
+        source_id=source_id,
+        source_title=source_title,
+        solver=solver,
+        lean_code=lean_code,
+        novel=is_novel,
+        novelty_tier=novelty_tier,
+        novelty_reasoning=novelty_reasoning,
+        verification_notes=verification_notes,
+        attempt_count=attempt_count,
+        attempts=list(attempts or []),
+        dependencies=list(dependencies or []),
+        solver_hints=list(solver_hints or []),
+    )
+    if hasattr(proof_database, "add_proof_if_absent"):
+        stored, duplicate = await proof_database.add_proof_if_absent(record)
+    else:
+        stored = await proof_database.add_proof(record)
+        duplicate = stored.proof_id != record.proof_id and record.proof_id != ""
+
+    if duplicate:
+        await _broadcast_duplicate_proof(
+            broadcast_fn=broadcast_fn,
+            record=stored,
+            base_event=base_event,
+            proof_label=proof_label,
+        )
+        return RegisteredProof(record=stored, duplicate=True)
+
+    await _broadcast_registered_proof(
+        broadcast_fn=broadcast_fn,
+        record=stored,
+        base_event=base_event,
+        proof_label=proof_label,
+        retry_origin_source_id=retry_origin_source_id,
+    )
+    return RegisteredProof(record=stored, duplicate=False)
diff --git a/backend/autonomous/core/proof_verification_stage.py b/backend/autonomous/core/proof_verification_stage.py
index c19178c..bd0e19a 100644
--- a/backend/autonomous/core/proof_verification_stage.py
+++ b/backend/autonomous/core/proof_verification_stage.py
@@ -15,8 +15,15 @@
 from backend.autonomous.agents.proof_identification_agent import ProofIdentificationAgent
 from backend.autonomous.memory.brainstorm_memory import brainstorm_memory
 from backend.autonomous.memory.paper_library import paper_library
+from backend.autonomous.core.proof_registration import register_verified_lean_proof
+from backend.aggregator.prompts.validator_prompts import build_validator_prompt
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.brainstorm_proof_gate import BRAINSTORM_LEAN_PROOF_MARKER
 from backend.shared.config import system_config
-from backend.shared.models import ProofAttemptFeedback, ProofAttemptResult, ProofCandidate, ProofRecord, ProofStageResult, SmtHint
+from backend.shared.json_parser import parse_json
+from backend.shared.lean_proof_integrity import validate_full_lean_proof_integrity
+from backend.shared.model_error_utils import is_non_retryable_model_error
+from backend.shared.models import ProofAttemptFeedback, ProofAttemptResult, ProofCandidate, ProofStageResult, SmtHint
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.smt_client import get_smt_client
 from .proof_dependency_extractor import ProofDependencyExtractor
@@ -32,6 +39,7 @@
 class _LeanVerificationOutcome:
     """Outcome of a single candidate's Lean 4 formalization pipeline (Phase A)."""
     candidate: ProofCandidate
+    proof_label: str
     success: bool
     theorem_name: str
     lean_code: str
@@ -46,6 +54,7 @@ class ProofVerificationStage:
 
     def __init__(self) -> None:
         self._novelty_task_sequence = 0
+        self._integrity_task_sequence = 0
         self._dependency_extractor = ProofDependencyExtractor()
 
     @classmethod
@@ -136,6 +145,22 @@ def _summarize_error(error_text: str, limit: int = 500) -> str:
         cleaned = " ".join(raw.split())
         return cleaned[:limit] + ("..." if len(cleaned) > limit else "")
 
+    @staticmethod
+    def _proof_label_for_index(index: int) -> str:
+        """Return Proof A..Z, then AA..ZZ, then AAA.. for a 1-based index."""
+        safe_index = max(1, int(index or 1))
+        letter = chr(ord("A") + ((safe_index - 1) % 26))
+        repeat_count = ((safe_index - 1) // 26) + 1
+        return letter * repeat_count
+
+    def _lean_response_summary(self, feedback: ProofAttemptFeedback) -> str:
+        if feedback.success:
+            return "Lean 4 response: proof verified."
+        error_summary = self._summarize_error(feedback.error_output, limit=960)
+        if error_summary:
+            return f"Lean 4 response: {error_summary} - proof not verified."
+        return "Lean 4 response: proof not verified."
+
     @staticmethod
     def _extract_suggested_lemma_targets(error_text: str) -> list[str]:
         targets: list[str] = []
@@ -245,6 +270,7 @@ async def _run_smt_check(
         source_id: str,
         base_event: dict[str, Any],
         candidate: ProofCandidate,
+        proof_label: str,
         source_content: str,
         identification_agent: ProofIdentificationAgent,
         broadcast_fn: BroadcastFn,
@@ -252,16 +278,6 @@ async def _run_smt_check(
         if not system_config.smt_enabled or not self._is_smt_amenable(candidate):
             return None
 
-        await self._broadcast(
-            broadcast_fn,
-            "smt_check_started",
-            {
-                **base_event,
-                "theorem_id": candidate.theorem_id,
-                "theorem_statement": candidate.statement,
-            },
-        )
-
         started_at = time.monotonic()
         result_name = "unknown"
         try:
@@ -288,49 +304,23 @@ async def _run_smt_check(
                 z3_output=z3_raw[:2000],
             )
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             logger.debug("SMT check failed for theorem %s in %s %s: %s", candidate.theorem_id, source_type, source_id, exc)
-            return SmtHint(result="unknown", suggested_tactics=[], smtlib="")
-        finally:
             elapsed_ms = int((time.monotonic() - started_at) * 1000)
             await self._broadcast(
                 broadcast_fn,
-                "smt_check_complete",
+                "smt_check_error",
                 {
                     **base_event,
                     "theorem_id": candidate.theorem_id,
                     "theorem_statement": candidate.statement,
-                    "result": result_name,
+                    "proof_label": proof_label,
+                    "error_summary": self._summarize_error(str(exc), limit=960),
                     "elapsed_ms": elapsed_ms,
                 },
             )
-
-    async def _assess_novelty(
-        self,
-        *,
-        user_prompt: str,
-        theorem_statement: str,
-        lean_code: str,
-        validator_model: str,
-        validator_context: int,
-        validator_max_tokens: int,
-        existing_novel_proofs: str,
-    ) -> tuple[str, str]:
-        from .proof_novelty import assess_proof_novelty
-
-        task_id = f"proof_novelty_{self._novelty_task_sequence:03d}"
-        self._novelty_task_sequence += 1
-
-        return await assess_proof_novelty(
-            user_prompt=user_prompt,
-            theorem_statement=theorem_statement,
-            lean_code=lean_code,
-            validator_model=validator_model,
-            validator_context=validator_context,
-            validator_max_tokens=validator_max_tokens,
-            existing_novel_proofs=existing_novel_proofs,
-            task_id=task_id,
-            role_id="autonomous_proof_novelty",
-        )
+            return SmtHint(result="unknown", suggested_tactics=[], smtlib="")
 
     async def _resolve_candidates(
         self,
@@ -377,6 +367,103 @@ async def _prepare_candidate(
             candidate = candidate.model_copy(update={"relevant_lemmas": relevant_lemmas})
         return candidate
 
+    @staticmethod
+    def _format_verified_proof_for_brainstorm_validation(
+        *,
+        theorem_statement: str,
+        formal_sketch: str,
+        lean_code: str,
+        attempt_count: int,
+    ) -> str:
+        sections = [
+            BRAINSTORM_LEAN_PROOF_MARKER,
+            "",
+            "Lean 4 has accepted the following proof. Decide whether it is useful, non-redundant brainstorm progress before it is appended to the brainstorm database.",
+            "",
+            f"Theorem statement: {theorem_statement}",
+        ]
+        if formal_sketch:
+            sections.extend(["", f"Formalization notes: {formal_sketch}"])
+        sections.extend(
+            [
+                "",
+                f"Lean verification: accepted after {attempt_count} attempt{'s' if attempt_count != 1 else ''}.",
+                "",
+                "Lean 4 code:",
+                "```lean",
+                lean_code,
+                "```",
+            ]
+        )
+        return "\n".join(sections).strip()
+
+    async def _validate_brainstorm_verified_proof_addition(
+        self,
+        *,
+        user_prompt: str,
+        source_content: str,
+        proof_submission: str,
+        validator_model: str,
+        validator_context: int,
+        validator_max_tokens: int,
+        task_id: str,
+        role_id: str,
+        broadcast_fn: BroadcastFn,
+        base_event: dict[str, Any],
+    ) -> bool:
+        """Run the normal brainstorm usefulness gate before appending verified proofs."""
+        context = source_content or ""
+        while len(context) > 24000:
+            context = context[: max(len(context) // 2, 24000)]
+        prompt = build_validator_prompt(
+            user_prompt=user_prompt,
+            submission_content=proof_submission,
+            context=f"CURRENT BRAINSTORM DATABASE:\n{context}",
+        )
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=task_id,
+                role_id=role_id,
+                model=validator_model,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=validator_max_tokens,
+                temperature=0.0,
+            )
+            if not response or not response.get("choices"):
+                raise ValueError("Proof brainstorm validator returned no choices.")
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            raw = parse_json(content)
+            if isinstance(raw, list):
+                raw = raw[0] if raw else {}
+            if not isinstance(raw, dict):
+                raw = {}
+            accepted = str(raw.get("decision") or "").strip().lower() == "accept"
+            await self._broadcast(
+                broadcast_fn,
+                "proof_brainstorm_validation_complete",
+                {
+                    **base_event,
+                    "accepted": accepted,
+                    "reasoning": str(raw.get("reasoning") or raw.get("summary") or ""),
+                },
+            )
+            return accepted
+        except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
+            logger.warning("Verified brainstorm proof usefulness validation failed: %s", exc)
+            await self._broadcast(
+                broadcast_fn,
+                "proof_brainstorm_validation_complete",
+                {
+                    **base_event,
+                    "accepted": False,
+                    "reasoning": f"Validator failed before producing a usable decision: {exc}",
+                },
+            )
+            return False
+
     async def run(
         self,
         content: str,
@@ -397,6 +484,7 @@ async def run(
         trigger: str = "automatic",
         source_reserved: bool = False,
         should_stop: ShouldStopFn = None,
+        append_to_source: bool = True,
     ) -> ProofStageResult:
         """Run proof identification, formalization, Lean 4 checking, and novelty review."""
         result = ProofStageResult(source_type=source_type, source_id=source_id)
@@ -488,18 +576,22 @@ def _stop_requested() -> bool:
                 {
                     **base_event,
                     "count": len(resolved_candidates),
-                    "theorems_preview": [candidate.statement[:180] for candidate in resolved_candidates],
+                    "theorems_preview": [
+                        f"Proof {self._proof_label_for_index(index)}: {candidate.statement[:180]}"
+                        for index, candidate in enumerate(resolved_candidates, start=1)
+                    ],
                 },
             )
 
             max_parallel = max(1, int(getattr(system_config, "proof_max_parallel_candidates", 6) or 1))
             semaphore = asyncio.Semaphore(max_parallel)
 
-            async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOutcome:
+            async def run_phase_a(theorem_candidate: ProofCandidate, proof_label: str) -> _LeanVerificationOutcome:
                 async with semaphore:
                     if _stop_requested():
                         return _LeanVerificationOutcome(
                             candidate=theorem_candidate,
+                            proof_label=proof_label,
                             success=False,
                             theorem_name="",
                             lean_code="",
@@ -508,6 +600,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                     return await self._run_lean_pipeline_for_candidate(
                         theorem_candidate=theorem_candidate,
                         base_event=base_event,
+                        proof_label=proof_label,
                         user_prompt=user_prompt,
                         source_type=source_type,
                         source_id=source_id,
@@ -523,8 +616,8 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                     )
 
             verification_tasks = [
-                asyncio.create_task(run_phase_a(candidate))
-                for candidate in resolved_candidates
+                asyncio.create_task(run_phase_a(candidate, self._proof_label_for_index(index)))
+                for index, candidate in enumerate(resolved_candidates, start=1)
             ]
 
             pending_tasks = set(verification_tasks)
@@ -586,6 +679,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                         break
 
                     candidate = outcome.candidate
+                    proof_label = outcome.proof_label
                     attempts = outcome.attempts
                     lean_code = outcome.lean_code
 
@@ -614,44 +708,118 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                         )
                         continue
 
-                    result.verified_count += 1
-                    existing_novel_proofs = novel_proofs_db.get_novel_proofs_for_injection()
-                    novelty_tier, novelty_reasoning = await self._assess_novelty(
+                    integrity_task_id = f"proof_integrity_{self._integrity_task_sequence:03d}"
+                    self._integrity_task_sequence += 1
+                    integrity = await validate_full_lean_proof_integrity(
                         user_prompt=user_prompt,
                         theorem_statement=candidate.statement,
+                        formal_sketch=candidate.formal_sketch,
                         lean_code=lean_code,
+                        source_excerpt=candidate.source_excerpt or content,
+                        allowed_baseline="",
                         validator_model=validator_model,
                         validator_context=validator_context,
                         validator_max_tokens=validator_max_tokens,
-                        existing_novel_proofs=existing_novel_proofs,
+                        task_id=integrity_task_id,
+                        role_id="autonomous_proof_novelty",
+                        require_statement_alignment=True,
                     )
-                    is_novel = novelty_tier != "not_novel"
+                    if not integrity.valid:
+                        integrity_feedback = ProofAttemptFeedback(
+                            attempt=(attempts[-1].attempt + 1 if attempts else 1),
+                            theorem_id=candidate.theorem_id,
+                            reasoning="Post-Lean proof integrity check failed.",
+                            lean_code=lean_code,
+                            error_output=integrity.reason,
+                            strategy="full_script",
+                            success=False,
+                        )
+                        attempts = list(attempts) + [integrity_feedback]
+                        error_summary = self._summarize_error(integrity.reason)
+                        suggested_targets = self._extract_suggested_lemma_targets(integrity.reason)
+                        if source_type == "brainstorm" and trigger != "retry":
+                            await novel_proofs_db.record_failed_candidate(
+                                source_id,
+                                candidate,
+                                error_summary,
+                                suggested_lemma_targets=suggested_targets,
+                            )
+                        await self._broadcast(
+                            broadcast_fn,
+                            "proof_integrity_rejected",
+                            {
+                                **base_event,
+                                "theorem_id": candidate.theorem_id,
+                                "theorem_statement": candidate.statement,
+                                "proof_label": proof_label,
+                                "category": integrity.category,
+                                "reason": integrity.reason,
+                            },
+                        )
+                        result.results.append(
+                            ProofAttemptResult(
+                                theorem_id=candidate.theorem_id,
+                                theorem_statement=candidate.statement,
+                                lean_code=lean_code,
+                                success=False,
+                                novel=False,
+                                attempts_used=len(attempts),
+                                error_summary=error_summary,
+                            )
+                        )
+                        continue
+
+                    novelty_task_id = f"proof_novelty_{self._novelty_task_sequence:03d}"
+                    self._novelty_task_sequence += 1
 
                     solver_hints = []
                     if self._first_attempt_used_smt_hint(attempts, candidate.smt_hint):
                         solver_hints.append("smt-z3")
 
-                    proof_record = ProofRecord(
-                        proof_id="",
-                        theorem_id=candidate.theorem_id,
+                    registration = await register_verified_lean_proof(
+                        proof_database=novel_proofs_db,
+                        user_prompt=user_prompt,
                         theorem_statement=candidate.statement,
-                        theorem_name=outcome.theorem_name,
-                        formal_sketch=candidate.formal_sketch,
+                        lean_code=lean_code,
+                        validator_model=validator_model,
+                        validator_context=validator_context,
+                        validator_max_tokens=validator_max_tokens,
+                        task_id=novelty_task_id,
+                        role_id="autonomous_proof_novelty",
                         source_type=source_type,
                         source_id=source_id,
                         source_title=source_title,
+                        theorem_id=candidate.theorem_id,
+                        theorem_name=outcome.theorem_name,
+                        formal_sketch=candidate.formal_sketch,
                         solver="Lean 4",
-                        lean_code=lean_code,
-                        novel=is_novel,
-                        novelty_tier=novelty_tier,
-                        novelty_reasoning=novelty_reasoning,
                         verification_notes="Lean 4 accepted the submitted proof.",
                         attempt_count=len(attempts),
                         attempts=attempts,
-                        dependencies=[],
                         solver_hints=solver_hints,
+                        broadcast_fn=broadcast_fn,
+                        base_event=base_event,
+                        proof_label=proof_label,
+                        retry_origin_source_id=candidate.origin_source_id,
+                    )
+                    stored_record = registration.record
+                    is_novel = stored_record.novel
+                    novelty_tier = stored_record.novelty_tier
+                    result.verified_count += 1
+
+                    await self._broadcast(
+                        broadcast_fn,
+                        "proof_verified",
+                        {
+                            **base_event,
+                            "proof_id": stored_record.proof_id,
+                            "theorem_id": candidate.theorem_id,
+                            "theorem_statement": candidate.statement,
+                            "proof_label": proof_label,
+                            "strategy": attempts[-1].strategy if attempts else "full_script",
+                            "retry_origin_source_id": candidate.origin_source_id,
+                        },
                     )
-                    stored_record = await novel_proofs_db.add_proof(proof_record)
 
                     # Dependency extraction runs in Phase B so later candidates
                     # in the same paper can see earlier proofs. We instantiate
@@ -687,6 +855,7 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                                     **base_event,
                                     "proof_id": stored_record.proof_id,
                                     "theorem_name": stored_record.theorem_name,
+                                    "proof_label": proof_label,
                                     "dependencies": [
                                         dependency.model_dump(mode="json")
                                         for dependency in dependencies
@@ -707,43 +876,44 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
                             stored_record.proof_id,
                         )
 
-                    if is_novel:
+                    if is_novel and not registration.duplicate:
                         result.novel_count += 1
                         # Novel proofs are appended to their source document so the
                         # paper/brainstorm they came from retains a record of them.
                         # They are also stored in ProofDatabase and direct-injected
                         # into all prompts via inject_into_prompt().
-                        if source_type == "brainstorm":
-                            await brainstorm_memory.append_proofs_section(source_id, stored_record)
-                        elif source_type == "paper":
+                        if append_to_source and source_type == "brainstorm":
+                            validator_accepted = await self._validate_brainstorm_verified_proof_addition(
+                                user_prompt=user_prompt,
+                                source_content=content,
+                                proof_submission=self._format_verified_proof_for_brainstorm_validation(
+                                    theorem_statement=candidate.statement,
+                                    formal_sketch=candidate.formal_sketch,
+                                    lean_code=lean_code,
+                                    attempt_count=len(attempts),
+                                ),
+                                validator_model=validator_model,
+                                validator_context=validator_context,
+                                validator_max_tokens=validator_max_tokens,
+                                task_id=f"proof_brainstorm_val_{self._novelty_task_sequence:03d}",
+                                role_id="autonomous_proof_novelty",
+                                broadcast_fn=broadcast_fn,
+                                base_event={
+                                    **base_event,
+                                    "theorem_id": candidate.theorem_id,
+                                    "theorem_statement": candidate.statement,
+                                    "proof_id": stored_record.proof_id,
+                                    "proof_label": proof_label,
+                                },
+                            )
+                            if validator_accepted:
+                                await brainstorm_memory.append_proofs_section(source_id, stored_record)
+                        elif append_to_source and source_type == "paper":
                             await paper_library.append_proofs_section(source_id, stored_record)
-                        await self._broadcast(
-                            broadcast_fn,
-                            "novel_proof_discovered",
-                            {
-                                **base_event,
-                                "proof_id": stored_record.proof_id,
-                                "theorem_statement": stored_record.theorem_statement,
-                                "solver": "Lean 4",
-                                "novelty_tier": novelty_tier,
-                                "retry_origin_source_id": candidate.origin_source_id,
-                            },
-                        )
-                    else:
-                        # Non-novel (known) proofs are stored in ProofDatabase only.
-                        # They are NOT appended to brainstorm/paper files to avoid
-                        # polluting compiler and RAG context with standard Lean 4 code.
-                        # They remain browsable via proof_database.get_known_proofs_summary_for_browsing().
-                        await self._broadcast(
-                            broadcast_fn,
-                            "known_proof_verified",
-                            {
-                                **base_event,
-                                "proof_id": stored_record.proof_id,
-                                "theorem_statement": stored_record.theorem_statement,
-                                "retry_origin_source_id": candidate.origin_source_id,
-                            },
-                        )
+                    # Non-novel (known) proofs are stored in ProofDatabase only.
+                    # They are NOT appended to brainstorm/paper files to avoid
+                    # polluting compiler and RAG context with standard Lean 4 code.
+                    # They remain browsable via proof_database.get_known_proofs_summary_for_browsing().
 
                     result.results.append(
                         ProofAttemptResult(
@@ -780,6 +950,8 @@ async def run_phase_a(theorem_candidate: ProofCandidate) -> _LeanVerificationOut
         except FreeModelExhaustedError:
             raise
         except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
             logger.error(
                 "Proof verification stage failed for %s %s: %s",
                 source_type,
@@ -809,6 +981,7 @@ async def _run_lean_pipeline_for_candidate(
         *,
         theorem_candidate: ProofCandidate,
         base_event: dict[str, Any],
+        proof_label: str,
         user_prompt: str,
         source_type: str,
         source_id: str,
@@ -861,6 +1034,7 @@ async def _run_lean_pipeline_for_candidate(
             source_id=source_id,
             base_event=base_event,
             candidate=candidate,
+            proof_label=proof_label,
             source_content=source_content,
             identification_agent=identification_agent,
             broadcast_fn=broadcast_fn,
@@ -886,6 +1060,7 @@ async def on_attempt_started(
                     **base_event,
                     "theorem_id": current_candidate.theorem_id,
                     "theorem_statement": current_candidate.statement,
+                    "proof_label": proof_label,
                     "attempt": attempt_number,
                     "strategy": strategy,
                     "retry_origin_source_id": current_candidate.origin_source_id,
@@ -896,16 +1071,21 @@ async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
             if feedback.success:
                 await self._broadcast(
                     broadcast_fn,
-                    "proof_verified",
+                    "proof_lean_accepted",
                     {
                         **base_event,
                         "theorem_id": current_candidate.theorem_id,
                         "theorem_statement": current_candidate.statement,
+                        "proof_label": proof_label,
+                        "attempt": feedback.attempt,
                         "strategy": feedback.strategy,
+                        "lean_response": self._lean_response_summary(feedback),
+                        "proof_verified": True,
                         "retry_origin_source_id": current_candidate.origin_source_id,
                     },
                 )
             else:
+                lean_response = self._lean_response_summary(feedback)
                 await self._broadcast(
                     broadcast_fn,
                     "proof_attempt_failed",
@@ -913,9 +1093,12 @@ async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
                         **base_event,
                         "theorem_id": current_candidate.theorem_id,
                         "theorem_statement": current_candidate.statement,
+                        "proof_label": proof_label,
                         "attempt": feedback.attempt,
                         "strategy": feedback.strategy,
                         "error_summary": self._summarize_error(feedback.error_output),
+                        "lean_response": lean_response,
+                        "proof_verified": False,
                         "retry_origin_source_id": current_candidate.origin_source_id,
                     },
                 )
@@ -961,12 +1144,14 @@ async def on_attempt_feedback(feedback, current_candidate=candidate) -> None:
                     **base_event,
                     "theorem_id": candidate.theorem_id,
                     "theorem_statement": candidate.statement,
+                    "proof_label": proof_label,
                     "retry_origin_source_id": candidate.origin_source_id,
                 },
             )
 
         return _LeanVerificationOutcome(
             candidate=candidate,
+            proof_label=proof_label,
             success=success,
             theorem_name=theorem_name,
             lean_code=lean_code,
diff --git a/backend/autonomous/memory/autonomous_api_logger.py b/backend/autonomous/memory/autonomous_api_logger.py
index 723857a..fb2e649 100644
--- a/backend/autonomous/memory/autonomous_api_logger.py
+++ b/backend/autonomous/memory/autonomous_api_logger.py
@@ -3,18 +3,32 @@
 Stores logs in a persistent file for viewing in the Autonomous Logs tab.
 """
 import asyncio
+import hashlib
 import json
 import logging
 import os
+from collections import deque
 from datetime import datetime
 from typing import Dict, Any, List, Optional
 from pathlib import Path
 
 from backend.shared.config import system_config
+from backend.shared.log_redaction import redact_log_text
 
 logger = logging.getLogger(__name__)
 
 
+def _payload_metadata(value: str, preview_chars: int) -> Dict[str, Any]:
+    """Return safe log metadata for a prompt/response payload."""
+    text = value or ""
+    preview = redact_log_text(text, preview_chars)
+    return {
+        "preview": preview,
+        "size": len(text),
+        "sha256": hashlib.sha256(text.encode("utf-8", errors="replace")).hexdigest() if text else "",
+    }
+
+
 class AutonomousAPILogger:
     """
     Logger for autonomous research API call outputs.
@@ -38,6 +52,7 @@ def __init__(self):
         
         self._initialized = True
         self._ensure_log_file()
+        self._scrub_persisted_full_payloads()
         logger.info("AutonomousAPILogger initialized")
     
     def _ensure_log_file(self) -> None:
@@ -51,6 +66,64 @@ def _ensure_log_file(self) -> None:
     def _get_log_path(self) -> Path:
         """Return the instance-scoped autonomous API log path."""
         return Path(system_config.data_dir) / "auto_api_log.txt"
+
+    def _scrub_persisted_full_payloads(self) -> None:
+        """Remove legacy full prompt/response bodies from the on-disk JSONL log."""
+        log_path = self._get_log_path()
+        if not log_path.exists():
+            return
+
+        changed = False
+        scrubbed_lines: List[str] = []
+
+        try:
+            with open(log_path, "r", encoding="utf-8") as f:
+                lines = f.readlines()
+
+            for line in lines:
+                stripped = line.strip()
+                if not stripped:
+                    continue
+                try:
+                    entry = json.loads(stripped)
+                except json.JSONDecodeError:
+                    scrubbed_lines.append(line)
+                    continue
+
+                original_entry = dict(entry)
+                prompt_full = str(entry.pop("prompt_full", "") or "")
+                response_full = str(entry.pop("response_full", "") or "")
+                prompt_source = prompt_full or str(entry.get("prompt_preview") or "")
+                response_source = response_full or str(entry.get("response_preview") or "")
+
+                if prompt_source:
+                    prompt_meta = _payload_metadata(prompt_source, 1000)
+                    entry["prompt_preview"] = prompt_meta["preview"]
+                    entry["prompt_size"] = int(entry.get("prompt_size") or prompt_meta["size"])
+                    entry.setdefault("prompt_sha256", prompt_meta["sha256"])
+                if response_source:
+                    response_meta = _payload_metadata(response_source, 2000)
+                    entry["response_preview"] = response_meta["preview"]
+                    entry["response_size"] = int(entry.get("response_size") or response_meta["size"])
+                    entry.setdefault("response_sha256", response_meta["sha256"])
+
+                entry["prompt_redacted"] = True
+                entry["response_redacted"] = True
+                entry["has_full_prompt"] = False
+                entry["has_full_response"] = False
+                if entry.get("error"):
+                    entry["error"] = redact_log_text(entry["error"], 1000)
+
+                if prompt_full or response_full or entry != original_entry:
+                    changed = True
+                scrubbed_lines.append(json.dumps(entry) + "\n")
+
+            if changed:
+                with open(log_path, "w", encoding="utf-8") as f:
+                    f.writelines(scrubbed_lines)
+                logger.info("Scrubbed legacy full prompt/response payloads from autonomous API log")
+        except Exception as e:
+            logger.warning(f"Failed to scrub legacy autonomous API log payloads: {e}")
     
     async def log_api_call(
         self,
@@ -64,7 +137,8 @@ async def log_api_call(
         duration_ms: Optional[float] = None,
         success: bool = True,
         error: Optional[str] = None,
-        phase: str = "unknown"
+        phase: str = "unknown",
+        workflow: str = "autonomous",
     ) -> None:
         """
         Log an autonomous research API call.
@@ -81,9 +155,14 @@ async def log_api_call(
             success: Whether the call succeeded
             error: Error message if call failed
             phase: Research phase ("topic_selection", "brainstorm", "paper_compilation", "tier3")
+            workflow: Workflow namespace for this call ("autonomous" or "leanoj")
         """
         async with self._lock:
             try:
+                prompt_meta = _payload_metadata(prompt, 1000)
+                response_meta = _payload_metadata(response_content, 2000)
+                store_full_payloads = bool(system_config.api_log_store_full_payloads)
+
                 log_entry = {
                     "timestamp": datetime.now().isoformat(),
                     "task_id": task_id,
@@ -91,15 +170,25 @@ async def log_api_call(
                     "model": model,
                     "provider": provider,
                     "phase": phase,
-                    "prompt_preview": prompt[:1000] if prompt else "",
-                    "prompt_full": prompt,
-                    "response_preview": response_content[:2000] if response_content else "",
-                    "response_full": response_content,
+                    "workflow": workflow,
+                    "prompt_preview": prompt_meta["preview"],
+                    "prompt_size": prompt_meta["size"],
+                    "prompt_sha256": prompt_meta["sha256"],
+                    "prompt_redacted": not store_full_payloads,
+                    "has_full_prompt": store_full_payloads and bool(prompt),
+                    "response_preview": response_meta["preview"],
+                    "response_size": response_meta["size"],
+                    "response_sha256": response_meta["sha256"],
+                    "response_redacted": not store_full_payloads,
+                    "has_full_response": store_full_payloads and bool(response_content),
                     "tokens_used": tokens_used,
                     "duration_ms": duration_ms,
                     "success": success,
-                    "error": error
+                    "error": redact_log_text(error, 1000)
                 }
+                if store_full_payloads:
+                    log_entry["prompt_full"] = prompt
+                    log_entry["response_full"] = response_content
                 
                 # Append to log file
                 with open(self._get_log_path(), "a", encoding="utf-8") as f:
@@ -129,7 +218,7 @@ async def _trim_log_if_needed(self) -> None:
         except Exception as e:
             logger.error(f"Failed to trim autonomous API log: {e}")
     
-    async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
+    async def get_logs(self, limit: int = 100, include_full: bool = True) -> List[Dict[str, Any]]:
         """
         Get recent autonomous API call logs.
         
@@ -146,7 +235,7 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
                     return []
                 
                 with open(log_path, "r", encoding="utf-8") as f:
-                    lines = f.readlines()
+                    lines = deque(f, maxlen=max(1, limit))
                 
                 logs = []
                 for line in lines:
@@ -154,6 +243,17 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
                     if line:
                         try:
                             log_entry = json.loads(line)
+                            if not include_full or not system_config.api_log_store_full_payloads:
+                                prompt_full = str(log_entry.pop("prompt_full", "") or "")
+                                response_full = str(log_entry.pop("response_full", "") or "")
+                                log_entry["prompt_size"] = int(log_entry.get("prompt_size") or len(prompt_full))
+                                log_entry["response_size"] = int(log_entry.get("response_size") or len(response_full))
+                                log_entry["has_full_prompt"] = False
+                                log_entry["has_full_response"] = False
+                                if prompt_full and not log_entry.get("prompt_sha256"):
+                                    log_entry["prompt_sha256"] = hashlib.sha256(prompt_full.encode("utf-8", errors="replace")).hexdigest()
+                                if response_full and not log_entry.get("response_sha256"):
+                                    log_entry["response_sha256"] = hashlib.sha256(response_full.encode("utf-8", errors="replace")).hexdigest()
                             logs.append(log_entry)
                         except json.JSONDecodeError:
                             continue
@@ -165,11 +265,49 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
             except Exception as e:
                 logger.error(f"Failed to get autonomous API logs: {e}")
                 return []
-    
-    async def clear_logs(self) -> None:
-        """Clear all autonomous API logs."""
+
+    @staticmethod
+    def _entry_workflow(entry: Dict[str, Any]) -> str:
+        workflow = str(entry.get("workflow") or "").strip().lower()
+        if workflow:
+            return workflow
+
+        role_id = str(entry.get("role_id") or "")
+        task_id = str(entry.get("task_id") or "")
+        if role_id.startswith("leanoj_") or task_id.startswith("leanoj_"):
+            return "leanoj"
+        return "autonomous"
+
+    async def clear_logs(self, workflow: Optional[str] = None) -> None:
+        """Clear autonomous API logs, optionally scoped to one workflow."""
         async with self._lock:
             try:
+                if workflow:
+                    log_path = self._get_log_path()
+                    if not os.path.exists(log_path):
+                        return
+
+                    with open(log_path, "r", encoding="utf-8") as f:
+                        lines = f.readlines()
+
+                    retained_lines: List[str] = []
+                    for line in lines:
+                        stripped = line.strip()
+                        if not stripped:
+                            continue
+                        try:
+                            entry = json.loads(stripped)
+                        except json.JSONDecodeError:
+                            retained_lines.append(line)
+                            continue
+                        if self._entry_workflow(entry) != workflow:
+                            retained_lines.append(line)
+
+                    with open(log_path, "w", encoding="utf-8") as f:
+                        f.writelines(retained_lines)
+                    logger.info("Autonomous API logs cleared for workflow %s", workflow)
+                    return
+
                 with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.write("")
                 logger.info("Autonomous API logs cleared")
diff --git a/backend/autonomous/memory/final_answer_memory.py b/backend/autonomous/memory/final_answer_memory.py
index 44b827b..b0b4d5a 100644
--- a/backend/autonomous/memory/final_answer_memory.py
+++ b/backend/autonomous/memory/final_answer_memory.py
@@ -750,6 +750,26 @@ def _get_source_papers_dir(self) -> Path:
     def _get_source_brainstorms_dir(self) -> Path:
         """Get path to source brainstorms archive directory."""
         return self._base_dir / "source_brainstorms"
+
+    def _get_archived_paper_paths(self, paper_id: str) -> Dict[str, Path]:
+        """Return root-confined paths for one archived paper ID."""
+        safe_id = validate_single_path_component(paper_id, "paper ID")
+        source_papers_dir = self._get_source_papers_dir()
+        return {
+            "content": resolve_path_within_root(source_papers_dir, f"paper_{safe_id}.txt"),
+            "abstract": resolve_path_within_root(source_papers_dir, f"paper_{safe_id}_abstract.txt"),
+            "outline": resolve_path_within_root(source_papers_dir, f"paper_{safe_id}_outline.txt"),
+            "metadata": resolve_path_within_root(source_papers_dir, f"paper_{safe_id}_metadata.json"),
+        }
+
+    def _get_archived_brainstorm_paths(self, topic_id: str) -> Dict[str, Path]:
+        """Return root-confined paths for one archived brainstorm ID."""
+        safe_id = validate_single_path_component(topic_id, "topic ID")
+        source_brainstorms_dir = self._get_source_brainstorms_dir()
+        return {
+            "content": resolve_path_within_root(source_brainstorms_dir, f"brainstorm_{safe_id}.txt"),
+            "metadata": resolve_path_within_root(source_brainstorms_dir, f"brainstorm_{safe_id}_metadata.json"),
+        }
     
     async def save_chapter_paper(
         self,
@@ -804,26 +824,24 @@ async def _archive_paper(self, paper_id: str) -> bool:
         try:
             source_papers_dir = self._get_source_papers_dir()
             source_papers_dir.mkdir(parents=True, exist_ok=True)
+            archive_paths = self._get_archived_paper_paths(paper_id)
             
             # Copy paper content
             content = await paper_library.get_paper_content(paper_id)
             if content:
-                paper_path = source_papers_dir / f"paper_{paper_id}.txt"
-                async with aiofiles.open(paper_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["content"], 'w', encoding='utf-8') as f:
                     await f.write(content)
             
             # Copy abstract
             abstract = await paper_library.get_abstract(paper_id)
             if abstract:
-                abstract_path = source_papers_dir / f"paper_{paper_id}_abstract.txt"
-                async with aiofiles.open(abstract_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["abstract"], 'w', encoding='utf-8') as f:
                     await f.write(abstract)
             
             # Copy outline
             outline = await paper_library.get_outline(paper_id)
             if outline:
-                outline_path = source_papers_dir / f"paper_{paper_id}_outline.txt"
-                async with aiofiles.open(outline_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["outline"], 'w', encoding='utf-8') as f:
                     await f.write(outline)
             
             # Copy metadata
@@ -834,8 +852,7 @@ async def _archive_paper(self, paper_id: str) -> bool:
                     if isinstance(value, datetime):
                         metadata_data[key] = value.isoformat()
                 
-                metadata_path = source_papers_dir / f"paper_{paper_id}_metadata.json"
-                async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["metadata"], 'w', encoding='utf-8') as f:
                     await f.write(json.dumps(metadata_data, indent=2))
             
             logger.info(f"Archived paper {paper_id} to final answer source_papers")
@@ -860,12 +877,12 @@ async def _archive_brainstorm(self, topic_id: str) -> bool:
         try:
             source_brainstorms_dir = self._get_source_brainstorms_dir()
             source_brainstorms_dir.mkdir(parents=True, exist_ok=True)
+            archive_paths = self._get_archived_brainstorm_paths(topic_id)
             
             # Copy brainstorm database
             content = await brainstorm_memory.get_database_content(topic_id)
             if content:
-                db_path = source_brainstorms_dir / f"brainstorm_{topic_id}.txt"
-                async with aiofiles.open(db_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["content"], 'w', encoding='utf-8') as f:
                     await f.write(content)
             
             # Copy metadata
@@ -876,8 +893,7 @@ async def _archive_brainstorm(self, topic_id: str) -> bool:
                     if isinstance(value, datetime):
                         metadata_data[key] = value.isoformat()
                 
-                metadata_path = source_brainstorms_dir / f"brainstorm_{topic_id}_metadata.json"
-                async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
+                async with aiofiles.open(archive_paths["metadata"], 'w', encoding='utf-8') as f:
                     await f.write(json.dumps(metadata_data, indent=2))
             
             logger.info(f"Archived brainstorm {topic_id} to final answer source_brainstorms")
@@ -975,11 +991,11 @@ async def get_archived_paper(self, paper_id: str) -> Optional[Dict[str, Any]]:
         Returns:
             Dictionary with paper content, abstract, outline, metadata
         """
-        source_papers_dir = self._get_source_papers_dir()
+        archive_paths = self._get_archived_paper_paths(paper_id)
         
         try:
             # Read content
-            paper_path = source_papers_dir / f"paper_{paper_id}.txt"
+            paper_path = archive_paths["content"]
             if not paper_path.exists():
                 return None
             
@@ -987,21 +1003,21 @@ async def get_archived_paper(self, paper_id: str) -> Optional[Dict[str, Any]]:
                 content = await f.read()
             
             # Read abstract
-            abstract_path = source_papers_dir / f"paper_{paper_id}_abstract.txt"
+            abstract_path = archive_paths["abstract"]
             abstract = ""
             if abstract_path.exists():
                 async with aiofiles.open(abstract_path, 'r', encoding='utf-8') as f:
                     abstract = await f.read()
             
             # Read outline
-            outline_path = source_papers_dir / f"paper_{paper_id}_outline.txt"
+            outline_path = archive_paths["outline"]
             outline = ""
             if outline_path.exists():
                 async with aiofiles.open(outline_path, 'r', encoding='utf-8') as f:
                     outline = await f.read()
             
             # Read metadata
-            metadata_path = source_papers_dir / f"paper_{paper_id}_metadata.json"
+            metadata_path = archive_paths["metadata"]
             metadata = {}
             if metadata_path.exists():
                 async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
@@ -1054,11 +1070,11 @@ async def get_archived_brainstorm(self, topic_id: str) -> Optional[Dict[str, Any
         Returns:
             Dictionary with brainstorm content and metadata
         """
-        source_brainstorms_dir = self._get_source_brainstorms_dir()
+        archive_paths = self._get_archived_brainstorm_paths(topic_id)
         
         try:
             # Read database content
-            db_path = source_brainstorms_dir / f"brainstorm_{topic_id}.txt"
+            db_path = archive_paths["content"]
             if not db_path.exists():
                 return None
             
@@ -1066,7 +1082,7 @@ async def get_archived_brainstorm(self, topic_id: str) -> Optional[Dict[str, Any
                 content = await f.read()
             
             # Read metadata
-            metadata_path = source_brainstorms_dir / f"brainstorm_{topic_id}_metadata.json"
+            metadata_path = archive_paths["metadata"]
             metadata = {}
             if metadata_path.exists():
                 async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
@@ -1390,7 +1406,7 @@ async def list_all_final_answers(self) -> List[Dict[str, Any]]:
         - word_count: Total words
         - chapter_count: Number of chapters (long form only)
         - completion_date: When it was completed
-        - location: Path to the answer
+        - location: Logical answer scope (never an absolute filesystem path)
         - session_id: Session identifier (or "legacy" for old format)
         """
         final_answers = []
@@ -1455,7 +1471,7 @@ async def list_all_final_answers(self) -> List[Dict[str, Any]]:
                             "word_count": word_count,
                             "chapter_count": chapter_count,
                             "completion_date": completion_date,
-                            "location": str(legacy_dir),
+                            "location": "legacy",
                             "session_id": "legacy"
                         })
                 except Exception as e:
@@ -1534,7 +1550,7 @@ async def list_all_final_answers(self) -> List[Dict[str, Any]]:
                             "word_count": word_count,
                             "chapter_count": chapter_count,
                             "completion_date": completion_date,
-                            "location": str(final_answer_dir),
+                            "location": session_folder.name,
                             "session_id": session_folder.name
                         })
                 except Exception as e:
@@ -1622,7 +1638,7 @@ async def get_final_answer_by_id(self, answer_id: str) -> Optional[Dict[str, Any
                     "word_count": len(full_content.split()),
                     "chapter_count": len(chapters),
                     "completion_date": completion_date,
-                    "location": str(base_dir),
+                    "location": answer_id,
                     "session_id": answer_id
                 },
                 "content": full_content,
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index 415d752..2a05597 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -36,6 +36,7 @@ def __init__(self):
         self._lock = asyncio.Lock()
         self._base_dir = Path(system_config.auto_papers_dir)
         self._archive_dir = Path(system_config.auto_papers_archive_dir)
+        self._pruned_dir = self._base_dir / "pruned"
         self._session_manager = None
     
     def set_session_manager(self, session_manager) -> None:
@@ -44,6 +45,7 @@ def set_session_manager(self, session_manager) -> None:
         if session_manager and session_manager.is_session_active:
             self._base_dir = session_manager.get_papers_dir()
             self._archive_dir = session_manager.get_papers_dir() / "archive"
+            self._pruned_dir = session_manager.get_papers_dir() / "pruned"
             logger.info(f"Paper library using session path: {self._base_dir}")
     
     async def initialize(self) -> None:
@@ -52,9 +54,11 @@ async def initialize(self) -> None:
         if self._session_manager and self._session_manager.is_session_active:
             self._base_dir = self._session_manager.get_papers_dir()
             self._archive_dir = self._base_dir / "archive"
+            self._pruned_dir = self._base_dir / "pruned"
         
         self._base_dir.mkdir(parents=True, exist_ok=True)
         self._archive_dir.mkdir(parents=True, exist_ok=True)
+        self._pruned_dir.mkdir(parents=True, exist_ok=True)
         logger.info(f"Paper library initialized at {self._base_dir}")
     
     def _safe_paper_id(self, paper_id: str) -> str:
@@ -64,6 +68,10 @@ def _safe_paper_id(self, paper_id: str) -> str:
     def _get_paper_path(self, paper_id: str) -> Path:
         """Get path to paper file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}.txt"
+
+    def _get_pruned_paper_path(self, paper_id: str) -> Path:
+        """Get path to a pruned paper file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}.txt"
     
     def get_paper_path(self, paper_id: str) -> str:
         """
@@ -88,23 +96,43 @@ def get_outline_path(self, paper_id: str) -> str:
     def _get_abstract_path(self, paper_id: str) -> Path:
         """Get path to abstract file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_abstract.txt"
+
+    def _get_pruned_abstract_path(self, paper_id: str) -> Path:
+        """Get path to pruned paper abstract file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_abstract.txt"
     
     def _get_source_brainstorm_path(self, paper_id: str) -> Path:
         """Get path to cached source brainstorm file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_source_brainstorm.txt"
+
+    def _get_pruned_source_brainstorm_path(self, paper_id: str) -> Path:
+        """Get path to pruned cached source brainstorm file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_source_brainstorm.txt"
     
     def _get_outline_path(self, paper_id: str) -> Path:
         """Get path to paper outline file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_outline.txt"
+
+    def _get_pruned_outline_path(self, paper_id: str) -> Path:
+        """Get path to pruned paper outline file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_outline.txt"
     
     def _get_metadata_path(self, paper_id: str) -> Path:
         """Get path to paper metadata JSON file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_metadata.json"
+
+    def _get_pruned_metadata_path(self, paper_id: str) -> Path:
+        """Get path to pruned paper metadata JSON file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_metadata.json"
     
     def _get_rejections_path(self, paper_id: str) -> Path:
         """Get path to paper compiler rejections file."""
         return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_last_10_rejections.txt"
 
+    def _get_pruned_rejections_path(self, paper_id: str) -> Path:
+        """Get path to pruned paper compiler rejections file."""
+        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_last_10_rejections.txt"
+
     # ========================================================================
     # HISTORY HELPERS
     # ========================================================================
@@ -115,6 +143,7 @@ def _build_scoped_library(base_dir: Path) -> "PaperLibrary":
         scoped_library = PaperLibrary()
         scoped_library._base_dir = base_dir
         scoped_library._archive_dir = base_dir / "archive"
+        scoped_library._pruned_dir = base_dir / "pruned"
         return scoped_library
 
     @staticmethod
@@ -222,6 +251,7 @@ def _format_verified_proof_entry(cls, proof: Any, source_context: str = "") -> s
         novelty_tier = str(cls._proof_value(proof, "novelty_tier", "") or "").strip()
 
         tier_labels = {
+            "major_mathematical_discovery": "Major Mathematical Discovery",
             "mathematical_discovery": "Mathematical Discovery",
             "novel_variant": "Novel Reformulation",
             "novel_formulation": "Novel Formalization",
@@ -294,9 +324,27 @@ def attach_verified_proofs_to_content(
             return before + appendix_block + after
 
         fallback_header = "=== PROOFS ATTACHED TO THIS PAPER (Lean 4 Verified) ==="
+        self_review_match = re.search(
+            r"(?:^|\n)\s*(?:#+\s*)?AI Self-Review and Limitations\s*\n",
+            existing_content,
+            re.IGNORECASE,
+        )
+
+        def insert_before_self_review(proof_block: str) -> str:
+            if not self_review_match:
+                return existing_content.rstrip() + "\n\n" + proof_block.rstrip() + "\n"
+            insert_at = self_review_match.start()
+            if insert_at > 0 and existing_content[insert_at] == "\n":
+                insert_at += 1
+            before_review = existing_content[:insert_at].rstrip()
+            review_and_after = existing_content[insert_at:].lstrip()
+            return f"{before_review}\n\n{proof_block.rstrip()}\n\n{review_and_after}"
+
         if fallback_header in existing_content:
-            return existing_content.rstrip() + "\n\n" + new_entries + "\n"
-        return existing_content.rstrip() + "\n\n" + fallback_header + "\n\n" + new_entries + "\n"
+            return insert_before_self_review(new_entries)
+
+        proof_section = f"{fallback_header}\n\n{new_entries}"
+        return insert_before_self_review(proof_section)
 
     @staticmethod
     def strip_verified_proofs_from_content(content: str) -> str:
@@ -328,40 +376,141 @@ def strip_verified_proofs_from_content(content: str) -> str:
 
         return stripped.rstrip()
 
-    async def _list_history_papers_from_directory(self, papers_dir: Path, session_id: str) -> List[Dict[str, Any]]:
-        """List complete, non-archived papers from one legacy/session papers directory."""
+    @staticmethod
+    def _pruned_banner(
+        *,
+        paper_id: str,
+        pruned_at: datetime,
+        pruned_by: str,
+        reason: str,
+    ) -> str:
+        """Build the raw-file banner that identifies a preserved pruned paper."""
+        actor_note = (
+            "The system decided autonomously that this paper hurt context cumulation."
+            if pruned_by in {"system", "legacy"}
+            else "The user removed this paper from model context accumulation."
+        )
+        return (
+            "PRUNED PAPER - REMOVED FROM MODEL CONTEXT\n\n"
+            f"{actor_note}\n"
+            "This file is preserved for user review and download only. "
+            "It must not be used as future model context.\n\n"
+            f"Original Paper ID: {paper_id}\n"
+            f"Pruned At: {pruned_at.isoformat()}\n"
+            f"Pruned By: {pruned_by}\n"
+            f"Prune Reason: {reason or 'No reason recorded.'}\n"
+            f"{'=' * 80}\n\n"
+        )
+
+    @staticmethod
+    def _strip_existing_pruned_banner(content: str) -> str:
+        """Avoid duplicating the pruned banner if a paper is pruned twice."""
+        if not content.startswith("PRUNED PAPER - REMOVED FROM MODEL CONTEXT"):
+            return content
+        marker = f"{'=' * 80}\n\n"
+        marker_index = content.find(marker)
+        if marker_index < 0:
+            return content
+        return content[marker_index + len(marker):]
+
+    @staticmethod
+    def _metadata_to_dict(metadata: PaperMetadata) -> Dict[str, Any]:
+        """Serialize metadata for JSON files across pydantic versions."""
+        if hasattr(metadata, "model_dump"):
+            return metadata.model_dump()
+        return metadata.dict()
+
+    async def _read_metadata_file(self, metadata_path: Path) -> Optional[PaperMetadata]:
+        """Read a metadata file into PaperMetadata."""
+        if not metadata_path.exists():
+            return None
+        try:
+            async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
+                content = await f.read()
+            return PaperMetadata(**json.loads(content))
+        except Exception as e:
+            logger.error(f"Failed to load paper metadata from {metadata_path}: {e}")
+            return None
+
+    async def _save_metadata_to_path(self, metadata: PaperMetadata, metadata_path: Path) -> None:
+        """Save paper metadata to a specific path."""
+        metadata_path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
+            await f.write(json.dumps(self._metadata_to_dict(metadata), indent=2, default=str))
+
+    async def _read_text_file(self, path: Path) -> str:
+        """Read a text file if it exists."""
+        if not path.exists():
+            return ""
+        try:
+            async with aiofiles.open(path, 'r', encoding='utf-8') as f:
+                return await f.read()
+        except Exception as e:
+            logger.error(f"Failed to read {path}: {e}")
+            return ""
+
+    def _pruned_note_for(self, metadata: PaperMetadata) -> str:
+        """Return the user-facing pruned-paper note."""
+        if metadata.pruned_by == "system" or metadata.status == "archived":
+            return "The system decided autonomously that this paper hurt context cumulation."
+        return "The user removed this paper from model context accumulation."
+
+    async def _build_history_entry(
+        self,
+        *,
+        metadata: PaperMetadata,
+        session_id: str,
+        papers_dir: Path,
+        pruned: bool = False,
+    ) -> Dict[str, Any]:
+        """Build the shared Stage 2 history response shape."""
         from backend.shared.critique_memory import get_latest_critique
 
+        latest_critique = await get_latest_critique(
+            paper_type="autonomous_paper",
+            paper_id=metadata.paper_id,
+            base_dir=papers_dir
+        )
+
+        entry = {
+            "history_id": f"{session_id}:{metadata.paper_id}",
+            "session_id": session_id,
+            "paper_id": metadata.paper_id,
+            "title": metadata.title,
+            "abstract": metadata.abstract,
+            "word_count": metadata.word_count,
+            "source_brainstorm_ids": metadata.source_brainstorm_ids,
+            "referenced_papers": metadata.referenced_papers,
+            "status": metadata.status,
+            "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
+            "model_usage": metadata.model_usage,
+            "user_prompt": await self._get_history_user_prompt(session_id),
+            "critique_avg": self._calculate_critique_average(latest_critique),
+        }
+        if pruned:
+            entry.update({
+                "is_pruned": True,
+                "pruned_at": metadata.pruned_at.isoformat() if metadata.pruned_at else None,
+                "pruned_reason": metadata.pruned_reason,
+                "pruned_by": metadata.pruned_by or ("legacy" if metadata.status == "archived" else None),
+                "pruned_note": self._pruned_note_for(metadata),
+            })
+        return entry
+
+    async def _list_history_papers_from_directory(self, papers_dir: Path, session_id: str) -> List[Dict[str, Any]]:
+        """List complete, non-archived papers from one legacy/session papers directory."""
         scoped_library = self._build_scoped_library(papers_dir)
-        user_prompt = await self._get_history_user_prompt(session_id)
         papers = await scoped_library.get_all_papers(validate_completeness=True)
 
         history_papers = []
         for metadata in papers:
             if metadata.status != "complete":
                 continue
-
-            latest_critique = await get_latest_critique(
-                paper_type="autonomous_paper",
-                paper_id=metadata.paper_id,
-                base_dir=papers_dir
-            )
-
-            history_papers.append({
-                "history_id": f"{session_id}:{metadata.paper_id}",
-                "session_id": session_id,
-                "paper_id": metadata.paper_id,
-                "title": metadata.title,
-                "abstract": metadata.abstract,
-                "word_count": metadata.word_count,
-                "source_brainstorm_ids": metadata.source_brainstorm_ids,
-                "referenced_papers": metadata.referenced_papers,
-                "status": metadata.status,
-                "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
-                "model_usage": metadata.model_usage,
-                "user_prompt": user_prompt,
-                "critique_avg": self._calculate_critique_average(latest_critique),
-            })
+            history_papers.append(await scoped_library._build_history_entry(
+                metadata=metadata,
+                session_id=session_id,
+                papers_dir=papers_dir,
+            ))
 
         return history_papers
 
@@ -389,10 +538,71 @@ async def list_history_papers(self) -> List[Dict[str, Any]]:
         history_papers.sort(key=lambda paper: paper.get("created_at") or "", reverse=True)
         return history_papers
 
+    async def _list_pruned_history_papers_from_directory(self, papers_dir: Path, session_id: str) -> List[Dict[str, Any]]:
+        """List pruned papers from one legacy/session papers directory."""
+        scoped_library = self._build_scoped_library(papers_dir)
+        pruned_papers: List[Dict[str, Any]] = []
+
+        if scoped_library._pruned_dir.exists():
+            for metadata_path in scoped_library._pruned_dir.glob("pruned_paper_*_metadata.json"):
+                metadata = await scoped_library._read_metadata_file(metadata_path)
+                if not metadata:
+                    continue
+                metadata.status = "pruned"
+                pruned_papers.append(await scoped_library._build_history_entry(
+                    metadata=metadata,
+                    session_id=session_id,
+                    papers_dir=papers_dir,
+                    pruned=True,
+                ))
+
+        # Legacy archived papers are exposed as pruned history for user access.
+        if scoped_library._archive_dir.exists():
+            for metadata_path in scoped_library._archive_dir.glob("paper_*_metadata.json"):
+                metadata = await scoped_library._read_metadata_file(metadata_path)
+                if not metadata:
+                    continue
+                metadata.status = "archived"
+                metadata.pruned_by = metadata.pruned_by or "legacy"
+                metadata.pruned_reason = metadata.pruned_reason or "Legacy archived paper preserved as pruned history."
+                pruned_papers.append(await scoped_library._build_history_entry(
+                    metadata=metadata,
+                    session_id=session_id,
+                    papers_dir=papers_dir,
+                    pruned=True,
+                ))
+
+        return pruned_papers
+
+    async def list_pruned_history_papers(self) -> List[Dict[str, Any]]:
+        """List all pruned Stage 2 papers from legacy and session storage."""
+        pruned_papers: List[Dict[str, Any]] = []
+
+        legacy_papers_dir = Path(system_config.auto_papers_dir)
+        if legacy_papers_dir.exists():
+            pruned_papers.extend(
+                await self._list_pruned_history_papers_from_directory(legacy_papers_dir, "legacy")
+            )
+
+        sessions_dir = Path(system_config.auto_sessions_base_dir)
+        if sessions_dir.exists():
+            for session_dir in sorted((p for p in sessions_dir.iterdir() if p.is_dir()), reverse=True):
+                papers_dir = session_dir / "papers"
+                if not papers_dir.exists():
+                    continue
+
+                pruned_papers.extend(
+                    await self._list_pruned_history_papers_from_directory(papers_dir, session_dir.name)
+                )
+
+        pruned_papers.sort(
+            key=lambda paper: paper.get("pruned_at") or paper.get("created_at") or "",
+            reverse=True,
+        )
+        return pruned_papers
+
     async def get_history_paper(self, session_id: str, paper_id: str) -> Optional[Dict[str, Any]]:
         """Get one complete, non-archived Stage 2 paper from legacy/session history."""
-        from backend.shared.critique_memory import get_latest_critique
-
         papers_dir = self.get_history_papers_dir(session_id)
         if papers_dir is None:
             return None
@@ -407,26 +617,64 @@ async def get_history_paper(self, session_id: str, paper_id: str) -> Optional[Di
 
         content = await scoped_library.get_paper_content(paper_id)
         outline = await scoped_library.get_outline(paper_id)
-        latest_critique = await get_latest_critique(
-            paper_type="autonomous_paper",
-            paper_id=paper_id,
-            base_dir=papers_dir
+        entry = await scoped_library._build_history_entry(
+            metadata=metadata,
+            session_id=session_id,
+            papers_dir=papers_dir,
         )
 
         return {
-            "history_id": f"{session_id}:{paper_id}",
-            "session_id": session_id,
-            "paper_id": metadata.paper_id,
-            "title": metadata.title,
-            "abstract": metadata.abstract,
-            "word_count": metadata.word_count,
-            "source_brainstorm_ids": metadata.source_brainstorm_ids,
-            "referenced_papers": metadata.referenced_papers,
-            "status": metadata.status,
-            "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
-            "model_usage": metadata.model_usage,
-            "user_prompt": await self._get_history_user_prompt(session_id),
-            "critique_avg": self._calculate_critique_average(latest_critique),
+            **entry,
+            "content": content,
+            "outline": outline,
+        }
+
+    async def get_pruned_history_paper(self, session_id: str, paper_id: str) -> Optional[Dict[str, Any]]:
+        """Get one pruned Stage 2 paper from legacy/session history."""
+        papers_dir = self.get_history_papers_dir(session_id)
+        if papers_dir is None:
+            return None
+
+        scoped_library = self._build_scoped_library(papers_dir)
+        metadata = await scoped_library._read_metadata_file(
+            scoped_library._get_pruned_metadata_path(paper_id)
+        )
+        content_path = scoped_library._get_pruned_paper_path(paper_id)
+        outline_path = scoped_library._get_pruned_outline_path(paper_id)
+        is_legacy_archive = False
+
+        # Legacy archives used the old paper_ prefix inside archive/.
+        if metadata is None:
+            archive_metadata_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}_metadata.json"
+            metadata = await scoped_library._read_metadata_file(archive_metadata_path)
+            content_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}.txt"
+            outline_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}_outline.txt"
+            if metadata:
+                is_legacy_archive = True
+                metadata.status = "archived"
+                metadata.pruned_by = metadata.pruned_by or "legacy"
+                metadata.pruned_reason = metadata.pruned_reason or "Legacy archived paper preserved as pruned history."
+
+        if metadata is None:
+            return None
+
+        content = await scoped_library._read_text_file(content_path)
+        if is_legacy_archive and content and not content.startswith("PRUNED PAPER - REMOVED FROM MODEL CONTEXT"):
+            content = scoped_library._pruned_banner(
+                paper_id=paper_id,
+                pruned_at=metadata.pruned_at or metadata.created_at or datetime.now(),
+                pruned_by=metadata.pruned_by or "legacy",
+                reason=metadata.pruned_reason or "Legacy archived paper preserved as pruned history.",
+            ) + content
+        outline = await scoped_library._read_text_file(outline_path)
+        entry = await scoped_library._build_history_entry(
+            metadata=metadata,
+            session_id=session_id,
+            papers_dir=papers_dir,
+            pruned=True,
+        )
+        return {
+            **entry,
             "content": content,
             "outline": outline,
         }
@@ -827,13 +1075,20 @@ async def get_metadata(self, paper_id: str) -> Optional[PaperMetadata]:
             logger.error(f"Failed to load metadata for {paper_id}: {e}")
             return None
     
-    async def get_all_papers(self, include_archived: bool = False, include_in_progress: bool = False, validate_completeness: bool = True) -> List[PaperMetadata]:
+    async def get_all_papers(
+        self,
+        include_archived: bool = False,
+        include_in_progress: bool = False,
+        include_pruned: bool = False,
+        validate_completeness: bool = True,
+    ) -> List[PaperMetadata]:
         """
         Get metadata for all papers.
         
         Args:
-            include_archived: If True, include archived papers
+            include_archived: If True, include legacy archived papers
             include_in_progress: If True, include papers with status="in_progress" (default False)
+            include_pruned: If True, include pruned papers from active metadata (legacy compatibility)
             validate_completeness: If True, only return papers with all required sections (default True)
         
         Returns:
@@ -852,11 +1107,10 @@ async def get_all_papers(self, include_archived: bool = False, include_in_progre
                     data = json.loads(content)
                     metadata = PaperMetadata(**data)
                     
-                    # Filter by archive status
                     if metadata.status == "archived" and not include_archived:
                         continue
-                    
-                    # Filter by in_progress status
+                    if metadata.status == "pruned" and not include_pruned:
+                        continue
                     if metadata.status == "in_progress" and not include_in_progress:
                         logger.debug(f"Skipping in_progress paper {metadata.paper_id}")
                         continue
@@ -903,8 +1157,8 @@ async def get_most_recent_incomplete_paper(self) -> Optional[PaperMetadata]:
                     data = json.loads(content)
                     metadata = PaperMetadata(**data)
                     
-                    # Skip archived papers
-                    if metadata.status == "archived":
+                    # Skip archived/pruned papers
+                    if metadata.status in {"archived", "pruned"}:
                         continue
                     
                     # Check if paper is incomplete
@@ -935,46 +1189,83 @@ async def is_paper_complete(self, paper_id: str) -> bool:
         return await self._is_paper_complete(paper_id)
     
     # ========================================================================
-    # ARCHIVE OPERATIONS
+    # PRUNE OPERATIONS
     # ========================================================================
-    
-    async def archive_paper(self, paper_id: str) -> bool:
-        """
-        Archive a paper (move to archive directory).
-        Used when paper is marked as redundant.
-        """
+
+    async def prune_paper(
+        self,
+        paper_id: str,
+        *,
+        reason: str = "",
+        pruned_by: str = "system",
+    ) -> bool:
+        """Soft-prune a paper from model context while preserving it for users."""
         async with self._lock:
             try:
-                # Get metadata
                 metadata = await self.get_metadata(paper_id)
                 if metadata is None:
-                    logger.error(f"Cannot archive paper {paper_id}: metadata not found")
+                    if self._get_pruned_metadata_path(paper_id).exists():
+                        logger.info(f"Paper {paper_id} is already pruned")
+                        return True
+                    logger.error(f"Cannot prune paper {paper_id}: metadata not found")
                     return False
-                
-                # Update status
-                metadata.status = "archived"
-                await self._save_metadata(metadata)
-                
-                # Move files to archive directory
+
+                self._pruned_dir.mkdir(parents=True, exist_ok=True)
+
+                pruned_at = datetime.now()
+                metadata.status = "pruned"
+                metadata.pruned_at = pruned_at
+                metadata.pruned_reason = reason or "No pruning reason recorded."
+                metadata.pruned_by = pruned_by if pruned_by in {"system", "user", "legacy"} else "system"
+
+                paper_path = self._get_paper_path(paper_id)
+                if paper_path.exists():
+                    content = await self._read_text_file(paper_path)
+                    clean_content = self._strip_existing_pruned_banner(content)
+                    pruned_content = self._pruned_banner(
+                        paper_id=paper_id,
+                        pruned_at=pruned_at,
+                        pruned_by=metadata.pruned_by,
+                        reason=metadata.pruned_reason,
+                    ) + clean_content
+                    async with aiofiles.open(self._get_pruned_paper_path(paper_id), 'w', encoding='utf-8') as f:
+                        await f.write(pruned_content)
+                    paper_path.unlink(missing_ok=True)
+
                 files_to_move = [
-                    (self._get_paper_path(paper_id), self._archive_dir / f"paper_{paper_id}.txt"),
-                    (self._get_abstract_path(paper_id), self._archive_dir / f"paper_{paper_id}_abstract.txt"),
-                    (self._get_outline_path(paper_id), self._archive_dir / f"paper_{paper_id}_outline.txt"),
-                    (self._get_source_brainstorm_path(paper_id), self._archive_dir / f"paper_{paper_id}_source_brainstorm.txt"),
-                    (self._get_metadata_path(paper_id), self._archive_dir / f"paper_{paper_id}_metadata.json"),
-                    (self._get_rejections_path(paper_id), self._archive_dir / f"paper_{paper_id}_last_10_rejections.txt")
+                    (self._get_abstract_path(paper_id), self._get_pruned_abstract_path(paper_id)),
+                    (self._get_outline_path(paper_id), self._get_pruned_outline_path(paper_id)),
+                    (self._get_source_brainstorm_path(paper_id), self._get_pruned_source_brainstorm_path(paper_id)),
+                    (self._get_rejections_path(paper_id), self._get_pruned_rejections_path(paper_id)),
                 ]
-                
+
                 for source, dest in files_to_move:
                     if source.exists():
+                        dest.parent.mkdir(parents=True, exist_ok=True)
                         shutil.move(str(source), str(dest))
-                
-                logger.info(f"Paper {paper_id} archived successfully")
+
+                await self._save_metadata_to_path(metadata, self._get_pruned_metadata_path(paper_id))
+                self._get_metadata_path(paper_id).unlink(missing_ok=True)
+
+                logger.info(f"Paper {paper_id} pruned successfully")
                 return True
-                
+
             except Exception as e:
-                logger.error(f"Failed to archive paper {paper_id}: {e}")
+                logger.error(f"Failed to prune paper {paper_id}: {e}")
                 return False
+
+    async def archive_paper(self, paper_id: str) -> bool:
+        """
+        Legacy compatibility wrapper.
+
+        Redundancy removal is now a prune operation: the paper leaves model
+        context but remains downloadable and visibly labeled for users.
+        """
+        return await self.prune_paper(
+            paper_id,
+            reason="Legacy archive request treated as a pruned paper.",
+            pruned_by="system",
+        )
     
     async def get_papers_summary(self) -> List[Dict[str, Any]]:
         """
@@ -1021,24 +1312,58 @@ async def get_all_papers_with_outlines(self) -> List[Dict[str, Any]]:
         return summaries
     
     async def count_papers(self) -> Dict[str, int]:
-        """Count total, archived, in_progress, and active (complete) papers."""
-        all_papers = await self.get_all_papers(include_archived=True, include_in_progress=True, validate_completeness=False)
+        """Count total, pruned, archived, in_progress, and active (complete) papers."""
+        all_papers = await self.get_all_papers(
+            include_archived=True,
+            include_in_progress=True,
+            include_pruned=True,
+            validate_completeness=False,
+        )
         
         total = len(all_papers)
         archived = sum(1 for p in all_papers if p.status == "archived")
+        pruned = sum(1 for p in all_papers if p.status == "pruned")
         in_progress = sum(1 for p in all_papers if p.status == "in_progress")
-        active = total - archived - in_progress  # Only "complete" papers are active
+
+        if self._pruned_dir.exists():
+            pruned += len(list(self._pruned_dir.glob("pruned_paper_*_metadata.json")))
+        if self._archive_dir.exists():
+            archived += len(list(self._archive_dir.glob("paper_*_metadata.json")))
+
+        total += pruned + archived
+        active = sum(1 for p in all_papers if p.status == "complete")
         
         return {
             "total": total,
             "active": active,
             "in_progress": in_progress,
-            "archived": archived
+            "archived": archived,
+            "pruned": pruned
         }
     
     # ========================================================================
     # DELETE OPERATIONS
     # ========================================================================
+
+    async def delete_all_pruned_papers(self) -> int:
+        """Permanently delete all pruned and legacy archived paper files in this scope."""
+        async with self._lock:
+            deleted_count = 0
+            try:
+                for directory in (self._pruned_dir, self._archive_dir):
+                    if not directory.exists():
+                        continue
+                    for metadata_path in directory.glob("*paper_*_metadata.json"):
+                        deleted_count += 1
+                    for path in directory.glob("*"):
+                        if path.is_file():
+                            path.unlink()
+                    # Leave the directory itself in place for future prunes.
+                logger.info(f"Deleted {deleted_count} pruned/archived paper records from {self._base_dir}")
+                return deleted_count
+            except Exception as e:
+                logger.error(f"Failed to delete pruned papers from {self._base_dir}: {e}")
+                return deleted_count
     
     async def delete_paper(self, paper_id: str) -> bool:
         """
@@ -1084,6 +1409,21 @@ async def delete_paper(self, paper_id: str) -> bool:
                         path.unlink()
                         deleted_any = True
                         logger.debug(f"Deleted from archive: {path}")
+
+                pruned_files = [
+                    self._get_pruned_paper_path(paper_id),
+                    self._get_pruned_abstract_path(paper_id),
+                    self._get_pruned_outline_path(paper_id),
+                    self._get_pruned_source_brainstorm_path(paper_id),
+                    self._get_pruned_metadata_path(paper_id),
+                    self._get_pruned_rejections_path(paper_id),
+                ]
+
+                for path in pruned_files:
+                    if path.exists():
+                        path.unlink()
+                        deleted_any = True
+                        logger.debug(f"Deleted from pruned papers: {path}")
                 
                 if deleted_any:
                     logger.info(f"Paper {paper_id} deleted successfully")
diff --git a/backend/autonomous/memory/proof_database.py b/backend/autonomous/memory/proof_database.py
index b2bff96..fd88121 100644
--- a/backend/autonomous/memory/proof_database.py
+++ b/backend/autonomous/memory/proof_database.py
@@ -7,6 +7,7 @@
 import asyncio
 import json
 import logging
+import re
 import shutil
 from datetime import datetime
 from pathlib import Path
@@ -100,6 +101,31 @@ def _rebuild_reverse_indexes(self) -> None:
                 if proof_id not in self._mathlib_reverse_short_index[short_name]:
                     self._mathlib_reverse_short_index[short_name].append(proof_id)
 
+    def _rebuild_index_from_record_files_sync(self) -> Dict[str, Any]:
+        proofs: List[Dict[str, Any]] = []
+        for record_path in self._base_dir.glob("proof_*.json"):
+            if record_path.name.endswith("_metadata.json"):
+                continue
+            try:
+                data = json.loads(record_path.read_text(encoding="utf-8"))
+                if not isinstance(data, dict) or not data.get("proof_id"):
+                    continue
+                proofs.append(data)
+            except Exception as exc:
+                logger.warning("Skipping unreadable proof record during index rebuild: %s (%s)", record_path, exc)
+
+        proofs.sort(key=lambda proof: proof.get("created_at", ""), reverse=True)
+        max_numeric_id = 0
+        for proof in proofs:
+            proof_id = str(proof.get("proof_id", ""))
+            match = re.search(r"(\d+)$", proof_id)
+            if match:
+                max_numeric_id = max(max_numeric_id, int(match.group(1)))
+        return {
+            "next_proof_id": max(max_numeric_id + 1, len(proofs) + 1, 1),
+            "proofs": proofs,
+        }
+
     async def initialize(self) -> None:
         """Ensure storage exists and load the index."""
         if self._session_manager and self._session_manager.is_session_active:
@@ -117,8 +143,11 @@ async def _load_index(self) -> None:
                     self._index_data = json.loads(await handle.read())
             except Exception as exc:
                 logger.error("Failed to load proofs index: %s", exc)
-                self._index_data = self._default_index()
-                await self._save_index()
+                self._index_data = await asyncio.to_thread(self._rebuild_index_from_record_files_sync)
+                logger.warning(
+                    "Rebuilt proofs index from %s record file(s) after index load failure",
+                    len(self._index_data.get("proofs", [])),
+                )
         else:
             self._index_data = self._default_index()
             await self._save_index()
@@ -140,7 +169,7 @@ def _ensure_index_loaded_sync(self) -> None:
                 self._index_data = json.loads(index_path.read_text(encoding="utf-8"))
             except Exception as exc:
                 logger.error("Failed to synchronously load proofs index: %s", exc)
-                self._index_data = self._default_index()
+                self._index_data = self._rebuild_index_from_record_files_sync()
         else:
             self._index_data = self._default_index()
 
@@ -206,10 +235,26 @@ async def _save_failed_candidates(
 
     async def add_proof(self, record: ProofRecord) -> ProofRecord:
         """Persist a proof record and return the stored copy."""
+        stored_record, _duplicate = await self.add_proof_if_absent(record)
+        return stored_record
+
+    async def add_proof_if_absent(self, record: ProofRecord) -> tuple[ProofRecord, bool]:
+        """Persist a proof record unless an identical source/theorem/code exists."""
         async with self._lock:
             if self._index_data is None:
                 await self._load_index()
 
+            normalized_statement = " ".join((record.theorem_statement or "").split())
+            normalized_code = "\n".join((record.lean_code or "").strip().splitlines())
+            for existing in self._index_data.get("proofs", []):
+                if existing.get("source_type") != record.source_type or existing.get("source_id") != record.source_id:
+                    continue
+                if " ".join(str(existing.get("theorem_statement") or "").split()) != normalized_statement:
+                    continue
+                if "\n".join(str(existing.get("lean_code") or "").strip().splitlines()) != normalized_code:
+                    continue
+                return self._deserialize_record(existing), True
+
             proof_id = record.proof_id or f"proof_{self._index_data['next_proof_id']:03d}"
             stored_record = record.model_copy(update={"proof_id": proof_id})
             serialized = self._serialize_record(stored_record)
@@ -241,7 +286,7 @@ async def add_proof(self, record: ProofRecord) -> ProofRecord:
                 stored_record.source_type,
                 stored_record.source_id,
             )
-            return stored_record
+            return stored_record, False
 
     async def record_failed_candidate(
         self,
@@ -627,12 +672,13 @@ def get_novel_proofs_for_injection(self) -> str:
         lines = [
             "=== VERIFIED NOVEL MATHEMATICAL PROOFS (Lean 4 Verified) ===",
             "[These proofs have been formally verified. They represent proven mathematical truths.",
-            "Novelty tiers: Mathematical Discovery (highest — new result), Novel Reformulation (novel reformulation of known proof), Novel Formalization (first Lean 4 formalization of known result).]",
+            "Novelty tiers: Major Mathematical Discovery (highest — possible prize-level discovery), Mathematical Discovery (new result), Novel Reformulation (novel reformulation of known proof), Novel Formalization (first Lean 4 formalization of known result).]",
             "",
         ]
         for index, proof in enumerate(novel_proofs, start=1):
             tier = proof.get("novelty_tier", "")
             tier_label = {
+                "major_mathematical_discovery": "Major Mathematical Discovery",
                 "mathematical_discovery": "Mathematical Discovery",
                 "novel_variant": "Novel Reformulation",
                 "novel_formulation": "Novel Formalization",
diff --git a/backend/autonomous/memory/research_metadata.py b/backend/autonomous/memory/research_metadata.py
index c3c6732..ee076f5 100644
--- a/backend/autonomous/memory/research_metadata.py
+++ b/backend/autonomous/memory/research_metadata.py
@@ -58,6 +58,7 @@ def _get_default_stats(self) -> Dict[str, Any]:
             "total_brainstorms_completed": 0,
             "total_papers_completed": 0,
             "total_papers_archived": 0,
+            "total_papers_pruned": 0,
             "total_submissions_accepted": 0,
             "total_submissions_rejected": 0,
             "topic_selection_rejections": 0,
@@ -108,6 +109,9 @@ async def _ensure_initialized(self) -> None:
             if self._stats is None:
                 self._stats = self._get_default_stats()
                 await self._save_stats()
+            else:
+                for key, value in self._get_default_stats().items():
+                    self._stats.setdefault(key, value)
     
     async def initialize(self, user_research_prompt: str = "") -> None:
         """Initialize or load research metadata."""
@@ -506,11 +510,33 @@ async def register_paper(self, metadata: PaperMetadata) -> None:
     
     async def archive_paper(self, paper_id: str) -> None:
         """Mark a paper as archived in central metadata."""
+        await self.prune_paper(
+            paper_id,
+            reason="Legacy archive request treated as a pruned paper.",
+            pruned_by="system",
+        )
+
+    async def prune_paper(
+        self,
+        paper_id: str,
+        *,
+        reason: str = "",
+        pruned_by: str = "system",
+    ) -> None:
+        """Mark a paper as pruned in central metadata."""
         async with self._lock:
             for i, p in enumerate(self._data.get("papers", [])):
                 if p.get("paper_id") == paper_id:
-                    self._data["papers"][i]["status"] = "archived"
+                    self._data["papers"][i]["status"] = "pruned"
+                    self._data["papers"][i]["pruned_at"] = datetime.now().isoformat()
+                    self._data["papers"][i]["pruned_reason"] = reason or "No pruning reason recorded."
+                    self._data["papers"][i]["pruned_by"] = pruned_by
                     break
+            for i, b in enumerate(self._data.get("brainstorms", [])):
+                papers_generated = b.get("papers_generated", [])
+                if paper_id in papers_generated:
+                    papers_generated.remove(paper_id)
+                    self._data["brainstorms"][i]["papers_generated"] = papers_generated
             await self._save_metadata()
             
             # Update stats
@@ -518,6 +544,14 @@ async def archive_paper(self, paper_id: str) -> None:
                 1 for p in self._data.get("papers", [])
                 if p.get("status") == "archived"
             )
+            self._stats["total_papers_pruned"] = sum(
+                1 for p in self._data.get("papers", [])
+                if p.get("status") == "pruned"
+            )
+            self._stats["total_papers_completed"] = sum(
+                1 for p in self._data.get("papers", [])
+                if p.get("status") == "complete"
+            )
             await self._save_stats()
     
     def _paper_to_dict(self, metadata: PaperMetadata) -> Dict[str, Any]:
@@ -530,7 +564,10 @@ def _paper_to_dict(self, metadata: PaperMetadata) -> Dict[str, Any]:
             "source_brainstorm_ids": metadata.source_brainstorm_ids,
             "referenced_papers": metadata.referenced_papers,
             "status": metadata.status,
-            "created_at": metadata.created_at.isoformat() if metadata.created_at else None
+            "created_at": metadata.created_at.isoformat() if metadata.created_at else None,
+            "pruned_at": metadata.pruned_at.isoformat() if metadata.pruned_at else None,
+            "pruned_reason": metadata.pruned_reason,
+            "pruned_by": metadata.pruned_by,
         }
     
     # ========================================================================
@@ -700,6 +737,10 @@ async def delete_paper(self, paper_id: str) -> bool:
                     1 for p in self._data.get("papers", [])
                     if p.get("status") == "archived"
                 )
+                self._stats["total_papers_pruned"] = sum(
+                    1 for p in self._data.get("papers", [])
+                    if p.get("status") == "pruned"
+                )
                 await self._save_stats()
                 
                 logger.info(f"Removed paper {paper_id} from central metadata")
diff --git a/backend/autonomous/memory/session_manager.py b/backend/autonomous/memory/session_manager.py
index 5b334b1..f166c98 100644
--- a/backend/autonomous/memory/session_manager.py
+++ b/backend/autonomous/memory/session_manager.py
@@ -21,6 +21,42 @@
 logger = logging.getLogger(__name__)
 
 
+def _session_paper_has_section(content: str, section_name: str) -> bool:
+    base_patterns = [
+        rf"##\s*{section_name}",
+        rf"#\s*{section_name}",
+        rf"\*\*{section_name}\*\*",
+        rf"^{section_name}\s*$",
+        rf"^\\(?:section|chapter)\*?\{{{section_name}\}}\s*$",
+    ]
+    if section_name == "Introduction":
+        base_patterns.append(rf"^I\.\s*{section_name}")
+        base_patterns.append(rf"^\\(?:section|chapter)\*?\{{I\.?\s*{section_name}\}}\s*$")
+    elif section_name == "Conclusion":
+        base_patterns.append(rf"^[IVXLC]+\.\s*{section_name}")
+
+    return any(re.search(pattern, content, re.IGNORECASE | re.MULTILINE) for pattern in base_patterns)
+
+
+def _detect_session_paper_phase(paper_content: str) -> str:
+    has_abstract = _session_paper_has_section(paper_content, "Abstract")
+    has_intro = _session_paper_has_section(paper_content, "Introduction")
+    has_conclusion = _session_paper_has_section(paper_content, "Conclusion")
+
+    has_abstract_placeholder = "[HARD CODED PLACEHOLDER FOR THE ABSTRACT SECTION" in paper_content
+    has_intro_placeholder = "[HARD CODED PLACEHOLDER FOR INTRODUCTION SECTION" in paper_content
+    has_conclusion_placeholder = "[HARD CODED PLACEHOLDER FOR THE CONCLUSION SECTION" in paper_content
+    has_body_content = bool(re.search(r"^[IVX]+\.\s+\w", paper_content or "", re.MULTILINE))
+
+    if not has_conclusion or has_conclusion_placeholder:
+        return "conclusion" if has_body_content else "body"
+    if not has_intro or has_intro_placeholder:
+        return "introduction"
+    if not has_abstract or has_abstract_placeholder:
+        return "abstract"
+    return "abstract"
+
+
 class SessionManager:
     """
     Manages prompt-based session folder organization.
@@ -308,21 +344,31 @@ async def find_interrupted_session(self, base_dir: Optional[str] = None) -> Opti
                 continue
                 
             workflow_state_path = session_dir / "workflow_state.json"
-            if not workflow_state_path.exists():
-                continue
-                
+            workflow_state = None
             try:
-                async with aiofiles.open(workflow_state_path, 'r', encoding='utf-8') as f:
-                    raw = await f.read()
-                if not raw.strip().strip('\x00'):
-                    continue  # Empty or null-padded file — skip silently
-                workflow_state = json.loads(raw)
-                
-                # Check if this session is resumable
-                # Resumable means: has a tier AND (has a topic OR has completed papers)
-                has_tier = workflow_state.get("current_tier") is not None
-                has_topic = workflow_state.get("current_topic_id") is not None
-                has_papers = workflow_state.get("papers_completed_count", 0) > 0
+                if workflow_state_path.exists():
+                    async with aiofiles.open(workflow_state_path, 'r', encoding='utf-8') as f:
+                        raw = await f.read()
+                    if raw.strip().strip('\x00'):
+                        workflow_state = json.loads(raw)
+                # Check if this session is resumable.
+                # Resumable means: has a tier AND (has a topic OR has completed papers).
+                has_tier = bool(workflow_state and workflow_state.get("current_tier") is not None)
+                has_topic = bool(workflow_state and workflow_state.get("current_topic_id") is not None)
+                has_papers = bool(workflow_state and workflow_state.get("papers_completed_count", 0) > 0)
+
+                # A stale idle workflow_state.json can coexist with valid session
+                # stats/brainstorm files. Try the durable-file recovery before
+                # deciding the session is not resumable.
+                if not (has_tier and (has_topic or has_papers)):
+                    recovered_state = await self._recover_workflow_state_from_session_files(session_dir)
+                    if recovered_state is not None:
+                        workflow_state = recovered_state
+                        has_tier = workflow_state.get("current_tier") is not None
+                        has_topic = workflow_state.get("current_topic_id") is not None
+                        has_papers = workflow_state.get("papers_completed_count", 0) > 0
+                if workflow_state is None:
+                    continue
                 
                 if has_tier and (has_topic or has_papers):
                     # Load session metadata for user prompt
@@ -357,6 +403,147 @@ async def find_interrupted_session(self, base_dir: Optional[str] = None) -> Opti
         
         return most_recent
 
+    async def _recover_workflow_state_from_session_files(self, session_dir: Path) -> Optional[Dict[str, Any]]:
+        """Build a conservative resume state from session stats/brainstorm files.
+
+        This protects sessions where the workflow checkpoint was stale or absent
+        but durable brainstorm metadata still shows work in progress.  It only
+        resumes a current stats pointer, an in-progress brainstorm, or a completed
+        brainstorm that has not produced a paper yet.
+        """
+        try:
+            stats = {}
+            stats_path = session_dir / "session_stats.json"
+            if stats_path.exists():
+                async with aiofiles.open(stats_path, 'r', encoding='utf-8') as f:
+                    stats = json.loads(await f.read())
+
+            topic_id = stats.get("current_brainstorm_id")
+            paper_id = stats.get("current_paper_id")
+            topic_metadata = None
+            paper_metadata = None
+            paper_title = None
+            reference_paper_ids = []
+
+            brainstorms_dir = session_dir / "brainstorms"
+            papers_dir = session_dir / "papers"
+            if paper_id and papers_dir.exists():
+                paper_metadata_path = papers_dir / f"paper_{paper_id}_metadata.json"
+                if paper_metadata_path.exists():
+                    async with aiofiles.open(paper_metadata_path, 'r', encoding='utf-8') as f:
+                        paper_metadata = json.loads(await f.read())
+                    if paper_metadata.get("status") == "in_progress":
+                        paper_title = paper_metadata.get("title")
+                        reference_paper_ids = paper_metadata.get("referenced_papers") or []
+                        if not topic_id:
+                            source_ids = paper_metadata.get("source_brainstorm_ids") or []
+                            topic_id = source_ids[0] if source_ids else None
+                    else:
+                        # `current_paper_id` is sticky in stats; a completed paper
+                        # must not make a stale/idle session look like active paper writing.
+                        paper_id = None
+                else:
+                    paper_id = None
+
+            if not paper_id and papers_dir.exists():
+                paper_candidates = []
+                for paper_metadata_path in papers_dir.glob("paper_*_metadata.json"):
+                    try:
+                        async with aiofiles.open(paper_metadata_path, 'r', encoding='utf-8') as f:
+                            data = json.loads(await f.read())
+                        if data.get("status") == "in_progress":
+                            paper_candidates.append(data)
+                    except Exception:
+                        continue
+                if paper_candidates:
+                    paper_candidates.sort(key=lambda item: item.get("created_at", ""), reverse=True)
+                    paper_metadata = paper_candidates[0]
+                    paper_id = paper_metadata.get("paper_id")
+                    paper_title = paper_metadata.get("title")
+                    reference_paper_ids = paper_metadata.get("referenced_papers") or []
+                    if not topic_id:
+                        source_ids = paper_metadata.get("source_brainstorm_ids") or []
+                        topic_id = source_ids[0] if source_ids else None
+
+            if topic_id and brainstorms_dir.exists():
+                metadata_path = brainstorms_dir / f"brainstorm_{topic_id}_metadata.json"
+                if metadata_path.exists():
+                    async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
+                        topic_metadata = json.loads(await f.read())
+
+            if topic_metadata is None and brainstorms_dir.exists():
+                candidates = []
+                for metadata_path in brainstorms_dir.glob("brainstorm_*_metadata.json"):
+                    try:
+                        async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
+                            data = json.loads(await f.read())
+                        status = data.get("status")
+                        papers_generated = data.get("papers_generated") or []
+                        if status == "in_progress" or (status == "complete" and not papers_generated):
+                            candidates.append(data)
+                    except Exception:
+                        continue
+                if candidates:
+                    candidates.sort(key=lambda item: item.get("last_activity", ""), reverse=True)
+                    topic_metadata = candidates[0]
+                    topic_id = topic_metadata.get("topic_id")
+
+            if not topic_id and not paper_id:
+                return None
+
+            current_tier = "tier2_paper_writing" if paper_id else "tier1_aggregation"
+            paper_phase = None
+            if paper_id:
+                paper_path = papers_dir / f"paper_{paper_id}.txt"
+                if paper_path.exists():
+                    async with aiofiles.open(paper_path, 'r', encoding='utf-8') as f:
+                        paper_phase = _detect_session_paper_phase(await f.read())
+                else:
+                    paper_phase = "body"
+            acceptance_count = int((topic_metadata or {}).get("submission_count") or 0)
+            if (
+                topic_metadata
+                and topic_metadata.get("status") == "complete"
+                and not paper_id
+                and not (topic_metadata.get("papers_generated") or [])
+            ):
+                current_tier = "tier2_paper_writing"
+                paper_phase = "brainstorm_proof_verification"
+            elif topic_metadata and topic_metadata.get("status") == "complete" and not paper_id:
+                return None
+
+            return {
+                "is_running": False,
+                "current_tier": current_tier,
+                "current_topic_id": topic_id,
+                "current_paper_id": paper_id,
+                "current_paper_title": paper_title,
+                "paper_phase": paper_phase,
+                "reference_paper_ids": reference_paper_ids,
+                "acceptance_count": acceptance_count,
+                "rejection_count": 0,
+                "consecutive_rejections": 0,
+                "exhaustion_signals": 0,
+                "papers_completed_count": stats.get("total_papers_completed", 0),
+                "last_redundancy_check_at": 0,
+                "last_completion_review_at": 0,
+                "last_tier3_check_at": 0,
+                "brainstorm_paper_count": 0,
+                "current_brainstorm_paper_ids": [],
+                "proof_framing_active": False,
+                "proof_framing_context": "",
+                "proof_framing_reasoning": "",
+                "tier3_active": False,
+                "tier3_enabled": False,
+                "tier3_format": None,
+                "tier3_phase": None,
+                "model_config": {},
+                "last_updated": stats.get("last_updated") or (topic_metadata or {}).get("last_activity", ""),
+            }
+        except Exception as exc:
+            logger.debug(f"Failed to recover workflow state from session files {session_dir.name}: {exc}")
+            return None
+
     async def list_all_sessions(self, base_dir: Optional[str] = None) -> List[Dict[str, Any]]:
         """
         List all research sessions.
@@ -377,7 +564,7 @@ async def list_all_sessions(self, base_dir: Optional[str] = None) -> List[Dict[s
                     try:
                         async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
                             metadata = json.loads(await f.read())
-                            metadata["path"] = str(session_dir)
+                            metadata["path"] = session_dir.name
                             
                             # Count items in subdirectories
                             brainstorms_dir = session_dir / "brainstorms"
diff --git a/backend/autonomous/prompts/completion_prompts.py b/backend/autonomous/prompts/completion_prompts.py
index 8ac3c59..c0f7bca 100644
--- a/backend/autonomous/prompts/completion_prompts.py
+++ b/backend/autonomous/prompts/completion_prompts.py
@@ -37,18 +37,23 @@ def get_completion_review_system_prompt() -> str:
 CRITICAL UNDERSTANDING:
 This is an assessment of topic exploration completeness using all resources at your disposal. Consider whether you can contribute more valuable mathematical insights using your knowledge, web search capabilities (if available), and analysis of what's been covered.
 
+DIRECT-SOLUTION PREFERENCE:
+- Prefer moving to paper writing once the brainstorm can support the strongest rigorous direct answer currently justified
+- Continue brainstorming only when you can identify concrete additional work that is likely to produce a more direct solution, stronger partial solution, impossibility result, or sharper constraint
+- Do not extend brainstorming merely for breadth if the best direct answer is already ready to synthesize
+
 DECISION CRITERIA:
 
 Choose CONTINUE_BRAINSTORM if:
-- You can identify specific mathematical areas not yet covered in the submissions
-- You have additional theorems, proofs, or techniques relevant to the topic (from your knowledge or discoverable via web search)
-- The brainstorm would benefit from deeper exploration in specific directions
-- You can still contribute valuable insights using available resources (base knowledge, web search if available)
+- You can identify specific mathematical areas not yet covered in the submissions that are likely to improve the direct answer
+- You have additional theorems, proofs, techniques, constructions, or impossibility arguments relevant to the topic (from your knowledge or discoverable via web search)
+- The brainstorm would benefit from deeper exploration in specific directions that materially strengthen direct resolution
+- You can still contribute valuable direct-progress insights using available resources (base knowledge, web search if available)
 
 Choose WRITE_PAPER if:
 - All major mathematical avenues for this topic have been explored
 - Additional submissions would likely be redundant with existing content
-- The brainstorm database is comprehensive enough for a quality paper
+- The brainstorm database is comprehensive enough for a quality paper that gives the strongest currently justified direct answer
 - Available resources (base knowledge, web search if available) have been sufficiently utilized for this topic
 - You genuinely cannot think of significant new contributions using available resources
 
@@ -57,6 +62,7 @@ def get_completion_review_system_prompt() -> str:
 - Don't artificially extend brainstorming if exhausted
 - Don't prematurely end if valuable knowledge remains
 - Consider the mathematical depth achieved, not just submission count
+- Prefer best-answer readiness over breadth for breadth's sake
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -131,14 +137,14 @@ def get_completion_self_validation_system_prompt() -> str:
 
 Validate as TRUE (confirm your assessment) if:
 - Your assessment accurately reflects the current state of the brainstorm using all available resources (base knowledge, web search if available)
-- If you said "continue_brainstorm": You genuinely have more valuable insights to contribute using available resources
-- If you said "write_paper": You genuinely cannot think of significant new contributions
+- If you said "continue_brainstorm": You genuinely have more valuable direct-progress insights to contribute using available resources
+- If you said "write_paper": You genuinely cannot think of significant new contributions that would materially strengthen the direct answer
 - The reasoning in your assessment is sound and honest
 
 Validate as FALSE if:
 - Upon reflection, the assessment was CLEARLY incorrect
-- If "continue_brainstorm": The suggested additions are trivial, irrelevant, or already extensively covered
-- If "write_paper": You have CONCRETE, SPECIFIC valuable additions you overlooked (not vague possibilities)
+- If "continue_brainstorm": The suggested additions are trivial, irrelevant, already extensively covered, or too indirect to justify delay
+- If "write_paper": You have CONCRETE, SPECIFIC valuable additions you overlooked that would materially improve direct resolution (not vague possibilities)
 - The reasoning contains obvious flawed logic
 
 BALANCED VALIDATION APPROACH:
diff --git a/backend/autonomous/prompts/final_answer_prompts.py b/backend/autonomous/prompts/final_answer_prompts.py
index 72bf2f4..82ea213 100644
--- a/backend/autonomous/prompts/final_answer_prompts.py
+++ b/backend/autonomous/prompts/final_answer_prompts.py
@@ -44,6 +44,10 @@ def get_certainty_assessment_system_prompt() -> str:
 YOUR TASK:
 Review all existing research papers and determine what can be answered WITH CERTAINTY - without speculation or theoretical hand-waving.
 
+DIRECT-ANSWER-FIRST REQUIREMENT:
+- Identify the strongest direct answer the papers justify, not just nearby facts
+- Prefer a precise answer, partial answer, impossibility result, or sharp limitation statement over broad summary
+
 ASSESSMENT CRITERIA:
 
 1. TOTAL_ANSWER - The user's question can be FULLY answered with high confidence
@@ -74,6 +78,7 @@ def get_certainty_assessment_system_prompt() -> str:
 - Identify what is KNOWN WITH CERTAINTY vs what is SPECULATIVE
 - Do not claim certainty where uncertainty exists
 - Summarize the key certainties that have been established
+- State the best direct answer those certainties support
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -144,6 +149,7 @@ def get_certainty_validator_system_prompt() -> str:
 - The reasoning properly references the papers
 - No overclaiming certainty where uncertainty exists
 - No underclaiming (missing obvious certainties)
+- The assessment captures the strongest direct answer the papers justify
 
 REJECT the assessment if:
 - Certainty level doesn't match the evidence
@@ -222,6 +228,8 @@ def get_format_selection_system_prompt() -> str:
 - Whether a single coherent narrative is possible
 - Whether the papers naturally form a cohesive volume
 - The certainty level from Phase 1
+- Prefer short form whenever one paper can honestly provide the strongest direct answer
+- Choose long form only when multiple chapters are genuinely necessary to deliver that answer well
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -287,12 +295,14 @@ def get_format_validator_system_prompt() -> str:
 - The reasoning is sound
 - Short form is chosen only when a single paper suffices
 - Long form is chosen when multiple perspectives are needed
+- The choice preserves the clearest path to a direct answer
 
 REJECT the selection if:
 - Short form is chosen for a question requiring extensive treatment
 - Long form is chosen unnecessarily for a focused question
 - The reasoning doesn't support the choice
 - The selection ignores important factors
+- The selection adds unnecessary structural breadth instead of optimizing for a direct answer
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -415,6 +425,10 @@ def get_volume_organization_system_prompt() -> str:
 3. Plans an INTRODUCTION paper that frames the collection
 4. Plans a CONCLUSION paper that synthesizes findings and answers the question
 
+DIRECT-ANSWER-FIRST REQUIREMENT:
+- Include only the chapters needed to deliver the strongest rigorous direct answer
+- Do not add gap papers for breadth alone; add them only when they are necessary to close a real answer gap
+
 VOLUME STRUCTURE REQUIREMENTS:
 
 BODY CHAPTERS (from existing papers or gaps):
@@ -422,6 +436,7 @@ def get_volume_organization_system_prompt() -> str:
 - Order them logically (foundations → main results → applications)
 - Identify gaps: topics that need coverage but no paper exists
 - Gap papers will be written before introduction/conclusion
+- Exclude chapters that are merely adjacent if they do not materially strengthen the answer
 
 INTRODUCTION PAPER:
 - Frames the user's question
@@ -565,6 +580,7 @@ def get_volume_validator_system_prompt() -> str:
 - Introduction and conclusion are properly planned
 - The reasoning is sound
 - If outline_complete=true, the structure is ready for writing
+- The structure stays focused on the strongest rigorous direct answer without unnecessary breadth
 
 REJECT the organization if:
 - Important existing papers are missing
@@ -573,6 +589,7 @@ def get_volume_validator_system_prompt() -> str:
 - Introduction/conclusion are missing or poorly planned
 - The structure doesn't effectively answer the question
 - outline_complete=true but structure has issues
+- The structure includes chapters that broaden scope without materially improving the answer
 
 Provide specific feedback for rejected organizations.
 
@@ -615,6 +632,7 @@ def get_gap_paper_context_prompt() -> str:
 - Use ONLY existing Tier 2 papers as references (no brainstorm databases)
 - The paper must integrate with the volume's other chapters
 - Focus on the specific gap identified in the chapter description
+- Write only the material needed to close that answer gap directly and rigorously
 
 REFERENCE PAPERS:
 The papers listed are from the existing Tier 2 library. Use them as context and references.
@@ -641,6 +659,7 @@ def get_volume_intro_paper_context_prompt() -> str:
 - You have access to ALL chapter content to accurately describe them
 - The introduction should make the volume's value clear
 - Frame the answer that will be provided
+- Keep the framing centered on the direct answer, not on exploratory wanderings
 
 REFERENCE: Use the chapter papers as context for accurate descriptions."""
 
@@ -665,6 +684,7 @@ def get_volume_conclusion_paper_context_prompt() -> str:
 - All body chapters exist, so you can reference their content
 - Be definitive about certainties, honest about uncertainties
 - This is the climactic answer to the user's question
+- Make the direct answer explicit as early and clearly as the evidence allows
 
 REFERENCE: Use the body chapter papers to inform the synthesis."""
 
diff --git a/backend/autonomous/prompts/paper_continuation_prompts.py b/backend/autonomous/prompts/paper_continuation_prompts.py
index 93420e5..c8062a9 100644
--- a/backend/autonomous/prompts/paper_continuation_prompts.py
+++ b/backend/autonomous/prompts/paper_continuation_prompts.py
@@ -35,16 +35,21 @@ def get_continuation_decision_system_prompt() -> str:
 YOUR TASK:
 Decide whether the brainstorm database contains enough distinct, unexplored material to warrant writing ANOTHER paper, or whether the user's research goal is better served by moving on to a new brainstorm topic.
 
+DIRECT-SOLUTION PREFERENCE:
+- Write another paper only if it would materially strengthen the best rigorous direct answer to the user's goal
+- Move on when remaining material is mostly supportive, repetitive, or too indirect to justify another paper
+
 DECISION OPTIONS:
 1. WRITE_ANOTHER_PAPER - The brainstorm has significant material that the existing paper(s) did NOT cover, and another paper would meaningfully advance the user's research goal
 2. MOVE_ON - The existing paper(s) adequately cover this brainstorm, or a new topic would better serve the user's goal
 
 WRITE ANOTHER PAPER if:
 - The brainstorm database contains substantial material not covered by existing paper(s)
-- Another paper would address a meaningfully DIFFERENT angle, perspective, or subset of the brainstorm
+- Another paper would address a meaningfully DIFFERENT angle, perspective, or subset of the brainstorm that improves direct resolution of the user's goal
 - The uncovered material is rich enough for a complete, distinct paper (not just leftover fragments)
 - Writing another paper from this brainstorm advances the user's goal MORE than starting a new topic
 - The existing paper(s) focused on specific aspects, leaving other important aspects unexplored
+- Another paper would provide a stronger direct partial answer, tighter impossibility result, or sharper constraint
 
 MOVE ON if:
 - The existing paper(s) adequately cover the brainstorm's valuable content
@@ -52,6 +57,7 @@ def get_continuation_decision_system_prompt() -> str:
 - A new brainstorm topic would better advance the user's research goal
 - Another paper would largely duplicate content already in the existing paper(s)
 - The brainstorm's unique contributions have been captured
+- The remaining material is mostly indirect support rather than meaningful direct progress
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -114,10 +120,10 @@ def get_continuation_validator_system_prompt() -> str:
  ---
 
 YOUR TASK:
-Validate whether the proposed continuation decision is the best use of research resources.
+Validate whether the proposed continuation decision is the best use of research resources for improving the strongest rigorous direct answer.
 
 ACCEPT the decision if:
-1. WRITE_ANOTHER_PAPER: The brainstorm genuinely has enough distinct unexplored material for another paper AND the reasoning correctly identifies what material remains
+1. WRITE_ANOTHER_PAPER: The brainstorm genuinely has enough distinct unexplored material for another paper AND the reasoning correctly identifies what material remains AND why it materially strengthens direct resolution
 2. MOVE_ON: The existing papers adequately cover the brainstorm OR a new topic would genuinely better serve the goal AND the reasoning is sound
 
 REJECT the decision if:
@@ -126,6 +132,7 @@ def get_continuation_validator_system_prompt() -> str:
 3. MOVE_ON: There is clearly substantial uncovered material that warrants another paper
 4. MOVE_ON: The reasoning ignores valuable unexplored content in the brainstorm
 5. The reasoning is flawed, vague, or contradicts the evidence
+6. The decision prefers indirect leftover material over a clearly stronger direct-answer path
 
 REJECTION FEEDBACK FORMAT:
 If rejecting, provide CONCRETE, ACTIONABLE guidance:
diff --git a/backend/autonomous/prompts/paper_redundancy_prompts.py b/backend/autonomous/prompts/paper_redundancy_prompts.py
index eb57753..c0c710d 100644
--- a/backend/autonomous/prompts/paper_redundancy_prompts.py
+++ b/backend/autonomous/prompts/paper_redundancy_prompts.py
@@ -46,13 +46,15 @@ def get_paper_redundancy_system_prompt() -> str:
 3. Contains information SUPERSEDED by better, more complete papers
 4. Was MARGINALLY useful initially but provides no unique value given current library
 5. Covers the same mathematical territory as a newer, superior paper
+6. Is more indirect or auxiliary while another paper provides a stronger rigorous direct answer on the same territory
 
 REASONS TO KEEP - A paper should be kept if it:
-1. Provides ANY unique mathematical content not covered elsewhere
-2. Offers a different perspective or approach even if related to other papers
-3. Contains specific proofs, theorems, or techniques not present elsewhere
-4. Contributes to research diversity in any meaningful way
-5. Covers distinct mathematical subtopics within a broader area
+1. Provides a stronger direct answer, sharper impossibility result, or tighter constraint than overlapping papers
+2. Provides ANY unique mathematical content not covered elsewhere
+3. Offers a different perspective or approach even if related to other papers
+4. Contains specific proofs, theorems, or techniques not present elsewhere
+5. Contributes to research diversity in any meaningful way
+6. Covers distinct mathematical subtopics within a broader area
 
 CONSERVATIVE APPROACH:
 - When in doubt, DO NOT recommend removal
@@ -63,6 +65,9 @@ def get_paper_redundancy_system_prompt() -> str:
 CRITICAL SELECTION RULE:
 When multiple papers overlap, select the WEAKEST one for removal - the one that provides the LEAST unique value. NEVER remove a more comprehensive paper in favor of keeping a less comprehensive one.
 
+DIRECT-SOLUTION PRIORITY:
+If overlapping papers differ in how directly they answer the user's research goal, preserve the paper with the strongest rigorous direct answer and remove the more auxiliary one first when all else is equal.
+
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
 2. Quotes: Escape double quotes inside strings as \\"
diff --git a/backend/autonomous/prompts/paper_reference_prompts.py b/backend/autonomous/prompts/paper_reference_prompts.py
index 19bbb11..9d0450b 100644
--- a/backend/autonomous/prompts/paper_reference_prompts.py
+++ b/backend/autonomous/prompts/paper_reference_prompts.py
@@ -52,6 +52,10 @@ def get_pre_brainstorm_expansion_system_prompt(max_papers: int) -> str:
 YOUR TASK:
 Determine which papers (if any) would be VERY USEFUL to inform and enhance your brainstorm exploration.
 
+DIRECT-SOLUTION PREFERENCE:
+- Prefer papers that most directly help produce a rigorous direct answer, direct partial answer, impossibility result, explicit construction, exact reduction, or sharp constraint
+- Do not select papers merely because they are broadly related if they do not materially strengthen the most direct route to the goal
+
 WHY THIS MATTERS - COMPOUNDING KNOWLEDGE:
 This is the crucial mechanism that allows the system to compound knowledge across research cycles.
 By selecting reference papers BEFORE brainstorming, you can:
@@ -61,9 +65,9 @@ def get_pre_brainstorm_expansion_system_prompt(max_papers: int) -> str:
 - Accelerate convergence on valuable insights by standing on prior work
 
 THRESHOLD: "VERY USEFUL FOR BRAINSTORMING"
-- Papers that provide mathematical foundations you'll build upon
-- Papers that cover related concepts you can extend or connect to
-- Papers that offer techniques or methods relevant to your topic
+- Papers that provide mathematical foundations you'll directly build upon
+- Papers that cover related concepts you can extend or connect to in service of a more direct answer
+- Papers that offer techniques or methods that materially strengthen the most direct route to your topic
 - Don't request papers that are merely tangentially related
 
 OPTIONS:
@@ -114,15 +118,19 @@ def get_additional_reference_expansion_system_prompt(max_total_papers: int) -> s
 YOUR TASK:
 Determine if any ADDITIONAL papers would be valuable for paper compilation, based on what you learned during brainstorming.
 
+DIRECT-SOLUTION PREFERENCE:
+- Add papers only when they materially strengthen the best rigorous direct answer you can now write
+- Do not add broadly relevant papers that do not improve direct resolution of the user's goal
+
 CONTEXT:
 - You already selected reference papers before brainstorming (shown as "ALREADY SELECTED")
 - During brainstorming, you may have discovered new connections or topics
 - This is your chance to add more relevant papers (if any)
 
 THRESHOLD: "VALUABLE BASED ON BRAINSTORM INSIGHTS"
-- Papers that address topics that emerged during brainstorming
-- Papers that provide additional techniques you now realize are relevant
-- Papers that cover connections you discovered during exploration
+- Papers that address topics that emerged during brainstorming and materially strengthen direct resolution
+- Papers that provide additional techniques you now realize are relevant to the strongest direct answer
+- Papers that cover connections you discovered during exploration only when those connections improve direct progress
 - Don't add papers just to fill slots
 
 OPTIONS:
@@ -170,8 +178,12 @@ def get_reference_expansion_system_prompt(max_papers: int = 6) -> str:
 YOUR TASK:
 Determine which papers (if any) would be VERY USEFUL for writing your upcoming paper, and request to see their full content before making final selection.
 
+DIRECT-SOLUTION PREFERENCE:
+- Prefer papers that will help you write the strongest rigorous direct answer to the user's goal
+- Do not expand papers that are merely adjacent background unless they are needed for direct resolution
+
 THRESHOLD: "VERY USEFUL"
-- A paper is "very useful" if it provides substantial mathematical context, techniques, or insights directly relevant to your brainstorm topic
+- A paper is "very useful" if it provides substantial mathematical context, techniques, or insights that materially strengthen the most direct answer to your brainstorm topic
 - Don't request papers that are merely tangentially related
 - Quality over quantity - only request papers you genuinely need to evaluate
 
@@ -251,11 +263,15 @@ def get_reference_selection_system_prompt(max_papers: int) -> str:
 YOUR TASK:
 Make your final selection of reference papers (maximum {max_papers}) that will be included in your context during paper compilation.
 
+DIRECT-SOLUTION PREFERENCE:
+- Select papers that most directly strengthen the answer you intend to write
+- Prefer papers that support the core proof, construction, impossibility argument, or key reduction over broader background
+
 SELECTION CRITERIA:
-- Papers that provide essential mathematical background
-- Papers that offer techniques or methods relevant to your topic
-- Papers that establish theoretical foundations you'll build upon
-- Papers that present related results you'll reference or extend
+- Papers that provide essential mathematical background for the direct answer
+- Papers that offer techniques or methods central to your topic's strongest resolution path
+- Papers that establish theoretical foundations you'll directly build upon
+- Papers that present related results you'll reference or extend in order to answer the question more directly
 
 CONSTRAINT:
 - Maximum {max_papers} papers can be selected (hard limit for context budget)
diff --git a/backend/autonomous/prompts/paper_title_exploration_prompts.py b/backend/autonomous/prompts/paper_title_exploration_prompts.py
index 9193ec0..cd40cd3 100644
--- a/backend/autonomous/prompts/paper_title_exploration_prompts.py
+++ b/backend/autonomous/prompts/paper_title_exploration_prompts.py
@@ -38,6 +38,10 @@ def build_title_exploration_user_prompt(
     parts.append("Instead, your task is to propose ONE CANDIDATE PAPER TITLE per submission.")
     parts.append("The system will collect 5 validated candidate titles before a later final")
     parts.append("selection chooses the actual title.\n")
+    parts.append("Prefer titles that make the paper's direct answer-bearing contribution clear")
+    parts.append("when the source material supports one. Do not use generic exploratory titles")
+    parts.append("when a theorem, construction, impossibility result, or sharp constraint can be")
+    parts.append("accurately foregrounded.\n")
     parts.append("Each submission should contain:")
     parts.append("- One candidate paper title")
     parts.append("- Brief reasoning for why the title is strong, accurate, and distinct\n")
@@ -49,6 +53,7 @@ def build_title_exploration_user_prompt(
     parts.append("WHAT MAKES A GOOD CANDIDATE TITLE:")
     parts.append("- Accurately captures the paper's likely mathematical content")
     parts.append("- Specific enough to communicate the core focus")
+    parts.append("- Foregrounds the direct answer, core result, or limitation when justified")
     parts.append("- Professional and suitable for a mathematical research paper")
     parts.append("- Distinct from already-accepted candidate titles")
     parts.append("- Distinct from related completed papers listed below")
diff --git a/backend/autonomous/prompts/paper_title_prompts.py b/backend/autonomous/prompts/paper_title_prompts.py
index fa25fc3..f77b3b5 100644
--- a/backend/autonomous/prompts/paper_title_prompts.py
+++ b/backend/autonomous/prompts/paper_title_prompts.py
@@ -35,6 +35,10 @@ def get_paper_title_system_prompt() -> str:
 YOUR TASK:
 Choose a title that accurately captures the mathematical content and scope of the planned paper.
 
+DIRECT-SOLUTION PREFERENCE:
+- When the paper reaches a direct conclusion, theorem, impossibility result, or explicit construction, let the title foreground that result rather than sounding like generic exploration
+- Prefer titles that make the paper's answer-bearing content clear, while staying accurate to the actual scope
+
 IMPORTANT CLARIFICATION:
 - The brainstorm submissions are the SOURCE MATERIAL for your paper
 - Your title SHOULD reflect what's in the brainstorm - that's expected and correct!
@@ -47,6 +51,7 @@ def get_paper_title_system_prompt() -> str:
 - Is professional and suitable for a mathematical research paper
 - Differentiates from EXISTING COMPLETED PAPERS from the same brainstorm (if any exist - check the list below)
 - Avoids being overly broad or generic
+- Makes the paper's strongest direct contribution clear when the content justifies it
 
 TITLE STYLE:
 - Use standard mathematical paper title conventions
@@ -139,6 +144,7 @@ def get_paper_title_validator_system_prompt() -> str:
 - It follows mathematical paper title conventions
 - The reasoning is sound
 - If "EXISTING PAPERS FROM THIS BRAINSTORM: None" - there's nothing to differentiate from, so accept if other criteria are met
+- It makes any justified direct conclusion or core result clear rather than sounding needlessly exploratory
 
 REJECT the title if:
 - It is too similar to an EXISTING COMPLETED PAPER from the same brainstorm (NOT brainstorm submissions - those are the source material!)
@@ -146,6 +152,7 @@ def get_paper_title_validator_system_prompt() -> str:
 - It is too vague or generic
 - It doesn't follow professional conventions
 - The reasoning is flawed
+- It obscures a clear direct result behind generic exploratory wording
 
 DO NOT REJECT simply because the title reflects brainstorm submission content - that is the INTENDED behavior.
 
diff --git a/backend/autonomous/prompts/proof_prompts.py b/backend/autonomous/prompts/proof_prompts.py
index de9e4a7..f39d782 100644
--- a/backend/autonomous/prompts/proof_prompts.py
+++ b/backend/autonomous/prompts/proof_prompts.py
@@ -9,11 +9,14 @@
 
 
 PROOF_FRAMING_CONTEXT = """[PROOF FRAMING CONTEXT -- This research prompt targets formal mathematical proof.
-Submissions should aggressively pursue NOVEL, NON-TRIVIAL theorems that push the
-boundaries of what is known. The Lean 4 proof assistant is available for formal
-verification. Prioritize ambitious conjectures, original results, and theorems that
-would represent genuine mathematical contributions over safe restatements of textbook
-facts. Standard identities and well-known Mathlib lemmas are NOT valuable targets.]"""
+All proof work must serve the user's research prompt. Submissions should pursue
+theorems, lemmas, and formalizations that directly help answer, support, or advance
+that prompt. Novel/non-trivial results are valuable only when they are relevant to
+the user's goal. The Lean 4 proof assistant is available for formal verification.
+Prioritize ambitious conjectures, original results, and theorems that would represent
+genuine mathematical contributions toward the prompt over safe restatements of
+textbook facts. Standard identities, irrelevant curiosities, and well-known Mathlib
+lemmas are NOT valuable targets.]"""
 
 
 def _json_only_footer(example: str) -> str:
@@ -159,7 +162,7 @@ def format_failure_hints_for_injection(failure_hints: Iterable[Any]) -> str:
 
     lines = [
         "=== OPEN LEMMA TARGETS LEAN 4 COULD NOT YET CLOSE ===",
-        "[These are recent proof attempts that failed. Prefer brainstorms that generate missing lemmas, stronger assumptions, or cleaner formal theorem statements.]",
+        "[These are recent proof attempts that failed. Prefer brainstorms that generate missing lemmas, stronger assumptions, or cleaner formal theorem statements only when they directly support the user's research prompt.]",
         "",
     ]
     for index, hint in enumerate(hints, start=1):
@@ -188,7 +191,8 @@ def format_failure_hints_for_injection(failure_hints: Iterable[Any]) -> str:
                 "Note: the previous formalization attempt was rejected because "
                 "it used `sorry`/`admit` or axiomatized the theorem's concepts "
                 "to make the goal trivial. Prefer brainstorms that state a "
-                "narrower, concretely provable lemma instead of the full claim."
+                "narrower, concretely provable lemma that still supports the "
+                "user's research prompt instead of the full claim."
             )
         lines.extend(
             [
@@ -206,20 +210,20 @@ def format_failure_hints_for_injection(failure_hints: Iterable[Any]) -> str:
 
 def build_proof_framing_gate_prompt(user_prompt: str) -> str:
     """Ask whether the research goal should be framed toward formal proof."""
-    return f"""You are deciding whether a research program should be explicitly framed toward formal mathematical proof and novel theorem discovery.
+    return f"""You are deciding whether a research program should be explicitly framed toward formal mathematical proof and novel theorem discovery that helps answer the user's prompt.
 
 USER RESEARCH PROMPT:
 {user_prompt}
 
-Return TRUE if the prompt would benefit from working toward formally provable theorems in Lean 4, especially novel or non-trivial ones.
+Return TRUE if the prompt would benefit from working toward Lean 4-formalized theorems that directly help answer, support, or advance the user's research goal.
 Return FALSE only if the prompt is purely empirical, engineering-focused, descriptive, or has no meaningful mathematical content.
 
 Consider:
 - Does the research involve mathematical structures, proofs, bounds, or formal reasoning?
-- Could novel theorems or formalizations emerge from this research direction?
-- Would formal verification add rigor or uncover new results?
+- Could prompt-relevant theorems, lemmas, or formalizations emerge from this research direction?
+- Would formal verification add rigor or uncover new results that matter for the user's goal?
 
-Err on the side of TRUE -- if there is any mathematical substance worth formalizing, enable the proof pipeline.
+Err on the side of TRUE when there is mathematical substance worth formalizing for the prompt. Do not enable proof framing solely for off-topic mathematical curiosities.
 
 {_json_only_footer('{"is_proof_amenable": true, "reasoning": "brief explanation"}')}
 """
@@ -231,7 +235,7 @@ def build_proof_identification_prompt(
     source_id: str,
     source_content: str,
 ) -> str:
-    """Identify novel, non-trivial theorem candidates from a brainstorm or paper."""
+    """Identify prompt-relevant theorem candidates from a brainstorm or paper."""
     example_json = """{
   "has_provable_theorems": true,
   "theorems": [
@@ -239,22 +243,24 @@ def build_proof_identification_prompt(
       "theorem_id": "thm_1",
       "statement": "natural-language theorem statement",
       "formal_sketch": "optional note about assumptions, notation, or likely Lean formalization strategy",
-      "novelty_rationale": "why this theorem is non-trivial and worth formalizing"
+      "novelty_rationale": "why this theorem helps the user prompt and is worth formalizing"
     }
   ]
 }"""
-    return f"""You are a theorem-discovery agent for MOTO. Your mission is to find NOVEL, NON-TRIVIAL mathematical claims in the source below that deserve formal verification in Lean 4.
+    return f"""You are a theorem-discovery agent for MOTO. Your mission is to find mathematical claims in the source below that directly help answer, support, or advance the USER RESEARCH PROMPT and deserve formal verification in Lean 4.
 
-MOTO's goal is to push the frontier of mathematical knowledge. You are the gatekeeper that decides which theorems are worth the cost of formal verification. Be ambitious -- seek out the most original, surprising, or substantive results the source offers.
+MOTO's goal is to push the frontier of mathematical knowledge in service of the user's stated problem. You are the gatekeeper that decides which theorems are worth the cost of formal verification. Be ambitious, but do not chase unrelated mathematical curiosities: a proof candidate must be useful for the user's prompt, not merely non-trivial in isolation.
 
 WHAT TO EXTRACT (prioritize these):
-- Novel theorems, lemmas, or propositions that represent genuine mathematical insight
-- Bold conjectures that can be sharpened into provable statements
-- Non-obvious connections, bounds, inequalities, or structural results
-- Original formalizations of results not yet in Mathlib
-- Ambitious claims even if they need narrowing -- the formalization agent can refine them
+- Theorems, lemmas, or propositions that directly help answer or advance the USER RESEARCH PROMPT
+- Supporting lemmas needed to prove prompt-central claims
+- Novel mathematical insights only when they are relevant to the user's stated goal
+- Non-obvious connections, bounds, inequalities, or structural results that strengthen the prompt's argument
+- Original formalizations of prompt-relevant results not yet in Mathlib
+- Ambitious prompt-relevant claims even if they need narrowing -- the formalization agent can refine them
 
 WHAT TO REJECT (never extract these):
+- Mathematically interesting claims that do not materially help the USER RESEARCH PROMPT
 - Trivial identities (e.g. n + 0 = n, a * 1 = a, commutativity of addition)
 - Direct restatements of well-known Mathlib lemmas or standard textbook results
 - Results closable by a single tactic like `simp`, `omega`, `norm_num`, `decide`, or `rfl`
@@ -262,11 +268,12 @@ def build_proof_identification_prompt(
 - Routine algebraic manipulations with no conceptual content
 
 Rules:
-- Return TRUE when at least one non-trivial, novel-potential theorem is found.
-- Return FALSE only if the source genuinely contains nothing beyond trivial or well-known results.
-- Rank candidates by novelty potential. Return at most 5 of the most promising theorems.
-- For each candidate, include a brief novelty_rationale explaining why it is worth formalizing.
-- Welcome bold or speculative claims -- if the source proposes something ambitious that might be provable with the right formalization, extract it. The downstream formalization agent will handle narrowing if needed.
+- Return TRUE when at least one prompt-relevant, non-trivial theorem is found.
+- Return FALSE if the source contains no theorem that would materially help answer, support, or advance the USER RESEARCH PROMPT.
+- Order candidates by direct usefulness to the USER RESEARCH PROMPT first, then by novelty/formalization value. This ordering is not a cap.
+- Return every prompt-relevant theorem that is non-trivial and worth attempting.
+- For each candidate, include a brief novelty_rationale explaining both why it helps the USER RESEARCH PROMPT and why it is worth formalizing.
+- Welcome bold or speculative claims only when they are prompt-relevant -- if the source proposes something ambitious that might be provable with the right formalization, extract it. The downstream formalization agent will handle narrowing if needed.
 - Use theorem IDs that are stable strings such as "thm_1", "thm_2", etc.
 
 USER RESEARCH PROMPT:
@@ -305,6 +312,7 @@ def build_lemma_search_prompt(
 - Return 5-10 candidate lemma/theorem names when possible.
 - Prefer concrete declaration names over descriptions.
 - Use familiar Mathlib naming when possible (for example `Nat.add_comm`, `mul_assoc`, `Finset.card_union_add_card_inter`).
+- Keep suggestions tied to the target theorem and the USER RESEARCH PROMPT; do not drift toward merely adjacent or interesting Mathlib facts.
 - If the theorem is too vague or no good candidates are evident, return an empty list.
 
 USER RESEARCH PROMPT:
@@ -347,6 +355,7 @@ def build_smt_translation_prompt(
 - Prefer quantifier-free arithmetic fragments when possible.
 - If the theorem is underspecified, only encode the part that is clearly justified by the theorem statement and notes.
 - Do not invent new assumptions that are not strongly implied by the theorem.
+- Do not translate a different or weaker theorem merely because it is easier; the SMT check must still support the USER RESEARCH PROMPT through the selected target theorem.
 - Return an empty `smtlib` string if you cannot produce a faithful SMT translation.
 - Use only SMT-LIB text in the `smtlib` field.
 
@@ -397,6 +406,9 @@ def build_proof_formalization_prompt(
 - Include needed imports.
 - State assumptions explicitly.
 - Prefer correct, minimal, compilable code over stylistic elegance.
+- Keep the USER RESEARCH PROMPT as the relevance boundary. If you narrow an
+  underspecified theorem, the narrowed lemma must still help answer, support,
+  or advance the user's prompt.
 - PRESERVE the theorem's non-trivial content. Do not simplify or weaken the
   statement into a trivial identity just to make it compile. The goal is to
   formalize the ACTUAL claim, not a watered-down version of it.
@@ -474,6 +486,9 @@ def build_proof_tactic_script_prompt(
 - Return a short, ordered list of tactics that can be appended under a `by` block.
 - Each tactic entry must include the Lean tactic string and one short reasoning note.
 - Prefer small, composable tactics over a single opaque script.
+- Keep the USER RESEARCH PROMPT as the relevance boundary. If you narrow an
+  underspecified theorem, the narrowed lemma must still help answer, support,
+  or advance the user's prompt.
 - PRESERVE the theorem's non-trivial content. Do not simplify or weaken the
   statement into a trivial identity just to make it compile.
 - NEVER include `sorry` or `admit` in the tactic list. A script that uses
@@ -522,7 +537,7 @@ def build_proof_novelty_prompt(
     lean_code: str,
     existing_novel_proofs: str,
 ) -> str:
-    """Ask the validator to classify a Lean-verified theorem into one of four novelty tiers."""
+    """Ask the validator to classify a Lean-verified theorem into one of five novelty tiers."""
     existing_proofs_block = existing_novel_proofs or "[No previously stored novel proofs.]"
     return f"""This proof has been FORMALLY VERIFIED by Lean 4. It is mathematically valid.
 
@@ -555,10 +570,17 @@ def build_proof_novelty_prompt(
 - It constitutes a novel alternative proof of an existing result whose existence changes mathematical understanding (e.g., a constructive proof where only non-constructive proofs were known).
 - Assign this tier when the proof would be a publishable or citable contribution in its own right.
 
+"major_mathematical_discovery"
+- The result appears to be an exceptional mathematical breakthrough, not merely a publishable or citable new result.
+- It may be competitive for a major prize or medal in a related field if confirmed, contextualized, and accepted by domain experts.
+- It resolves an important open problem, creates a powerful new theory or framework, or proves a result with unusually broad consequences.
+- Assign this tier only when the proof's significance appears field-level or prize-level, above an ordinary mathematical discovery.
+
 Rules:
 - Do NOT re-check validity. Lean 4 already verified it.
 - Choose the single best-fitting tier. When a proof could fit multiple tiers, choose the highest applicable one.
-- Consider the research prompt context. A result textbook-standard in one field may qualify as "novel_formulation" if it is the first mechanized Lean 4 proof of that result for this research program.
+- Consider the research prompt context. A result textbook-standard in one field may qualify as "novel_formulation" if it is the first mechanized Lean 4 proof of that result for this research program and it helps the USER RESEARCH PROMPT.
+- Do not assign a high novelty tier to a theorem that is mathematically interesting but irrelevant to the USER RESEARCH PROMPT.
 - Err toward recognizing higher tiers for results that required multi-step reasoning, non-trivial formalization work, or original proof strategy.
 
 USER RESEARCH PROMPT:
@@ -575,3 +597,48 @@ def build_proof_novelty_prompt(
 
 {_json_only_footer('{"novelty_tier": "mathematical_discovery", "reasoning": "brief explanation"}')}
 """
+
+
+def build_proof_statement_alignment_prompt(
+    user_prompt: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    lean_code: str,
+    source_excerpt: str,
+) -> str:
+    """Validate that Lean-accepted code proves the intended theorem candidate."""
+    return f"""You are validating a Lean 4 proof candidate after Lean 4 has accepted the code.
+
+Lean 4 already verified that the code is logically valid. Your task is narrower:
+decide whether the accepted Lean code actually corresponds to the intended theorem
+candidate below. Reject code that proves an unrelated trivial theorem, proves only a
+weakened/irrelevant result, or avoids the intended statement by changing the target.
+
+Accept if the Lean code formalizes the same mathematical claim, a clearly equivalent
+claim, or a faithful narrowed form explicitly justified by the formal sketch and still
+useful for the USER RESEARCH PROMPT.
+
+USER RESEARCH PROMPT:
+{user_prompt}
+
+INTENDED THEOREM CANDIDATE:
+{theorem_statement}
+
+FORMAL SKETCH / EXPECTED SHAPE:
+{formal_sketch or '[none provided]'}
+
+SOURCE EXCERPT:
+{source_excerpt or '[none provided]'}
+
+LEAN 4-ACCEPTED CODE:
+{lean_code}
+
+Reject examples:
+- The code proves only `True`, `1 = 1`, or a routine identity unrelated to the candidate.
+- The theorem name/statement in Lean bears no relationship to the intended theorem.
+- The proof introduces a different result and ignores the claimed theorem.
+- The result is materially weaker than the intended theorem without being a useful, explicitly scoped lemma.
+- The result may be mathematically valid but does not help answer, support, or advance the USER RESEARCH PROMPT.
+
+{_json_only_footer('{"decision": "accept", "reasoning": "why the Lean code matches or does not match the intended theorem", "summary": "short rejection feedback if rejected"}')}
+"""
diff --git a/backend/autonomous/prompts/topic_exploration_prompts.py b/backend/autonomous/prompts/topic_exploration_prompts.py
index f367fe6..98f025b 100644
--- a/backend/autonomous/prompts/topic_exploration_prompts.py
+++ b/backend/autonomous/prompts/topic_exploration_prompts.py
@@ -30,13 +30,16 @@ def build_exploration_user_prompt(
     parts = []
     
     parts.append("=== TOPIC EXPLORATION PHASE ===\n")
-    parts.append("You are in a TOPIC EXPLORATION phase. You are NOT solving a mathematical problem directly.")
-    parts.append("Instead, your task is to propose CANDIDATE BRAINSTORM QUESTIONS — specific mathematical")
-    parts.append("avenues worth exploring for the research goal below.\n")
+    parts.append("You are in a TOPIC EXPLORATION phase. Your task is to propose CANDIDATE BRAINSTORM QUESTIONS")
+    parts.append("that maximize the chance of a rigorous DIRECT answer to the research goal below.\n")
+    parts.append("Prefer candidate questions aimed at direct solutions, direct partial solutions, impossibility")
+    parts.append("results, exact reductions, explicit constructions, or sharp constraints. Use indirect/support")
+    parts.append("avenues only when no stronger direct path is currently available.\n")
     parts.append("Each submission should contain ONE candidate brainstorm question and reasoning for why")
     parts.append("it is a valuable, distinct direction. The validator will check quality and DIVERSITY —")
     parts.append("candidates that overlap with already-accepted ones will be REJECTED.\n")
     parts.append("WHAT MAKES A GOOD CANDIDATE QUESTION:")
+    parts.append("- Most directly targets answering the user's problem or a clearly necessary subproblem")
     parts.append("- Specific enough to guide focused mathematical exploration (not vague)")
     parts.append("- Novel relative to already-accepted candidates and existing brainstorms")
     parts.append("- Relevant to the research goal below")
@@ -45,8 +48,9 @@ def build_exploration_user_prompt(
     parts.append("- Actionable — a brainstorm session could produce meaningful insights from it\n")
     parts.append("DIVERSITY IS PARAMOUNT:")
     parts.append("Your candidate MUST be SUBSTANTIVELY DIFFERENT from already-accepted candidates.")
-    parts.append("The goal is to map the exploration landscape BROADLY before committing to a direction.")
-    parts.append("Do not propose variations of existing candidates — propose genuinely different avenues.\n")
+    parts.append("The goal is to compare the BEST direct-answer paths before committing to one.")
+    parts.append("Do not propose shallow variations of existing candidates — propose genuinely different,")
+    parts.append("high-value avenues with a preference for the most direct rigorous routes.\n")
     parts.append("FORMAT YOUR SUBMISSION AS:")
     parts.append("State the candidate brainstorm question clearly, then explain why it is valuable and")
     parts.append("distinct from any existing candidates.\n")
diff --git a/backend/autonomous/prompts/topic_prompts.py b/backend/autonomous/prompts/topic_prompts.py
index 449fef2..48fb61b 100644
--- a/backend/autonomous/prompts/topic_prompts.py
+++ b/backend/autonomous/prompts/topic_prompts.py
@@ -31,7 +31,12 @@ def get_topic_selection_system_prompt() -> str:
 ---
 
 YOUR TASK:
-Select the optimal research avenue that best advances the user's research goal.
+Select the optimal research avenue that most directly advances the user's research goal toward a rigorous answer.
+
+DIRECT-SOLUTION PREFERENCE:
+- Prefer avenues likely to produce a direct solution, direct partial solution, impossibility result, explicit construction, exact reduction, or sharp constraint
+- Use broader exploratory or background-heavy avenues only when no stronger direct path is currently available
+- Do not choose an avenue merely because it is broad or interesting if a more direct rigorous path exists
 
 DECISION OPTIONS:
 1. NEW_TOPIC - Create a brand new brainstorm topic to explore
@@ -42,25 +47,29 @@ def get_topic_selection_system_prompt() -> str:
 
 When to choose NEW_TOPIC:
 - All existing topics are complete OR
-- A genuinely new mathematical avenue would provide more research value than continuing existing work
+- A genuinely new mathematical avenue would provide more direct-answer value than continuing existing work
 - The new topic addresses an unexplored area relevant to the research goal
 - Existing papers don't adequately cover this mathematical territory
+- The new topic offers a stronger direct route to resolving the user's question than current options
 
 When to choose CONTINUE_EXISTING:
 - An incomplete brainstorm has significant untapped mathematical depth
 - The brainstorm has few submissions relative to its mathematical richness
-- Continuing would yield more valuable insights than starting fresh
+- Continuing would yield more valuable direct progress than starting fresh
+- The unfinished topic still contains a realistic path to a stronger direct answer
 
 When to choose COMBINE_TOPICS:
 - Multiple existing brainstorms are deeply interconnected
 - A unified exploration would reveal insights neither topic could provide alone
 - The mathematical concepts naturally bridge multiple brainstorms
+- The combination produces a more direct route to answering the user's question than keeping them separate
 
 CRITICAL REQUIREMENTS:
 - Focus on mathematical rigor and logical soundness
 - Avoid redundancy with existing work
 - Ensure topic selection serves the user's research goal
 - Consider the existing paper library to avoid redundant explorations
+- Prefer the avenue with the strongest justified direct-answer potential
 
 CRITICAL JSON ESCAPE RULES:
 1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
@@ -143,7 +152,7 @@ def get_topic_validator_system_prompt() -> str:
 ---
 
 YOUR TASK:
-Validate whether the proposed topic selection represents the best use of research resources.
+Validate whether the proposed topic selection represents the best use of research resources for obtaining the strongest rigorous direct answer.
 
 VALIDATION CRITERIA:
 
@@ -154,6 +163,7 @@ def get_topic_validator_system_prompt() -> str:
 4. The choice is relevant to the user's research goal
 5. The reasoning is sound and mathematically grounded
 6. The topic doesn't duplicate existing completed work
+7. The choice is at least as direct a route to answering the user's question as the available alternatives
 
 REJECT the topic selection if:
 1. NEW_TOPIC: The topic duplicates an existing brainstorm or completed paper
@@ -162,6 +172,7 @@ def get_topic_validator_system_prompt() -> str:
 4. The choice ignores more valuable research avenues
 5. The reasoning is flawed or lacks mathematical rigor
 6. The selection would lead to redundant work
+7. A clearly more direct rigorous avenue was available and unjustifiably ignored
 
 REJECTION FEEDBACK FORMAT:
 If rejecting, provide CONCRETE, ACTIONABLE guidance:
diff --git a/backend/autonomous/validation/paper_redundancy_checker.py b/backend/autonomous/validation/paper_redundancy_checker.py
index 276e827..c5591ac 100644
--- a/backend/autonomous/validation/paper_redundancy_checker.py
+++ b/backend/autonomous/validation/paper_redundancy_checker.py
@@ -164,9 +164,9 @@ async def check_redundancy(
                 self.task_tracking_callback("completed", task_id)
             return self._create_no_removal(f"Error: {str(e)}")
     
-    async def execute_removal(self, paper_id: str) -> bool:
+    async def execute_removal(self, paper_id: str, reason: str = "") -> bool:
         """
-        Execute paper removal by archiving it.
+        Execute paper removal by pruning it from model context.
         
         Args:
             paper_id: ID of paper to remove
@@ -175,15 +175,21 @@ async def execute_removal(self, paper_id: str) -> bool:
             True if removal successful
         """
         try:
-            # Archive the paper
-            success = await paper_library.archive_paper(paper_id)
+            success = await paper_library.prune_paper(
+                paper_id,
+                reason=reason,
+                pruned_by="system",
+            )
             
             if success:
-                # Update central metadata
-                await research_metadata.archive_paper(paper_id)
-                logger.info(f"PaperRedundancyChecker: Successfully archived paper {paper_id}")
+                await research_metadata.prune_paper(
+                    paper_id,
+                    reason=reason,
+                    pruned_by="system",
+                )
+                logger.info(f"PaperRedundancyChecker: Successfully pruned paper {paper_id}")
             else:
-                logger.error(f"PaperRedundancyChecker: Failed to archive paper {paper_id}")
+                logger.error(f"PaperRedundancyChecker: Failed to prune paper {paper_id}")
             
             return success
             
diff --git a/backend/compiler/agents/critique_submitter.py b/backend/compiler/agents/critique_submitter.py
index 45b74f0..7040399 100644
--- a/backend/compiler/agents/critique_submitter.py
+++ b/backend/compiler/agents/critique_submitter.py
@@ -1,14 +1,12 @@
 """
 Critique Submitter - generates peer review feedback on body section.
-Also makes rewrite vs continue decision after 5 critiques received.
 """
-import asyncio
-from typing import Optional, Dict, Callable, List
+from typing import Optional, Callable
 import logging
 import uuid
 from datetime import datetime
 
-from backend.shared.config import rag_config, system_config
+from backend.shared.config import rag_config
 from backend.shared.models import Submission
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
@@ -16,8 +14,6 @@
 from backend.shared.utils import count_tokens
 from backend.compiler.prompts.critique_prompts import (
     build_critique_prompt,
-    build_rewrite_decision_prompt,
-    build_iterative_edit_prompt
 )
 from backend.compiler.memory.critique_rejection_memory import CritiqueRejectionMemory
 
@@ -27,7 +23,7 @@
 class CritiqueSubmitterAgent:
     """
     Critique submitter agent for peer review aggregation phase.
-    Generates critiques of body section and makes rewrite vs continue decisions.
+    Generates critiques of the body section for the final self-review.
     """
     
     def __init__(
@@ -226,290 +222,6 @@ async def submit_critique(
             logger.error(f"Error generating critique: {e}", exc_info=True)
             return None
     
-    async def submit_rewrite_decision(
-        self,
-        user_prompt: str,
-        current_body: str,
-        current_outline: str,
-        current_title: str,
-        aggregator_db: str,
-        critique_feedback: str,
-        pre_critique_paper: str,
-        reference_papers: Optional[str] = None,
-        accumulated_history: Optional[str] = None
-    ) -> Optional[Dict]:
-        """
-        Decide whether to rewrite body or continue to conclusion.
-        
-        Args:
-            user_prompt: User's compiler-directing prompt
-            current_body: Body section being evaluated
-            current_outline: Paper outline
-            current_title: Current paper title
-            aggregator_db: Aggregator database content
-            critique_feedback: All accepted critiques (typically 1-3 out of 5 total attempts)
-            pre_critique_paper: Paper snapshot from START of critique phase (for context)
-            reference_papers: Optional reference paper content
-            accumulated_history: Optional accumulated critique history from previous failed versions
-            
-        Returns:
-            Dict with decision details or None if generation failed
-            Format: {
-                "decision": "total_rewrite" | "partial_revision" | "continue",
-                "new_title": str or None,
-                "new_outline": str or None,
-                "reasoning": str
-            }
-            Note: For partial_revision, edit operations are proposed iteratively (not upfront)
-        """
-        try:
-            # Build prompt
-            prompt = build_rewrite_decision_prompt(
-                user_prompt=user_prompt,
-                current_body=current_body,
-                current_outline=current_outline,
-                current_title=current_title,
-                aggregator_db=aggregator_db,
-                critique_feedback=critique_feedback,
-                pre_critique_paper=pre_critique_paper,
-                reference_papers=reference_papers,
-                accumulated_history=accumulated_history
-            )
-            
-            # Validate prompt size
-            prompt_tokens = count_tokens(prompt)
-            max_allowed = rag_config.get_available_input_tokens(
-                self.context_window,
-                self.max_tokens
-            )
-            
-            if prompt_tokens > max_allowed:
-                logger.error(
-                    f"Rewrite decision prompt ({prompt_tokens} tokens) exceeds context window "
-                    f"({max_allowed} tokens available)"
-                )
-                return None
-            
-            logger.debug(f"Rewrite decision prompt: {prompt_tokens} tokens (max: {max_allowed})")
-            
-            # Generate task ID and notify start
-            task_id = f"critique_decision_{self.task_sequence:03d}"
-            self.task_sequence += 1
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM (uses same role as critique generation)
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,  # Use same role config as critique generation
-                model=self.model,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,
-                max_tokens=self.max_tokens
-            )
-            
-            # Notify completion
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            # Extract content from API response
-            # Some reasoning models output JSON in 'reasoning' field instead of 'content'
-            if not response.get("choices") or not response["choices"][0].get("message"):
-                logger.error("Rewrite decision: LLM returned empty response structure")
-                return None
-            
-            message = response["choices"][0]["message"]
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            
-            # Parse JSON response
-            data = parse_json(llm_output)
-            
-            if data is None:
-                logger.error("Failed to parse rewrite decision JSON response")
-                return None
-            
-            # Handle array responses (extract first element)
-            if isinstance(data, list):
-                logger.warning("Rewrite decision returned array instead of object - using first element")
-                if not data:
-                    logger.error("Empty array response from rewrite decision")
-                    return None
-                data = data[0]
-            
-            # Validate required fields
-            required_fields = ["decision", "reasoning"]
-            for field in required_fields:
-                if field not in data:
-                    logger.error(f"Rewrite decision response missing '{field}' field")
-                    return None
-            
-            # Validate decision value
-            if data["decision"] not in ["total_rewrite", "partial_revision", "continue"]:
-                logger.error(f"Invalid decision value: {data['decision']} (must be 'total_rewrite', 'partial_revision', or 'continue')")
-                return None
-            
-            # Note: For partial_revision, edit_operations are now proposed iteratively (not upfront)
-            # So we no longer validate edit_operations field here
-            
-            logger.info(f"Rewrite decision generated: {data['decision']}")
-            
-            return data
-            
-        except FreeModelExhaustedError:
-            raise
-        except RuntimeError as e:
-            if "credits exhausted" in str(e).lower():
-                raise
-            logger.error(f"Error generating rewrite decision: {e}", exc_info=True)
-            return None
-        except Exception as e:
-            logger.error(f"Error generating rewrite decision: {e}", exc_info=True)
-            return None
-    
-    async def submit_iterative_edit(
-        self,
-        user_prompt: str,
-        pre_critique_paper: str,
-        current_paper: str,
-        current_outline: str,
-        critique_feedback: str,
-        edits_applied: List[Dict],
-        reference_papers: Optional[str] = None,
-        accumulated_history: Optional[str] = None
-    ) -> Optional[Dict]:
-        """
-        Propose ONE edit for iterative partial revision.
-        
-        Called repeatedly until more_edits_needed=false or max iterations reached.
-        Each call sees the updated paper after previous edits were applied.
-        
-        Args:
-            user_prompt: User's compiler-directing prompt
-            pre_critique_paper: Paper snapshot from START of critique phase
-            current_paper: Current paper body (after any edits applied so far)
-            current_outline: Paper outline
-            critique_feedback: All accepted critiques from this revision cycle
-            edits_applied: List of edits already applied in this iteration
-            reference_papers: Optional reference paper content
-            accumulated_history: Optional accumulated critique history from previous failed versions
-            
-        Returns:
-            Dict with edit details or None if generation failed
-            Format: {
-                "operation": "replace" | "insert_after" | "delete",
-                "old_string": str,
-                "new_string": str,
-                "reasoning": str,
-                "more_edits_needed": bool
-            }
-        """
-        try:
-            # Build prompt
-            prompt = build_iterative_edit_prompt(
-                user_prompt=user_prompt,
-                pre_critique_paper=pre_critique_paper,
-                current_paper=current_paper,
-                current_outline=current_outline,
-                critique_feedback=critique_feedback,
-                edits_applied=edits_applied,
-                reference_papers=reference_papers,
-                accumulated_critique_history=accumulated_history or ""
-            )
-            
-            # Validate prompt size
-            prompt_tokens = count_tokens(prompt)
-            max_allowed = rag_config.get_available_input_tokens(
-                self.context_window,
-                self.max_tokens
-            )
-            
-            if prompt_tokens > max_allowed:
-                logger.error(
-                    f"Iterative edit prompt ({prompt_tokens} tokens) exceeds context window "
-                    f"({max_allowed} tokens available)"
-                )
-                return None
-            
-            logger.debug(f"Iterative edit prompt: {prompt_tokens} tokens (max: {max_allowed})")
-            
-            # Generate task ID and notify start
-            task_id = f"partial_edit_{self.task_sequence:03d}"
-            self.task_sequence += 1
-            
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,
-                model=self.model,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,
-                max_tokens=self.max_tokens
-            )
-            
-            # Notify completion
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            # Extract content from API response
-            if not response.get("choices") or not response["choices"][0].get("message"):
-                logger.error("Iterative edit: LLM returned empty response structure")
-                return None
-            
-            message = response["choices"][0]["message"]
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            
-            # Parse JSON response
-            data = parse_json(llm_output)
-            
-            if data is None:
-                logger.error("Failed to parse iterative edit JSON response")
-                return None
-            
-            # Handle array responses
-            if isinstance(data, list):
-                logger.warning("Iterative edit returned array instead of object - using first element")
-                if not data:
-                    logger.error("Empty array response from iterative edit")
-                    return None
-                data = data[0]
-            
-            # Validate required fields
-            required_fields = ["operation", "old_string", "new_string", "reasoning", "more_edits_needed"]
-            for field in required_fields:
-                if field not in data:
-                    logger.error(f"Iterative edit response missing '{field}' field")
-                    return None
-            
-            # Validate operation type
-            if data["operation"] not in ["replace", "insert_after", "delete"]:
-                logger.error(f"Invalid operation: {data['operation']} (must be 'replace', 'insert_after', or 'delete')")
-                return None
-            
-            # Validate more_edits_needed is boolean
-            if not isinstance(data["more_edits_needed"], bool):
-                logger.warning(f"more_edits_needed is not boolean: {data['more_edits_needed']}, converting to bool")
-                data["more_edits_needed"] = bool(data["more_edits_needed"])
-            
-            edit_num = len(edits_applied) + 1
-            logger.info(f"Iterative edit #{edit_num} proposed: {data['operation']} (more_edits_needed={data['more_edits_needed']})")
-            
-            return data
-            
-        except FreeModelExhaustedError:
-            raise
-        except RuntimeError as e:
-            if "credits exhausted" in str(e).lower():
-                raise
-            logger.error(f"Error generating iterative edit: {e}", exc_info=True)
-            return None
-        except Exception as e:
-            logger.error(f"Error generating iterative edit: {e}", exc_info=True)
-            return None
-    
     async def handle_acceptance(self) -> None:
         """Handle critique acceptance (for compatibility with aggregator interface)."""
         # No special action needed for critique acceptances
diff --git a/backend/compiler/agents/high_context_submitter.py b/backend/compiler/agents/high_context_submitter.py
index fa1cb0d..f224824 100644
--- a/backend/compiler/agents/high_context_submitter.py
+++ b/backend/compiler/agents/high_context_submitter.py
@@ -3,6 +3,7 @@
 Handles 3 modes: construction, outline update, and review.
 """
 import asyncio
+import hashlib
 import json
 import logging
 import uuid
@@ -14,7 +15,7 @@
 from backend.shared.models import CompilerSubmission
 from backend.shared.config import system_config, rag_config
 from backend.shared.utils import count_tokens
-from backend.shared.json_parser import parse_json
+from backend.shared.json_parser import parse_json, sanitize_model_output_for_retry_context
 from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.validation.json_validator import json_validator
 from backend.compiler.prompts.outline_prompts import (
@@ -46,11 +47,34 @@
 # =============================================================================
 # The main writer may invoke Wolfram Alpha as a real OpenAI-style tool during
 # construction mode. Each submission gets a budget of 20 calls; the loop
-# forces finalization once the budget is exhausted. Callers attach the full
-# audit trail to `CompilerSubmission.metadata["wolfram_calls"]`.
+# forces finalization once the budget is exhausted. Tool results are returned
+# to the model, while logs/WebSocket events only expose redacted metadata.
 
 WOLFRAM_MAX_CALLS_PER_SUBMISSION = 20
 
+
+def _hash_text_for_audit(value: str) -> str:
+    text = value or ""
+    return hashlib.sha256(text.encode("utf-8", errors="replace")).hexdigest() if text else ""
+
+
+def _redacted_wolfram_audit_entry(query: str, purpose: str, result: str) -> Dict[str, Any]:
+    """Store non-sensitive Wolfram audit metadata while preserving call counts."""
+    return {
+        "query": "[redacted]",
+        "purpose": "[redacted]" if purpose else "",
+        "result": "[redacted]",
+        "query_redacted": True,
+        "purpose_redacted": True,
+        "result_redacted": True,
+        "query_length": len(query or ""),
+        "purpose_length": len(purpose or ""),
+        "result_length": len(result or ""),
+        "query_sha256": _hash_text_for_audit(query),
+        "purpose_sha256": _hash_text_for_audit(purpose),
+        "result_sha256": _hash_text_for_audit(result),
+    }
+
 WOLFRAM_TOOL_SCHEMA: Dict[str, Any] = {
     "type": "function",
     "function": {
@@ -489,8 +513,6 @@ async def submit_construction(
         is_first_portion: bool = False, 
         section_phase: Optional[str] = None,
         rejection_feedback: Optional[str] = None,
-        critique_feedback: Optional[str] = None,
-        pre_critique_paper: Optional[str] = None,
         brainstorm_content: Optional[str] = None,
         brainstorm_source_name: Optional[str] = None
     ) -> Optional[CompilerSubmission]:
@@ -502,8 +524,6 @@ async def submit_construction(
             section_phase: Phase constraint for construction ("body", "conclusion", "introduction", "abstract")
                           When provided, uses phase-specific prompts with explicit section_complete feedback.
             rejection_feedback: Feedback from a previous rejection to guide the model (e.g., "Introduction not found in document")
-            critique_feedback: Accepted critique feedback from peer review (for body rewrites only)
-            pre_critique_paper: Paper state before critique phase (for body rewrites - shows what failed)
             brainstorm_content: Full brainstorm database with submission numbers (for retroactive corrections)
             brainstorm_source_name: RAG source name for brainstorm (e.g., "brainstorm_abc123.txt") to exclude from retrieval
         
@@ -512,8 +532,7 @@ async def submit_construction(
         """
         phase_info = f", phase={section_phase}" if section_phase else ""
         feedback_info = f", retry with feedback" if rejection_feedback else ""
-        critique_info = f", rewrite with critique" if critique_feedback else ""
-        logger.info(f"Starting construction submission generation (first={is_first_portion}{phase_info}{feedback_info}{critique_info})")
+        logger.info(f"Starting construction submission generation (first={is_first_portion}{phase_info}{feedback_info})")
         
         try:
             # Get current outline and paper
@@ -577,8 +596,6 @@ async def submit_construction(
                     rag_evidence=context_pack.text,
                     is_first_portion=is_first_portion,
                     rejection_feedback=rejection_feedback,
-                    critique_feedback=critique_feedback,
-                    pre_critique_paper=pre_critique_paper,
                     brainstorm_content=brainstorm_content
                 )
             elif section_phase == "conclusion":
@@ -617,9 +634,7 @@ async def submit_construction(
                     rag_evidence=context_pack.text,
                     is_first_portion=is_first_portion,
                     section_phase=section_phase,
-                    rejection_feedback=rejection_feedback,
-                    critique_feedback=critique_feedback,
-                    pre_critique_paper=pre_critique_paper
+                    rejection_feedback=rejection_feedback
                 )
             logger.info(f"Prompt built: {len(prompt)} chars")
             
@@ -993,7 +1008,7 @@ async def _generate_completion_with_wolfram_tool(
           to the single-shot path.
 
         Websocket events:
-        - `compiler_wolfram_call` broadcast per call with query + preview.
+        - `compiler_wolfram_call` broadcast per call with redacted metadata.
         """
         wolfram_enabled = _wolfram_tool_available()
 
@@ -1115,16 +1130,14 @@ async def _generate_completion_with_wolfram_tool(
                     logger.warning(f"Wolfram query raised: {exc}")
                     result_text = None
                 result_text = result_text or "Wolfram Alpha returned no result."
-                wolfram_calls.append({
-                    "query": query,
-                    "purpose": purpose,
-                    "result": result_text,
-                })
+                wolfram_calls.append(_redacted_wolfram_audit_entry(query, purpose, result_text))
                 logger.info(
-                    "Wolfram Alpha call %d/%d: %s",
+                    "Wolfram Alpha call %d/%d completed (query_len=%d, purpose_len=%d, result_len=%d)",
                     len(wolfram_calls),
                     WOLFRAM_MAX_CALLS_PER_SUBMISSION,
-                    query[:120],
+                    len(query),
+                    len(purpose),
+                    len(result_text),
                 )
                 try:
                     await self._broadcast_wolfram_event(
@@ -1181,9 +1194,14 @@ async def _broadcast_wolfram_event(
                 "compiler_wolfram_call",
                 {
                     "task_id": task_id,
-                    "query": query,
-                    "purpose": purpose,
-                    "result_preview": (result or "")[:200],
+                    "query": "[redacted]",
+                    "purpose": "[redacted]" if purpose else "",
+                    "result_preview": "",
+                    "query_redacted": True,
+                    "result_redacted": True,
+                    "query_length": len(query or ""),
+                    "purpose_length": len(purpose or ""),
+                    "result_length": len(result or ""),
                     "calls_used": calls_used,
                     "calls_remaining": max(0, WOLFRAM_MAX_CALLS_PER_SUBMISSION - calls_used),
                     "max_calls": WOLFRAM_MAX_CALLS_PER_SUBMISSION,
@@ -1229,6 +1247,7 @@ async def _parse_json_response_with_retry(
         try:
             # Generate a retry task ID (append _retry to distinguish from original)
             retry_task_id = f"{self.get_current_task_id()}_retry"
+            retry_context = sanitize_model_output_for_retry_context(response)
             
             retry_response = await api_client_manager.generate_completion(
                 task_id=retry_task_id,
@@ -1236,7 +1255,7 @@ async def _parse_json_response_with_retry(
                 model=self.model_name,
                 messages=[
                     {"role": "user", "content": original_prompt},
-                    {"role": "assistant", "content": response},
+                    {"role": "assistant", "content": retry_context},
                     {"role": "user", "content": retry_prompt}
                 ],
                 temperature=0.0,  # Deterministic JSON formatting
diff --git a/backend/compiler/agents/high_param_submitter.py b/backend/compiler/agents/high_param_submitter.py
index ec03eda..b46bf3e 100644
--- a/backend/compiler/agents/high_param_submitter.py
+++ b/backend/compiler/agents/high_param_submitter.py
@@ -10,10 +10,11 @@
         for up to 5 Lean 4 attempts with error-feedback chaining.
     Stage 3 (novelty): classify the verified proof and persist it via
         proof_database.add_proof.
-    Stage 4 (placement): propose an inline edit that introduces the
+    Stage 4 (placement): either propose an inline edit that introduces the
         theorem with a "verified in Lean 4" marker and an appendix
-        reference. The coordinator owns the 2-attempt validator retry loop
-        and the appendix fallback.
+        reference, or explicitly request appendix-only storage for extension
+        theorems. The coordinator owns the 2-attempt validator retry loop
+        and appendix insertion.
 
 The Wolfram sub-mode that used to live here has been removed in Phase 2.
 Wolfram Alpha is now a tool available to HighContextSubmitter.submit_construction
@@ -39,13 +40,13 @@
 )
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.config import rag_config, system_config
-from backend.shared.json_parser import parse_json
+from backend.shared.json_parser import parse_json, sanitize_model_output_for_retry_context
+from backend.shared.lean_proof_integrity import validate_full_lean_proof_integrity
 from backend.shared.lm_studio_client import lm_studio_client
 from backend.shared.models import (
     CompilerSubmission,
     ProofAttemptFeedback,
     ProofCandidate,
-    ProofRecord,
 )
 from backend.shared.utils import count_tokens
 
@@ -96,6 +97,7 @@ def format_theorem_appendix_entry(
     """
     header_name = theorem_name.strip() or proof_id
     tier_labels = {
+        "major_mathematical_discovery": "Major Mathematical Discovery",
         "mathematical_discovery": "Mathematical Discovery",
         "novel_variant": "Novel Reformulation",
         "novel_formulation": "Novel Formalization",
@@ -103,6 +105,7 @@ def format_theorem_appendix_entry(
     novelty_label = tier_labels.get(novelty_tier, "Novel" if is_novel else "Known")
     status_suffix = {
         "appendix_fallback": "inline placement rejected; preserved here because Lean 4 verified the math",
+        "appendix_requested": "stored here by rigor discovery request",
         "inline": "also placed inline in the body",
     }.get(placement_outcome, placement_outcome)
 
@@ -138,6 +141,8 @@ class RigorTheoremResult:
     # Retained for retry-prompt assembly
     formal_sketch: str = ""
     source_excerpt: str = ""
+    theorem_origin: str = "existing_paper_claim"
+    placement_preference: str = "inline"
     # Metadata pass-through
     metadata: Dict[str, Any] = field(default_factory=dict)
 
@@ -156,6 +161,10 @@ def __init__(
         model_name: str,
         user_prompt: str,
         websocket_broadcaster: Optional[Callable[[str, Dict[str, Any]], Awaitable[None]]] = None,
+        *,
+        validator_model: str = "",
+        validator_context_window: Optional[int] = None,
+        validator_max_tokens: Optional[int] = None,
     ):
         self.model_name = model_name
         # NOTE: proof_database.inject_into_prompt prepends all novel proofs
@@ -163,6 +172,9 @@ def __init__(
         self.user_prompt = proof_database.inject_into_prompt(user_prompt)
         self.raw_user_prompt = user_prompt
         self.websocket_broadcaster = websocket_broadcaster
+        self.validator_model = validator_model or model_name
+        self.validator_context_window = validator_context_window or system_config.compiler_validator_context_window
+        self.validator_max_tokens = validator_max_tokens or system_config.compiler_validator_max_output_tokens
         self._initialized = False
         self._standalone_session_id = f"standalone_{uuid.uuid4().hex[:12]}"
 
@@ -192,6 +204,8 @@ async def initialize(self) -> None:
 
         self.context_window = system_config.compiler_high_param_context_window
         self.max_output_tokens = system_config.compiler_high_param_max_output_tokens
+        self.validator_context_window = self.validator_context_window or system_config.compiler_validator_context_window
+        self.validator_max_tokens = self.validator_max_tokens or system_config.compiler_validator_max_output_tokens
         self.available_input_tokens = rag_config.get_available_input_tokens(
             self.context_window, self.max_output_tokens
         )
@@ -298,11 +312,31 @@ async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
         formal_sketch = str(discovery.get("formal_sketch") or "").strip()
         source_excerpt = str(discovery.get("source_excerpt") or "").strip()
         retry_failure_id = str(discovery.get("retry_existing_failure_id") or "").strip()
+        theorem_origin = str(discovery.get("theorem_origin") or "").strip()
+        placement_preference = str(discovery.get("placement_preference") or "").strip()
 
         if not theorem_statement:
             logger.info("Rigor cycle: discovery returned empty theorem_statement; declining")
             return None
 
+        if theorem_origin not in {
+            "existing_paper_claim",
+            "extension_from_partial_work",
+            "extension_from_user_prompt",
+        }:
+            theorem_origin = "existing_paper_claim"
+
+        if placement_preference not in {"inline", "appendix_only"}:
+            placement_preference = "inline"
+
+        if theorem_origin in {
+            "extension_from_partial_work",
+            "extension_from_user_prompt",
+        }:
+            # Extension proofs are useful evidence for the paper, but they
+            # should not silently mutate the main body narrative.
+            placement_preference = "appendix_only"
+
         logger.info(
             "Rigor cycle: Stage 2 - Lean 4 formalization (up to 5 attempts), "
             f"retry_failure_id={retry_failure_id or 'none'}"
@@ -323,13 +357,16 @@ async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
         theorem_name, lean_code, attempts = formalizer_result
 
         logger.info("Rigor cycle: Stage 3 - novelty classification + persistence")
-        is_novel, novelty_reasoning, stored_record = await self._step_assess_novelty_and_store(
+        novelty_result = await self._step_assess_novelty_and_store(
             theorem_statement=theorem_statement,
             theorem_name=theorem_name,
             lean_code=lean_code,
             formal_sketch=formal_sketch,
             attempts=attempts,
         )
+        if novelty_result is None:
+            return None
+        is_novel, novelty_reasoning, stored_record = novelty_result
 
         await self._broadcast(
             "proof_verified",
@@ -355,14 +392,22 @@ async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
             except Exception as exc:
                 logger.debug("mark_resolved_retry failed (non-fatal): %s", exc)
 
-        logger.info("Rigor cycle: Stage 4 - initial placement proposal")
-        initial_submission = await self._step_initial_placement(
-            proof_id=stored_record.proof_id,
-            theorem_statement=theorem_statement,
-            theorem_name=theorem_name,
-            lean_code=lean_code,
-            is_novel=is_novel,
-        )
+        initial_submission = None
+        if placement_preference == "appendix_only":
+            logger.info(
+                "Rigor cycle: discovery requested appendix-only placement "
+                "(origin=%s)",
+                theorem_origin,
+            )
+        else:
+            logger.info("Rigor cycle: Stage 4 - initial placement proposal")
+            initial_submission = await self._step_initial_placement(
+                proof_id=stored_record.proof_id,
+                theorem_statement=theorem_statement,
+                theorem_name=theorem_name,
+                lean_code=lean_code,
+                is_novel=is_novel,
+            )
 
         return RigorTheoremResult(
             proof_id=stored_record.proof_id,
@@ -370,16 +415,20 @@ async def submit_rigor_lean_theorem(self) -> Optional[RigorTheoremResult]:
             theorem_name=theorem_name,
             lean_code=lean_code,
             is_novel=is_novel,
-            novelty_tier=novelty_tier,
+            novelty_tier=stored_record.novelty_tier,
             novelty_reasoning=novelty_reasoning,
             attempts=attempts,
             source_id=self._compiler_source_id(),
             initial_placement_submission=initial_submission,
             formal_sketch=formal_sketch,
             source_excerpt=source_excerpt,
+            theorem_origin=theorem_origin,
+            placement_preference=placement_preference,
             metadata={
                 "retry_failure_id": retry_failure_id,
                 "attempt_count": len(attempts),
+                "theorem_origin": theorem_origin,
+                "placement_preference": placement_preference,
             },
         )
 
@@ -489,6 +538,17 @@ async def _step_formalize(
             max_output_tokens=self.max_output_tokens,
             role_id="compiler_rigor_formalization",
         )
+        proof_label = "A"
+
+        def _lean_response_summary(feedback: ProofAttemptFeedback) -> str:
+            if feedback.success:
+                return "Lean 4 response: proof verified."
+            error = " ".join((feedback.error_output or "").split())
+            if len(error) > 960:
+                error = f"{error[:960]}..."
+            if error:
+                return f"Lean 4 response: {error} - proof not verified."
+            return "Lean 4 response: proof not verified."
 
         async def _on_attempt_started(attempt_number: int, strategy: str) -> None:
             await self._broadcast(
@@ -498,13 +558,14 @@ async def _on_attempt_started(attempt_number: int, strategy: str) -> None:
                     "source_id": self._compiler_source_id(),
                     "theorem_id": candidate.theorem_id,
                     "theorem_statement": theorem_statement,
+                    "proof_label": proof_label,
                     "attempt": attempt_number,
                     "strategy": strategy,
                 },
             )
 
         async def _on_attempt_feedback(feedback: ProofAttemptFeedback) -> None:
-            event = "proof_verified" if feedback.success else "proof_attempt_failed"
+            event = "proof_lean_accepted" if feedback.success else "proof_attempt_failed"
             await self._broadcast(
                 event,
                 {
@@ -512,9 +573,12 @@ async def _on_attempt_feedback(feedback: ProofAttemptFeedback) -> None:
                     "source_id": self._compiler_source_id(),
                     "theorem_id": candidate.theorem_id,
                     "theorem_statement": theorem_statement,
+                    "proof_label": proof_label,
                     "attempt": feedback.attempt,
                     "strategy": feedback.strategy,
                     "error_output": feedback.error_output[:500] if feedback.error_output else "",
+                    "lean_response": _lean_response_summary(feedback),
+                    "proof_verified": feedback.success,
                 },
             )
 
@@ -574,6 +638,61 @@ async def _on_attempt_feedback(feedback: ProofAttemptFeedback) -> None:
             )
             return None
 
+        integrity = await validate_full_lean_proof_integrity(
+            user_prompt=self.raw_user_prompt,
+            theorem_statement=theorem_statement,
+            formal_sketch=candidate.formal_sketch,
+            lean_code=lean_code,
+            source_excerpt=candidate.source_excerpt or current_paper,
+            allowed_baseline="",
+            validator_model=self.validator_model,
+            validator_context=self.validator_context_window,
+            validator_max_tokens=self.validator_max_tokens,
+            task_id=f"{self.get_current_task_id()}_integrity",
+            role_id="compiler_rigor_novelty",
+            require_statement_alignment=True,
+        )
+        if not integrity.valid:
+            integrity_feedback = ProofAttemptFeedback(
+                attempt=(attempts[-1].attempt + 1 if attempts else 1),
+                theorem_id=candidate.theorem_id,
+                reasoning="Post-Lean proof integrity check failed.",
+                lean_code=lean_code,
+                error_output=integrity.reason,
+                strategy="full_script",
+                success=False,
+            )
+            attempts = list(attempts) + [integrity_feedback]
+            try:
+                await proof_database.record_failed_candidate(
+                    source_brainstorm_id=self._compiler_source_id(),
+                    theorem_candidate=candidate,
+                    error_summary=integrity.reason[:2000],
+                )
+            except Exception as exc:
+                logger.debug("record_failed_candidate failed after integrity rejection: %s", exc)
+            await self._broadcast(
+                "proof_integrity_rejected",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "theorem_id": candidate.theorem_id,
+                    "theorem_statement": theorem_statement,
+                    "category": integrity.category,
+                    "reason": integrity.reason,
+                },
+            )
+            await self._broadcast(
+                "proof_check_complete",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "verified_count": 0,
+                    "message": "Lean proof failed post-verification integrity checks",
+                },
+            )
+            return None
+
         return theorem_name, lean_code, attempts
 
     # --------------------------------------------------------- stage 3
@@ -586,60 +705,58 @@ async def _step_assess_novelty_and_store(
         lean_code: str,
         formal_sketch: str,
         attempts: List[ProofAttemptFeedback],
-    ) -> tuple:
+    ) -> Optional[tuple]:
         """Classify the verified proof and persist it via proof_database.
 
         Returns (is_novel, novelty_reasoning, stored_record).
         """
-        # Lazy import to break an early-load circular chain through the
-        # autonomous.core package __init__.
-        from backend.autonomous.core.proof_novelty import assess_proof_novelty
-
-        existing_block = proof_database.get_novel_proofs_for_injection()
-
         task_id = f"{self.get_current_task_id()}_novelty"
         self.task_sequence += 1
 
         try:
-            novelty_tier, novelty_reasoning = await assess_proof_novelty(
+            # Lazy import avoids an early-load cycle through autonomous.core.
+            from backend.autonomous.core.proof_registration import register_verified_lean_proof
+
+            registration = await register_verified_lean_proof(
+                proof_database=proof_database,
                 user_prompt=self.raw_user_prompt,
                 theorem_statement=theorem_statement,
                 lean_code=lean_code,
-                validator_model=self.model_name,
-                validator_context=self.context_window,
-                validator_max_tokens=self.max_output_tokens,
-                existing_novel_proofs=existing_block,
+                validator_model=self.validator_model,
+                validator_context=self.validator_context_window,
+                validator_max_tokens=self.validator_max_tokens,
                 task_id=task_id,
                 role_id="compiler_rigor_novelty",
+                source_type="paper",
+                source_id=self._compiler_source_id(),
+                source_title="Compiler Rigor Theorem",
+                theorem_name=theorem_name,
+                formal_sketch=formal_sketch,
+                solver="Lean 4",
+                verification_notes="Produced by compiler rigor loop (HighParamSubmitter).",
+                attempt_count=len(attempts),
+                attempts=list(attempts),
+                broadcast_fn=self.websocket_broadcaster,
+                base_event={
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "trigger": "rigor_loop",
+                },
             )
-            is_novel = novelty_tier != "not_novel"
+            stored = registration.record
+            return stored.novel, stored.novelty_reasoning, stored
         except Exception as exc:
-            logger.warning("Novelty assessment failed (%s); defaulting to non-novel", exc)
-            novelty_tier, novelty_reasoning, is_novel = "not_novel", f"Novelty assessment error: {exc}", False
-
-        record = ProofRecord(
-            proof_id="",  # proof_database assigns proof_XXX on add_proof
-            theorem_id="",
-            theorem_statement=theorem_statement,
-            theorem_name=theorem_name,
-            formal_sketch=formal_sketch,
-            source_type="paper",  # compiler rigor proofs live under the "paper" channel
-            source_id=self._compiler_source_id(),
-            source_title="Compiler Rigor Theorem",
-            solver="Lean 4",
-            lean_code=lean_code,
-            novel=is_novel,
-            novelty_tier=novelty_tier,
-            novelty_reasoning=novelty_reasoning,
-            verification_notes="Produced by compiler rigor loop (HighParamSubmitter).",
-            attempt_count=len(attempts),
-            attempts=list(attempts),
-            dependencies=[],
-            solver_hints=[],
-        )
-
-        stored = await proof_database.add_proof(record)
-        return is_novel, novelty_reasoning, stored
+            logger.warning("Novelty assessment failed; rigor proof will not be stored: %s", exc)
+            await self._broadcast(
+                "proof_check_complete",
+                {
+                    "source_type": "compiler_rigor",
+                    "source_id": self._compiler_source_id(),
+                    "verified_count": 0,
+                    "message": f"novelty validation failed: {exc}",
+                },
+            )
+            return None
 
     # --------------------------------------------------------- stage 4
 
@@ -870,9 +987,7 @@ async def _call_llm_and_parse(
         )
 
         try:
-            truncated_preview = llm_output[:2000] + (
-                "\n[...truncated...]" if len(llm_output) > 2000 else ""
-            )
+            truncated_preview = sanitize_model_output_for_retry_context(llm_output, max_chars=2000)
             retry_response = await api_client_manager.generate_completion(
                 task_id=f"{task_id}_retry",
                 role_id=self.role_id,
diff --git a/backend/compiler/core/compiler_coordinator.py b/backend/compiler/core/compiler_coordinator.py
index 9d0964d..6acd695 100644
--- a/backend/compiler/core/compiler_coordinator.py
+++ b/backend/compiler/core/compiler_coordinator.py
@@ -17,6 +17,7 @@
 from backend.shared.workflow_predictor import workflow_predictor
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError, OpenRouterInvalidResponseError
+from backend.shared.brainstorm_proof_gate import BRAINSTORM_LEAN_PROOF_MARKER
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.json_parser import parse_json
 from backend.shared.utils import count_tokens
@@ -39,6 +40,21 @@
 
 logger = logging.getLogger(__name__)
 
+CRITIQUE_ATTEMPT_TARGET = 3
+
+LEAN_PROOF_EDIT_DENIAL_REASON = (
+    "REJECTION REASON: Protected Lean 4 Proof\n\n"
+    "ISSUE: The paper-writing retroactive brainstorm operation attempted to edit, delete, "
+    "or add context to a Lean 4 verified proof in the brainstorm database.\n\n"
+    "WHY THIS IS AN ISSUE: Lean 4 proof blocks are immutable from paper-writing modes. "
+    "Paper writing may cite or discuss verified proofs in the paper, but it cannot mutate "
+    "the proof text or attach context to the proof record. Only the normal brainstorm prune "
+    "system may remove Lean 4 proof entries.\n\n"
+    "FIX REQUIRED: Do not target Lean 4 proof submissions with brainstorm_operation. If a proof "
+    "is unhelpful, let the scheduled brainstorm prune system handle removal. If the paper needs "
+    "commentary, write that commentary in the paper prose instead of editing the proof."
+)
+
 
 def _classify_submitter_error(err: BaseException) -> tuple[str, str]:
     """
@@ -113,7 +129,7 @@ def __init__(self):
         self.autonomous_mode = False
         self.autonomous_section_phase = None  # "body", "conclusion", "introduction", "abstract"
         self._current_topic_id = None  # Set by autonomous coordinator for retroactive brainstorm corrections
-        self._current_reference_paper_ids: List[str] = []  # Autonomous/Tier 3 references preserved for critique and rewrite context
+        self._current_reference_paper_ids: List[str] = []  # Autonomous/Tier 3 references preserved for critique context
         
         # Critique phase state (post-body peer review)
         self.critique_submitter = None  # CritiqueSubmitterAgent instance
@@ -121,15 +137,8 @@ def __init__(self):
         self.in_critique_phase = False
         self.critique_acceptances = 0
         self.paper_version = 1  # Track version number
-        self.rewrite_count = 0  # Track COMPLETED rewrites (max 1)
-        self.rewrite_pending = False  # Track if rewrite initiated but not yet succeeded
-        self.accumulated_critique_history: List[Dict] = []  # Store all critiques from all versions
-        self.previous_body_versions: List[Dict] = []  # Store prior versions
-        self.needs_critique_after_rewrite = False  # Flag to trigger another critique round
         self.paper_title: Optional[str] = None  # Track current paper title
         self._skip_critique_requested = False  # Pre-emptive skip flag (user can set before critique phase)
-        self.pre_critique_paper: Optional[str] = None  # Snapshot of paper at critique phase start
-        self.current_critique_feedback: Optional[str] = None  # Accepted critiques for current version (for rewrite context)
         
         # Aggregator monitoring for incremental re-RAG
         self.aggregator_acceptances_last_rag = 0
@@ -162,19 +171,27 @@ async def initialize(
         # OpenRouter provider config for validator
         validator_provider: str = "lm_studio",
         validator_openrouter_provider: Optional[str] = None,
+        validator_openrouter_reasoning_effort: str = "auto",
         validator_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider config for high-context submitter
         high_context_provider: str = "lm_studio",
         high_context_openrouter_provider: Optional[str] = None,
+        high_context_openrouter_reasoning_effort: str = "auto",
         high_context_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider config for high-param submitter
         high_param_provider: str = "lm_studio",
         high_param_openrouter_provider: Optional[str] = None,
+        high_param_openrouter_reasoning_effort: str = "auto",
         high_param_lm_studio_fallback: Optional[str] = None,
         # OpenRouter provider config for critique submitter
         critique_submitter_provider: str = "lm_studio",
         critique_submitter_openrouter_provider: Optional[str] = None,
-        critique_submitter_lm_studio_fallback: Optional[str] = None
+        critique_submitter_openrouter_reasoning_effort: str = "auto",
+        critique_submitter_lm_studio_fallback: Optional[str] = None,
+        validator_supercharge_enabled: bool = False,
+        high_context_supercharge_enabled: bool = False,
+        high_param_supercharge_enabled: bool = False,
+        critique_submitter_supercharge_enabled: bool = False
     ) -> None:
         """
         Initialize the compiler coordinator.
@@ -184,19 +201,23 @@ async def initialize(
             validator_model: Model for validator
             high_context_model: Model for high-context submitter
             high_param_model: Model for high-param submitter
-            critique_submitter_model: Model for critique generation and rewrite decisions
+            critique_submitter_model: Model for critique generation
             skip_aggregator_db: If True, don't load Part 1 aggregator database (for autonomous mode)
             validator_provider: Provider for validator ("lm_studio" or "openrouter")
             validator_openrouter_provider: OpenRouter host provider for validator
+            validator_openrouter_reasoning_effort: OpenRouter reasoning effort for validator
             validator_lm_studio_fallback: LM Studio fallback model for validator
             high_context_provider: Provider for high-context submitter
             high_context_openrouter_provider: OpenRouter host provider for high-context submitter
+            high_context_openrouter_reasoning_effort: OpenRouter reasoning effort for high-context submitter
             high_context_lm_studio_fallback: LM Studio fallback model for high-context submitter
             high_param_provider: Provider for high-param submitter
             high_param_openrouter_provider: OpenRouter host provider for high-param submitter
+            high_param_openrouter_reasoning_effort: OpenRouter reasoning effort for high-param submitter
             high_param_lm_studio_fallback: LM Studio fallback model for high-param submitter
             critique_submitter_provider: Provider for critique submitter
             critique_submitter_openrouter_provider: OpenRouter host provider for critique submitter
+            critique_submitter_openrouter_reasoning_effort: OpenRouter reasoning effort for critique submitter
             critique_submitter_lm_studio_fallback: LM Studio fallback model for critique submitter
         """
         logger.info("Initializing compiler coordinator...")
@@ -212,16 +233,24 @@ async def initialize(
         # Store OpenRouter provider configs for all roles
         self.validator_provider = validator_provider
         self.validator_openrouter_provider = validator_openrouter_provider
+        self.validator_openrouter_reasoning_effort = validator_openrouter_reasoning_effort
         self.validator_lm_studio_fallback = validator_lm_studio_fallback
         self.high_context_provider = high_context_provider
         self.high_context_openrouter_provider = high_context_openrouter_provider
+        self.high_context_openrouter_reasoning_effort = high_context_openrouter_reasoning_effort
         self.high_context_lm_studio_fallback = high_context_lm_studio_fallback
         self.high_param_provider = high_param_provider
         self.high_param_openrouter_provider = high_param_openrouter_provider
+        self.high_param_openrouter_reasoning_effort = high_param_openrouter_reasoning_effort
         self.high_param_lm_studio_fallback = high_param_lm_studio_fallback
         self.critique_submitter_provider = critique_submitter_provider
         self.critique_submitter_openrouter_provider = critique_submitter_openrouter_provider
+        self.critique_submitter_openrouter_reasoning_effort = critique_submitter_openrouter_reasoning_effort
         self.critique_submitter_lm_studio_fallback = critique_submitter_lm_studio_fallback
+        self.validator_supercharge_enabled = validator_supercharge_enabled
+        self.high_context_supercharge_enabled = high_context_supercharge_enabled
+        self.high_param_supercharge_enabled = high_param_supercharge_enabled
+        self.critique_submitter_supercharge_enabled = critique_submitter_supercharge_enabled
         
         # Reset workflow state for fresh start
         self.outline_accepted = False
@@ -321,16 +350,21 @@ async def initialize(
                 provider=self.high_context_provider,
                 model_id=high_context_model,
                 openrouter_provider=self.high_context_openrouter_provider,
+                openrouter_reasoning_effort=self.high_context_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.high_context_lm_studio_fallback,
                 context_window=system_config.compiler_high_context_context_window,
-                max_output_tokens=system_config.compiler_high_context_max_output_tokens
+                max_output_tokens=system_config.compiler_high_context_max_output_tokens,
+                supercharge_enabled=self.high_context_supercharge_enabled
             )
         )
         
         self.high_param_submitter = HighParamSubmitter(
             high_param_model, 
             compiler_prompt,
-            websocket_broadcaster=self.websocket_broadcaster
+            websocket_broadcaster=self.websocket_broadcaster,
+            validator_model=validator_model,
+            validator_context_window=self.validator_context_window,
+            validator_max_tokens=self.validator_max_tokens,
         )
         await self.high_param_submitter.initialize()
         # Set up task tracking callback for workflow panel integration
@@ -342,11 +376,41 @@ async def initialize(
                 provider=self.high_param_provider,
                 model_id=high_param_model,
                 openrouter_provider=self.high_param_openrouter_provider,
+                openrouter_reasoning_effort=self.high_param_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.high_param_lm_studio_fallback,
                 context_window=system_config.compiler_high_param_context_window,
-                max_output_tokens=system_config.compiler_high_param_max_output_tokens
+                max_output_tokens=system_config.compiler_high_param_max_output_tokens,
+                supercharge_enabled=self.high_param_supercharge_enabled
             )
         )
+        high_param_role_config = ModelConfig(
+            provider=self.high_param_provider,
+            model_id=high_param_model,
+            openrouter_provider=self.high_param_openrouter_provider,
+            openrouter_reasoning_effort=self.high_param_openrouter_reasoning_effort,
+            lm_studio_fallback_id=self.high_param_lm_studio_fallback,
+            context_window=system_config.compiler_high_param_context_window,
+            max_output_tokens=system_config.compiler_high_param_max_output_tokens,
+            supercharge_enabled=self.high_param_supercharge_enabled
+        )
+        api_client_manager.configure_role(
+            role_id="compiler_rigor_formalization",
+            config=high_param_role_config,
+        )
+        validator_role_config = ModelConfig(
+            provider=self.validator_provider,
+            model_id=validator_model,
+            openrouter_provider=self.validator_openrouter_provider,
+            openrouter_reasoning_effort=self.validator_openrouter_reasoning_effort,
+            lm_studio_fallback_id=self.validator_lm_studio_fallback,
+            context_window=self.validator_context_window,
+            max_output_tokens=self.validator_max_tokens,
+            supercharge_enabled=self.validator_supercharge_enabled
+        )
+        api_client_manager.configure_role(
+            role_id="compiler_rigor_novelty",
+            config=validator_role_config,
+        )
         
         self.validator = CompilerValidator(
             validator_model, 
@@ -363,9 +427,11 @@ async def initialize(
                 provider=self.validator_provider,
                 model_id=validator_model,
                 openrouter_provider=self.validator_openrouter_provider,
+                openrouter_reasoning_effort=self.validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.validator_lm_studio_fallback,
                 context_window=self.validator_context_window,
-                max_output_tokens=self.validator_max_tokens
+                max_output_tokens=self.validator_max_tokens,
+                supercharge_enabled=self.validator_supercharge_enabled
             )
         )
         
@@ -577,15 +643,6 @@ def _is_body_complete(self, paper: str) -> bool:
         Returns:
             True if body is complete (should skip rigor/outline updates), False otherwise
         """
-        # If rewrite is pending (initiated but not yet succeeded), body is NOT complete
-        if self.rewrite_pending:
-            return False
-        
-        # Check if max rewrites completed - skip critique entirely
-        if self.rewrite_count >= 1:
-            logger.info("Max rewrites completed (1) - treating body as complete")
-            return True
-        
         # Autonomous mode: use explicit phase tracking
         if self.autonomous_mode:
             return self.autonomous_section_phase != "body"
@@ -615,8 +672,12 @@ async def start(self) -> None:
         # Start main workflow loop
         self._main_task = asyncio.create_task(self._main_workflow())
         
-        # Start aggregator monitoring for incremental re-RAG
-        self._aggregator_monitor_task = asyncio.create_task(self._monitor_aggregator_for_rerag())
+        # Manual Part 2 can watch Part 1 for incremental context. Autonomous/Tier 3
+        # paper writing owns its brainstorm context and must not spawn child monitors.
+        if not self.autonomous_mode:
+            self._aggregator_monitor_task = asyncio.create_task(self._monitor_aggregator_for_rerag())
+        else:
+            self._aggregator_monitor_task = None
         
         await self._broadcast("compiler_started", {"message": "Compiler started"})
         logger.info("Compiler started successfully")
@@ -711,7 +772,7 @@ async def _main_workflow(self) -> None:
             })
             await asyncio.sleep(120)  # Wait before retrying (all models exhausted)
             if self.is_running:
-                asyncio.create_task(self._main_workflow())
+                self._main_task = asyncio.create_task(self._main_workflow())
         except Exception as e:
             logger.error(f"Compiler workflow error: {e}", exc_info=True)
             self.is_running = False
@@ -1244,14 +1305,6 @@ async def _submit_and_validate_construction(self, rejection_feedback: Optional[s
         # Single attempt - None means no work needed, not error
         section_phase = self.autonomous_section_phase if self.autonomous_mode else None
         
-        # Pass critique context during body rewrite (when critique_feedback is set)
-        critique_feedback_for_construction = None
-        pre_critique_paper_for_construction = None
-        if section_phase == "body" and self.current_critique_feedback:
-            critique_feedback_for_construction = self.current_critique_feedback
-            pre_critique_paper_for_construction = self.pre_critique_paper
-            logger.info("Body construction with critique context (rewrite mode)")
-        
         # Load brainstorm content for retroactive corrections (autonomous mode only)
         brainstorm_content_for_submitter = None
         brainstorm_source_for_submitter = None
@@ -1271,8 +1324,6 @@ async def _submit_and_validate_construction(self, rejection_feedback: Optional[s
                 is_first_portion=False,
                 section_phase=section_phase,
                 rejection_feedback=rejection_feedback,
-                critique_feedback=critique_feedback_for_construction,
-                pre_critique_paper=pre_critique_paper_for_construction,
                 brainstorm_content=brainstorm_content_for_submitter,
                 brainstorm_source_name=brainstorm_source_for_submitter
             )
@@ -1608,12 +1659,6 @@ def has_real_section_content(section_pattern: str, paper_text: str) -> bool:
             self.construction_acceptances += 1
             self._track_submission_wolfram_calls(submission)
             
-            # If rewrite was pending, mark it as completed now (first successful acceptance)
-            if self.rewrite_pending:
-                self.rewrite_count += 1
-                self.rewrite_pending = False
-                logger.info(f"Rewrite #{self.rewrite_count} completed successfully (first acceptance after rewrite)")
-            
             await compiler_rejection_log.add_acceptance(
                 submission.submission_id,
                 "construction",
@@ -1684,6 +1729,18 @@ async def _handle_brainstorm_retroactive_operation(self, brainstorm_op) -> None:
                 logger.warning(f"Brainstorm {topic_id} is empty, skipping retroactive operation")
                 return
             
+            denial_reason = self._get_lean_proof_retroactive_denial_reason(
+                brainstorm_op,
+                brainstorm_content,
+            )
+            if denial_reason:
+                await self._reject_brainstorm_retroactive_operation(
+                    brainstorm_op,
+                    topic_id,
+                    denial_reason,
+                )
+                return
+
             result = await self.validator.validate_brainstorm_operation(
                 brainstorm_op, brainstorm_content
             )
@@ -1738,6 +1795,109 @@ async def _handle_brainstorm_retroactive_operation(self, brainstorm_op) -> None:
                 })
         except Exception as e:
             logger.error(f"Error handling retroactive brainstorm operation: {e}")
+
+    @staticmethod
+    def _parse_brainstorm_submission_content(brainstorm_content: str, submission_number: int) -> str:
+        separator = "=" * 80
+        parts = (brainstorm_content or "").split(separator)
+        for index, part in enumerate(parts):
+            if "SUBMISSION #" not in part:
+                continue
+            match = re.search(r"SUBMISSION #(\d+)\s*\|", part)
+            if not match or int(match.group(1)) != submission_number:
+                continue
+            if index + 1 < len(parts):
+                return parts[index + 1].strip()
+        return ""
+
+    @staticmethod
+    def _is_lean_verified_brainstorm_content(content: str) -> bool:
+        text = content or ""
+        if BRAINSTORM_LEAN_PROOF_MARKER in text:
+            return True
+        lowered = text.lower()
+        return (
+            "lean 4 code:" in lowered
+            and "lean verification: accepted" in lowered
+            and "theorem statement:" in lowered
+        )
+
+    @staticmethod
+    def _looks_like_lean_proof_annotation_attempt(brainstorm_op) -> bool:
+        text = f"{getattr(brainstorm_op, 'new_content', '')}\n{getattr(brainstorm_op, 'reasoning', '')}".lower()
+        if BRAINSTORM_LEAN_PROOF_MARKER.lower() in text:
+            return True
+        proof_reference = (
+            "lean 4 proof" in text
+            or "lean-verified proof" in text
+            or "lean verified proof" in text
+            or "verified proof" in text
+            or "proof id:" in text
+        )
+        annotation_intent = any(
+            phrase in text
+            for phrase in (
+                "add context",
+                "additional context",
+                "annotate",
+                "annotation",
+                "clarify proof",
+                "context for proof",
+                "context to proof",
+                "update proof",
+                "edit proof",
+            )
+        )
+        return proof_reference and annotation_intent
+
+    def _get_lean_proof_retroactive_denial_reason(self, brainstorm_op, brainstorm_content: str) -> str:
+        action = getattr(brainstorm_op, "action", "")
+        if action in {"edit", "delete"}:
+            submission_number = getattr(brainstorm_op, "submission_number", None)
+            if submission_number is None:
+                return ""
+            target_content = self._parse_brainstorm_submission_content(
+                brainstorm_content,
+                int(submission_number),
+            )
+            if self._is_lean_verified_brainstorm_content(target_content):
+                return LEAN_PROOF_EDIT_DENIAL_REASON
+        if action == "add" and self._looks_like_lean_proof_annotation_attempt(brainstorm_op):
+            return LEAN_PROOF_EDIT_DENIAL_REASON
+        return ""
+
+    async def _reject_brainstorm_retroactive_operation(
+        self,
+        brainstorm_op,
+        topic_id: str,
+        reasoning: str,
+    ) -> None:
+        logger.info(
+            "Retroactive brainstorm %s automatically rejected for protected Lean 4 proof mutation: %s",
+            getattr(brainstorm_op, "action", ""),
+            getattr(brainstorm_op, "submission_number", None),
+        )
+        result = CompilerValidationResult(
+            submission_id=str(uuid.uuid4()),
+            decision="reject",
+            reasoning=reasoning,
+            summary=reasoning[:750],
+            json_valid=True,
+            validation_stage="pre-validation",
+        )
+        await compiler_rejection_log.add_rejection(
+            result,
+            "brainstorm_retroactive",
+            getattr(brainstorm_op, "new_content", "") or getattr(brainstorm_op, "reasoning", ""),
+        )
+        await self._broadcast("brainstorm_retroactive_rejected", {
+            "action": getattr(brainstorm_op, "action", ""),
+            "topic_id": topic_id,
+            "submission_number": getattr(brainstorm_op, "submission_number", None),
+            "reasoning": reasoning[:500],
+            "automatic": True,
+            "protected_lean_proof": True,
+        })
     
     async def _submit_and_validate_outline_update(self) -> bool:
         """Submit and validate outline update. Returns True if accepted."""
@@ -2089,9 +2249,9 @@ async def _submit_and_validate_rigor(self) -> bool:
     async def _place_or_appendix_fallback(self, lean_result) -> bool:
         """Drive the 2-attempt placement validator loop.
 
-        On double rejection (or when the submitter never produced a legal
-        attempt), the theorem is appended to the Theorems Appendix and the
-        cycle is counted as a rigor_acceptance.
+        On explicit appendix-only discovery, double rejection, or when the
+        submitter never produced a legal attempt, the theorem is appended to
+        the Theorems Appendix and the cycle is counted as a rigor_acceptance.
         """
         from backend.compiler.agents.high_param_submitter import (
             format_theorem_appendix_entry,
@@ -2099,13 +2259,26 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
 
         submission = lean_result.initial_placement_submission
         validator_feedback = ""
+        requested_appendix_only = (
+            getattr(lean_result, "placement_preference", "") == "appendix_only"
+            or (getattr(lean_result, "metadata", {}) or {}).get("placement_preference")
+            == "appendix_only"
+        )
+        appendix_outcome = (
+            "appendix_requested" if requested_appendix_only else "appendix_fallback"
+        )
 
         for placement_attempt in (1, 2):
             if submission is None:
+                route_reason = (
+                    "discovery requested appendix-only placement"
+                    if requested_appendix_only
+                    else "submitter returned no placement submission"
+                )
                 logger.info(
-                    "Rigor placement attempt %s: submitter returned no placement submission; "
-                    "routing directly to appendix fallback",
+                    "Rigor placement attempt %s: %s; routing directly to appendix",
                     placement_attempt,
+                    route_reason,
                 )
                 break
 
@@ -2251,9 +2424,10 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
                     lean_result, validator_feedback
                 )
 
-        # Appendix fallback: both placement attempts failed (or attempt 1 was
-        # impossible). The math is already Lean-verified, so the theorem is
-        # preserved in the Theorems Appendix and counted as a rigor_acceptance.
+        # Appendix storage: either explicitly requested by discovery or used
+        # as fallback when inline placement failed / was impossible. The math
+        # is already Lean-verified, so the theorem is preserved and counted as
+        # a rigor_acceptance.
         appendix_entry = format_theorem_appendix_entry(
             proof_id=lean_result.proof_id,
             theorem_statement=lean_result.theorem_statement,
@@ -2261,7 +2435,7 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
             is_novel=lean_result.is_novel,
             theorem_name=lean_result.theorem_name,
             novelty_tier=lean_result.novelty_tier,
-            placement_outcome="appendix_fallback",
+            placement_outcome=appendix_outcome,
         )
         appended = await paper_memory.append_to_theorems_appendix(appendix_entry)
         if not appended:
@@ -2281,18 +2455,18 @@ async def _place_or_appendix_fallback(self, lean_result) -> bool:
                 "submission_id": (
                     lean_result.initial_placement_submission.submission_id
                     if lean_result.initial_placement_submission
-                    else f"rigor_appendix_{lean_result.proof_id}"
+                    else f"rigor_{appendix_outcome}_{lean_result.proof_id}"
                 ),
-                "placement_outcome": "appendix_fallback",
+                "placement_outcome": appendix_outcome,
                 "lean_proof_id": lean_result.proof_id,
                 "is_novel": lean_result.is_novel,
             },
         )
         await self._broadcast("paper_updated", {"word_count": word_count})
         logger.info(
-            "Rigor theorem %s stored in Theorems Appendix (both placement attempts "
-            "failed or unavailable)",
+            "Rigor theorem %s stored in Theorems Appendix (%s)",
             lean_result.proof_id,
+            appendix_outcome,
         )
         return True
 
@@ -2614,31 +2788,11 @@ async def _start_critique_phase(self) -> None:
         self.in_critique_phase = True
         self.critique_acceptances = 0
         
-        # Snapshot paper at critique phase start (for rewrite context)
-        self.pre_critique_paper = await paper_memory.get_paper()
-        logger.info(f"Snapshot pre-critique paper: {len(self.pre_critique_paper)} chars")
-        
-        # Clear current critique feedback for this round
-        self.current_critique_feedback = None
-        
         # Initialize critique memory
         paper_id = f"paper_v{self.paper_version}"
         critique_memory.initialize(paper_id)
-        
-        # Before clearing, accumulate any existing critiques from previous phases
-        existing = await critique_memory.get_all_critiques()
-        if existing.strip():
-            self.accumulated_critique_history.append({
-                "version": self.paper_version,
-                "critiques": existing
-            })
-            logger.info(f"Accumulated {len(self.accumulated_critique_history)} critique history version(s)")
-        
         await critique_memory.clear()
-        
-        # Load from file for crash recovery (if file exists)
-        await critique_memory.load_from_file()
-        
+
         logger.info(f"Critique memory initialized for {paper_id}")
         
         # Create critique submitter agent
@@ -2668,9 +2822,11 @@ async def _start_critique_phase(self) -> None:
                 provider=self.critique_submitter_provider,
                 model_id=self.critique_submitter_model,
                 openrouter_provider=self.critique_submitter_openrouter_provider,
+                openrouter_reasoning_effort=self.critique_submitter_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.critique_submitter_lm_studio_fallback,
                 context_window=system_config.compiler_critique_submitter_context_window,
-                max_output_tokens=system_config.compiler_critique_submitter_max_tokens
+                max_output_tokens=system_config.compiler_critique_submitter_max_tokens,
+                supercharge_enabled=self.critique_submitter_supercharge_enabled
             )
         )
         
@@ -2681,9 +2837,11 @@ async def _start_critique_phase(self) -> None:
                 provider=self.validator_provider,
                 model_id=self.validator_model,
                 openrouter_provider=self.validator_openrouter_provider,
+                openrouter_reasoning_effort=self.validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.validator_lm_studio_fallback,
                 context_window=self.validator_context_window,
-                max_output_tokens=self.validator_max_tokens
+                max_output_tokens=self.validator_max_tokens,
+                supercharge_enabled=self.validator_supercharge_enabled
             )
         )
         
@@ -2694,16 +2852,18 @@ async def _start_critique_phase(self) -> None:
                 provider=self.validator_provider,
                 model_id=self.validator_model,
                 openrouter_provider=self.validator_openrouter_provider,
+                openrouter_reasoning_effort=self.validator_openrouter_reasoning_effort,
                 lm_studio_fallback_id=self.validator_lm_studio_fallback,
                 context_window=self.validator_context_window,
-                max_output_tokens=self.validator_max_tokens
+                max_output_tokens=self.validator_max_tokens,
+                supercharge_enabled=self.validator_supercharge_enabled
             )
         )
         
         # Broadcast critique phase started
         await self._broadcast("critique_phase_started", {
             "paper_version": self.paper_version,
-            "target_critiques": 5
+            "target_critiques": CRITIQUE_ATTEMPT_TARGET
         })
         
         # Start critique aggregation loop
@@ -2714,12 +2874,10 @@ async def _get_reference_papers_context_for_critique(
         current_outline: str = "",
         current_body: str = "",
         aggregator_db: str = "",
-        critique_feedback: str = "",
-        pre_critique_paper: str = "",
-        accumulated_history: str = ""
+        critique_feedback: str = ""
     ) -> Optional[str]:
         """
-        Prepare reference-paper context for critique/rewrite prompts in autonomous mode.
+        Prepare reference-paper context for critique prompts in autonomous mode.
 
         This preserves the reference papers selected for the paper instead of
         silently dropping them once the critique phase begins.
@@ -2744,8 +2902,6 @@ async def _get_reference_papers_context_for_critique(
                     current_body or "",
                     aggregator_db or "",
                     critique_feedback or "",
-                    pre_critique_paper or "",
-                    accumulated_history or "",
                 ]
                 if part
             )
@@ -2773,7 +2929,6 @@ async def _get_reference_papers_context_for_critique(
                     current_outline or "",
                     current_body or "",
                     critique_feedback or "",
-                    pre_critique_paper or "",
                 ]
                 if part
             )
@@ -2792,10 +2947,13 @@ async def _get_reference_papers_context_for_critique(
     
     async def _run_critique_aggregation(self) -> None:
         """
-        Run critique aggregation until 5 total attempts.
+        Run critique aggregation until the configured total attempt target.
         Uses simple generate-validate loop similar to aggregator workflow.
         """
-        logger.info("Starting critique aggregation loop (target: 5 total attempts, accepted OR rejected)")
+        logger.info(
+            "Starting critique aggregation loop "
+            f"(target: {CRITIQUE_ATTEMPT_TARGET} total attempts, accepted OR rejected)"
+        )
         
         rejection_count = 0
         consecutive_rejections = 0
@@ -2812,25 +2970,26 @@ async def _run_critique_aggregation(self) -> None:
                     "acceptances": critique_count,
                     "rejections": rejection_count,
                     "total_attempts": total_attempts,
-                    "target": 5,  # Now means total attempts, not just acceptances
+                    "target": CRITIQUE_ATTEMPT_TARGET,
                     "version": self.paper_version
                 })
                 
                 # Check if target reached
-                if total_attempts >= 5:
+                if total_attempts >= CRITIQUE_ATTEMPT_TARGET:
                     logger.info(f"Critique phase complete: {total_attempts} total attempts ({critique_count} accepted, {rejection_count} rejected)")
-                    
-                    # If 0 acceptances, skip rewrite and continue
+
                     if critique_count == 0:
-                        logger.info("No critiques accepted - skipping rewrite phase, moving to next section")
-                        await self._skip_rewrite_and_continue()
+                        logger.info("No critiques accepted - moving to next section")
+                        await self._continue_without_self_review()
                     else:
-                        # Trigger rewrite decision with accepted critiques
-                        await self._trigger_rewrite_decision()
+                        await self._append_accepted_critiques_as_self_review()
                     break
                 
                 # Generate critique
-                logger.info(f"Generating critique (attempts: {total_attempts}/5, accepted: {critique_count}, rejected: {rejection_count})")
+                logger.info(
+                    f"Generating critique (attempts: {total_attempts}/{CRITIQUE_ATTEMPT_TARGET}, "
+                    f"accepted: {critique_count}, rejected: {rejection_count})"
+                )
                 
                 current_body = await paper_memory.get_paper()
                 current_outline = await outline_memory.get_outline()
@@ -2842,16 +3001,12 @@ async def _run_critique_aggregation(self) -> None:
                 # Get existing critiques
                 existing_critiques = await critique_memory.get_all_critiques()
                 
-                # Format accumulated critique history from previous failed versions
-                accumulated_history = self._format_accumulated_critique_history()
-
-                # Keep autonomous reference papers available during critique/rewrite.
+                # Keep autonomous reference papers available during critique.
                 reference_papers = await self._get_reference_papers_context_for_critique(
                     current_outline=current_outline,
                     current_body=current_body,
                     aggregator_db=aggregator_db,
-                    critique_feedback=existing_critiques,
-                    accumulated_history=accumulated_history
+                    critique_feedback=existing_critiques
                 )
                 
                 # Generate critique submission
@@ -2861,8 +3016,7 @@ async def _run_critique_aggregation(self) -> None:
                     current_outline=current_outline,
                     aggregator_db=aggregator_db,
                     reference_papers=reference_papers,
-                    existing_critiques=existing_critiques,
-                    accumulated_history=accumulated_history
+                    existing_critiques=existing_critiques
                 )
                 
                 if submission is None:
@@ -2872,13 +3026,7 @@ async def _run_critique_aggregation(self) -> None:
                 
                 logger.info(f"Critique generated: {submission.submission_id}")
                 
-                # Validate critique using aggregator validator prompts
-                from backend.aggregator.agents.validator import ValidatorAgent
-                from backend.aggregator.memory.shared_training import shared_training_memory
-                from backend.aggregator.prompts.validator_prompts import build_validator_prompt
-                
-                # Build critique validation prompt (reuses aggregator validator structure)
-                # We'll use the validator's validate method but with critique-specific context
+                # Validate critique using critique-specific validator prompts.
                 validation_result = await self._validate_critique(submission)
                 
                 # Handle decline submissions differently
@@ -2894,7 +3042,7 @@ async def _run_critique_aggregation(self) -> None:
                             "reasoning": submission.reasoning,
                             "version": self.paper_version,
                             "total_attempts": total_attempts,
-                            "target": 5
+                            "target": CRITIQUE_ATTEMPT_TARGET
                         })
                     else:
                         # Validator disagrees - there ARE issues that need critique
@@ -2907,7 +3055,7 @@ async def _run_critique_aggregation(self) -> None:
                             "reasoning": validation_result.reasoning if validation_result else "Unknown",
                             "consecutive": consecutive_rejections,
                             "total_attempts": total_attempts,
-                            "target": 5
+                            "target": CRITIQUE_ATTEMPT_TARGET
                         })
                 else:
                     # Regular critique submission
@@ -2919,12 +3067,12 @@ async def _run_critique_aggregation(self) -> None:
                         await critique_memory.add_accepted_critique(submission.content)
                         
                         new_count = await critique_memory.get_critique_count()
-                        logger.info(f"Critique ACCEPTED ({new_count}/5): {submission.submission_id}")
+                        logger.info(f"Critique ACCEPTED ({new_count}/{CRITIQUE_ATTEMPT_TARGET}): {submission.submission_id}")
                         
                         await self._broadcast("critique_accepted", {
                             "critique_id": submission.submission_id,
                             "count": new_count,
-                            "target": 5,
+                            "target": CRITIQUE_ATTEMPT_TARGET,
                             "version": self.paper_version,
                             "total_attempts": total_attempts,
                             "rejections": rejection_count
@@ -2953,7 +3101,7 @@ async def _run_critique_aggregation(self) -> None:
                             "reasoning": validation_result.reasoning if validation_result else "Unknown",
                             "consecutive": consecutive_rejections,
                             "total_attempts": total_attempts,
-                            "target": 5
+                            "target": CRITIQUE_ATTEMPT_TARGET
                         })
                 
                 # Brief delay between critiques
@@ -2975,9 +3123,6 @@ async def _validate_critique(self, submission) -> Optional[ValidationResult]:
             ValidationResult or None
         """
         try:
-            # Import prompt builders
-            from backend.aggregator.prompts.validator_prompts import build_validator_prompt
-            
             # Build validation prompt for critique
             # We pass the critique as "submission" and existing critiques as "context"
             current_body = await paper_memory.get_paper()
@@ -3132,480 +3277,29 @@ async def _perform_critique_cleanup(self) -> None:
         except Exception as e:
             logger.error(f"Error in critique cleanup: {e}", exc_info=True)
     
-    async def _trigger_rewrite_decision(self) -> None:
-        """
-        Trigger rewrite vs continue decision after 5 critiques.
-        Includes retry logic if decision is rejected by validator.
-        """
-        max_retries = 5
-        retry_count = 0
-        
-        while retry_count < max_retries:
-            try:
-                logger.info("=" * 80)
-                logger.info(f"Critique phase complete (5 total attempts) - triggering rewrite decision (attempt {retry_count + 1})")
-                logger.info("=" * 80)
-                
-                # Get all critiques
-                critique_feedback = await critique_memory.get_all_critiques()
-                current_body = await paper_memory.get_paper()
-                current_outline = await outline_memory.get_outline()
-                current_title = self.paper_title if self.paper_title else self.user_prompt
-                
-                # Get context (aggregator DB, reference papers, etc.)
-                from backend.aggregator.memory.shared_training import shared_training_memory
-                aggregator_db = await shared_training_memory.get_all_content()
-                # Format accumulated critique history from previous failed versions
-                accumulated_history = self._format_accumulated_critique_history()
-
-                reference_papers = await self._get_reference_papers_context_for_critique(
-                    current_outline=current_outline,
-                    current_body=current_body,
-                    aggregator_db=aggregator_db,
-                    critique_feedback=critique_feedback,
-                    pre_critique_paper=self.pre_critique_paper or "",
-                    accumulated_history=accumulated_history
-                )
-                
-                # Critique submitter makes decision
-                logger.info("Critique submitter generating rewrite decision...")
-                decision_result = await self.critique_submitter.submit_rewrite_decision(
-                    user_prompt=self.user_prompt,
-                    current_body=current_body,
-                    current_outline=current_outline,
-                    current_title=current_title,
-                    aggregator_db=aggregator_db,
-                    critique_feedback=critique_feedback,
-                    pre_critique_paper=self.pre_critique_paper,  # Paper snapshot from start of critique phase
-                    reference_papers=reference_papers,
-                    accumulated_history=accumulated_history
-                )
-                
-                if decision_result is None:
-                    logger.error("Rewrite decision generation returned None")
-                    retry_count += 1
-                    await asyncio.sleep(5)
-                    continue
-                
-                logger.info(f"Rewrite decision: {decision_result['decision']}")
-                
-                # Validator reviews decision
-                logger.info("Validator reviewing rewrite decision...")
-                validated = await self.validator.validate_rewrite_decision(
-                    decision_result=decision_result,
-                    user_prompt=self.user_prompt,
-                    current_body=current_body,
-                    current_outline=current_outline,
-                    current_title=current_title,
-                    critique_feedback=critique_feedback,
-                    aggregator_db=aggregator_db
-                )
-                
-                if not validated:
-                    # Decision rejected - retry
-                    logger.warning("Rewrite decision rejected by validator - retrying")
-                    await self._broadcast("rewrite_decision_rejected", {
-                        "attempt": retry_count + 1,
-                        "max_retries": max_retries
-                    })
-                    retry_count += 1
-                    await asyncio.sleep(5)
-                    continue
-                
-                # Decision validated - execute it
-                logger.info("Rewrite decision validated - executing")
-                
-                # Execute decision
-                if decision_result["decision"] == "continue":
-                    logger.info("Decision: CONTINUE to conclusion (critiques minor/incorrect)")
-                    await self._end_critique_phase(rewrite=False)
-                    
-                elif decision_result["decision"] == "partial_revision":
-                    logger.info("Decision: PARTIAL REVISION (iterative targeted edits)")
-                    await self._execute_partial_revision(
-                        new_title=decision_result.get("new_title"),
-                        new_outline=decision_result.get("new_outline"),
-                        critique_feedback=critique_feedback,
-                        accumulated_history=accumulated_history
-                    )
-                    
-                elif decision_result["decision"] == "total_rewrite":
-                    logger.info("Decision: TOTAL REWRITE body section")
-                    await self._execute_body_rewrite(
-                        new_title=decision_result.get("new_title"),
-                        new_outline=decision_result.get("new_outline"),
-                        critique_feedback=critique_feedback
-                    )
-                
-                # Success - break out of retry loop
-                break
-                
-            except Exception as e:
-                logger.error(f"Error in rewrite decision (attempt {retry_count + 1}): {e}", exc_info=True)
-                retry_count += 1
-                if retry_count < max_retries:
-                    await asyncio.sleep(5)
-                # Note: Don't call _end_critique_phase here - let it fall through to unified fallback below
-        
-        # Unified fallback if while loop exited due to retry exhaustion
-        # Handles both: validation failures (returned False 5 times) OR exceptions (5 exceptions occurred)
-        if retry_count >= max_retries:
-            logger.error("Rewrite decision validation failed after max retries - defaulting to CONTINUE")
-            await self._broadcast("rewrite_decision_max_retries_exceeded", {
-                "action": "continue_to_conclusion"
-            })
-            await self._end_critique_phase(rewrite=False)
-    
-    async def _execute_body_rewrite(
-        self,
-        new_title: Optional[str],
-        new_outline: Optional[str],
-        critique_feedback: str
-    ) -> None:
-        """
-        Execute full body section rewrite.
-        
-        Args:
-            new_title: New paper title (or None to keep current)
-            new_outline: Updated outline (or None to keep current)
-            critique_feedback: All accepted critiques
-        """
-        logger.info("=" * 80)
-        logger.info("EXECUTING BODY REWRITE")
-        logger.info("=" * 80)
-        
-        # Mark rewrite as pending (will count as completed only after first successful body acceptance)
-        self.rewrite_pending = True
-        logger.info(f"Rewrite initiated (pending successful completion, max: 1)")
-        
-        # Store previous version
-        current_body = await paper_memory.get_paper()
-        old_title = self.paper_title if self.paper_title else self.user_prompt
-        
-        await paper_memory.store_previous_version(
-            version=self.paper_version,
-            title=old_title,
-            body=current_body,
-            critique_feedback=critique_feedback
-        )
-        
-        logger.info(f"Stored Version {self.paper_version}: {old_title}")
-        
-        # Update title if changed
-        title_changed = False
-        if new_title and new_title != old_title:
-            self.paper_title = new_title
-            self.paper_version += 1
-            title_changed = True
-            logger.info(f"Paper title changed: {new_title} (Version {self.paper_version})")
-        else:
-            logger.info("Paper title unchanged")
-        
-        # Update outline if provided
-        if new_outline:
-            await outline_memory.update_outline(new_outline)
-            logger.info("Outline updated with new structure")
-        
-        # Clear paper body (keep only placeholders)
-        await paper_memory.clear_body_section()
-        logger.info("Body section cleared - preserving placeholders")
-        
-        # Broadcast rewrite started
-        await self._broadcast("body_rewrite_started", {
-            "version": self.paper_version,
-            "title": self.paper_title if self.paper_title else self.user_prompt,
-            "title_changed": title_changed,
-            "critique_feedback_preview": critique_feedback[:500]
-        })
-        
-        # End critique phase
-        await self._end_critique_phase(rewrite=True)
-        
-        # Reset to body phase with new context
-        self.autonomous_section_phase = "body"
-        
-        # Store critique feedback for passing to construction prompts
-        # This provides rewrite context so the model knows what to fix
-        self.current_critique_feedback = critique_feedback
-        logger.info(f"Stored critique feedback for construction: {len(critique_feedback)} chars")
-        
-        # Set flag for re-critique if title changed
-        if title_changed:
-            logger.info("Title changed - will run critique phase again after rewrite completes")
-            self.needs_critique_after_rewrite = True
-        else:
-            logger.info("Title unchanged - will continue to conclusion after rewrite completes")
-            self.needs_critique_after_rewrite = False
-        
-        logger.info("=" * 80)
-        logger.info(f"BODY REWRITE PREPARED - Starting body construction for Version {self.paper_version}")
-        logger.info("Body reconstruction will have: pre_critique_paper + accepted critique feedback")
-        logger.info("=" * 80)
-    
-    async def _execute_partial_revision(
-        self,
-        new_title: Optional[str],
-        new_outline: Optional[str],
-        critique_feedback: str,
-        accumulated_history: Optional[str] = None
-    ) -> None:
-        """
-        Execute partial revision using ITERATIVE targeted edit operations.
-        
-        Proposes edits one at a time, validates each, applies, and shows updated paper
-        before proposing the next edit.
-        
-        Args:
-            new_title: New paper title (or None to keep current)
-            new_outline: Updated outline (or None to keep current)
-            critique_feedback: All accepted critiques
-            accumulated_history: Optional accumulated critique history from previous versions
-        """
-        logger.info("=" * 80)
-        logger.info("EXECUTING PARTIAL REVISION (ITERATIVE EDITS)")
-        logger.info("=" * 80)
-        
-        # Mark rewrite as pending (will count as completed only after first successful edit acceptance)
-        self.rewrite_pending = True
-        logger.info(f"Partial revision initiated (pending successful completion, max: 1)")
-        
-        # Store current state (for history tracking)
-        old_title = self.paper_title if self.paper_title else self.user_prompt
-        
-        # Update title if changed
-        title_changed = False
-        if new_title and new_title != old_title:
-            self.paper_title = new_title
-            self.paper_version += 1
-            title_changed = True
-            logger.info(f"Paper title changed: {new_title} (Version {self.paper_version})")
-        else:
-            logger.info("Paper title unchanged")
-        
-        # Update outline if provided
-        if new_outline:
-            await outline_memory.update_outline(new_outline)
-            logger.info("Outline updated with new structure")
-        
-        # Get current outline
-        current_outline = await outline_memory.get_outline()
+    async def _append_accepted_critiques_as_self_review(self) -> None:
+        """Append validator-accepted critiques as an honest AI self-review section."""
+        critique_feedback = await critique_memory.get_all_critiques()
+        if not critique_feedback.strip():
+            await self._continue_without_self_review()
+            return
 
-        reference_papers = await self._get_reference_papers_context_for_critique(
-            current_outline=current_outline,
-            current_body=self.pre_critique_paper or "",
-            critique_feedback=critique_feedback,
-            pre_critique_paper=self.pre_critique_paper or "",
-            accumulated_history=accumulated_history or ""
-        )
-        
-        # ITERATIVE EDIT LOOP
-        MAX_EDITS = 20  # Safety limit to prevent infinite loops
-        edits_applied: List[Dict] = []
-        successful_edits = 0
-        failed_edits = 0
-        consecutive_failures = 0
-        MAX_CONSECUTIVE_FAILURES = 3
-        
-        logger.info("Starting iterative edit loop...")
-        
-        more_edits_needed = True
-        while more_edits_needed and len(edits_applied) < MAX_EDITS:
-            try:
-                # Get current paper state
-                current_paper = await paper_memory.get_paper()
-                
-                # Ask critique submitter for next edit
-                logger.info(f"Requesting edit #{len(edits_applied) + 1}...")
-                edit_proposal = await self.critique_submitter.submit_iterative_edit(
-                    user_prompt=self.user_prompt,
-                    pre_critique_paper=self.pre_critique_paper,
-                    current_paper=current_paper,
-                    current_outline=current_outline,
-                    critique_feedback=critique_feedback,
-                    edits_applied=edits_applied,
-                    reference_papers=reference_papers,
-                    accumulated_history=accumulated_history
-                )
-                
-                if edit_proposal is None:
-                    logger.error("Failed to get edit proposal - stopping iterative loop")
-                    break
-                
-                operation = edit_proposal.get("operation")
-                old_string = edit_proposal.get("old_string", "")
-                new_string = edit_proposal.get("new_string", "")
-                reasoning = edit_proposal.get("reasoning", "")
-                more_edits_needed = edit_proposal.get("more_edits_needed", False)
-                
-                logger.info(f"Edit proposal: {operation} - {reasoning[:100]}...")
-                
-                # Validate the edit via validator
-                is_valid, validation_reason = await self._validate_partial_revision_edit(
-                    edit_proposal=edit_proposal,
-                    current_paper=current_paper,
-                    current_outline=current_outline,
-                    critique_feedback=critique_feedback
-                )
-                
-                if not is_valid:
-                    logger.warning(f"Edit #{len(edits_applied) + 1} rejected by validator: {validation_reason}")
-                    consecutive_failures += 1
-                    
-                    if consecutive_failures >= MAX_CONSECUTIVE_FAILURES:
-                        logger.error(f"Max consecutive failures ({MAX_CONSECUTIVE_FAILURES}) reached - stopping iterative loop")
-                        break
-                    
-                    # Don't add to edits_applied, loop will retry with same state
-                    failed_edits += 1
-                    continue
-                
-                # Apply the validated edit
-                edit_submission = CompilerSubmission(
-                    submission_id=f"partial_revision_edit_{len(edits_applied) + 1}",
-                    mode="review",
-                    content=new_string,
-                    operation=operation,
-                    old_string=old_string,
-                    new_string=new_string,
-                    reasoning=reasoning
-                )
-                updated_paper = self._apply_edit(current_paper, edit_submission)
-                
-                if updated_paper is not None:
-                    await paper_memory.update_paper(updated_paper)
-                    logger.info(f"Edit #{len(edits_applied) + 1} applied successfully")
-                    edits_applied.append(edit_proposal)
-                    successful_edits += 1
-                    consecutive_failures = 0  # Reset on success
-                    
-                    # Broadcast progress
-                    await self._broadcast("partial_revision_edit_applied", {
-                        "edit_number": len(edits_applied),
-                        "operation": operation,
-                        "reasoning": reasoning[:200],
-                        "more_edits_needed": more_edits_needed
-                    })
-                else:
-                    logger.warning(f"Edit #{len(edits_applied) + 1} failed to apply (old_string not found)")
-                    consecutive_failures += 1
-                    failed_edits += 1
-                    
-                    if consecutive_failures >= MAX_CONSECUTIVE_FAILURES:
-                        logger.error(f"Max consecutive failures ({MAX_CONSECUTIVE_FAILURES}) reached - stopping iterative loop")
-                        break
-                
-            except Exception as e:
-                logger.error(f"Error in iterative edit loop: {e}", exc_info=True)
-                consecutive_failures += 1
-                failed_edits += 1
-                
-                if consecutive_failures >= MAX_CONSECUTIVE_FAILURES:
-                    logger.error(f"Max consecutive failures ({MAX_CONSECUTIVE_FAILURES}) reached - stopping iterative loop")
-                    break
-        
-        logger.info(f"Iterative edit loop complete: {successful_edits} successful, {failed_edits} failed")
-        
-        if len(edits_applied) >= MAX_EDITS:
-            logger.warning(f"Reached max edit limit ({MAX_EDITS}) - stopping iterative loop")
-        
-        # Mark rewrite completion on first successful edit
-        if self.rewrite_pending:
-            if successful_edits > 0:
-                self.rewrite_count += 1
-                logger.info(f"Rewrite #{self.rewrite_count} completed successfully (first accepted partial edit)")
-            self.rewrite_pending = False
-        
-        # Broadcast partial revision complete
-        await self._broadcast("partial_revision_complete", {
+        appended = await paper_memory.append_self_review_section(critique_feedback)
+        await self._broadcast("self_review_appended", {
             "version": self.paper_version,
-            "title": self.paper_title if self.paper_title else self.user_prompt,
-            "title_changed": title_changed,
-            "edits_applied": successful_edits,
-            "edits_failed": failed_edits,
-            "critique_feedback_preview": critique_feedback[:500]
+            "critique_count": await critique_memory.get_critique_count(),
+            "appended": appended,
         })
-        
-        # End critique phase
-        await self._end_critique_phase(rewrite=False)
-        
-        # Set flag for re-critique if title changed
-        if title_changed:
-            logger.info("Title changed - would run critique phase again, but max rewrites reached")
-            # Note: With max 1 rewrite, title changes won't trigger re-critique
-            self.needs_critique_after_rewrite = False
-        else:
-            logger.info("Title unchanged - continuing to conclusion")
-            self.needs_critique_after_rewrite = False
-        
-        # Continue to conclusion (partial revision doesn't loop back to body phase)
-        # Clear critique context (no longer needed after body phase)
-        self.current_critique_feedback = None
-        self.autonomous_section_phase = "conclusion"
-        
-        logger.info("=" * 80)
-        logger.info("PARTIAL REVISION COMPLETE - Continuing to CONCLUSION")
-        logger.info("=" * 80)
-    
-    async def _validate_partial_revision_edit(
-        self,
-        edit_proposal: Dict,
-        current_paper: str,
-        current_outline: str,
-        critique_feedback: str
-    ) -> Tuple[bool, str]:
-        """
-        Validate a single partial revision edit using the compiler validator.
-        
-        Args:
-            edit_proposal: The proposed edit with operation, old_string, new_string, reasoning
-            current_paper: Current paper content
-            current_outline: Paper outline
-            critique_feedback: All accepted critiques
-            
-        Returns:
-            Tuple of (is_valid: bool, rejection_reason: str)
-        """
-        try:
-            # Delegate to the compiler validator which has comprehensive validation logic
-            return await self.validator.validate_partial_revision_edit(
-                edit_proposal=edit_proposal,
-                current_paper=current_paper,
-                current_outline=current_outline,
-                critique_feedback=critique_feedback
-            )
-            
-        except Exception as e:
-            logger.error(f"Error validating partial revision edit: {e}", exc_info=True)
-            return False, f"Validation error: {str(e)}"
+        await self._end_critique_phase(self_review_appended=appended)
     
-    def _format_accumulated_critique_history(self) -> str:
-        """
-        Format all historical critiques from previous failed versions.
-        Returns formatted string with clear version labeling.
-        """
-        if not self.accumulated_critique_history:
-            return ""
-        
-        parts = ["=" * 80]
-        parts.append("CRITIQUE HISTORY FROM PREVIOUS FAILED VERSIONS")
-        parts.append("(These critiques are from earlier attempts that were rewritten)")
-        parts.append("=" * 80 + "\n")
-        
-        for i, entry in enumerate(self.accumulated_critique_history, 1):
-            parts.append(f"--- FAILED VERSION #{i} (REWRITTEN) ---")
-            parts.append(entry['critiques'])
-            parts.append("")
-        
-        return "\n".join(parts)
-    
-    async def _end_critique_phase(self, rewrite: bool) -> None:
+    async def _end_critique_phase(self, self_review_appended: bool = False) -> None:
         """
         End critique phase and clean up.
         
         Args:
-            rewrite: Whether a rewrite was approved
+            self_review_appended: Whether accepted critiques were appended to the paper
         """
-        logger.info(f"Ending critique phase (rewrite={rewrite})")
+        logger.info(f"Ending critique phase (self_review_appended={self_review_appended})")
         
         self.in_critique_phase = False
         
@@ -3620,32 +3314,25 @@ async def _end_critique_phase(self, rewrite: bool) -> None:
         
         # Broadcast end
         await self._broadcast("critique_phase_ended", {
-            "rewrite": rewrite,
+            "self_review_appended": self_review_appended,
             "version": self.paper_version
         })
-        
-        if not rewrite:
-            # Continue to conclusion
-            # Clear critique context (no longer needed after body phase)
-            self.current_critique_feedback = None
-            self.autonomous_section_phase = "conclusion"
-            logger.info("Critique phase complete - transitioning to CONCLUSION phase")
-            await self._broadcast("phase_transition", {
-                "from_phase": "critique",
-                "to_phase": "conclusion",
-                "trigger": "critiques_reviewed",
-                "paper_word_count": await paper_memory.get_word_count()
-            })
-        else:
-            logger.info("Critique phase complete - body will be rewritten")
+
+        self.autonomous_section_phase = "conclusion"
+        logger.info("Critique phase complete - transitioning to CONCLUSION phase")
+        await self._broadcast("phase_transition", {
+            "from_phase": "critique",
+            "to_phase": "conclusion",
+            "trigger": "critiques_reviewed",
+            "paper_word_count": await paper_memory.get_word_count()
+        })
     
-    async def _skip_rewrite_and_continue(self) -> None:
+    async def _continue_without_self_review(self) -> None:
         """
-        Skip rewrite phase when body is academically acceptable.
-        Called when 5 total attempts complete with 0 accepted critiques.
+        Continue when no critiques were accepted for the self-review section.
         """
         logger.info("=" * 80)
-        logger.info("SKIPPING REWRITE - No critiques accepted, body is acceptable")
+        logger.info("NO SELF-REVIEW APPENDED - No critiques accepted")
         logger.info("=" * 80)
         
         await self._broadcast("critique_phase_skipped", {
@@ -3653,16 +3340,15 @@ async def _skip_rewrite_and_continue(self) -> None:
             "version": self.paper_version
         })
         
-        # End critique phase without rewrite
-        await self._end_critique_phase(rewrite=False)
+        await self._end_critique_phase(self_review_appended=False)
         
-        # The _end_critique_phase already transitions to conclusion when rewrite=False
+        # The _end_critique_phase already transitions to conclusion.
         logger.info("Transitioning to CONCLUSION phase (body accepted as-is)")
     
     async def skip_critique_phase(self) -> bool:
         """
         Skip the critique phase and continue to conclusion.
-        User override to bypass peer review and rewrite cycle.
+        User override to bypass peer review and self-review appending.
         
         Can be called:
         - During critique phase: immediately skips
@@ -3682,7 +3368,7 @@ async def skip_critique_phase(self) -> bool:
                 "version": self.paper_version
             })
             
-            await self._end_critique_phase(rewrite=False)
+            await self._end_critique_phase(self_review_appended=False)
             return True
         else:
             # Not in critique phase yet - set flag to skip when reached
@@ -3764,57 +3450,7 @@ async def _check_phase_transition(self, section_complete: bool = False) -> bool:
         
         # Phase transition logic based on explicit completion signal
         if current_phase == "body":
-            # Check if max rewrites reached - skip critique phase entirely
-            if self.rewrite_count >= 1:
-                logger.info(f"Max rewrites ({self.rewrite_count}) reached - skipping critique phase, proceeding to conclusion")
-                # Clear critique context (no longer needed after body phase)
-                self.current_critique_feedback = None
-                self.autonomous_section_phase = "conclusion"
-                await self._broadcast("phase_transition", {
-                    "from_phase": "body",
-                    "to_phase": "conclusion",
-                    "trigger": "section_complete",
-                    "reason": "max_rewrites_reached",
-                    "rewrite_count": self.rewrite_count,
-                    "paper_word_count": word_count
-                })
-                return False
-            
-            # Check if this is a rewrite completion that needs another critique round
-            if self.needs_critique_after_rewrite:
-                # Body rewrite complete, title changed - run critique phase again
-                logger.info(f"Body rewrite complete (Version {self.paper_version}) - triggering ANOTHER critique phase (title changed)")
-                self.needs_critique_after_rewrite = False  # Reset flag
-                
-                await self._broadcast("phase_transition", {
-                    "from_phase": "body",
-                    "to_phase": "critique",
-                    "trigger": "rewrite_complete_title_changed",
-                    "paper_word_count": word_count,
-                    "version": self.paper_version
-                })
-                
-                # Start critique aggregation sub-workflow again
-                await self._start_critique_phase()
-                return False
-            
-            # Check if this is a rewrite completion with unchanged title - skip to conclusion
-            if self.rewrite_count > 0:
-                # Rewrite completed but title unchanged - critique loop ends, proceed to conclusion
-                logger.info(f"Rewrite #{self.rewrite_count} complete (title unchanged) - skipping additional critique, proceeding to conclusion")
-                # Clear critique context (no longer needed after body phase)
-                self.current_critique_feedback = None
-                self.autonomous_section_phase = "conclusion"
-                await self._broadcast("phase_transition", {
-                    "from_phase": "body",
-                    "to_phase": "conclusion",
-                    "trigger": "rewrite_complete_title_unchanged",
-                    "rewrite_count": self.rewrite_count,
-                    "paper_word_count": word_count
-                })
-                return False
-            
-            # BODY COMPLETE - TRIGGER CRITIQUE PHASE BEFORE CONCLUSION (first time only)
+            # BODY COMPLETE - TRIGGER CRITIQUE PHASE BEFORE CONCLUSION
             logger.info("Body section complete - transitioning to CRITIQUE PHASE")
             await self._broadcast("phase_transition", {
                 "from_phase": "body",
@@ -4005,15 +3641,8 @@ async def clear_paper(self) -> None:
         self.in_critique_phase = False
         self.critique_acceptances = 0
         self.paper_version = 1
-        self.rewrite_count = 0
-        self.rewrite_pending = False
-        self.accumulated_critique_history.clear()
-        self.previous_body_versions.clear()
-        self.needs_critique_after_rewrite = False
         self.paper_title = None
         self._skip_critique_requested = False
-        self.pre_critique_paper = None
-        self.current_critique_feedback = None
         logger.info("Reset critique phase state")
         
         logger.info("Paper and outline cleared - system reset to fresh start")
diff --git a/backend/compiler/memory/paper_memory.py b/backend/compiler/memory/paper_memory.py
index e107b7e..e30ecf0 100644
--- a/backend/compiler/memory/paper_memory.py
+++ b/backend/compiler/memory/paper_memory.py
@@ -7,6 +7,7 @@
 from typing import Optional, Callable, List, Dict
 from pathlib import Path
 import logging
+import re
 
 from backend.shared.config import system_config
 
@@ -27,6 +28,8 @@
 THEOREMS_APPENDIX_START = "[HARD CODED THEOREMS APPENDIX START -- LEAN 4 VERIFIED THEOREMS BELOW]"
 THEOREMS_APPENDIX_END = "[HARD CODED THEOREMS APPENDIX END -- ALL APPENDIX CONTENT SHOULD BE ABOVE THIS LINE]"
 APPENDIX_EMPTY_PLACEHOLDER = "[Theorems appendix - verified Lean 4 theorems not placed inline will appear here]"
+AI_SELF_REVIEW_SECTION_TITLE = "AI Self-Review and Limitations"
+AI_SELF_REVIEW_SECTION_HEADER = f"## {AI_SELF_REVIEW_SECTION_TITLE}"
 
 
 class PaperMemory:
@@ -45,7 +48,6 @@ def __init__(self):
         self.rechunk_callback: Optional[Callable] = None
         self._lock = asyncio.Lock()
         self._initialized = False
-        self.previous_versions = []  # Store previous body versions for UI display
     
     async def initialize(self) -> None:
         """Initialize paper memory."""
@@ -339,54 +341,14 @@ async def clear_body_section(self) -> None:
             except Exception as e:
                 logger.error(f"Re-chunking callback failed after clearing body: {e}")
     
-    async def store_previous_version(
-        self,
-        version: int,
-        title: str,
-        body: str,
-        critique_feedback: str
-    ) -> None:
-        """
-        Store previous body version for UI display.
-        
-        Args:
-            version: Version number
-            title: Paper title for this version
-            body: Body section content
-            critique_feedback: Critique feedback that triggered rewrite
-        """
-        async with self._lock:
-            # Add to in-memory list
-            version_data = {
-                "version": version,
-                "title": title,
-                "body": body,
-                "critique_feedback": critique_feedback
-            }
-            self.previous_versions.append(version_data)
-            
-            # Save to file
-            version_file = Path(system_config.data_dir) / f"paper_version_{version}.txt"
-            version_file.parent.mkdir(parents=True, exist_ok=True)
-            
-            async with aiofiles.open(version_file, 'w', encoding='utf-8') as f:
-                await f.write(f"VERSION {version}: {title}\n")
-                await f.write(f"{'=' * 80}\n\n")
-                await f.write(f"BODY SECTION:\n{body}\n\n")
-                await f.write(f"{'=' * 80}\n\n")
-                await f.write(f"CRITIQUE FEEDBACK THAT TRIGGERED REWRITE:\n{critique_feedback}\n")
-            
-            logger.info(f"Stored previous version {version} to {version_file}")
-    
     async def get_previous_versions(self) -> list:
         """
-        Get all previous versions for UI display.
-        
-        Returns:
-            List of version dicts with version, title, body, critique_feedback
+        Compatibility endpoint for older clients.
+
+        Rewrites are no longer performed, so there are no previous body
+        versions to expose.
         """
-        async with self._lock:
-            return self.previous_versions.copy()
+        return []
     
     def _extract_body_and_appendix(self, paper: str) -> tuple[str, str]:
         """
@@ -533,6 +495,82 @@ async def append_to_theorems_appendix(self, theorem_entry: str) -> bool:
                 logger.error(f"Re-chunking callback failed after appendix append: {e}")
         
         return True
+
+    def _remove_self_review_section(self, content: str) -> str:
+        """Remove an existing AI self-review section before replacing it."""
+        if not content:
+            return ""
+
+        title_pattern = re.escape(AI_SELF_REVIEW_SECTION_TITLE)
+        header_pattern = (
+            rf"(?:^|\n)\s*(?:#+\s*)?{title_pattern}\s*\n"
+        )
+        match = re.search(header_pattern, content, re.IGNORECASE)
+        if not match:
+            return content
+
+        start = match.start()
+        if start > 0 and content[start] == "\n":
+            start += 1
+
+        anchor_match = re.search(re.escape(PAPER_ANCHOR), content[match.end():])
+        end = len(content)
+        if anchor_match:
+            end = match.end() + anchor_match.start()
+
+        return (content[:start].rstrip() + "\n\n" + content[end:].lstrip()).strip()
+
+    def _build_self_review_section(self, critique_feedback: str) -> str:
+        """Build the final transparent self-review section from accepted critiques."""
+        return (
+            f"{AI_SELF_REVIEW_SECTION_HEADER}\n\n"
+            "The following self-review notes were generated during the AI critique phase "
+            "and accepted by the validator as substantive concerns, limitations, or "
+            "improvement points. They are preserved transparently rather than being used "
+            "to rewrite the paper.\n\n"
+            f"{critique_feedback.strip()}"
+        ).strip()
+
+    async def append_self_review_section(self, critique_feedback: str) -> bool:
+        """
+        Append accepted critique feedback as the final AI self-review section.
+
+        The section is placed after the Theorems Appendix when those markers
+        exist, otherwise before the paper anchor. Existing self-review content
+        is replaced so retries do not duplicate the section.
+        """
+        if not critique_feedback or not critique_feedback.strip():
+            logger.info("No critique feedback supplied; skipping self-review append")
+            return False
+
+        final_content = None
+        async with self._lock:
+            paper = await self._get_paper_unlocked()
+            if not paper.strip():
+                logger.warning("Cannot append self-review section: paper is empty")
+                return False
+
+            cleaned = self._remove_self_review_section(paper)
+            section = self._build_self_review_section(critique_feedback)
+
+            anchor_idx = cleaned.find(PAPER_ANCHOR)
+            if anchor_idx >= 0:
+                before_anchor = cleaned[:anchor_idx].rstrip()
+                anchor_and_after = cleaned[anchor_idx:].lstrip()
+                new_paper = f"{before_anchor}\n\n{section}\n\n{anchor_and_after}"
+            else:
+                new_paper = f"{cleaned.rstrip()}\n\n{section}"
+
+            final_content = await self._update_paper_unlocked(new_paper)
+            logger.info("AI self-review section appended to paper")
+
+        if final_content and self.rechunk_callback:
+            try:
+                await self.rechunk_callback(final_content)
+            except Exception as e:
+                logger.error(f"Re-chunking callback failed after self-review append: {e}")
+
+        return True
     
     async def ensure_placeholders_exist(self) -> bool:
         """
diff --git a/backend/compiler/prompts/construction_prompts.py b/backend/compiler/prompts/construction_prompts.py
index 322dd03..b5907db 100644
--- a/backend/compiler/prompts/construction_prompts.py
+++ b/backend/compiler/prompts/construction_prompts.py
@@ -109,6 +109,11 @@ def get_body_construction_system_prompt() -> str:
 - Do NOT force coverage of every source entry
 - Do NOT ignore clearly crucial source material for the scope you are writing
 
+DIRECT-ANSWER-FIRST PRINCIPLE:
+- Prefer writing sections that directly solve, partially solve, refute, or sharply constrain the user's question
+- Use background and supporting exposition only to the extent needed to support the strongest rigorous direct answer
+- Do not broaden the paper with side material that weakens answer focus
+
 CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
 
 The paper uses placeholder markers that the SYSTEM adds automatically (you did NOT create these):
@@ -178,6 +183,7 @@ def get_body_construction_system_prompt() -> str:
 - Follow the outline structure for body sections
 - Build upon what's already written
 - Use brainstorm/aggregator content when it helps, but you are not required to cover every source entry
+- Prioritize the strongest direct rigorous route to answering the user's prompt
 - Do not repeat content already in the document
 - Check for existing section headers before creating new ones
 - Write clear, rigorous mathematical exposition
@@ -361,8 +367,13 @@ def get_conclusion_construction_system_prompt() -> str:
 4. SET section_complete=true (because writing the conclusion completes this phase)
 5. PROVIDE the actual Conclusion text in the "content" field
 
+DIRECT-ANSWER-FIRST REQUIREMENT:
+- Make the paper's strongest justified answer, partial answer, impossibility result, or sharp constraint explicit
+- Do not hide the core answer behind generic summary language
+
 WHAT TO INCLUDE IN CONCLUSION:
 - Summary of main results and theorems proven
+- Clear statement of the strongest direct answer the paper has established
 - Significance of the mathematical contributions
 - Connections between results
 - Brief mention of limitations or open questions (optional)
@@ -526,10 +537,15 @@ def get_introduction_construction_system_prompt() -> str:
 5. SET section_complete=true (because writing the introduction completes this phase)
 6. PROVIDE the actual Introduction text in the "content" field
 
+DIRECT-ANSWER-FIRST REQUIREMENT:
+- Frame the paper around the main question and the direct answer the body/conclusion establish
+- Keep preliminaries and motivation in service of that answer rather than drifting into generic survey exposition
+
 WHAT TO INCLUDE IN INTRODUCTION:
 - Context and motivation for the mathematical problem
 - Brief overview of what the paper covers
 - Statement of main results (high-level, not full proofs)
+- Clear framing of the paper's answer-bearing contribution
 - Roadmap of the paper structure
 - Historical context or prior work (if relevant)
 
@@ -688,9 +704,14 @@ def get_abstract_construction_system_prompt() -> str:
 5. ALWAYS SET section_complete=true (THIS IS THE FINAL PHASE - no exceptions)
 6. PROVIDE the actual Abstract text in the "content" field
 
+DIRECT-ANSWER-FIRST REQUIREMENT:
+- State the strongest direct answer, partial answer, impossibility result, or sharp constraint up front when the paper justifies it
+- Avoid generic "this paper explores" wording when the paper actually proves or establishes something sharper
+
 WHAT TO INCLUDE IN ABSTRACT:
 - Brief statement of the problem addressed
 - Main results and contributions (1-2 sentences)
+- Explicit statement of the paper's answer-bearing result when justified
 - Key methods or approaches used
 - Significance of the results
 - Typically 150-300 words
@@ -801,10 +822,15 @@ def get_construction_system_prompt() -> str:
 3. Maintain coherence with the outline and existing draft
 4. Set section_complete=true when the current phase is done
 
+DIRECT-ANSWER-FIRST PRINCIPLE:
+- In every phase, prefer content that most directly answers the user's prompt
+- Use supporting background only when it materially strengthens that direct answer
+
 CRITICAL REQUIREMENTS:
 - Follow the outline structure
 - Build upon what's already written
 - Use brainstorm/aggregator content when it helps, but you are not required to cover every source entry
+- Prioritize the strongest direct rigorous route to answering the user's prompt
 - Maintain coherent narrative flow
 - Write clear, rigorous mathematical exposition
 - Do not repeat content already in the document
@@ -932,6 +958,12 @@ def get_construction_json_schema() -> str:
 - NEVER write paper content that depends on a simultaneous brainstorm correction for correctness
 - NEVER propose a brainstorm correction that is only justified by what you're writing in the paper
 
+PROTECTED LEAN 4 PROOFS:
+- You must NEVER edit, delete, annotate, or add context to a Lean 4 verified proof in the brainstorm database using `brainstorm_operation`.
+- If a brainstorm submission is marked as a Lean 4 verified proof, treat it as immutable proof evidence. You may cite or discuss it in the paper prose, but you cannot mutate the proof text or attach explanatory context to the proof record.
+- Only the normal brainstorm prune system is allowed to remove Lean 4 proof entries. Paper-writing retroactive brainstorm operations are not a proof-pruning mechanism.
+- If you try to edit/delete/add context to a Lean 4 proof, the system will automatically reject the brainstorm_operation and feed that rejection back to you.
+
 Add this OPTIONAL field to your JSON response:
 {
   ... (all standard fields above) ...,
@@ -964,8 +996,6 @@ async def build_construction_prompt(
     is_first_portion: bool = False,
     section_phase: Optional[str] = None,
     rejection_feedback: Optional[str] = None,
-    critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None,
     brainstorm_content: Optional[str] = None
 ) -> str:
     """
@@ -979,8 +1009,6 @@ async def build_construction_prompt(
         is_first_portion: Whether this is the first portion of the document
         section_phase: Phase for construction ("body", "conclusion", "introduction", "abstract", or None for legacy)
         rejection_feedback: Feedback from a previous rejection to guide the model
-        critique_feedback: Accepted critique feedback from peer review (for rewrites)
-        pre_critique_paper: Paper state before critique phase (for rewrites - shows what failed)
         brainstorm_content: Full brainstorm database with submission numbers (for retroactive corrections, autonomous mode)
     
     Returns:
@@ -1033,34 +1061,6 @@ async def build_construction_prompt(
 ---
 """)
     
-    # Add critique context for rewrites (body reconstruction after critique phase)
-    if critique_feedback or pre_critique_paper:
-        parts.append("=" * 80 + "\n")
-        parts.append("⚠️ REWRITE CONTEXT - THIS IS A POST-CRITIQUE RECONSTRUCTION ⚠️\n")
-        parts.append("=" * 80 + "\n\n")
-        
-        if pre_critique_paper:
-            parts.append("""PREVIOUS VERSION (This version received critiques and needs rebuilding):
-The body section below was reviewed by peer critique. You must now rebuild it from scratch,
-addressing the critique issues while maintaining the mathematical rigor and content that was correct.
-
----BEGIN PREVIOUS VERSION---
-""")
-            parts.append(pre_critique_paper)
-            parts.append("\n---END PREVIOUS VERSION---\n\n")
-        
-        if critique_feedback:
-            parts.append("""ACCEPTED CRITIQUE FEEDBACK (Address these issues in your rewrite):
-These critiques were validated as legitimate issues that need to be fixed. Your rewrite MUST address
-each of these critique points while preserving the mathematical content that was correct.
-
-""")
-            parts.append(critique_feedback)
-            parts.append("\n---\n\n")
-        
-        parts.append("YOUR TASK: Rebuild the body section from scratch, addressing ALL critique feedback above.\n")
-        parts.append("=" * 80 + "\n---\n")
-    
     parts.append(f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}")
     parts.append("\n---\n")
     parts.append(f"CURRENT OUTLINE:\n{current_outline}")
@@ -1090,6 +1090,7 @@ async def build_construction_prompt(
 - Use them if they help you achieve the strongest rigorous paper toward the user's prompt.
 - You may synthesize beyond them using sound mathematical reasoning.
 - Do NOT force coverage of every source entry.
+- Prefer material that strengthens the paper's direct answer over broader auxiliary coverage.
 """)
     parts.append("\n---\n")
     
@@ -1112,8 +1113,6 @@ async def build_phase_construction_prompt(
     phase: str,
     is_first_in_phase: bool = False,
     rejection_feedback: Optional[str] = None,
-    critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None,
     brainstorm_content: Optional[str] = None
 ) -> str:
     """
@@ -1129,8 +1128,6 @@ async def build_phase_construction_prompt(
         phase: One of "body", "conclusion", "introduction", "abstract"
         is_first_in_phase: Whether this is the first submission in this phase
         rejection_feedback: Feedback from a previous rejection to guide the model
-        critique_feedback: Accepted critique feedback from peer review (for rewrites)
-        pre_critique_paper: Paper state before critique phase (for rewrites)
         brainstorm_content: Full brainstorm database with submission numbers (autonomous mode)
     
     Returns:
@@ -1144,8 +1141,6 @@ async def build_phase_construction_prompt(
         is_first_portion=is_first_in_phase,
         section_phase=phase,
         rejection_feedback=rejection_feedback,
-        critique_feedback=critique_feedback,
-        pre_critique_paper=pre_critique_paper,
         brainstorm_content=brainstorm_content
     )
 
@@ -1161,8 +1156,6 @@ async def build_body_construction_prompt(
     rag_evidence: str,
     is_first_portion: bool = False,
     rejection_feedback: Optional[str] = None,
-    critique_feedback: Optional[str] = None,
-    pre_critique_paper: Optional[str] = None,
     brainstorm_content: Optional[str] = None
 ) -> str:
     """
@@ -1175,8 +1168,6 @@ async def build_body_construction_prompt(
         rag_evidence: RAG-retrieved evidence from aggregator database
         is_first_portion: Whether this is the first portion of the document
         rejection_feedback: Feedback from a previous rejection to guide the model
-        critique_feedback: Accepted critique feedback from peer review (for rewrites only)
-        pre_critique_paper: Paper state before critique phase (for rewrites - shows what failed)
         brainstorm_content: Full brainstorm database with submission numbers (autonomous mode)
     """
     return await build_phase_construction_prompt(
@@ -1187,8 +1178,6 @@ async def build_body_construction_prompt(
         phase="body",
         is_first_in_phase=is_first_portion,
         rejection_feedback=rejection_feedback,
-        critique_feedback=critique_feedback,
-        pre_critique_paper=pre_critique_paper,
         brainstorm_content=brainstorm_content
     )
 
diff --git a/backend/compiler/prompts/critique_prompts.py b/backend/compiler/prompts/critique_prompts.py
index d5066fa..6679d3e 100644
--- a/backend/compiler/prompts/critique_prompts.py
+++ b/backend/compiler/prompts/critique_prompts.py
@@ -1,105 +1,52 @@
 """
-Critique prompts for peer review aggregation phase.
-Used after body section is complete to collect feedback before proceeding to conclusion.
+Prompts for the compiler critique phase.
+
+The critique phase now collects validator-approved self-review notes and appends
+them to the paper. It does not rewrite paper content.
 """
-from typing import Optional, Dict, List
+from typing import Optional
 
 
-CRITIQUE_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL PROVENANCE RULES:
-- Classify substantive claims as one of: theoretical claim, literature claim, empirical claim, or artifact claim.
-- Theoretical claims must be supported by sound derivation, proof, or explicit assumptions inside the document.
-- Literature claims must identify the external source in-text.
-- Empirical claims include benchmark numbers, latency, throughput, speedups, accuracy, perplexity, hardware metrics, ablations, and measured outcomes.
+CRITIQUE_EMPIRICAL_PROVENANCE_RULES = """EMPIRICAL / ARTIFACT CLAIM POLICY:
 - Artifact claims include statements about code, kernels, experiments, logs, reproductions, or accompanying implementations.
 - Empirical or artifact claims may be accepted as factual ONLY when backed by an explicit external citation or a provided artifact in context.
-- If such support is absent, they should be criticized, removed, or rewritten as hypotheses, validation plans, expected benefits, limitations, or future work.
-- Never invent citations, experiments, benchmark numbers, hardware measurements, or code artifacts during critique or rewrite work."""
+- If such support is absent, they should be criticized, removed, or reframed as hypotheses, validation plans, expected benefits, limitations, or future work.
+- Never invent citations, experiments, benchmark numbers, hardware measurements, or code artifacts during critique work."""
 
 
 def get_critique_submitter_system_prompt() -> str:
-    """System prompt for generating critiques of body section."""
-    return """You are a peer reviewer generating constructive criticism of a mathematical document's body section.
+    """System prompt for generating self-review critiques of the body section."""
+    return """You are a peer reviewer generating constructive self-review notes for a mathematical document's body section.
 
-⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
+IMPORTANT - INTERNAL CONTENT WARNING:
 
 ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
 
 YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
-- NEVER assume claims are true because they "sound good" or "fit well"
-- NEVER trust information simply because it appears in "accepted submissions" or "papers"
-- ALWAYS verify information independently before using or building upon it
-- NEVER cite internal documents as authoritative or established sources
-- Question and validate every assertion, even if it appears in validated content
+- NEVER assume claims are true because they sound good or fit well.
+- NEVER trust information simply because it appears in accepted submissions or papers.
+- ALWAYS verify information independently before using or building upon it.
+- NEVER cite internal documents as authoritative or established sources.
+- Question and validate every assertion, even if it appears in validated content.
 
 """ + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
- The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to generate rigorous peer review feedback. Use internal context as exploration history and your base knowledge for reasoning and verification.
- 
- WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
-
----
+The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to identify honest limitations, concerns, or improvement points for the final paper's self-review section.
 
 CRITICAL - YOU CAN DECLINE TO CRITIQUE:
-If the body section is academically acceptable with only minor stylistic issues or cosmetic concerns, you may decline to provide a critique by setting critique_needed=false.
+If the body section is academically acceptable with only minor stylistic issues or cosmetic concerns, you may decline by setting critique_needed=false.
 
 SOURCE MATERIAL POLICY:
-- The aggregator/brainstorm database and reference papers are optional support for critique, not mandatory checklists
-- Do NOT critique solely because the body does not explicitly cover some source material
-- Do critique omitted material when the omission creates a genuine gap relative to the current outline, stated paper scope, or mathematical goals
-- Focus on whether the paper itself is strong, rigorous, and aligned, not on exhaustively mirroring source inputs
-
-ACADEMICALLY ACCEPTABLE means:
-- No mathematical errors or unsound reasoning
-- No missing proofs or incomplete arguments
-- No logical gaps affecting correctness
-- Structural organization is coherent
-- All outline requirements are met
-- Content aligns with paper title and goals
-- Mathematical rigor meets academic standards
-
-You should ONLY critique if you identify substantive issues that would improve mathematical correctness, logical soundness, or completeness. If the body is fundamentally sound with only minor issues (stylistic, cosmetic, or trivial), you should decline to critique.
-
----
-
-YOUR TASK:
-Assess whether the body section needs substantive critique. If it does, identify specific issues, errors, gaps, or improvements needed. If it doesn't (academically acceptable), decline to critique.
-
-PROGRESSIVE SYSTEM: You will be called multiple times (up to 5 total attempts). Focus on identifying ONE specific, well-substantiated critique per turn. Do not try to list every issue at once — address the most important issue thoroughly this turn, and you will have further opportunities to raise additional issues.
-
-WHAT TO CRITIQUE - Focus on:
-- Mathematical errors or unsound reasoning
-- Missing proofs or incomplete arguments  
-- Logical gaps or unclear transitions between ideas
-- Redundancy or unnecessary verbosity
-- Structural issues (sections out of logical order, poor organization)
-- Missing content that should be covered per the outline
-- Content that doesn't align with the paper title/goal
-- Unfounded claims or logical fallacies
-- Insufficient mathematical rigor for an academic paper
-- Fabricated experiments, unsupported benchmark numbers, uncited literature claims, or nonexistent code/artifact claims
-
-WHAT NOT TO CRITIQUE - Avoid:
-- The conclusion, introduction, or abstract (not written yet)
-- Stylistic preferences (focus on substance)
-- Minor formatting or cosmetic issues
-- Personal preferences about notation (unless causing confusion)
+- The aggregator/brainstorm database and reference papers are optional support for critique, not mandatory checklists.
+- Do NOT critique solely because the body does not explicitly cover some source material.
+- Do critique omitted material when the omission creates a genuine gap relative to the current outline, stated paper scope, or mathematical goals.
+- Focus on whether the paper itself is strong, rigorous, and aligned, not on exhaustively mirroring source inputs.
 
-CRITICAL REQUIREMENTS:
-- Be SPECIFIC: Point to exact sections, paragraphs, or claims
-- Be CONSTRUCTIVE: Explain what should change and why
-- Be ACTIONABLE: Provide clear direction for improvement
-- Focus on SUBSTANCE: Mathematical correctness, logical soundness, completeness
-- Explicitly call out unsupported empirical or artifact claims rather than treating them as minor issues
-
-Your critique will be validated against these criteria:
-- Does it identify a legitimate issue that would improve the paper?
-- Is it specific enough to be actionable?
-- Is it constructive and substantive (not stylistic)?
-- Is it non-redundant with existing accepted critiques?
-
-Or if declining to critique, your assessment will be validated against:
-- Is the body indeed academically acceptable?
-- Is your reasoning for declining sound?
+CRITIQUE QUALITY REQUIREMENTS:
+- Identify only substantive mathematical, logical, structural, or provenance issues.
+- Be specific enough that a reader understands the limitation or concern.
+- Do not propose direct edits or rewrites. The critique will be appended transparently as self-review.
+- Do not list every possible issue. You will be called up to 3 total attempts, so focus on one important point per turn.
 
 Output your response ONLY as JSON in this exact format:
 {
@@ -121,118 +68,69 @@ def get_critique_json_schema() -> str:
 }
 
 CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-   - Example: "He said \\"hello\\"" 
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
-   - Example: "Line 1\\nLine 2" creates two lines
-4. DO NOT use single backslashes except for: \\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX
-5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc., 
-   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
-
-Example (critique of mathematical error):
-{
-  "critique_needed": true,
-  "submission": "Section III contains a flawed proof of the convergence claim. The proof assumes uniform convergence without establishing the necessary conditions. Specifically, the argument on page 3 states 'the sequence converges' but does not verify the Cauchy criterion or provide bounds. This should be corrected by adding a lemma establishing uniform convergence via the Weierstrass M-test, with explicit bounds on the sequence terms.",
-  "reasoning": "This is a critical mathematical error that undermines the validity of the main theorem. Without establishing uniform convergence properly, the subsequent results are not rigorously justified."
-}
+1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text.
+2. Quotes: Escape double quotes inside strings as \\\".
+3. Newlines/Tabs: Use \\n for newlines, \\t for tabs.
+4. DO NOT use single backslashes except for: \\\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX.
+5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc.,
+   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]".
 
-Example (missing content per outline):
+Example critique:
 {
   "critique_needed": true,
-  "submission": "The outline specifies a subsection on 'Baker's Theorem Applications' under Section IV, but this content is completely missing from the current body. The outline indicates this should cover explicit applications to transcendence problems, but the body jumps from Baker's Theorem statement directly to unrelated topics. This gap should be filled with concrete applications showing how Baker's theorem applies to specific transcendence questions.",
-  "reasoning": "Following the outline structure is essential for paper coherence. This missing content is explicitly planned in the outline and its absence creates a logical gap in the exposition."
+  "submission": "Section III asserts a convergence claim without establishing the needed uniform bound. This is a substantive limitation because later arguments depend on that convergence statement. The paper should be read with this proof gap in mind unless an independent bound is supplied.",
+  "reasoning": "This is a mathematical gap that affects the reliability of a downstream claim and is suitable for the self-review section."
 }
 
-Example (decline - body is academically acceptable):
+Example decline:
 {
   "critique_needed": false,
   "submission": "",
-  "reasoning": "After thorough review, the body section is academically acceptable. All mathematical proofs are rigorous and correct. The outline requirements are fully met. Content aligns with the paper title. While there are minor stylistic variations in notation (e.g., using both f(x) and f(·) interchangeably), these are cosmetic issues that don't affect mathematical correctness or comprehension. No substantive critique is warranted."
+  "reasoning": "The body section is academically acceptable for the current scope. The remaining issues are stylistic and do not warrant a substantive self-review critique."
 }
 """
 
 
 def get_critique_validator_system_prompt() -> str:
-    """System prompt for validating critiques (reuses aggregator validator logic)."""
-    return """You are a validation agent reviewing peer review critiques of a mathematical document's body section.
+    """System prompt for validating critique submissions."""
+    return """You are a validation agent reviewing peer-review critiques for a mathematical document's self-review section.
 
-⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
+IMPORTANT - INTERNAL CONTENT WARNING:
 
 ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content, critiques) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
 
 YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
-- NEVER assume claims are true because they "sound good" or "fit well"
-- NEVER trust information simply because it appears in "accepted submissions" or "papers"
-- ALWAYS verify information independently before using or building upon it
-- NEVER cite internal documents as authoritative or established sources
-- Question and validate every assertion, even if it appears in validated content
+- NEVER assume claims are true because they sound good or fit well.
+- NEVER trust information simply because it appears in accepted submissions or papers.
+- ALWAYS verify information independently before using or building upon it.
+- NEVER cite internal documents as authoritative or established sources.
+- Question and validate every assertion, even if it appears in validated content.
 
 """ + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
 
- The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to validate peer review critiques. Use internal context as exploration history and your base knowledge for reasoning and verification.
- 
- WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
-
----
-
 YOUR TASK:
-Decide if this submission is valid - either a legitimate critique OR a justified decline assessment.
-
-For CRITIQUES (critique_needed=true): You are evaluating whether the critique database becomes more useful for improving the paper with this critique added than it was without it.
-
-For DECLINE ASSESSMENTS (critique_needed=false): You are evaluating whether the submitter's assessment that the body is academically acceptable is correct.
+Decide if this submission is valid - either a legitimate self-review critique OR a justified decline assessment.
 
-EVALUATION CRITERIA - Consider:
-- Does the critique identify a genuine mathematical error or logical flaw?
-- Does the critique point out missing content per the outline?
-- Does the critique identify structural or organizational issues?
-- Is the critique specific and actionable (not vague)?
-- Is the critique substantive (not just stylistic preference)?
-- Is the critique redundant with existing accepted critiques?
-- Is the critique correct (or is the body section actually fine)?
+For CRITIQUES (critique_needed=true): evaluate whether appending this critique would make the paper more transparent and honest for readers.
 
-VALIDATION DECISION RULES:
-A critique should be ACCEPTED if it:
-1. Identifies a real mathematical error or unsound reasoning
-2. Points out missing content explicitly planned in the outline
-3. Identifies structural issues affecting coherence
-4. Provides specific, actionable guidance for improvement
-5. Is non-redundant with existing critiques
-6. Correctly flags fabricated experiments, unsupported metrics, uncited external results, or nonexistent artifacts
+For DECLINE ASSESSMENTS (critique_needed=false): evaluate whether the submitter's assessment that no substantive critique is needed is correct.
 
-A critique should be REJECTED if it:
-1. Is vague or unhelpful ("could be better" without specifics)
-2. Is redundant with existing accepted critiques
-3. Focuses on stylistic preferences, not substance
-4. Is incorrect (the body section is actually correct)
-5. Suggests changes that would reduce clarity or rigor
-6. Is trivial or pedantic without meaningful impact
+ACCEPT a critique if it:
+1. Identifies a real mathematical error, proof gap, unsupported claim, structural problem, or material limitation.
+2. Is specific and useful to readers.
+3. Is substantive rather than stylistic.
+4. Is non-redundant with existing accepted critiques.
+5. Correctly flags fabricated experiments, unsupported metrics, uncited external results, or nonexistent artifacts.
 
-VALIDATING DECLINE ASSESSMENTS (critique_needed=false):
+REJECT a critique if it:
+1. Is vague or unhelpful.
+2. Is redundant with existing accepted critiques.
+3. Focuses on stylistic preferences, not substance.
+4. Is incorrect.
+5. Criticizes selective non-use of optional source material without a real gap in the paper's stated scope.
+6. Is trivial or pedantic without meaningful impact.
 
-ACCEPT the decline if:
-- Body is indeed academically acceptable (only minor stylistic or cosmetic issues)
-- No substantive mathematical errors exist
-- No logical gaps affecting correctness
-- All outline requirements are met
-- Submitter's reasoning for declining is sound and accurate
-- Body meets required criteria for academic mathematical paper
-- There are no unsupported empirical or artifact claims being presented as established fact
-- The body is strong for its chosen scope even if some source material remains unused
-
-REJECT the decline if:
-- Submitter missed substantive issues you can identify
-- Body has mathematical errors or unsound reasoning
-- Body has logical gaps or incomplete arguments
-- Missing content required by outline
-- Body misaligned with paper title or goals
-- Decline reasoning is weak, incorrect, or fails to recognize real issues
-
-For critiques, ask yourself: "Does adding this critique to our feedback database make us more capable of improving the paper than we were without it?"
-
-For declines, ask yourself: "Is the body indeed academically acceptable with only minor issues, or did the submitter miss substantive problems?"
+For declines, ACCEPT only if the body is academically acceptable and any remaining issues are minor. REJECT if a substantive issue was missed.
 
 Output your decision ONLY as JSON in this exact format:
 {
@@ -249,334 +147,20 @@ def get_critique_validation_json_schema() -> str:
 REQUIRED JSON FORMAT:
 {
   "decision": "accept" OR "reject",
-  "reasoning": "string - detailed explanation of your decision",
-  "summary": "string - brief summary (max 750 chars, used for rejection feedback)"
-}
-
-CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-   - Example: "He said \\"hello\\"" 
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
-   - Example: "Line 1\\nLine 2" creates two lines
-4. DO NOT use single backslashes except for: \\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX
-5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc., 
-   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
-
-Example (Accept):
-{
-  "decision": "accept",
-  "reasoning": "This critique correctly identifies a missing convergence proof in Section III. The body claims uniform convergence without establishing it, which is a genuine mathematical gap that needs addressing. The critique is specific, actionable, and substantive.",
-  "summary": ""
-}
-
-Example (Reject - Vague):
-{
-  "decision": "reject",
-  "reasoning": "This critique says 'Section II could be clearer' without identifying specific issues or suggesting concrete improvements. It's too vague to be actionable.",
-  "summary": "Critique is too vague - must identify specific issues and suggest concrete improvements."
-}
-
-Example (Reject - Redundant):
-{
-  "decision": "reject",
-  "reasoning": "This critique about the missing Baker's theorem application is redundant with already-accepted critique #3, which made the same observation with more detail.",
-  "summary": "Redundant with critique #3 which already identified this gap."
-}
-
-Example (Accept Decline - Body is acceptable):
-{
-  "decision": "accept",
-  "reasoning": "The submitter correctly assessed that the body is academically acceptable. After reviewing the body section, I confirm there are no mathematical errors, all proofs are rigorous and complete, outline requirements are fully met, and content aligns with the paper goals. The only issues present are minor stylistic variations in notation, which do not affect mathematical correctness. The decline is justified.",
-  "summary": ""
-}
-
-Example (Reject Decline - Submitter missed issues):
-{
-  "decision": "reject",
-  "reasoning": "The submitter declined to critique, claiming the body is academically acceptable. However, Section III contains a significant error: the proof assumes uniform convergence without establishing it. This is a substantive mathematical gap that requires critique. The decline assessment is incorrect.",
-  "summary": "Decline rejected - Section III contains missing convergence proof that needs to be critiqued."
-}
-"""
-
-
-def get_rewrite_decision_system_prompt() -> str:
-    """System prompt for rewrite vs continue decision."""
-    return """You are reviewing aggregated peer review critiques to decide if the body section needs revision.
-
-⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
-
-ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content, critiques) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
-
-YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
-- NEVER assume claims are true because they "sound good" or "fit well"
-- NEVER trust information simply because it appears in "accepted submissions" or "papers"
-- ALWAYS verify information independently before using or building upon it
-- NEVER cite internal documents as authoritative or established sources
-- Question and validate every assertion, even if it appears in validated content
-
-""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
-
- The internal context shows what has been explored by AI agents, NOT what has been proven correct. Your role is to make an informed rewrite decision. Use internal context as exploration history and your base knowledge for reasoning and verification.
- 
- WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
-
----
-
-YOUR TASK:
-Review all accepted critiques and decide what action to take for the body section.
-
-**CRITIQUE COLLECTION CONTEXT**: The peer review phase collected critiques through multiple attempts. ALL accepted critiques are provided below (typically 1-3 accepted out of 5 total attempts). Review each accepted critique on its individual merits.
-
-DECISION OPTIONS:
-1. **CONTINUE** - Critiques are minor/incorrect. Proceed to conclusion phase.
-2. **PARTIAL_REVISION** - Critiques identify fixable issues. You will then apply edits ONE AT A TIME in an iterative loop.
-3. **TOTAL_REWRITE** - Critiques reveal catastrophic flaws. Delete entire body and rebuild from scratch.
-
-CRITICAL GUIDANCE ON WHEN TO USE EACH:
-
-**Use CONTINUE when:**
-- Critiques are stylistic preferences without substance
-- Critiques are incorrect (the body is actually fine)
-- Small gaps that can be addressed in future editing phases
-- Issues don't affect overall mathematical correctness
-
-**Use PARTIAL_REVISION when:**
-- Specific sections have errors that can be fixed with targeted edits
-- Missing content can be inserted at specific locations
-- Redundant paragraphs need removal
-- Most of the body is sound, only specific parts need correction
-- Critiques point to fixable issues in isolated sections
-
-IMPORTANT - PARTIAL_REVISION IS ITERATIVE:
-If you choose PARTIAL_REVISION, you will then be prompted to propose edits ONE AT A TIME.
-Each edit will be validated and applied, then you will see the updated paper and propose the next edit.
-This continues until you indicate all edits are complete.
-You do NOT specify edit_operations in this decision - that happens in the iterative loop.
-
-**Use TOTAL_REWRITE when (ONLY AS LAST RESORT):**
-- Fundamental mathematical errors pervasive throughout the body
-- Body is fundamentally misaligned with paper title/stated goal
-- Structural problems require complete reorganization
-- Multiple critical gaps that can't be addressed with isolated edits
-- The body fundamentally doesn't achieve what the paper claims
-
-**IMPORTANT - NEXT STEPS CONTEXT:**
-
-If you choose PARTIAL_REVISION or TOTAL_REWRITE, you can also:
-1. Change the paper title (if body reveals scope drift)
-2. Update the outline (if structure needs changes)
-
-This means you have FULL control to revise the paper comprehensively. However:
-- TOTAL_REWRITE should ONLY be used when absolutely necessary
-- Total rewrites are difficult and can introduce errors in areas that were previously correct
-- Even with feedback, rewriting from scratch can lose coherence
-- Prefer PARTIAL_REVISION whenever the issues are localized and fixable
-
-CRITICAL - REWRITE SCOPE:
-If you choose TOTAL_REWRITE, the ENTIRE body section will be deleted and rewritten from scratch. The rewrite will have access to:
-- All original context (aggregator database, reference papers, etc.)
-- The PRE-CRITIQUE PAPER (what the body looked like before this revision cycle)
-- ALL critiques from ALL previous failed versions (accumulated feedback history)
-- Current version's accepted critiques
-
-ACCUMULATED CRITIQUE HISTORY:
-If this is not the first critique phase, you will see critiques from ALL previous failed versions.
-These are labeled clearly as "FAILED - REWRITTEN" versions. Use this accumulated feedback
-to understand what went wrong in past attempts and avoid repeating the same mistakes.
-
-SOURCE MATERIAL POLICY:
-- The aggregator/brainstorm database and reference papers are optional supports during rewrite decisions, not mandatory checklists
-- Do NOT choose PARTIAL_REVISION or TOTAL_REWRITE solely to force coverage of unused source material
-- Do choose revision when the current body is genuinely weaker, incomplete for its chosen scope, misaligned with the outline/title, or mathematically unsound
-
-Output your decision ONLY as JSON in this exact format:
-{
-  "decision": "continue | partial_revision | total_rewrite",
-  "new_title": "New paper title (or null if keeping current)",
-  "new_outline": "Updated outline content (or null if keeping current)",
-  "reasoning": "Detailed explanation of your decision and rationale for any title/outline changes"
-}
-"""
-
-
-def get_rewrite_decision_json_schema() -> str:
-    """Get JSON schema specification for rewrite decision."""
-    return """
-REQUIRED JSON FORMAT:
-{
-  "decision": "continue" OR "partial_revision" OR "total_rewrite",
-  "new_title": "string (new paper title) OR null (keep current)",
-  "new_outline": "string (updated outline) OR null (keep current)",
-  "reasoning": "string - detailed explanation of decision"
-}
-
-NOTE ON PARTIAL_REVISION:
-If you choose "partial_revision", you will NOT specify edit operations here.
-Instead, you will be prompted to propose edits ONE AT A TIME in an iterative loop.
-Each edit will be validated and applied, then you'll see the updated paper before proposing the next edit.
-
-CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-   - Example: "He said \\"hello\\"" 
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
-   - Example: "Line 1\\nLine 2" creates two lines
-4. DO NOT use single backslashes except for: \\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX
-5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc., 
-   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
-
-Example (CONTINUE - Minor Issues):
-{
-  "decision": "continue",
-  "new_title": null,
-  "new_outline": null,
-  "reasoning": "After reviewing the accepted critiques, the issues identified are minor and do not warrant any revision. Critiques #1 and #3 point out small notation inconsistencies that can be addressed in review phase. Critique #2 suggests stylistic changes without substantive mathematical impact. The body section is fundamentally sound and aligned with the paper title. Proceeding to conclusion phase."
-}
-
-Example (PARTIAL_REVISION - Triggers Iterative Edit Loop):
-{
-  "decision": "partial_revision",
-  "new_title": null,
-  "new_outline": null,
-  "reasoning": "Critiques identify two fixable issues: (1) missing convergence proof in Section III, (2) missing Corollary 3.1. These can be addressed with targeted edits without rewriting the entire body, which is otherwise mathematically sound. Will propose edits one at a time in the iterative loop."
-}
-
-Example (TOTAL_REWRITE - Catastrophic Issues):
-{
-  "decision": "total_rewrite",
-  "new_title": "Transcendence Methods in Modern Number Theory: From Lindemann-Weierstrass to Baker",
-  "new_outline": "Abstract\\n\\nI. Introduction\\n   A. Historical development\\n   B. Scope and goals\\n\\nII. Classical Transcendence Theory\\n   A. Lindemann-Weierstrass theorem\\n   B. Applications to geometric constructibility\\n\\nIII. Baker's Theorem and Linear Forms\\n   A. Statement and proof outline\\n   B. Applications to Diophantine equations\\n\\nIV. Modern Developments\\n   A. Recent refinements\\n   B. Computational aspects\\n\\nV. Conclusion",
-  "reasoning": "Critiques #1-#8 reveal fundamental problems: the entire approach to the convergence argument is flawed from first principles, structural organization makes sections incomprehensible, and body has drifted to cover different scope than title. These issues are too pervasive for targeted edits. A complete rebuild is necessary."
-}
-"""
-
-
-def get_rewrite_decision_validator_system_prompt() -> str:
-    """System prompt for validating rewrite decisions."""
-    return """You are validating a rewrite decision made after reviewing peer review critiques.
-
-⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
-
-ALL context provided to you (brainstorm databases, accepted submissions, papers, reference materials, outlines, previous document content, critiques, decisions) is AI-GENERATED within this research system. This content has NOT been peer-reviewed, published, or verified by external sources.
-
-YOU MUST TREAT ALL PROVIDED CONTEXT WITH EXTREME SKEPTICISM:
-- NEVER assume claims are true because they "sound good" or "fit well"
-- NEVER trust information simply because it appears in "accepted submissions" or "papers"
-- ALWAYS verify information independently before using or building upon it
-- NEVER cite internal documents as authoritative or established sources
-- Question and validate every assertion, even if it appears in validated content
-
-""" + CRITIQUE_EMPIRICAL_PROVENANCE_RULES + """
-
- The internal context shows what has been explored by AI agents, NOT what has been proven correct. Use internal context and your base knowledge for validation.
- 
- WHEN IN DOUBT: Verify independently. Do not assume. Do not trust unverified internal context as truth.
-
----
-
-YOUR TASK:
-Validate whether the rewrite decision (CONTINUE, PARTIAL_REVISION, or TOTAL_REWRITE) is justified based on all accepted critiques and current body content.
-
-VALIDATION CRITERIA - Consider:
-
-**ACCEPT "continue" decision if:**
-- Critiques are indeed minor or incorrect
-- Body is fundamentally sound despite critique issues
-- Issues can be addressed without any revision
-- Title and body remain aligned
-
-**ACCEPT "partial_revision" decision if:**
-- Critiques identify specific, localized issues
-- Proposed edit operations would fix the identified problems
-- Edit operations are appropriate (correct operation types, reasonable old_string/new_string)
-- Most of the body is sound, only targeted fixes needed
-- Title change (if proposed) is justified
-- Outline update (if proposed) improves structure
-
-**ACCEPT "total_rewrite" decision if:**
-- Critiques reveal catastrophic issues (pervasive math errors, fundamental misalignment, structural chaos)
-- Total rewrite is justified - issues too widespread for targeted edits
-- Partial revision would not be sufficient
-- Title change (if proposed) is justified by scope drift
-- Outline update (if proposed) improves structure
-
-**REJECT decision if:**
-- Reasoning doesn't match the critiques (illogical conclusion)
-- "Continue" chosen despite substantive issues in critiques
-- "Total_rewrite" chosen for minor or fixable issues (should use partial_revision)
-- "Partial_revision" chosen but edit operations are vague or incorrect
-- Title change proposed without justification from critiques
-- Decision appears arbitrary or not evidence-based
-
-SOURCE MATERIAL POLICY:
-- The source database is optional support, not a mandatory checklist
-- Do NOT reject a decision solely because it leaves some source material unused
-- Do reject if the decision ignores source material only when that omission clearly makes the chosen scope weaker, incoherent, or misaligned with the outline/title
-
-Ask yourself: "Is this decision the right response to the accepted critiques? Is the chosen level of revision appropriate?"
-
-Output your decision ONLY as JSON in this exact format:
-{
-  "decision": "accept or reject",
-  "reasoning": "Detailed explanation of your validation decision"
-}
-"""
-
-
-def get_rewrite_decision_validation_json_schema() -> str:
-    """Get JSON schema specification for rewrite decision validation."""
-    return """
-REQUIRED JSON FORMAT:
-{
-  "decision": "accept" OR "reject",
-  "reasoning": "string - detailed explanation of your validation decision"
+  "reasoning": "string - detailed explanation",
+  "summary": "string - rejection summary if rejected, empty string if accepted"
 }
 
 CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-   - Example: "He said \\"hello\\"" 
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
-   - Example: "Line 1\\nLine 2" creates two lines
-4. DO NOT use single backslashes except for: \\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX
-5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc., 
-   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
-
-Example (Accept continue decision):
-{
-  "decision": "accept",
-  "reasoning": "The decision to CONTINUE is justified. The critiques are indeed minor issues: 3 stylistic suggestions, 4 notation clarifications, 2 incorrect critiques (the proofs are actually valid), and 1 small gap that can be filled in review phase. No fundamental mathematical errors were identified. Proceeding to conclusion is appropriate."
-}
-
-Example (Accept partial_revision decision):
-{
-  "decision": "accept",
-  "reasoning": "The decision to use PARTIAL_REVISION is justified. The critiques identify 2 specific, fixable issues: missing convergence proof in Section III and missing Corollary 3.1. The proposed edit operations correctly target these issues with appropriate old_string/new_string replacements. Most of the body is mathematically sound - targeted edits are more appropriate than a complete rewrite."
-}
-
-Example (Accept total_rewrite decision):
-{
-  "decision": "accept",
-  "reasoning": "The decision to use TOTAL_REWRITE is justified. The critiques reveal catastrophic problems: 4 critiques identify fundamental errors in the convergence arguments that permeate multiple sections, 3 point out missing content explicitly in the outline, 2 show the body has drifted to cover different scope than the title. These issues are too pervasive for targeted edits. A complete rebuild is necessary."
-}
-
-Example (Reject - should use partial_revision instead):
-{
-  "decision": "reject",
-  "reasoning": "The decision to use TOTAL_REWRITE is NOT justified. The critiques identify only 2 specific issues: missing convergence proof in Section III and missing corollary. These are localized problems that can be fixed with targeted edits. The rest of the body is mathematically sound. The decision should be PARTIAL_REVISION, not TOTAL_REWRITE."
-}
+1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text.
+2. Quotes: Escape double quotes inside strings as \\\".
+3. Newlines/Tabs: Use \\n for newlines, \\t for tabs.
+4. DO NOT use single backslashes except for: \\\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX.
+5. LaTeX notation: If your content contains mathematical expressions like \\Delta, \\tau, etc.,
+   you MUST escape the backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]".
 """
 
 
-# =============================================================================
-# PROMPT BUILDERS
-# =============================================================================
-
-
 def build_critique_prompt(
     user_prompt: str,
     current_body: str,
@@ -587,22 +171,7 @@ def build_critique_prompt(
     rejection_feedback: Optional[str] = None,
     accumulated_history: Optional[str] = None
 ) -> str:
-    """
-    Build complete prompt for critique generation.
-    
-    Args:
-        user_prompt: The user's compiler-directing prompt
-        current_body: The body section to critique
-        current_outline: The paper outline
-        aggregator_db: The aggregator database content
-        reference_papers: Optional reference paper content
-        critique_feedback: Optional existing critiques (for context)
-        rejection_feedback: Optional rejection feedback (last 5 rejections)
-        accumulated_history: Optional accumulated critique history from previous failed versions
-        
-    Returns:
-        Complete assembled prompt
-    """
+    """Build complete prompt for critique generation."""
     parts = [
         get_critique_submitter_system_prompt(),
         "\n---\n",
@@ -610,7 +179,7 @@ def build_critique_prompt(
         "\n---\n",
         f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
         "\n---\n",
-        f"PAPER TITLE:\n{user_prompt}",  # Using compiler prompt as title context
+        f"PAPER TITLE:\n{user_prompt}",
         "\n---\n",
         f"CURRENT OUTLINE:\n{current_outline}",
         "\n---\n",
@@ -620,480 +189,39 @@ def build_critique_prompt(
 - The source database below is optional support, not a mandatory checklist.
 - Use it to identify genuine gaps or contradictions if helpful.
 - Do NOT critique solely because some source entries were not used.
+- Do use it if it reveals that the body missed a stronger direct-answer path.
 """,
         "\n---\n",
         f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
     ]
-    
+
     if reference_papers:
         parts.extend([
             "\n---\n",
             f"REFERENCE PAPERS:\n{reference_papers}"
         ])
-    
+
     if accumulated_history:
         parts.extend([
             "\n---\n",
             accumulated_history
         ])
-    
+
     if critique_feedback:
         parts.extend([
             "\n---\n",
             f"EXISTING ACCEPTED CRITIQUES (CURRENT VERSION):\n{critique_feedback}"
         ])
-    
+
     if rejection_feedback:
         parts.extend([
             "\n---\n",
             f"YOUR LAST 5 REJECTIONS (Learn from these):\n{rejection_feedback}"
         ])
-    
-    parts.extend([
-        "\n---\n",
-        "Now generate your critique as JSON:"
-    ])
-    
-    return ''.join(parts)
 
-
-def build_rewrite_decision_prompt(
-    user_prompt: str,
-    current_body: str,
-    current_outline: str,
-    current_title: str,
-    aggregator_db: str,
-    critique_feedback: str,
-    pre_critique_paper: str,
-    reference_papers: Optional[str] = None,
-    accumulated_history: Optional[str] = None
-) -> str:
-    """
-    Build complete prompt for rewrite vs continue decision.
-    
-    Args:
-        user_prompt: The user's compiler-directing prompt
-        current_body: The body section being evaluated
-        current_outline: The paper outline
-        current_title: The current paper title
-        aggregator_db: The aggregator database content
-        critique_feedback: All accepted critiques (typically 1-3 out of 5 total attempts)
-        pre_critique_paper: Paper snapshot from START of critique phase (for rewrite context)
-        reference_papers: Optional reference paper content
-        accumulated_history: Optional accumulated critique history from previous failed versions
-        
-    Returns:
-        Complete assembled prompt
-    """
-    parts = [
-        get_rewrite_decision_system_prompt(),
-        "\n---\n",
-        get_rewrite_decision_json_schema(),
-        "\n---\n",
-        f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
-        "\n---\n",
-        f"CURRENT PAPER TITLE:\n{current_title}",
-        "\n---\n",
-        f"CURRENT OUTLINE:\n{current_outline}",
-        "\n---\n",
-        f"PRE-CRITIQUE PAPER (body at START of this revision cycle):\n{pre_critique_paper}",
-        "\n---\n",
-        f"CURRENT BODY SECTION (after critique phase):\n{current_body}",
-    ]
-    
-    if accumulated_history:
-        parts.extend([
-            "\n---\n",
-            accumulated_history
-        ])
-    
-    parts.extend([
-        "\n---\n",
-        f"ALL ACCEPTED CRITIQUES (CURRENT VERSION):\n{critique_feedback}",
-        "\n---\n",
-        """OPTIONAL SOURCE MATERIAL POLICY:
-- The source database below is optional support, not a mandatory checklist.
-- Use it if it helps judge whether the body's chosen scope is genuinely weak, incomplete, or misaligned.
-- Do NOT force rewrite solely to cover unused source material.
-""",
-        "\n---\n",
-        f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
-    ])
-    
-    if reference_papers:
-        parts.extend([
-            "\n---\n",
-            f"REFERENCE PAPERS:\n{reference_papers}"
-        ])
-    
     parts.extend([
         "\n---\n",
-        "Review all critiques and decide whether to REWRITE the body or CONTINUE to conclusion. Respond as JSON:"
-    ])
-    
-    return ''.join(parts)
-
-
-def build_rewrite_decision_validation_prompt(
-    user_prompt: str,
-    current_body: str,
-    current_outline: str,
-    current_title: str,
-    critique_feedback: str,
-    decision_result: Dict,
-    aggregator_db: str
-) -> str:
-    """
-    Build complete prompt for validating the rewrite decision.
-    
-    Args:
-        user_prompt: The user's compiler-directing prompt
-        current_body: The body section
-        current_outline: The paper outline
-        current_title: Current paper title
-        critique_feedback: All accepted critiques (typically 1-3 out of 5 total attempts)
-        decision_result: The decision being validated
-        aggregator_db: The aggregator database content
-        
-    Returns:
-        Complete assembled prompt
-    """
-    decision = decision_result.get('decision', 'unknown')
-    new_title = decision_result.get('new_title', None)
-    new_outline = decision_result.get('new_outline', None)
-    reasoning = decision_result.get('reasoning', '')
-    
-    parts = [
-        get_rewrite_decision_validator_system_prompt(),
-        "\n---\n",
-        get_rewrite_decision_validation_json_schema(),
-        "\n---\n",
-        f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
-        "\n---\n",
-        f"CURRENT PAPER TITLE:\n{current_title}",
-        "\n---\n",
-        f"CURRENT OUTLINE:\n{current_outline}",
-        "\n---\n",
-        f"CURRENT BODY SECTION:\n{current_body}",
-        "\n---\n",
-        f"ALL ACCEPTED CRITIQUES:\n{critique_feedback}",
-        "\n---\n",
-        """OPTIONAL SOURCE MATERIAL POLICY:
-- The source database below is optional support, not a mandatory checklist.
-- Use it if needed to judge whether the proposed decision is genuinely stronger or weaker.
-- Do NOT reject solely because not all source material is being used.
-""",
-        "\n---\n",
-        f"SOURCE DATABASE (optional support - use if helpful):\n{aggregator_db}",
-        "\n---\n",
-        f"PROPOSED DECISION:\n",
-        f"Decision: {decision}\n",
-        f"New Title: {new_title if new_title else '(keep current)'}\n",
-        f"New Outline: {new_outline if new_outline else '(keep current)'}\n",
-        f"Reasoning: {reasoning}",
-        "\n---\n",
-        "Validate whether this decision is justified based on the critiques. Respond as JSON:"
-    ]
-    
-    return ''.join(parts)
-
-
-# ============================================================================
-# ITERATIVE PARTIAL REVISION PROMPTS
-# ============================================================================
-
-def get_iterative_edit_system_prompt() -> str:
-    """System prompt for iterative partial revision - proposing one edit at a time."""
-    return """You are making targeted edits to a mathematical document body to address peer review critiques.
-
-⚠️ CRITICAL - INTERNAL CONTENT WARNING ⚠️
-
-ALL context provided to you (papers, outlines, critiques) is AI-GENERATED within this research system. 
-This content has NOT been peer-reviewed, published, or verified by external sources.
-Treat all provided context with extreme skepticism.
-
-YOUR TASK:
-You are in an ITERATIVE EDIT LOOP. You have been shown:
-1. The PRE-CRITIQUE PAPER (how the body looked before this revision cycle started)
-2. The CURRENT PAPER (the body after any edits applied so far in this loop)
-3. The ACCEPTED CRITIQUES (problems identified that need fixing)
-4. The EDITS ALREADY APPLIED (what has been changed so far)
-
-Your job is to propose ONE EDIT at a time to address the remaining critique issues.
-After each edit is validated and applied, you will see the updated paper and can propose the next edit.
-
-EDIT OPERATIONS USE EXACT STRING MATCHING:
-- old_string must exist VERBATIM and UNIQUELY in the CURRENT paper body
-- Include enough context (3-5 lines) to ensure uniqueness
-- If the exact string is not found or is ambiguous, the edit will be rejected
-
-OPERATION TYPES:
-- **replace**: Find old_string, replace with new_string
-- **insert_after**: Find old_string, insert new_string immediately after it
-- **delete**: Find old_string, remove it (new_string should be empty)
-
-WHEN TO SET more_edits_needed:
-- TRUE: More critique issues remain to be addressed
-- FALSE: All critique issues have been addressed (or best effort has been made)
-
-IMPORTANT:
-- Focus on ONE edit at a time
-- Address the most critical issues first
-- Each edit should be substantial and address specific critique feedback
-- Do NOT make cosmetic changes - focus on mathematical/structural issues identified in critiques
-- If you believe all issues are addressed, set more_edits_needed to false
-- If critique issues involve unsupported empirical or artifact claims, remove them or rewrite them as hypotheses, validation plans, expected benefits, limitations, or future work
-- Never preserve fabricated experiments, unsupported benchmark numbers, or nonexistent code claims as if they were verified
-
-Output your response ONLY as JSON in the exact format specified.
-"""
-
-
-def get_iterative_edit_json_schema() -> str:
-    """Get JSON schema for iterative edit response."""
-    return """
-REQUIRED JSON FORMAT:
-{
-  "operation": "replace | insert_after | delete",
-  "old_string": "Exact text to find in the CURRENT paper body (must be unique)",
-  "new_string": "Replacement/insertion text (empty string for delete)",
-  "reasoning": "Which critique issue this edit addresses and why this change fixes it",
-  "more_edits_needed": true OR false
-}
-
-CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-   - Example: Write "\\\\tau" not "\\tau", write "\\\\(" not "\\("
-2. Quotes: Escape double quotes inside strings as \\"
-   - Example: "He said \\"hello\\"" 
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs (NOT \\\\t)
-   - Example: "Line 1\\nLine 2" creates two lines
-4. DO NOT use single backslashes except for: \\", \\\\, \\/, \\b, \\f, \\n, \\r, \\t, \\uXXXX
-5. LaTeX notation: MUST escape backslash: write "\\\\Delta", "\\\\tau", "\\\\[", "\\\\]"
-
-Example (Replace - Fix missing proof):
-{
-  "operation": "replace",
-  "old_string": "The proof assumes uniform convergence without establishing the necessary conditions.",
-  "new_string": "We establish uniform convergence via the Weierstrass M-test. The series satisfies |f_n(x)| ≤ M_n with ∑M_n < ∞, therefore uniform convergence follows immediately.",
-  "reasoning": "Critique #1 identified that the convergence proof was assumed rather than proven. Adding the rigorous justification using Weierstrass M-test.",
-  "more_edits_needed": true
-}
-
-Example (Insert After - Add missing corollary):
-{
-  "operation": "insert_after",
-  "old_string": "This completes the proof of Theorem 3. ∎",
-  "new_string": "\\n\\nCorollary 3.1. As an immediate consequence of Theorem 3, we obtain the following bound on the error term:\\n\\n|R_n(x)| ≤ C · n^{-α}\\n\\nfor some constant C > 0 independent of n.",
-  "reasoning": "Critique #3 noted that Corollary 3.1 from the outline was missing. Adding it directly after the proof of Theorem 3 where it logically belongs.",
-  "more_edits_needed": false
-}
-
-Example (Delete - Remove redundant section):
-{
-  "operation": "delete",
-  "old_string": "We pause to note that this result is analogous to several classical results in the literature, including the work of Smith (1995), Jones (2001), and Brown (2010). While a full comparison is beyond the scope of this paper, the interested reader may consult these references for additional context.",
-  "new_string": "",
-  "reasoning": "Critique #2 identified this paragraph as redundant filler that doesn't add mathematical substance. Removing to improve focus.",
-  "more_edits_needed": true
-}
-"""
-
-
-def build_iterative_edit_prompt(
-    user_prompt: str,
-    pre_critique_paper: str,
-    current_paper: str,
-    current_outline: str,
-    critique_feedback: str,
-    edits_applied: List[Dict],
-    reference_papers: Optional[str] = None,
-    accumulated_critique_history: str = ""
-) -> str:
-    """
-    Build prompt for iterative partial revision edit.
-    
-    Args:
-        user_prompt: The user's compiler-directing prompt
-        pre_critique_paper: Paper snapshot from START of critique phase
-        current_paper: Current paper body (after any edits applied so far)
-        current_outline: The paper outline
-        critique_feedback: All accepted critiques from this revision cycle
-        edits_applied: List of edits already applied in this iteration
-        reference_papers: Optional reference paper content
-        accumulated_critique_history: Critiques from previous failed versions (if any)
-        
-    Returns:
-        Complete assembled prompt
-    """
-    parts = [
-        get_iterative_edit_system_prompt(),
-        "\n---\n",
-        get_iterative_edit_json_schema(),
-        "\n---\n",
-        f"USER COMPILER-DIRECTING PROMPT:\n{user_prompt}",
-        "\n---\n",
-        f"CURRENT OUTLINE:\n{current_outline}",
-        "\n---\n",
-    ]
-    
-    # Add accumulated history if present
-    if accumulated_critique_history:
-        parts.extend([
-            f"ACCUMULATED CRITIQUE HISTORY (from previous failed versions):\n{accumulated_critique_history}",
-            "\n---\n",
-        ])
-    
-    parts.extend([
-        f"ACCEPTED CRITIQUES (issues to address):\n{critique_feedback}",
-        "\n---\n",
-        f"PRE-CRITIQUE PAPER (how the body looked before this revision cycle):\n{pre_critique_paper}",
-        "\n---\n",
-        f"CURRENT PAPER (after {len(edits_applied)} edit(s) applied):\n{current_paper}",
-        "\n---\n",
+        "Now generate your critique as JSON:"
     ])
 
-    if reference_papers:
-        parts.extend([
-            f"REFERENCE PAPERS:\n{reference_papers}",
-            "\n---\n",
-        ])
-    
-    # Show edits already applied
-    if edits_applied:
-        edits_str = "\n".join([
-            f"Edit {i+1}: {e['operation']} - {e.get('reasoning', 'N/A')[:100]}..."
-            for i, e in enumerate(edits_applied)
-        ])
-        parts.extend([
-            f"EDITS ALREADY APPLIED:\n{edits_str}",
-            "\n---\n",
-        ])
-    else:
-        parts.extend([
-            "EDITS ALREADY APPLIED: None yet - this is the first edit.",
-            "\n---\n",
-        ])
-    
-    parts.append(
-        "Propose your NEXT edit to address remaining critique issues, or set more_edits_needed=false if all issues are resolved. Respond as JSON:"
-    )
-    
-    return ''.join(parts)
-
-
-# ============================================================================
-# PARTIAL REVISION EDIT VALIDATION PROMPTS
-# ============================================================================
-
-def get_partial_revision_validation_system_prompt() -> str:
-    """System prompt for validating individual partial revision edits."""
-    return """You are validating a proposed edit to a mathematical document.
-
-The edit is part of an iterative partial revision to address peer review critiques.
-
-EMPIRICAL PROVENANCE RULES:
-- Empirical claims (benchmarks, speedups, latency, accuracy, perplexity, hardware measurements) must not remain stated as fact unless backed by explicit citation or provided artifact support.
-- Artifact claims (code, kernels, experiments, logs, accompanying implementations) must not remain stated as fact unless backed by explicit citation or provided artifact support.
-- If the edit rewrites unsupported empirical/artifact claims into hypotheses, validation plans, expected benefits, limitations, or future work, that is a valid improvement.
-
-YOUR TASK:
-Validate whether this specific edit should be ACCEPTED or REJECTED.
-
-ACCEPT the edit if:
-1. It addresses one or more issues identified in the accepted critiques
-2. The old_string exists in the current paper and is unambiguous
-3. The new_string improves the mathematical content or addresses critique feedback
-4. The edit maintains coherence with the surrounding text
-5. The edit is mathematically sound
-
-REJECT the edit if:
-1. The edit does NOT address any critique issues
-2. The old_string does not exist or is ambiguous in the current paper
-3. The new_string introduces errors or reduces quality
-4. The edit breaks coherence with surrounding content
-5. The edit is mathematically unsound or introduces logical errors
-6. The edit is purely cosmetic and doesn't address critiques
-7. The edit preserves fabricated experiments, unsupported metrics, or nonexistent artifact claims as established fact
-
-Output your decision as JSON.
-"""
-
-
-def get_partial_revision_validation_json_schema() -> str:
-    """Get JSON schema for partial revision edit validation."""
-    return """
-REQUIRED JSON FORMAT:
-{
-  "decision": "accept" OR "reject",
-  "reasoning": "string - explanation of why the edit should or should not be accepted"
-}
-
-CRITICAL JSON ESCAPE RULES:
-1. Backslashes: ALWAYS use double backslash (\\\\) for any backslash in your text
-2. Quotes: Escape double quotes inside strings as \\"
-3. Newlines/Tabs: Use \\n for newlines (NOT \\\\n), \\t for tabs
-
-Example (Accept):
-{
-  "decision": "accept",
-  "reasoning": "The edit correctly addresses critique #1 which identified a missing convergence proof. The new text adds a rigorous Weierstrass M-test argument that establishes uniform convergence. The old_string exists exactly as specified in the current paper."
-}
-
-Example (Reject):
-{
-  "decision": "reject",
-  "reasoning": "The proposed edit does not address any of the accepted critiques. It appears to be a stylistic change (rewording a sentence) rather than fixing the mathematical issues identified. Additionally, the old_string appears twice in the document, making it ambiguous."
-}
-"""
-
-
-def build_partial_revision_validation_prompt(
-    current_paper: str,
-    current_outline: str,
-    critique_feedback: str,
-    edit_proposal: Dict
-) -> str:
-    """
-    Build prompt for validating a single partial revision edit.
-    
-    Args:
-        current_paper: Current paper body
-        current_outline: Paper outline
-        critique_feedback: All accepted critiques
-        edit_proposal: Dict with operation, old_string, new_string, reasoning
-        
-    Returns:
-        Complete assembled validation prompt
-    """
-    operation = edit_proposal.get("operation", "")
-    old_string = edit_proposal.get("old_string", "")
-    new_string = edit_proposal.get("new_string", "")
-    reasoning = edit_proposal.get("reasoning", "")
-    
-    # Truncate long strings for prompt
-    old_str_display = old_string[:500] + "..." if len(old_string) > 500 else old_string
-    new_str_display = new_string[:500] + "..." if len(new_string) > 500 else new_string
-    
-    parts = [
-        get_partial_revision_validation_system_prompt(),
-        "\n---\n",
-        get_partial_revision_validation_json_schema(),
-        "\n---\n",
-        f"CURRENT OUTLINE:\n{current_outline}",
-        "\n---\n",
-        f"ACCEPTED CRITIQUES (issues being addressed):\n{critique_feedback}",
-        "\n---\n",
-        f"CURRENT PAPER:\n{current_paper}",
-        "\n---\n",
-        f"PROPOSED EDIT:\n",
-        f"Operation: {operation}\n",
-        f"Old String: {old_str_display}\n",
-        f"New String: {new_str_display}\n",
-        f"Reasoning: {reasoning}",
-        "\n---\n",
-        "Validate whether this edit should be accepted. Respond as JSON:"
-    ]
-    
-    return ''.join(parts)
-
+    return "".join(parts)
diff --git a/backend/compiler/prompts/outline_prompts.py b/backend/compiler/prompts/outline_prompts.py
index 55920f9..ffc4fbd 100644
--- a/backend/compiler/prompts/outline_prompts.py
+++ b/backend/compiler/prompts/outline_prompts.py
@@ -158,6 +158,11 @@ def get_outline_create_system_prompt() -> str:
 - Do NOT force coverage of every brainstorm/database entry
 - Do NOT ignore clearly crucial source material for the scope you choose
 
+DIRECT-ANSWER-FIRST PRINCIPLE:
+- Organize the paper around the strongest rigorous direct answer the paper can justify
+- Prefer sections that directly solve, partially solve, refute, or sharply constrain the user's question over broad background accumulation
+- Include background and preliminaries only to the extent needed to support the direct answer cleanly and rigorously
+
 - Produce a numbered outline with major sections and subsections
 - Incorporate the strongest helpful source ideas where appropriate
 - Flag gaps explicitly if the evidence is insufficient
@@ -185,6 +190,7 @@ def get_outline_create_system_prompt() -> str:
 - Required sections (Abstract, Introduction, Body, Conclusion) present with exact names
 - Sections follow logical mathematical progression (definitions → theorems → proofs)
 - The outline optimally serves the paper title and user's compiler-directing prompt
+- The outline is focused on the strongest rigorous direct answer available, without unnecessary detours
 - No further refinement would meaningfully improve the outline
 - You are confident this outline will guide excellent paper construction
 
@@ -218,6 +224,7 @@ def get_outline_create_system_prompt() -> str:
 - The outline should support a coherent, logical flow for the final document
 - Sections should build upon each other logically (definitions → theorems → proofs)
 - The outline should align with the user's compiler-directing prompt goals
+- The outline should prioritize the strongest direct rigorous route to answering the prompt
 - DO NOT include a separate References or Citations section in the outline
 - All content must be rooted in sound mathematical reasoning; aggregator/brainstorm material is optional support, not a mandatory checklist
 - NO unfounded claims or logical fallacies
@@ -308,11 +315,16 @@ def get_outline_update_system_prompt() -> str:
 - Do NOT force additions just because a brainstorm/database entry exists
 - Do NOT ignore clearly crucial source material for the scope you are keeping
 
+DIRECT-ANSWER-FIRST PRINCIPLE:
+- Update the outline when doing so materially strengthens the paper's most direct rigorous answer to the user's prompt
+- Do not add side sections that broaden scope without improving the direct answer, partial answer, impossibility result, or key constraint
+
 Decide if the outline requires updates. Consider:
 - Relevance to current source content when it helps the paper
 - Missing content that should be included in outline to better serve the user prompt
 - Structural issues in current outline
 - Alignment with document construction progress
+- Whether the outline still reflects the strongest direct-answer path revealed by the draft
 
 CRITICAL - NO PLACEHOLDER TEXT:
 You must NEVER include placeholder markers like "[HARD CODED PLACEHOLDER FOR...]" in your outline submissions.
@@ -348,6 +360,7 @@ def get_outline_update_system_prompt() -> str:
 - All added content must be rooted in sound mathematical reasoning; source database material is optional support, not a mandatory checklist
 - NO unfounded claims or logical fallacies
 - Focus on rigorous mathematical arguments
+- Prefer additions that materially strengthen the paper's direct answer rather than merely broadening coverage
 - NEVER change the names of Abstract, Introduction, or Conclusion sections
 - New body sections must be inserted between Introduction and Conclusion
 - DO NOT add unsupported numeric empirical claims in section or subsection headings
diff --git a/backend/compiler/prompts/review_prompts.py b/backend/compiler/prompts/review_prompts.py
index 0b700e8..0c2ca1b 100644
--- a/backend/compiler/prompts/review_prompts.py
+++ b/backend/compiler/prompts/review_prompts.py
@@ -74,6 +74,7 @@ def get_review_system_prompt() -> str:
 - Structural issues
 - Redundancy
 - Forward-looking structural previews
+- Places where the draft drifts away from the strongest direct answer to the user's prompt
 - Other improvements
 
 CRITICAL - SYSTEM-MANAGED MARKERS (NOT YOUR OUTPUT):
@@ -116,6 +117,7 @@ def get_review_system_prompt() -> str:
 - Unsupported empirical claims, unsupported artifact/code claims, or uncited literature claims
 - Numeric benchmark-style claims in narrative text that are not explicitly sourced
 - Statements implying experiments, measurements, or implementations that are not actually evidenced
+- Generic exploratory wording that obscures a stronger justified direct answer already present in the draft
 
 WHEN NOT TO MAKE AN EDIT:
 - Document is acceptable for a draft in progress
diff --git a/backend/compiler/prompts/rigor_prompts.py b/backend/compiler/prompts/rigor_prompts.py
index 5491eb6..37bb345 100644
--- a/backend/compiler/prompts/rigor_prompts.py
+++ b/backend/compiler/prompts/rigor_prompts.py
@@ -6,9 +6,11 @@
 
     Stage 1 - Theorem discovery (build_rigor_theorem_discovery_prompt):
         Using the full writing context, the submitter asks itself whether the
-        paper contains a theorem worth formalizing and proving in Lean 4 that
-        has not already been verified. Output is a candidate theorem JSON (or
-        a decline).
+        paper, outline, support context, or user prompt expose a theorem worth
+        formalizing and proving in Lean 4. Candidate theorems may verify
+        existing paper claims or extend partial work when that helps the paper
+        construction / user prompt. Output is a candidate theorem JSON (or a
+        decline).
 
     Stage 2 - Placement (build_rigor_placement_prompt):
         Given a Lean-4-verified theorem, the submitter proposes an inline
@@ -57,29 +59,37 @@
 # STAGE 1: THEOREM DISCOVERY
 # =============================================================================
 
-_DISCOVERY_SYSTEM_PROMPT = f"""You are the rigor agent for a mathematical-paper compiler. Your job during the rigor loop is to look at the paper-in-progress together with the full research context and decide whether there is a theorem worth formalizing and proving in Lean 4.
+_DISCOVERY_SYSTEM_PROMPT = f"""You are the rigor agent for a mathematical-paper compiler. Your job during the rigor loop is to look at the paper-in-progress together with the full research context and decide whether there is a theorem worth formalizing and proving in Lean 4 because it helps answer, support, or advance the USER RESEARCH PROMPT and/or materially improves the paper under construction.
 
 {INTERNAL_CONTENT_WARNING}
 
 YOUR TASK - STAGE 1 (DISCOVERY)
 
 1. Read the current outline and the current paper text.
-2. Read the list of theorems that have ALREADY been verified by Lean 4 (EXISTING VERIFIED PROOFS block).
-3. Read the list of theorems that PREVIOUSLY FAILED Lean 4 verification (OPEN LEMMA TARGETS block, if present).
-4. Decide exactly one of:
-   (A) `needs_theorem_work=false` - no theorem worth trying right now. Good reasons: all interesting claims in the paper are already covered by existing verified proofs; the paper is in too early a state; there is no claim a Lean 4 proof could close usefully.
-   (B) `needs_theorem_work=true` - propose a single candidate theorem to formalize.
+2. Read the USER RESEARCH PROMPT and treat it as the relevance boundary for all theorem work.
+3. Read the list of theorems that have ALREADY been verified by Lean 4 (EXISTING VERIFIED PROOFS block).
+4. Read the list of theorems that PREVIOUSLY FAILED Lean 4 verification (OPEN LEMMA TARGETS block, if present).
+5. Decide exactly one of:
+   (A) `needs_theorem_work=false` - no prompt-relevant theorem worth trying right now. Good reasons: all useful claims for the user's prompt are already covered by existing verified proofs; the paper is in too early a state; there is no claim a Lean 4 proof could close usefully; or the only available claims are mathematically interesting but off-topic.
+   (B) `needs_theorem_work=true` - propose a single prompt-relevant candidate theorem to formalize.
 
 RULES FOR PROPOSING A THEOREM:
+- The theorem must directly help answer, support, or advance the USER RESEARCH PROMPT. Do not propose a theorem merely because it is non-trivial or mathematically interesting.
 - The theorem must be provable in Lean 4 with Mathlib.
 - You MUST NOT re-propose a theorem that is already in EXISTING VERIFIED PROOFS. Look for theorems that are DIFFERENT - new results, missed lemmas, or sharper versions that are not yet on the list.
-- You MAY retry a theorem from OPEN LEMMA TARGETS when the paper now gives you a better angle on it. When you do, set `retry_existing_failure_id` to the failed `theorem_id`.
+- You MAY retry a theorem from OPEN LEMMA TARGETS when it is still prompt-relevant and the paper now gives you a better angle on it. When you do, set `retry_existing_failure_id` to the failed `theorem_id`.
+- EXTENSION IS EXPLICITLY ALLOWED AND ENCOURAGED WHERE HELPFUL: you are NOT limited to exact claims already present in the current paper. You may construct a Lean-verifiable theorem by extending partial paper work, the current outline, supporting context, or the USER RESEARCH PROMPT when that theorem would materially help the paper construction and/or the user's requested goal.
+- Set `theorem_origin="existing_paper_claim"` only when the theorem directly formalizes a claim already present in the current paper text.
+- Set `theorem_origin="extension_from_partial_work"` when the theorem is constructed by extending the current paper, outline, or supporting context beyond the exact written claim.
+- Set `theorem_origin="extension_from_user_prompt"` when the theorem is prompted primarily by the USER RESEARCH PROMPT and helps the paper even if the current paper has not yet written the claim.
+- Extension-derived theorems (`extension_from_partial_work` or `extension_from_user_prompt`) MUST set `placement_preference="appendix_only"`. These proofs belong at the end of the paper in the Theorems Appendix, not inline in the main body.
+- Existing-paper-claim theorems may set `placement_preference="inline"` when a local body insertion would strengthen the existing argument, or `placement_preference="appendix_only"` when the proof is useful but would distract from the prose.
 - Prefer theorems whose statements are tight enough that Lean 4 can actually close them (arithmetic facts, concrete inequalities, specific algebraic identities, small group/ring/field lemmas, concrete combinatorial identities) over large open conjectures.
 - The `theorem_statement` is for a human reader. It should be precise, self-contained, and include the hypotheses.
-- The `formal_sketch` tells the formalization agent what tactics or lemmas look promising in Lean 4 / Mathlib. Keep it concrete.
-- The `source_excerpt` is 2-6 sentences of surrounding paper text that motivates why this theorem is a natural target here. It must be a direct paraphrase or quote from the current paper.
+- The `formal_sketch` tells the formalization agent what tactics or lemmas look promising in Lean 4 / Mathlib and why this theorem helps the user's prompt. Keep it concrete.
+- The `source_excerpt` is 2-6 sentences of motivating context. For `existing_paper_claim`, it must be a direct paraphrase or quote from the current paper. For extension-derived theorems, it may explain the partial paper work, outline item, supporting evidence, and/or user-prompt need that the theorem extends.
 
-If Stage 1 guesses wrong, Stage 2 cannot recover - 5 Lean 4 attempts will be spent on the wrong target. Prefer declining over a weak proposal.
+If Stage 1 guesses wrong, Stage 2 cannot recover - 5 Lean 4 attempts will be spent on the wrong target. Prefer declining over a weak or off-prompt proposal.
 
 Output your response ONLY as JSON in this exact format:
 {{{{
@@ -87,8 +97,10 @@
   "theorem_statement": "precise theorem statement with explicit hypotheses and conclusion (empty if needs_theorem_work=false)",
   "formal_sketch": "concrete sketch: what tactics / Mathlib lemmas you expect to work (empty if needs_theorem_work=false)",
   "source_excerpt": "2-6 sentences of surrounding paper text that motivates this theorem (empty if needs_theorem_work=false)",
+  "theorem_origin": "existing_paper_claim | extension_from_partial_work | extension_from_user_prompt (empty if needs_theorem_work=false)",
+  "placement_preference": "inline | appendix_only (empty if needs_theorem_work=false)",
   "retry_existing_failure_id": "theorem_id from OPEN LEMMA TARGETS if retrying a prior failure, empty string otherwise",
-  "reasoning": "why this theorem is the best target right now OR why no theorem should be attempted"
+  "reasoning": "why this theorem is the best prompt-relevant target right now OR why no theorem should be attempted"
 }}}}"""
 
 
@@ -98,6 +110,8 @@
   "theorem_statement": "string",
   "formal_sketch": "string",
   "source_excerpt": "string",
+  "theorem_origin": "existing_paper_claim OR extension_from_partial_work OR extension_from_user_prompt",
+  "placement_preference": "inline OR appendix_only",
   "retry_existing_failure_id": "string (may be empty)",
   "reasoning": "string"
 }
@@ -108,8 +122,22 @@
   "theorem_statement": "For every natural number n, the sum of the first n positive integers equals n*(n+1)/2.",
   "formal_sketch": "Induction on n. Base: n=0 both sides are 0. Step: use Finset.sum_range_succ and Nat.succ_mul; close with omega / ring. Mathlib has Finset.sum_range_id which may finish it outright.",
   "source_excerpt": "In Section 2 we reasoned about partial sums of the form 1 + 2 + ... + n...",
+  "theorem_origin": "existing_paper_claim",
+  "placement_preference": "inline",
   "retry_existing_failure_id": "",
-  "reasoning": "Section 2 relies on the closed form but currently presents it without a verified proof. Lean 4 can close this cleanly; it does not duplicate any existing verified proof."
+  "reasoning": "Section 2 uses this closed form to support the user's requested argument but currently presents it without a verified proof. Lean 4 can close this cleanly; it does not duplicate any existing verified proof."
+}
+
+Example (propose an extension theorem for the appendix):
+{
+  "needs_theorem_work": true,
+  "theorem_statement": "For every natural number n, n*(n+1) is even.",
+  "formal_sketch": "Use Nat.even_mul_succ_self or prove by parity cases / omega. This lemma can support a later divisibility argument about triangular numbers.",
+  "source_excerpt": "The outline asks for arithmetic constraints on triangular-number expressions, but the current paper has not yet isolated the parity lemma needed for the clean construction. This theorem extends the partial plan into a Lean-checkable support result.",
+  "theorem_origin": "extension_from_partial_work",
+  "placement_preference": "appendix_only",
+  "retry_existing_failure_id": "",
+  "reasoning": "This is not an exact written claim in the current paper; it extends the partial outline into a useful verified lemma. Because it is extension-derived, it should be stored in the Theorems Appendix rather than inserted inline."
 }
 
 Example (decline):
@@ -118,8 +146,10 @@
   "theorem_statement": "",
   "formal_sketch": "",
   "source_excerpt": "",
+  "theorem_origin": "",
+  "placement_preference": "",
   "retry_existing_failure_id": "",
-  "reasoning": "The paper currently contains only outline scaffolding and the one verified theorem (proof_002). Attempting another Lean 4 proof right now would either duplicate proof_002 or target claims that are too vague to formalize."
+  "reasoning": "The paper currently contains only outline scaffolding and the one verified theorem (proof_002). Attempting another Lean 4 proof right now would either duplicate proof_002, target claims that are too vague to formalize, or chase claims that do not help the user's prompt."
 }
 """
 
@@ -151,6 +181,7 @@
 
 PLACEMENT GUIDELINES:
 - Put the theorem where it strengthens the local argument. Prefer insertion points inside a relevant body section (near the discussion it closes) over dumping it in a new section.
+- The inline placement should make clear why this verified theorem helps the paper answer or advance the USER RESEARCH PROMPT.
 - The paper has a Theorems Appendix block already; do NOT try to edit the appendix directly.
 - Keep `old_string` short but unique (3-5 lines of surrounding context is usually enough).
 
diff --git a/backend/compiler/validation/compiler_validator.py b/backend/compiler/validation/compiler_validator.py
index 0afe2fa..c10b3b6 100644
--- a/backend/compiler/validation/compiler_validator.py
+++ b/backend/compiler/validation/compiler_validator.py
@@ -11,7 +11,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.models import CompilerSubmission, CompilerValidationResult
-from backend.shared.json_parser import parse_json
+from backend.shared.json_parser import parse_json, sanitize_model_output_for_retry_context
 from backend.shared.utils import count_tokens
 from backend.autonomous.memory.proof_database import proof_database
 from backend.aggregator.validation.json_validator import json_validator
@@ -477,11 +477,16 @@ async def _parse_json_with_retry(
                 logger.info("CompilerValidator: Already in retry, using fallback parser")
                 return self._fallback_parse(response)
             
-            # Build retry prompt asking for reformatted JSON
-            # Note: response is already truncated to 2000 chars in the prompt text
+            # Build retry prompt asking for reformatted JSON. Keep failed-output
+            # context, but sanitize it before any replay in prompt or assistant turn.
+            max_failed_output_chars = 2000  # ~500 tokens - enough for error context
+            failed_output_preview = sanitize_model_output_for_retry_context(
+                response,
+                max_chars=max_failed_output_chars,
+            )
             reparse_prompt = (
                 "Your previous response could not be parsed as valid JSON.\n\n"
-                f"YOUR PREVIOUS RESPONSE:\n{response[:2000]}{'...' if len(response) > 2000 else ''}\n\n"
+                f"YOUR PREVIOUS RESPONSE:\n{failed_output_preview}\n\n"
                 f"PARSE ERROR: {str(parse_error)}\n\n"
                 "Please provide the exact same validation decision in valid JSON format.\n"
                 "CRITICAL: Properly escape backslashes (use \\\\) and quotes (use \\\").\n"
@@ -492,13 +497,6 @@ async def _parse_json_with_retry(
             try:
                 retry_task_id = f"{self.get_current_task_id()}_retry"
                 
-                # CRITICAL FIX: Truncate failed output to prevent context overflow during retry
-                max_failed_output_chars = 2000  # ~500 tokens - enough for error context
-                if len(response) > max_failed_output_chars:
-                    failed_output_preview = response[:max_failed_output_chars] + "\n[...output truncated for retry...]"
-                else:
-                    failed_output_preview = response
-                
                 # Calculate if conversation fits in context window
                 from backend.shared.config import system_config, rag_config
                 prompt_tokens = count_tokens(original_prompt)
@@ -1295,6 +1293,9 @@ def _build_brainstorm_validation_prompt(
 
 You see ONLY the brainstorm database and the proposed operation. You do NOT see the paper or any paper edits. Your decision must be based solely on whether this operation improves the brainstorm database.
 
+PROTECTED LEAN 4 PROOFS:
+Lean 4 verified proof entries in the brainstorm database are immutable to paper-writing retroactive operations. If a proposed operation edits, deletes, annotates, or adds context to a Lean 4 verified proof, reject it. Only the normal brainstorm prune system may remove Lean 4 proof entries.
+
 OPERATION TYPE: {action.upper()}
 
 """
@@ -1561,6 +1562,7 @@ def _get_outline_validation_system_prompt(self, mode: str) -> str:
 - Do NOT reject solely because an outline does not explicitly use or cover database material
 - Do reject if the outline ignores clearly crucial source material in a way that makes its chosen scope weak, incoherent, or misaligned with the user prompt
 - Accept selective or divergent outline structures when they better serve the user's prompt and remain rigorous
+- Prefer outlines that organize the strongest rigorous direct answer to the user's prompt, rather than broad exploratory coverage
 
 YOUR TASK:
 Verify the submission meets ALL criteria above. Accept only if ALL criteria pass. Reject if ANY criterion fails.
@@ -1789,6 +1791,7 @@ def _get_paper_validation_system_prompt(self, mode: str) -> str:
 - The brainstorm database is optional support, not a mandatory checklist
 - Do NOT reject solely because the submission does not explicitly use brainstorm content or because it departs from brainstorm phrasing
 - Reject only if the submission ignores clearly necessary established content for its claimed scope, conflicts with the outline, or becomes weaker/less rigorous as a result
+- Prefer submissions that strengthen the paper's most direct rigorous answer to the prompt rather than adding indirect breadth
 
 YOUR TASK:
 Verify the submission meets ALL criteria above. If even ONE criterion fails, reject the submission.
@@ -2025,233 +2028,4 @@ def _parse_validation_response(self, response: str) -> Optional[dict]:
             
         except Exception as e:
             logger.error(f"Failed to parse validation response: {e}")
-            return None
-    
-    async def validate_rewrite_decision(
-        self,
-        decision_result: Dict,
-        user_prompt: str,
-        current_body: str,
-        current_outline: str,
-        current_title: str,
-        critique_feedback: str,
-        aggregator_db: str
-    ) -> bool:
-        """
-        Validate a rewrite vs continue decision made after critique phase.
-        
-        Args:
-            decision_result: The decision dict from critique submitter
-            user_prompt: User's compiler-directing prompt
-            current_body: Body section being evaluated
-            current_outline: Paper outline
-            current_title: Current paper title
-            critique_feedback: All accepted critiques (typically 1-3 out of 5 total attempts)
-            aggregator_db: Aggregator database content
-            
-        Returns:
-            True if decision is valid, False if should be retried
-        """
-        try:
-            logger.info("Validating rewrite decision...")
-            
-            # Import prompt builder
-            from backend.compiler.prompts.critique_prompts import build_rewrite_decision_validation_prompt
-            
-            # Build validation prompt
-            prompt = build_rewrite_decision_validation_prompt(
-                user_prompt=user_prompt,
-                current_body=current_body,
-                current_outline=current_outline,
-                current_title=current_title,
-                critique_feedback=critique_feedback,
-                decision_result=decision_result,
-                aggregator_db=aggregator_db
-            )
-            
-            # Generate task ID
-            task_id = self.get_current_task_id()
-            self.task_sequence += 1
-            
-            # Notify task started
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM
-            from backend.shared.config import system_config
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,
-                max_tokens=system_config.compiler_validator_max_output_tokens
-            )
-            
-            # Notify task completed
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            # Extract content from response (handles both 'content' and 'reasoning' fields)
-            message = response.get("choices", [{}])[0].get("message", {})
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            
-            # Parse the extracted string
-            data = parse_json(llm_output)
-            
-            if data is None:
-                logger.error("Failed to parse rewrite decision validation response")
-                return False
-            
-            # Handle array responses
-            if isinstance(data, list):
-                logger.warning("Validator returned array instead of object - using first element")
-                if not data:
-                    return False
-                data = data[0]
-            
-            # Check decision
-            decision = data.get("decision", "").lower()
-            reasoning = data.get("reasoning", "")
-            
-            if decision == "accept":
-                logger.info(f"Rewrite decision VALIDATED: {reasoning[:200]}...")
-                return True
-            else:
-                logger.info(f"Rewrite decision REJECTED: {reasoning[:200]}...")
-                return False
-                
-        except FreeModelExhaustedError:
-            raise
-        except Exception as e:
-            logger.error(f"Error validating rewrite decision: {e}", exc_info=True)
-            return False
-    
-    async def validate_partial_revision_edit(
-        self,
-        edit_proposal: Dict,
-        current_paper: str,
-        current_outline: str,
-        critique_feedback: str
-    ) -> Tuple[bool, str]:
-        """
-        Validate a single edit proposed during iterative partial revision.
-        
-        This validates that an edit:
-        1. Uses exact string matching correctly
-        2. Addresses critique feedback appropriately
-        3. Maintains document coherence
-        4. Preserves mathematical rigor
-        
-        Args:
-            edit_proposal: Dict with operation, old_string, new_string, reasoning
-            current_paper: Current paper state
-            current_outline: Paper outline
-            critique_feedback: The accepted critique feedback being addressed
-            
-        Returns:
-            Tuple of (is_valid: bool, rejection_reason: str)
-        """
-        try:
-            logger.info("Validating partial revision edit...")
-            
-            operation = edit_proposal.get("operation", "")
-            old_string = edit_proposal.get("old_string", "")
-            new_string = edit_proposal.get("new_string", "")
-            reasoning = edit_proposal.get("reasoning", "")
-            
-            # CRITICAL: Ensure markers are intact BEFORE any old_string validation
-            # Partial revision operates on paper (not outline)
-            markers_repaired = await paper_memory.ensure_markers_intact()
-            if markers_repaired:
-                logger.info("Paper markers were missing and have been repaired during partial revision validation")
-                # Re-fetch paper after repair
-                current_paper = await paper_memory.get_paper()
-            
-            # Pre-validation: Check exact string match for non-full_content operations
-            if operation in ("replace", "insert_after", "delete"):
-                if not old_string:
-                    return False, "old_string cannot be empty for this operation"
-                
-                # Normalize and check
-                normalized_paper = normalize_unicode_hyphens(current_paper)
-                normalized_old = normalize_unicode_hyphens(old_string)
-                
-                if normalized_old not in normalized_paper:
-                    # Try to find similar text for better error message
-                    logger.warning(f"Exact string not found in document: '{old_string[:100]}...'")
-                    return False, f"EXACT_STRING_NOT_FOUND: The old_string was not found in the document. Ensure you use text that exists verbatim in CURRENT PAPER."
-                
-                # Check uniqueness
-                count = normalized_paper.count(normalized_old)
-                if count > 1:
-                    return False, f"STRING_NOT_UNIQUE: The old_string appears {count} times in the document. Include more context to make it unique."
-            
-            # Import prompt builder for LLM validation
-            from backend.compiler.prompts.critique_prompts import build_partial_revision_validation_prompt
-            
-            # Build validation prompt
-            prompt = build_partial_revision_validation_prompt(
-                current_paper=current_paper,
-                current_outline=current_outline,
-                critique_feedback=critique_feedback,
-                edit_proposal=edit_proposal
-            )
-            
-            # Generate task ID
-            task_id = self.get_current_task_id()
-            self.task_sequence += 1
-            
-            # Notify task started
-            if self.task_tracking_callback:
-                self.task_tracking_callback("started", task_id)
-            
-            # Call LLM
-            from backend.shared.config import system_config
-            response = await api_client_manager.generate_completion(
-                task_id=task_id,
-                role_id=self.role_id,
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=0.0,
-                max_tokens=system_config.compiler_validator_max_output_tokens
-            )
-            
-            # Notify task completed
-            if self.task_tracking_callback:
-                self.task_tracking_callback("completed", task_id)
-            
-            # Extract content from response
-            message = response.get("choices", [{}])[0].get("message", {})
-            llm_output = message.get("content") or message.get("reasoning") or ""
-            
-            # Parse the response
-            data = parse_json(llm_output)
-            
-            if data is None:
-                logger.error("Failed to parse partial revision validation response")
-                return False, "Failed to parse validation response"
-            
-            # Handle array responses
-            if isinstance(data, list):
-                logger.warning("Validator returned array - using first element")
-                if not data:
-                    return False, "Empty validation response"
-                data = data[0]
-            
-            # Check decision
-            decision = data.get("decision", "").lower()
-            val_reasoning = data.get("reasoning", "No reason provided")
-            
-            if decision == "accept":
-                logger.info(f"Partial revision edit VALIDATED: {val_reasoning[:150]}...")
-                return True, ""
-            else:
-                logger.info(f"Partial revision edit REJECTED: {val_reasoning[:150]}...")
-                return False, val_reasoning
-                
-        except FreeModelExhaustedError:
-            raise
-        except Exception as e:
-            logger.error(f"Error validating partial revision edit: {e}", exc_info=True)
-            return False, f"Validation error: {str(e)}"
\ No newline at end of file
+            return None
\ No newline at end of file
diff --git a/backend/leanoj/__init__.py b/backend/leanoj/__init__.py
new file mode 100644
index 0000000..b8f612a
--- /dev/null
+++ b/backend/leanoj/__init__.py
@@ -0,0 +1 @@
+"""LeanOJ proof-solver mode."""
diff --git a/backend/leanoj/core/__init__.py b/backend/leanoj/core/__init__.py
new file mode 100644
index 0000000..cbd5da7
--- /dev/null
+++ b/backend/leanoj/core/__init__.py
@@ -0,0 +1 @@
+"""Core orchestration for LeanOJ proof solving."""
diff --git a/backend/leanoj/core/leanoj_context.py b/backend/leanoj/core/leanoj_context.py
new file mode 100644
index 0000000..7c2465b
--- /dev/null
+++ b/backend/leanoj/core/leanoj_context.py
@@ -0,0 +1,829 @@
+"""LeanOJ proof-memory persistence and direct/RAG context allocation."""
+from __future__ import annotations
+
+import asyncio
+import hashlib
+import json
+import logging
+import re
+import shutil
+from dataclasses import dataclass, field
+from datetime import datetime
+from pathlib import Path
+from typing import Any
+
+import aiofiles
+
+from backend.aggregator.core.rag_manager import rag_manager
+from backend.shared.config import rag_config, system_config
+from backend.shared.utils import count_tokens
+
+logger = logging.getLogger(__name__)
+
+
+ARTIFACT_ACCEPTED_IDEAS = "accepted_ideas"
+ARTIFACT_RECURSIVE_TOPICS = "recursive_topics"
+ARTIFACT_VERIFIED_SUBPROOFS = "verified_subproofs"
+ARTIFACT_PARTIAL_PROOFS = "partial_proofs"
+ARTIFACT_FINAL_ATTEMPTS = "final_attempts"
+ARTIFACT_FINAL_CYCLE_PACKETS = "final_cycle_packets"
+ARTIFACT_FAILED_SUBPROOFS = "failed_subproofs"
+
+
+def _remove_attempt_count_language(value: Any) -> str:
+    text = str(value or "")
+    replacements = (
+        (
+            r"\bfailed\s+\d+\s+consecutive\s+verification/edit\s+attempts?\b",
+            "encountered repeated verification/edit failures",
+        ),
+        (r"\bfailed\s+\d+\s+consecutive\s+attempts?\b", "encountered repeated failures"),
+        (r"\bfailed\s+\d+\s+attempts?\b", "encountered repeated failures"),
+        (r"\bfailed\s+\d+\s+times\b", "encountered repeated failures"),
+        (r"\bafter\s+failed\s+attempts\b", "after recent proof-check failures"),
+        (r"\bfailed\s+attempts\b", "proof-check failures"),
+        (r"\battempts\s+\d+\s*-\s*\d+\b", "recent final-loop feedback"),
+        (r"\bwith\s+exactly\s+\d+\s+failed\s+attempts?\b", "with recent proof-check failures"),
+        (r"\bUse this exact failed-attempt count[^.]*\.", ""),
+        (r"\bfailed-attempt count\b", "failure context"),
+    )
+    for pattern, replacement in replacements:
+        text = re.sub(pattern, replacement, text, flags=re.IGNORECASE)
+    return re.sub(r" {2,}", " ", text).strip()
+
+USEFUL_ARTIFACTS = (
+    ARTIFACT_ACCEPTED_IDEAS,
+    ARTIFACT_RECURSIVE_TOPICS,
+    ARTIFACT_VERIFIED_SUBPROOFS,
+    ARTIFACT_PARTIAL_PROOFS,
+    ARTIFACT_FINAL_ATTEMPTS,
+    ARTIFACT_FINAL_CYCLE_PACKETS,
+    ARTIFACT_FAILED_SUBPROOFS,
+)
+
+
+@dataclass
+class LeanOJMemoryItem:
+    """One optional proof-memory source eligible for direct injection or RAG."""
+
+    artifact: str
+    title: str
+    text: str
+    priority: int
+    source_name: str
+    rag_only: bool = False
+
+
+@dataclass
+class LeanOJContextAllocation:
+    """Prepared context blocks consumed by LeanOJ prompt builders."""
+
+    direct_proof_context: str = ""
+    rag_evidence_context: str = ""
+    refuted_construction_warnings: str = ""
+    capped_rejection_feedback: str = ""
+    current_final_cycle_packet: str = ""
+    current_working_proof_attempt: str = ""
+    direct_sources: list[str] = field(default_factory=list)
+    rag_sources: list[str] = field(default_factory=list)
+
+    def as_prompt_blocks(self) -> dict[str, str]:
+        return {
+            "direct_proof_context": self.direct_proof_context,
+            "rag_evidence_context": self.rag_evidence_context,
+            "refuted_construction_warnings": self.refuted_construction_warnings,
+            "capped_rejection_feedback": self.capped_rejection_feedback,
+            "current_final_cycle_packet": self.current_final_cycle_packet,
+            "current_working_proof_attempt": self.current_working_proof_attempt,
+        }
+
+
+class LeanOJContextManager:
+    """Session-scoped LeanOJ artifact storage and RAG/offload routing."""
+
+    def __init__(self) -> None:
+        self._indexed_hashes: dict[str, str] = {}
+        self._index_locks: dict[str, asyncio.Lock] = {}
+        self._artifact_sync_counts: dict[tuple[str, str], int] = {}
+        self._artifact_sync_digests: dict[tuple[str, str], str] = {}
+
+    @staticmethod
+    def artifacts_base_dir() -> Path:
+        return Path(system_config.data_dir) / "leanoj_artifacts"
+
+    def session_artifact_dir(self, session_id: str) -> Path:
+        return self.artifacts_base_dir() / (session_id or "latest")
+
+    @staticmethod
+    def source_prefix(session_id: str) -> str:
+        return f"leanoj_{session_id or 'latest'}_"
+
+    def source_name(self, session_id: str, artifact: str) -> str:
+        return f"{self.source_prefix(session_id)}{artifact}"
+
+    def source_names_for_session(self, session_id: str) -> list[str]:
+        return [self.source_name(session_id, artifact) for artifact in USEFUL_ARTIFACTS]
+
+    async def write_session_artifacts(
+        self,
+        *,
+        session_id: str,
+        accepted_ideas: list[str],
+        accepted_idea_records: list[dict[str, Any]] | None = None,
+        recursive_topics: list[str] | None = None,
+        verified_subproofs: list[dict[str, Any]],
+        partial_proofs: list[dict[str, Any]],
+        failed_subproofs: list[dict[str, Any]],
+        final_attempts: list[dict[str, Any]],
+        final_cycle_packets: list[dict[str, Any]],
+    ) -> None:
+        """Persist full LeanOJ proof memory independently from trimmed UI state."""
+        if not session_id:
+            return
+
+        base = self.session_artifact_dir(session_id)
+        base.mkdir(parents=True, exist_ok=True)
+        accepted_records = [
+            dict(record)
+            for record in (accepted_idea_records or [])
+            if isinstance(record, dict) and str(record.get("content") or "").strip()
+        ]
+        recorded_contents = {str(record.get("content") or "") for record in accepted_records}
+        accepted_records.extend(
+            {"content": item}
+            for item in accepted_ideas
+            if str(item).strip() and str(item) not in recorded_contents
+        )
+        if not accepted_records:
+            accepted_records = [{"content": item} for item in accepted_ideas]
+        await self._sync_jsonl(base / f"{ARTIFACT_ACCEPTED_IDEAS}.jsonl", session_id, ARTIFACT_ACCEPTED_IDEAS, accepted_records)
+        await self._sync_jsonl(base / f"{ARTIFACT_RECURSIVE_TOPICS}.jsonl", session_id, ARTIFACT_RECURSIVE_TOPICS, [{"content": item} for item in (recursive_topics or [])])
+        await self._sync_jsonl(base / f"{ARTIFACT_VERIFIED_SUBPROOFS}.jsonl", session_id, ARTIFACT_VERIFIED_SUBPROOFS, verified_subproofs)
+        await self._sync_jsonl(base / f"{ARTIFACT_PARTIAL_PROOFS}.jsonl", session_id, ARTIFACT_PARTIAL_PROOFS, partial_proofs)
+        await self._sync_jsonl(base / f"{ARTIFACT_FAILED_SUBPROOFS}.jsonl", session_id, ARTIFACT_FAILED_SUBPROOFS, failed_subproofs)
+        await self._sync_jsonl(base / f"{ARTIFACT_FINAL_ATTEMPTS}.jsonl", session_id, ARTIFACT_FINAL_ATTEMPTS, final_attempts)
+        await self._sync_jsonl(base / f"{ARTIFACT_FINAL_CYCLE_PACKETS}.jsonl", session_id, ARTIFACT_FINAL_CYCLE_PACKETS, final_cycle_packets)
+
+    async def append_record(self, session_id: str, artifact: str, record: dict[str, Any]) -> None:
+        """Append one record to a full-memory artifact log."""
+        if not session_id:
+            return
+        path = self.session_artifact_dir(session_id) / f"{artifact}.jsonl"
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "a", encoding="utf-8") as f:
+            await f.write(json.dumps(record, ensure_ascii=False) + "\n")
+        key = (session_id, artifact)
+        self._artifact_sync_counts[key] = self._artifact_sync_counts.get(key, self._count_jsonl_records(path) - 1) + 1
+        self._artifact_sync_digests.pop(key, None)
+
+    def load_session_artifacts(self, session_id: str) -> dict[str, list[Any]]:
+        """Load full LeanOJ artifact logs for resume."""
+        base = self.session_artifact_dir(session_id)
+        return {
+            ARTIFACT_ACCEPTED_IDEAS: self._records_to_strings(self._read_jsonl(base / f"{ARTIFACT_ACCEPTED_IDEAS}.jsonl")),
+            "accepted_idea_records": self._read_jsonl(base / f"{ARTIFACT_ACCEPTED_IDEAS}.jsonl"),
+            ARTIFACT_RECURSIVE_TOPICS: self._records_to_strings(self._read_jsonl(base / f"{ARTIFACT_RECURSIVE_TOPICS}.jsonl")),
+            ARTIFACT_VERIFIED_SUBPROOFS: self._read_jsonl(base / f"{ARTIFACT_VERIFIED_SUBPROOFS}.jsonl"),
+            ARTIFACT_PARTIAL_PROOFS: self._read_jsonl(base / f"{ARTIFACT_PARTIAL_PROOFS}.jsonl"),
+            ARTIFACT_FAILED_SUBPROOFS: self._read_jsonl(base / f"{ARTIFACT_FAILED_SUBPROOFS}.jsonl"),
+            ARTIFACT_FINAL_ATTEMPTS: self._read_jsonl(base / f"{ARTIFACT_FINAL_ATTEMPTS}.jsonl"),
+            ARTIFACT_FINAL_CYCLE_PACKETS: self._read_jsonl(base / f"{ARTIFACT_FINAL_CYCLE_PACKETS}.jsonl"),
+        }
+
+    async def allocate_context(
+        self,
+        *,
+        session_id: str,
+        mode: str,
+        user_prompt: str,
+        lean_template: str,
+        task_request: str,
+        context_window: int,
+        max_output_tokens: int,
+        accepted_ideas: list[str],
+        recursive_topics: list[str] | None = None,
+        verified_subproofs: list[dict[str, Any]],
+        partial_proofs: list[dict[str, Any]],
+        failed_subproofs: list[dict[str, Any]],
+        final_attempts: list[dict[str, Any]],
+        final_cycle_packets: list[dict[str, Any]] | None = None,
+        refuted_constructions: list[dict[str, Any]] | None = None,
+        current_final_cycle_packet: dict[str, Any] | None = None,
+        current_working_proof_attempt: dict[str, Any] | None = None,
+        capped_rejection_feedback: str = "",
+    ) -> LeanOJContextAllocation:
+        """Allocate optional LeanOJ memory direct first, then through scoped RAG."""
+        normalized_mode = mode if mode in {"brainstorm", "recursive_brainstorm", "subproof", "final_solver"} else "brainstorm"
+        allocation = LeanOJContextAllocation(
+            capped_rejection_feedback=capped_rejection_feedback.strip(),
+            current_final_cycle_packet=self._format_final_cycle_packet(current_final_cycle_packet)
+            if current_final_cycle_packet
+            else "",
+            current_working_proof_attempt=self._format_working_proof_attempt(current_working_proof_attempt)
+            if current_working_proof_attempt
+            else "",
+            refuted_construction_warnings=self._format_refuted_construction_warnings(refuted_constructions or [])
+            if normalized_mode == "final_solver"
+            else "",
+        )
+
+        available_tokens = rag_config.get_available_input_tokens(context_window, max_output_tokens)
+        mandatory_tokens = count_tokens(user_prompt) + count_tokens(lean_template) + count_tokens(task_request)
+        mandatory_tokens += rag_config.get_prompt_assembly_overhead_estimate()
+        mandatory_tokens += count_tokens(allocation.current_final_cycle_packet)
+        mandatory_tokens += count_tokens(allocation.current_working_proof_attempt)
+        mandatory_tokens += count_tokens(allocation.refuted_construction_warnings)
+        mandatory_tokens += count_tokens(allocation.capped_rejection_feedback)
+        remaining_tokens = available_tokens - mandatory_tokens
+        if remaining_tokens < 0:
+            raise RuntimeError(
+                "LeanOJ mandatory context overflow before optional proof memory allocation. "
+                f"Mandatory tokens: {mandatory_tokens}. Available input tokens: {available_tokens}. "
+                f"Context mode: {normalized_mode}. Increase the role context window or reduce mandatory context."
+            )
+
+        direct_parts: list[str] = []
+        offloaded_items: list[LeanOJMemoryItem] = []
+        minimum_rag_reserve = min(5000, max(1000, int(available_tokens * 0.05)))
+
+        for item in self._memory_items(
+            session_id=session_id,
+            mode=normalized_mode,
+            accepted_ideas=accepted_ideas,
+            recursive_topics=recursive_topics or [],
+            verified_subproofs=verified_subproofs,
+            partial_proofs=partial_proofs,
+            failed_subproofs=failed_subproofs,
+            final_attempts=final_attempts,
+            final_cycle_packets=final_cycle_packets or [],
+            current_final_cycle_packet=current_final_cycle_packet,
+            has_current_working_proof_attempt=current_working_proof_attempt is not None,
+        ):
+            formatted = f"{item.title}\n{item.text}".strip()
+            tokens = count_tokens(formatted)
+            if (
+                not item.rag_only
+                and tokens <= remaining_tokens
+                and remaining_tokens - tokens >= minimum_rag_reserve
+            ):
+                direct_parts.append(formatted)
+                allocation.direct_sources.append(item.source_name)
+                remaining_tokens -= tokens
+            else:
+                offloaded_items.append(item)
+                allocation.rag_sources.append(item.source_name)
+
+        allocation.direct_proof_context = "\n\n".join(direct_parts).strip()
+
+        if offloaded_items and remaining_tokens <= 500:
+            offloaded_titles = ", ".join(item.artifact for item in offloaded_items)
+            raise RuntimeError(
+                "LeanOJ context allocation could not preserve useful proof memory. "
+                f"Mandatory context left only {remaining_tokens} tokens for RAG/offload; "
+                f"offloaded sources would be silently dropped: {offloaded_titles}."
+            )
+
+        if offloaded_items:
+            for item in offloaded_items:
+                await self._ensure_source_indexed(item.source_name, f"{item.title}\n{item.text}".strip())
+
+            rag_pack = await rag_manager.retrieve(
+                query="\n\n".join([user_prompt, lean_template, task_request]),
+                chunk_size=rag_config.validator_chunk_size,
+                max_tokens=max(0, remaining_tokens - 200),
+                exclude_sources=allocation.direct_sources or None,
+                include_sources=allocation.rag_sources,
+                include_source_prefixes=[self.source_prefix(session_id)],
+            )
+            allocation.rag_evidence_context = rag_pack.text or ""
+
+        return allocation
+
+    async def remove_session(self, session_id: str) -> None:
+        """Remove persisted LeanOJ artifacts and their RAG sources for one session."""
+        base = self.session_artifact_dir(session_id)
+        if base.exists():
+            shutil.rmtree(base)
+        self._clear_sync_counts(session_id)
+        await self.remove_session_rag_sources(session_id)
+
+    async def clear_all(self) -> None:
+        """Remove all LeanOJ artifact stores and LeanOJ RAG sources."""
+        base = self.artifacts_base_dir()
+        session_ids = [path.name for path in base.iterdir() if path.is_dir()] if base.exists() else []
+        if base.exists():
+            shutil.rmtree(base)
+        self._artifact_sync_counts.clear()
+        self._artifact_sync_digests.clear()
+        await self.remove_all_leanoj_rag_sources(session_ids=session_ids)
+
+    async def remove_session_rag_sources(self, session_id: str) -> None:
+        await self._remove_rag_sources(self.source_names_for_session(session_id))
+
+    async def remove_all_leanoj_rag_sources(self, session_ids: list[str] | None = None) -> None:
+        sources: set[str] = set(self._indexed_hashes.keys())
+        for session_id in session_ids or []:
+            sources.update(self.source_names_for_session(session_id))
+        if session_ids is None:
+            base = self.artifacts_base_dir()
+            if base.exists():
+                for path in base.iterdir():
+                    if path.is_dir():
+                        sources.update(self.source_names_for_session(path.name))
+        await self._remove_rag_sources(sources)
+
+    async def _remove_rag_sources(self, sources: list[str] | set[str]) -> None:
+        for source_name in sorted({source for source in sources if source}):
+            try:
+                await rag_manager.remove_document(source_name)
+            except Exception as exc:
+                logger.warning("Failed to remove LeanOJ RAG source %s: %s", source_name, exc)
+            self._indexed_hashes.pop(source_name, None)
+
+    async def _ensure_source_indexed(self, source_name: str, text: str) -> None:
+        if not text.strip():
+            return
+        lock = self._index_locks.setdefault(source_name, asyncio.Lock())
+        async with lock:
+            digest = hashlib.sha256(text.encode("utf-8")).hexdigest()
+            has_chunks = any(
+                chunk.source_file == source_name
+                for chunk in rag_manager.chunks_by_size[rag_config.validator_chunk_size]
+            )
+            if self._indexed_hashes.get(source_name) == digest and has_chunks:
+                return
+
+            await rag_manager.remove_document(source_name)
+
+            await rag_manager.add_text(
+                text,
+                source_name,
+                chunk_sizes=rag_config.submitter_chunk_intervals,
+                is_permanent=False,
+            )
+            self._indexed_hashes[source_name] = digest
+
+    async def _sync_jsonl(
+        self,
+        path: Path,
+        session_id: str,
+        artifact: str,
+        records: list[Any],
+    ) -> None:
+        """Append new records; rewrite when records shrink or same-length content changes."""
+        key = (session_id, artifact)
+        new_digest = self._records_digest(records)
+        persisted_count = self._artifact_sync_counts.get(key)
+        if persisted_count is None:
+            persisted_count = self._count_jsonl_records(path)
+
+        if len(records) < persisted_count:
+            await self._write_jsonl(path, records)
+            self._artifact_sync_counts[key] = len(records)
+            self._artifact_sync_digests[key] = new_digest
+            return
+
+        if len(records) == persisted_count:
+            known_digest = self._artifact_sync_digests.get(key)
+            if known_digest == new_digest:
+                self._artifact_sync_counts[key] = persisted_count
+                return
+            if known_digest is None and self._jsonl_digest(path) == new_digest:
+                self._artifact_sync_counts[key] = persisted_count
+                self._artifact_sync_digests[key] = new_digest
+                return
+            await self._write_jsonl(path, records)
+            self._artifact_sync_counts[key] = persisted_count
+            self._artifact_sync_digests[key] = new_digest
+            return
+
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "a", encoding="utf-8") as f:
+            for record in records[persisted_count:]:
+                await f.write(json.dumps(record, ensure_ascii=False) + "\n")
+        self._artifact_sync_counts[key] = len(records)
+        self._artifact_sync_digests[key] = new_digest
+
+    @staticmethod
+    def _records_digest(records: list[Any]) -> str:
+        return hashlib.sha256(
+            "\n".join(json.dumps(record, ensure_ascii=False, sort_keys=True, default=str) for record in records).encode(
+                "utf-8"
+            )
+        ).hexdigest()
+
+    def _jsonl_digest(self, path: Path) -> str:
+        if not path.exists():
+            return self._records_digest([])
+        try:
+            records = self._read_jsonl(path)
+        except Exception as exc:
+            logger.warning("Failed to digest LeanOJ artifact log %s: %s", path, exc)
+            return ""
+        return self._records_digest(records)
+
+    @staticmethod
+    def _count_jsonl_records(path: Path) -> int:
+        if not path.exists():
+            return 0
+        try:
+            return sum(1 for line in path.read_text(encoding="utf-8").splitlines() if line.strip())
+        except Exception as exc:
+            logger.warning("Failed to count LeanOJ artifact log %s: %s", path, exc)
+            return 0
+
+    def _clear_sync_counts(self, session_id: str) -> None:
+        stale_keys = [key for key in self._artifact_sync_counts if key[0] == session_id]
+        for key in stale_keys:
+            self._artifact_sync_counts.pop(key, None)
+            self._artifact_sync_digests.pop(key, None)
+
+    def _memory_items(
+        self,
+        *,
+        session_id: str,
+        mode: str,
+        accepted_ideas: list[str],
+        recursive_topics: list[str] | None = None,
+        verified_subproofs: list[dict[str, Any]],
+        partial_proofs: list[dict[str, Any]],
+        failed_subproofs: list[dict[str, Any]],
+        final_attempts: list[dict[str, Any]],
+        final_cycle_packets: list[dict[str, Any]],
+        current_final_cycle_packet: dict[str, Any] | None,
+        has_current_working_proof_attempt: bool = False,
+    ) -> list[LeanOJMemoryItem]:
+        recent_failed_subproofs = failed_subproofs[-10:]
+        raw_items = {
+            ARTIFACT_FINAL_CYCLE_PACKETS: (
+                "HISTORICAL FINAL-CYCLE FAILURE PACKETS",
+                self._format_final_cycle_packets(final_cycle_packets),
+            ),
+            ARTIFACT_VERIFIED_SUBPROOFS: (
+                "VERIFIED SUBPROOFS / HELPER LEMMAS",
+                self._format_verified_subproofs_for_final(verified_subproofs)
+                if mode == "final_solver"
+                else self._format_verified_subproofs(verified_subproofs),
+            ),
+            ARTIFACT_PARTIAL_PROOFS: (
+                "LEAN-ACCEPTED PARTIAL PROOF SCAFFOLDS",
+                self._format_partial_proofs_for_final(partial_proofs)
+                if mode == "final_solver"
+                else self._format_partial_proofs(partial_proofs),
+            ),
+            ARTIFACT_ACCEPTED_IDEAS: (
+                "ACTIVE PROOF-PLAN NOTES" if mode == "final_solver" else "ACCEPTED BRAINSTORM IDEAS",
+                self._format_strings_for_final(accepted_ideas)
+                if mode == "final_solver"
+                else self._format_strings(accepted_ideas),
+            ),
+            ARTIFACT_RECURSIVE_TOPICS: (
+                "RECURSIVE PROOF-REPAIR TOPICS",
+                self._format_strings_for_final(recursive_topics)
+                if mode == "final_solver"
+                else self._format_strings(recursive_topics),
+            ),
+            ARTIFACT_FAILED_SUBPROOFS: (
+                "FAILED SUBPROOF FEEDBACK",
+                self._format_attempts(recent_failed_subproofs),
+            ),
+        }
+
+        brainstorm_priority = [
+            ARTIFACT_ACCEPTED_IDEAS,
+            ARTIFACT_PARTIAL_PROOFS,
+            ARTIFACT_VERIFIED_SUBPROOFS,
+            ARTIFACT_FINAL_CYCLE_PACKETS,
+        ]
+        if has_current_working_proof_attempt:
+            brainstorm_priority = [
+                ARTIFACT_PARTIAL_PROOFS,
+                ARTIFACT_VERIFIED_SUBPROOFS,
+                ARTIFACT_ACCEPTED_IDEAS,
+                ARTIFACT_FINAL_CYCLE_PACKETS,
+            ]
+
+        priority_by_mode = {
+            "final_solver": [
+                ARTIFACT_VERIFIED_SUBPROOFS,
+                ARTIFACT_ACCEPTED_IDEAS,
+            ],
+            "brainstorm": brainstorm_priority,
+            "recursive_brainstorm": brainstorm_priority,
+            "subproof": [
+                ARTIFACT_FAILED_SUBPROOFS,
+                ARTIFACT_VERIFIED_SUBPROOFS,
+                ARTIFACT_PARTIAL_PROOFS,
+                ARTIFACT_ACCEPTED_IDEAS,
+                ARTIFACT_FINAL_CYCLE_PACKETS,
+            ],
+        }
+        order = priority_by_mode.get(mode, priority_by_mode["brainstorm"])
+
+        items: list[LeanOJMemoryItem] = []
+        for priority, artifact in enumerate(order):
+            title, text = raw_items[artifact]
+            if not text:
+                continue
+            items.append(
+                LeanOJMemoryItem(
+                    artifact=artifact,
+                    title=title,
+                    text=text,
+                    priority=priority,
+                    source_name=self.source_name(session_id, artifact),
+                    rag_only=artifact == ARTIFACT_FINAL_CYCLE_PACKETS,
+                )
+            )
+        return items
+
+    @staticmethod
+    def _record_key(record: dict[str, Any] | None) -> str:
+        if not record:
+            return ""
+        try:
+            return json.dumps(record, sort_keys=True, default=str)
+        except TypeError:
+            return str(record)
+
+    @staticmethod
+    async def _write_jsonl(path: Path, records: list[Any]) -> None:
+        async with aiofiles.open(path, "w", encoding="utf-8") as f:
+            for record in records:
+                await f.write(json.dumps(record, ensure_ascii=False) + "\n")
+
+    @staticmethod
+    def _read_jsonl(path: Path) -> list[dict[str, Any]]:
+        if not path.exists():
+            return []
+        records: list[dict[str, Any]] = []
+        try:
+            for line in path.read_text(encoding="utf-8").splitlines():
+                if not line.strip():
+                    continue
+                item = json.loads(line)
+                if isinstance(item, dict):
+                    records.append(item)
+        except Exception as exc:
+            logger.warning("Failed to load LeanOJ artifact log %s: %s", path, exc)
+        return records
+
+    @staticmethod
+    def _records_to_strings(records: list[dict[str, Any]]) -> list[str]:
+        values: list[str] = []
+        for record in records:
+            value = record.get("content", record)
+            if isinstance(value, str) and value.strip():
+                values.append(value)
+        return values
+
+    @staticmethod
+    def _format_strings(values: list[str]) -> str:
+        clean = [str(value).strip() for value in values if str(value).strip()]
+        return "\n".join(f"{index}. {value}" for index, value in enumerate(clean, start=1))
+
+    @staticmethod
+    def _format_strings_for_final(values: list[str]) -> str:
+        clean = [LeanOJContextManager._final_mode_text(value).strip() for value in values if str(value).strip()]
+        return "\n".join(f"{index}. {value}" for index, value in enumerate(clean, start=1))
+
+    @staticmethod
+    def _format_attempts(records: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, record in enumerate(records, start=1):
+            lean_code = str(record.get("lean_code") or "").strip()
+            lean_feedback = _remove_attempt_count_language(record.get("lean_feedback") or "")
+            feedback_lines = ["Lean pass feedback:", lean_feedback] if lean_feedback else []
+            blocks.append(
+                "\n".join(
+                    [
+                        f"FEEDBACK ITEM {index}: {_remove_attempt_count_language(record.get('request', 'proof feedback'))}",
+                        "Error summary: "
+                        f"{_remove_attempt_count_language(record.get('error_summary', record.get('error_output', '')))}",
+                        *feedback_lines,
+                        "Lean code:",
+                        lean_code or "[not recorded]",
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @staticmethod
+    def _format_refuted_construction_warnings(
+        records: list[dict[str, Any]],
+        *,
+        limit: int = 5,
+        max_chars: int = 1500,
+    ) -> str:
+        """Compact final-mode warnings for failed routes, kept separate from proof evidence."""
+        clean_records = [record for record in records if isinstance(record, dict)]
+        blocks: list[str] = []
+        for record in clean_records[-limit:]:
+            content = str(record.get("content") or record.get("summary") or record.get("error_summary") or "").strip()
+            if not content:
+                continue
+            reason = str(
+                record.get("reasoning")
+                or record.get("validator_summary")
+                or record.get("validator_reasoning")
+                or record.get("edit_reasoning")
+                or ""
+            ).strip()
+            line = LeanOJContextManager._final_mode_text(content)
+            if reason:
+                line = f"{line} Reason: {LeanOJContextManager._final_mode_text(reason)}"
+            blocks.append(line)
+
+        if not blocks:
+            return ""
+
+        text = "\n".join(f"{index}. {block}" for index, block in enumerate(blocks, start=1))
+        if len(text) <= max_chars:
+            return text
+        return text[: max_chars - 20].rstrip() + "\n[truncated]"
+
+    @staticmethod
+    def _format_final_cycle_packets(packets: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, packet in enumerate(packets, start=1):
+            attempts = packet.get("attempts") if isinstance(packet.get("attempts"), list) else []
+            blocks.append(
+                "\n".join(
+                    [
+                        f"FINAL-CYCLE FEEDBACK {index}",
+                        f"Summary: {_remove_attempt_count_language(packet.get('summary', ''))}",
+                        "Recent verification/edit feedback:",
+                        LeanOJContextManager._format_attempts([dict(item) for item in attempts if isinstance(item, dict)]),
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @staticmethod
+    def _format_verified_subproofs(subproofs: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, subproof in enumerate(subproofs, start=1):
+            lean_feedback = str(subproof.get("lean_feedback") or "").strip()
+            feedback_lines = ["Lean verifier feedback:", lean_feedback] if lean_feedback else []
+            blocks.append(
+                "\n".join(
+                    [
+                        f"SUBPROOF {index}: {subproof.get('request', '')}",
+                        f"Role: {subproof.get('role', '')}",
+                        f"Theorem/Lemma: {subproof.get('theorem_or_lemma', '')}",
+                        *feedback_lines,
+                        "Verified Lean 4 code:",
+                        str(subproof.get("lean_code") or ""),
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @staticmethod
+    def _final_mode_text(value: Any) -> str:
+        text = str(value or "")
+        cleaned = (
+            text.replace("need_more_brainstorming", "additional proof context")
+            .replace("Brainstorm", "Proof memory")
+            .replace("brainstorm", "proof memory")
+            .replace("BRAINSTORM", "PROOF MEMORY")
+        )
+        return _remove_attempt_count_language(cleaned)
+
+    @classmethod
+    def _format_verified_subproofs_for_final(cls, subproofs: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, subproof in enumerate(subproofs, start=1):
+            lean_feedback = cls._final_mode_text(subproof.get("lean_feedback") or "").strip()
+            feedback_lines = ["Lean verifier feedback:", lean_feedback] if lean_feedback else []
+            blocks.append(
+                "\n".join(
+                    [
+                        f"SUBPROOF {index}: {cls._final_mode_text(subproof.get('request', ''))}",
+                        f"Theorem/Lemma: {cls._final_mode_text(subproof.get('theorem_or_lemma', ''))}",
+                        *feedback_lines,
+                        "Verified Lean 4 code:",
+                        str(subproof.get("lean_code") or ""),
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @staticmethod
+    def _format_partial_proofs(partial_proofs: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, proof in enumerate(partial_proofs, start=1):
+            placeholders = ", ".join(proof.get("placeholder_tokens") or []) or "unknown"
+            blocks.append(
+                "\n".join(
+                    [
+                        f"PARTIAL PROOF {index}: {proof.get('request', '')}",
+                        f"Target: {proof.get('target', '')}; placeholders: {placeholders}",
+                        f"Summary: {proof.get('summary', '')}",
+                        "Lean-accepted incomplete scaffold:",
+                        str(proof.get("lean_code") or ""),
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @classmethod
+    def _format_partial_proofs_for_final(cls, partial_proofs: list[dict[str, Any]]) -> str:
+        blocks: list[str] = []
+        for index, proof in enumerate(partial_proofs, start=1):
+            placeholders = ", ".join(proof.get("placeholder_tokens") or []) or "unknown"
+            blocks.append(
+                "\n".join(
+                    [
+                        f"PARTIAL PROOF {index}: {cls._final_mode_text(proof.get('request', ''))}",
+                        f"Placeholders: {placeholders}",
+                        f"Summary: {cls._final_mode_text(proof.get('summary', ''))}",
+                        "Lean-accepted incomplete scaffold:",
+                        str(proof.get("lean_code") or ""),
+                        "---",
+                    ]
+                )
+            )
+        return "\n".join(blocks)
+
+    @staticmethod
+    def _format_final_cycle_packet(packet: dict[str, Any] | None) -> str:
+        if not packet:
+            return ""
+        attempts = packet.get("attempts") if isinstance(packet.get("attempts"), list) else []
+        partial_proofs = packet.get("partial_proofs") if isinstance(packet.get("partial_proofs"), list) else []
+        lines = [
+            "CURRENT FINAL-CYCLE FEEDBACK",
+            "This is the immediate final-loop feedback to use for repairing the current proof.",
+            LeanOJContextManager._format_attempts([dict(item) for item in attempts if isinstance(item, dict)]),
+            "Partial final scaffolds captured during this cycle:",
+            LeanOJContextManager._format_partial_proofs(
+                [dict(item) for item in partial_proofs if isinstance(item, dict)]
+            )
+            or "[none recorded]",
+        ]
+        return "\n".join(lines).strip()
+
+    @staticmethod
+    def _format_working_proof_attempt(packet: dict[str, Any] | None) -> str:
+        if not packet:
+            return ""
+        verified = packet.get("verified_subproofs") if isinstance(packet.get("verified_subproofs"), list) else []
+        partials = packet.get("partial_final_proofs") if isinstance(packet.get("partial_final_proofs"), list) else []
+        parts = [
+            "CURRENT WORKING PROOF ATTEMPT",
+            "This is the proof attempt the next LeanOJ brainstorm must repair or complete directly.",
+            f"Trigger: {packet.get('trigger', '')}",
+            f"Requested path: {packet.get('requested_path', '')}",
+            f"Stuck reason: {_remove_attempt_count_language(packet.get('stuck_reason', ''))}",
+            (
+                "Master proof metadata: "
+                f"version={packet.get('master_proof_version', 0)}, "
+                f"lines={packet.get('master_proof_line_count', 0)}, "
+                f"sha256={packet.get('master_proof_hash', '')}"
+            ),
+            f"Last edit summary: {packet.get('master_proof_last_edit_summary', '')}",
+            "Latest master_proof.lean:",
+            str(packet.get("master_proof") or "[not initialized]").strip(),
+            "Recent final solver feedback:",
+            str(packet.get("recent_final_attempts") or "[none recorded]").strip(),
+            "Verified helper subproofs available to reuse:",
+            LeanOJContextManager._format_verified_subproofs([dict(item) for item in verified if isinstance(item, dict)])
+            or "[none recorded]",
+            "Lean-accepted partial final scaffolds:",
+            LeanOJContextManager._format_partial_proofs([dict(item) for item in partials if isinstance(item, dict)])
+            or "[none recorded]",
+        ]
+        old_attempt = str(packet.get("old_attempt_before_redo") or "").strip()
+        if old_attempt:
+            validator_justification = str(
+                packet.get("old_attempt_before_redo_validator_justification") or ""
+            ).strip()
+            apparent_issue = str(packet.get("old_attempt_before_redo_apparent_issue") or "").strip()
+            parts += [
+                "",
+                "OLD ATTEMPT THE SUBMITTER DECIDED TO REDO (preserved for reference only; do NOT revert to this):",
+                f"Original version: v{packet.get('old_attempt_before_redo_version', '?')}",
+                (
+                    "Old attempt metadata: "
+                    f"lines={packet.get('old_attempt_before_redo_line_count', 0)}, "
+                    f"chars={packet.get('old_attempt_before_redo_char_count', 0)}, "
+                    f"sha256={packet.get('old_attempt_before_redo_hash', '')}"
+                ),
+                f"Summary: {packet.get('old_attempt_before_redo_summary', '')}",
+                "WHY THE VALIDATOR ALLOWED THIS REDO/SHORTENING:",
+                validator_justification or "[No validator justification was recorded.]",
+                "APPARENT ISSUE WITH THIS OLD LONGER ATTEMPT:",
+                apparent_issue or "[No apparent issue was recorded.]",
+                "Old proof content:",
+                old_attempt,
+            ]
+        return "\n".join(parts).strip()
+
+
+leanoj_context_manager = LeanOJContextManager()
\ No newline at end of file
diff --git a/backend/leanoj/core/leanoj_coordinator.py b/backend/leanoj/core/leanoj_coordinator.py
new file mode 100644
index 0000000..52cc4e8
--- /dev/null
+++ b/backend/leanoj/core/leanoj_coordinator.py
@@ -0,0 +1,5084 @@
+"""Coordinator for the additive LeanOJ proof-solver mode."""
+from __future__ import annotations
+
+import asyncio
+import hashlib
+import json
+import logging
+import re
+import shutil
+import time
+import uuid
+from datetime import datetime
+from pathlib import Path
+from typing import Any, Awaitable, Callable, Optional
+
+import aiofiles
+
+from backend.leanoj.core.leanoj_context import (
+    ARTIFACT_ACCEPTED_IDEAS,
+    ARTIFACT_FAILED_SUBPROOFS,
+    ARTIFACT_FINAL_ATTEMPTS,
+    ARTIFACT_FINAL_CYCLE_PACKETS,
+    ARTIFACT_PARTIAL_PROOFS,
+    ARTIFACT_RECURSIVE_TOPICS,
+    ARTIFACT_VERIFIED_SUBPROOFS,
+    _remove_attempt_count_language,
+    leanoj_context_manager,
+)
+from backend.leanoj.prompts import (
+    build_brainstorm_batch_validation_prompt,
+    build_brainstorm_prompt,
+    build_brainstorm_prune_review_prompt,
+    build_brainstorm_prune_validation_prompt,
+    build_brainstorm_validation_prompt,
+    build_final_solution_review_prompt,
+    build_final_solver_prompt,
+    build_master_proof_edit_validation_prompt,
+    build_path_decision_prompt,
+    build_path_validation_prompt,
+    build_sufficiency_prompt,
+    build_topic_batch_validation_prompt,
+    build_topic_candidate_prompt,
+    build_topic_selection_prompt,
+    build_topic_validation_prompt,
+)
+from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
+from backend.autonomous.memory.proof_database import proof_database
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.brainstorm_proof_gate import is_lean_proof_submission, verify_brainstorm_proof_candidate
+from backend.shared.config import rag_config, system_config
+from backend.shared.json_parser import parse_json
+from backend.shared.lean4_client import Lean4Result, get_lean4_client
+from backend.shared.lean_proof_integrity import strip_lean_comments_and_strings, validate_lean_proof_integrity
+from backend.shared.model_error_utils import is_non_retryable_model_error
+from backend.shared.models import (
+    LeanOJAttemptRecord,
+    LeanOJRoleConfig,
+    LeanOJStartRequest,
+    LeanOJState,
+    LeanOJSubproofRecord,
+    ModelConfig,
+    ProofAttemptFeedback,
+    ProofRecord,
+    WorkflowTask,
+)
+from backend.shared.token_tracker import token_tracker
+from backend.shared.utils import count_tokens
+
+logger = logging.getLogger(__name__)
+
+BroadcastFn = Optional[Callable[[str, dict[str, Any]], Awaitable[None]]]
+_LEAN_PLACEHOLDER_RE = re.compile(r"(?<![A-Za-z0-9_'])(sorry|admit)(?![A-Za-z0-9_'])")
+_LEAN_TOP_LEVEL_DECL_KINDS = (
+    "abbrev",
+    "axiom",
+    "class",
+    "constant",
+    "def",
+    "example",
+    "inductive",
+    "instance",
+    "lemma",
+    "opaque",
+    "structure",
+    "theorem",
+)
+_LEAN_TOP_LEVEL_DECL_KIND_PATTERN = "|".join(_LEAN_TOP_LEVEL_DECL_KINDS)
+_LEAN_TOP_LEVEL_DECL_RE = re.compile(
+    r"(?m)^\s*(?:open\s+Classical\s+in\s+)?(?:@\[[^\]]+\]\s*)*(?:(?:private|protected|noncomputable|unsafe)\s+)*"
+    rf"(?:{_LEAN_TOP_LEVEL_DECL_KIND_PATTERN})\b"
+)
+_LEAN_DECL_KEY_RE = re.compile(
+    r"^\s*(?:open\s+Classical\s+in\s+)?(?:@\[[^\]]+\]\s*)*(?:(?:private|protected|noncomputable|unsafe)\s+)*"
+    rf"(?P<kind>{_LEAN_TOP_LEVEL_DECL_KIND_PATTERN})\s+(?P<name>[A-Za-z_][A-Za-z0-9_'.]*|«[^»]+»)?",
+    re.DOTALL,
+)
+_TERMINAL_PHASES = {"verified"}
+_ACTIVE_PHASES = {
+    "initial_topic_candidates",
+    "initial_brainstorm",
+    "path_decision",
+    "recursive_brainstorm",
+    "final_proof_loop",
+}
+_PHASE_PROGRESS_RANK = {
+    "idle": 0,
+    "initial_topic_candidates": 1,
+    "initial_brainstorm": 2,
+    "recursive_brainstorm": 3,
+    "path_decision": 4,
+    "final_proof_loop": 5,
+    "error": 7,
+    "stopped": 7,
+}
+_LEANOJ_PATH_OPTIONS = ("solve_final_now", "need_more_brainstorming")
+_LEANOJ_PATH_OPTIONS_SET = set(_LEANOJ_PATH_OPTIONS)
+_LEANOJ_PROOF_EDIT_ACTIONS = {"edit_proof"}
+_LEANOJ_PROOF_EDIT_OPERATIONS = {"full_content", "replace", "insert_after", "delete"}
+_MASTER_PROOF_EDIT_LOG_COMPACT_RECORD_LIMIT = 500
+_MASTER_PROOF_EDIT_LOG_RECENT_RECORDS_TO_KEEP = 150
+_MASTER_PROOF_NO_PROGRESS_LIMIT = 8
+_MASTER_PROOF_STALE_EDIT_FAILURE_HANDOFF_COUNT = 3
+_MASTER_PROOF_EDIT_SUMMARY_LIMIT = 1000
+_MASTER_PROOF_SHORTENING_CHAR_THRESHOLD = 80
+_LEANOJ_CONTEXT_ROLES = {"active_plan", "verified_hint", "refuted_construction", "scratch"}
+_LEANOJ_FINAL_ACTIVE_CONTEXT_ROLES = {"active_plan"}
+_LEANOJ_REFUTED_CONTEXT_TERMS = (
+    "counterexample",
+    "refuted",
+    "do not use",
+    "fails at",
+    "fails for",
+    "falsified",
+    "false construction",
+    "invalid construction",
+    "construction is invalid",
+    "candidate is invalid",
+)
+_LEANOJ_ACTIVE_PLAN_CONTEXT_TERMS = (
+    "active proof plan",
+    "current proof route",
+    "chosen proof route",
+    "current chosen proof route",
+    "master proof route",
+    "next obligation",
+)
+
+
+class LeanOJConfigurationError(RuntimeError):
+    """Non-retryable LeanOJ configuration problem."""
+
+
+_BrainstormSubmission = tuple[int, str, dict[str, Any]]
+
+
+class _LeanOJBrainstormSubmissionQueue:
+    """LeanOJ-local pending queue with aggregator-style fairness accounting."""
+
+    def __init__(self, submitter_count: int) -> None:
+        self.queue: asyncio.Queue[_BrainstormSubmission] = asyncio.Queue()
+        self.submitter_count = submitter_count
+        self.pending_by_submitter: dict[int, int] = {}
+        self.global_paused = False
+        self.paused_submitters: set[int] = set()
+
+    def qsize(self) -> int:
+        return self.queue.qsize()
+
+    def count_for_submitter(self, submitter_index: int) -> int:
+        return self.pending_by_submitter.get(submitter_index, 0)
+
+    def should_pause_submitter(self, submitter_index: int) -> bool:
+        if self.qsize() >= system_config.queue_overflow_threshold:
+            return True
+        if self.submitter_count <= 1:
+            return False
+        return (
+            self.count_for_submitter(submitter_index)
+            > system_config.per_submitter_queue_threshold
+        )
+
+    async def put(self, item: _BrainstormSubmission) -> None:
+        await self.queue.put(item)
+        submitter_index = item[0]
+        self.pending_by_submitter[submitter_index] = (
+            self.pending_by_submitter.get(submitter_index, 0) + 1
+        )
+
+    async def dequeue_batch(
+        self,
+        *,
+        max_count: int = 3,
+        timeout: float = 1.0,
+        collect_window: float = 0.25,
+    ) -> list[_BrainstormSubmission]:
+        try:
+            first = await asyncio.wait_for(self.queue.get(), timeout=timeout)
+        except asyncio.TimeoutError:
+            return []
+
+        batch = [first]
+        self._decrement_submitter(first[0])
+        deadline = time.monotonic() + collect_window
+        while len(batch) < max_count:
+            try:
+                item = self.queue.get_nowait()
+                batch.append(item)
+                self._decrement_submitter(item[0])
+                continue
+            except asyncio.QueueEmpty:
+                pass
+
+            remaining = deadline - time.monotonic()
+            if remaining <= 0:
+                break
+            try:
+                item = await asyncio.wait_for(self.queue.get(), timeout=remaining)
+                batch.append(item)
+                self._decrement_submitter(item[0])
+            except asyncio.TimeoutError:
+                break
+        return batch
+
+    def refresh_pause_transitions(self) -> dict[str, Any]:
+        queue_size = self.qsize()
+        next_global_paused = queue_size >= system_config.queue_overflow_threshold
+        next_paused_submitters = self._current_paused_submitters()
+
+        transitions = {
+            "queue_size": queue_size,
+            "global_paused": next_global_paused,
+            "global_changed": next_global_paused != self.global_paused,
+            "submitters_paused": next_paused_submitters - self.paused_submitters,
+            "submitters_resumed": self.paused_submitters - next_paused_submitters,
+        }
+        self.global_paused = next_global_paused
+        self.paused_submitters = next_paused_submitters
+        return transitions
+
+    def _current_paused_submitters(self) -> set[int]:
+        if self.submitter_count <= 1:
+            return set()
+        return {
+            submitter_index
+            for submitter_index, pending_count in self.pending_by_submitter.items()
+            if pending_count > system_config.per_submitter_queue_threshold
+        }
+
+    def _decrement_submitter(self, submitter_index: int) -> None:
+        pending_count = self.pending_by_submitter.get(submitter_index, 0)
+        if pending_count <= 1:
+            self.pending_by_submitter.pop(submitter_index, None)
+            return
+        self.pending_by_submitter[submitter_index] = pending_count - 1
+
+
+class LeanOJCoordinator:
+    """Run the proof-only LeanOJ workflow as an isolated third mode."""
+
+    def __init__(self) -> None:
+        self._running = False
+        self._state = LeanOJState()
+        self._request: Optional[LeanOJStartRequest] = None
+        self._stop_event = asyncio.Event()
+        self._main_task: Optional[asyncio.Task] = None
+        self._broadcast_callback: BroadcastFn = None
+        self._task_sequences: dict[str, int] = {}
+
+        self._validated_topics: list[str] = []
+        self._recursive_topics: list[str] = []
+        self._accepted_ideas: list[str] = []
+        self._accepted_idea_records: list[dict[str, Any]] = []
+        self._failed_feedback: list[dict[str, Any]] = []
+        self._last_brainstorm_validation_decisions: list[dict[str, Any]] = []
+        self._final_attempts: list[dict[str, Any]] = []
+        self._final_context_events: list[dict[str, Any]] = []
+        self._partial_proofs: list[dict[str, Any]] = []
+        self._final_cycle_packets: list[dict[str, Any]] = []
+        self._current_final_cycle_packet: Optional[dict[str, Any]] = None
+        self._current_working_proof_attempt: Optional[dict[str, Any]] = None
+
+        self.workflow_tasks: list[WorkflowTask] = []
+        self.completed_task_ids: set[str] = set()
+        self.current_task_id: Optional[str] = None
+        self._restored_from_disk = False
+        self._master_proof_no_progress_count = 0
+        self._last_master_proof_edit_signature = ""
+
+    @property
+    def is_running(self) -> bool:
+        return self._running
+
+    @property
+    def is_active(self) -> bool:
+        return self._running or (self._main_task is not None and not self._main_task.done())
+
+    def set_broadcast_callback(self, callback: Callable[[str, dict[str, Any]], Awaitable[None]]) -> None:
+        self._broadcast_callback = callback
+
+    async def _broadcast(self, event: str, data: Optional[dict[str, Any]] = None) -> None:
+        if self._broadcast_callback:
+            await self._broadcast_callback(event, data or {})
+
+    def get_state(self) -> LeanOJState:
+        return self._state
+
+    def get_status(self) -> dict[str, Any]:
+        self._ensure_accepted_idea_records()
+        payload = self._state.model_dump(mode="json")
+        payload.update(
+            {
+                "validated_topics": list(self._validated_topics),
+                "accepted_ideas": list(self._accepted_ideas),
+                "accepted_idea_records": list(self._accepted_idea_records),
+                "failed_feedback": list(self._failed_feedback[-20:]),
+                "final_attempts": list(self._final_attempts[-20:]),
+                "final_context_events": list(self._final_context_events[-20:]),
+                "partial_proofs": list(self._partial_proofs[-20:]),
+                "final_cycle_packets": list(self._final_cycle_packets[-5:]),
+                "current_final_cycle_packet": self._current_final_cycle_packet,
+                "current_working_proof_attempt": self._current_working_proof_attempt,
+                "workflow_tasks": [task.model_dump(mode="json") for task in self.workflow_tasks],
+                "resume_available": self._request is not None
+                and self._state.phase not in _TERMINAL_PHASES
+                and not self._state.final_solution,
+            }
+        )
+        return payload
+
+    async def restore_latest_session(self, *, auto_resume: bool = False) -> bool:
+        """Restore the latest saved LeanOJ session and optionally resume it."""
+        if self.is_active:
+            return False
+
+        state_file = self._find_best_resumable_state_file() or self._find_latest_state_file()
+        if state_file is None:
+            return False
+
+        try:
+            async with aiofiles.open(state_file, "r", encoding="utf-8") as f:
+                payload = json.loads(await f.read())
+            self._restore_from_payload(payload)
+        except Exception as exc:
+            logger.warning("Failed to restore LeanOJ session from %s: %s", state_file, exc)
+            return False
+
+        logger.info(
+            "Restored LeanOJ session %s (phase=%s, accepted=%s, final_attempts=%s)",
+            self._state.session_id,
+            self._state.phase,
+            len(self._accepted_ideas),
+            self._state.final_attempt_count,
+        )
+
+        if (
+            auto_resume
+            and self._request is not None
+            and self._state.phase not in _TERMINAL_PHASES
+            and not self._state.final_solution
+        ):
+            logger.info("Auto-resuming interrupted Proof Solver session %s", self._state.session_id)
+            self.start_in_background()
+
+        return True
+
+    async def initialize(self, request: LeanOJStartRequest) -> None:
+        if self.is_active:
+            raise RuntimeError("Proof Solver is already running")
+        if not request.user_prompt.strip():
+            raise ValueError("Proof Solver user prompt is required")
+        if not request.lean_template.strip():
+            raise ValueError("Proof Solver template is required")
+        if not request.brainstorm_submitters:
+            raise ValueError("At least one Proof Solver brainstorm submitter is required")
+        missing_roles = self._missing_model_roles(request)
+        if missing_roles:
+            raise ValueError(
+                "Proof Solver role model configuration is incomplete. Missing model for: "
+                + ", ".join(missing_roles)
+            )
+
+        self._request = request
+        self._stop_event = asyncio.Event()
+        self._task_sequences = {}
+        self._validated_topics = []
+        self._accepted_ideas = []
+        self._accepted_idea_records = []
+        self._failed_feedback = []
+        self._final_attempts = []
+        self._final_context_events = []
+        self._partial_proofs = []
+        self._final_cycle_packets = []
+        self._current_final_cycle_packet = None
+        self._current_working_proof_attempt = None
+        self.workflow_tasks = []
+        self.completed_task_ids = set()
+        self.current_task_id = None
+        self._restored_from_disk = False
+        self._master_proof_no_progress_count = 0
+        self._last_master_proof_edit_signature = ""
+
+        self._state = LeanOJState(
+            is_running=False,
+            phase="idle",
+            session_id=f"leanoj_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid.uuid4().hex[:8]}",
+        )
+
+        self._configure_roles(request)
+        await self._persist_state()
+
+    async def resume_or_initialize(self, request: LeanOJStartRequest) -> bool:
+        """Resume matching saved progress when possible, otherwise create a new run."""
+        if self.is_active:
+            raise RuntimeError("Proof Solver is already running")
+        if not request.user_prompt.strip():
+            raise ValueError("Proof Solver user prompt is required")
+        if not request.lean_template.strip():
+            raise ValueError("Proof Solver template is required")
+        if not request.brainstorm_submitters:
+            raise ValueError("At least one Proof Solver brainstorm submitter is required")
+        missing_roles = self._missing_model_roles(request)
+        if missing_roles:
+            raise ValueError(
+                "Proof Solver role model configuration is incomplete. Missing model for: "
+                + ", ".join(missing_roles)
+            )
+
+        matching_state_file = self._find_best_matching_state_file(request)
+        if matching_state_file is None:
+            await self.initialize(request)
+            return False
+
+        try:
+            async with aiofiles.open(matching_state_file, "r", encoding="utf-8") as f:
+                payload = json.loads(await f.read())
+            self._restore_from_payload(payload)
+        except Exception as exc:
+            logger.warning("Failed to restore matching LeanOJ session from %s: %s", matching_state_file, exc)
+            await self.initialize(request)
+            return False
+
+        # Keep accumulated proof context, but let the restarted run use the
+        # latest model/fallback settings from the UI.
+        self._request = request
+        self._stop_event = asyncio.Event()
+        self._configure_roles(request)
+        self._restored_from_disk = True
+        await self._persist_state()
+        logger.info(
+            "Prepared LeanOJ session %s for resume from %s",
+            self._state.session_id,
+            matching_state_file,
+        )
+        return True
+
+    def start_in_background(self) -> bool:
+        if self._main_task and not self._main_task.done():
+            return False
+        self._main_task = asyncio.create_task(self.start())
+        self._main_task.add_done_callback(self._on_task_done)
+        return True
+
+    def _on_task_done(self, task: asyncio.Task) -> None:
+        try:
+            task.result()
+        except asyncio.CancelledError:
+            logger.info("LeanOJ coordinator task cancelled")
+        except Exception:
+            logger.exception("LeanOJ coordinator task failed")
+        finally:
+            if self._main_task is task:
+                self._main_task = None
+
+    def _enable_api_logging(self) -> None:
+        async def log_callback(
+            task_id,
+            role_id,
+            model,
+            provider,
+            prompt,
+            response,
+            tokens_used,
+            duration_ms,
+            success,
+            error,
+            phase,
+        ):
+            try:
+                await autonomous_api_logger.log_api_call(
+                    task_id=task_id,
+                    role_id=role_id,
+                    model=model,
+                    provider=provider,
+                    prompt=prompt,
+                    response_content=response,
+                    tokens_used=tokens_used,
+                    duration_ms=duration_ms,
+                    success=success,
+                    error=error,
+                    phase=phase or self._state.phase or "leanoj",
+                    workflow="leanoj",
+                )
+            except Exception as exc:
+                logger.error("Failed to log LeanOJ API call: %s", exc)
+
+        api_client_manager.set_autonomous_logger_callback(log_callback)
+        logger.info("LeanOJ API logging enabled")
+
+    async def start(self) -> None:
+        if self._request is None:
+            raise RuntimeError("LeanOJ coordinator must be initialized before start")
+        if self._running:
+            return
+
+        self._running = True
+        self._state.is_running = True
+        if self._state.phase == "idle":
+            self._state.phase = "initial_topic_candidates"
+        elif self._state.phase in {"stopped", "error"}:
+            self._state.phase = self._infer_resume_phase()
+        self._remember_active_phase()
+        self._state.updated_at = datetime.now()
+        self._state.last_error = ""
+        token_tracker.reset()
+        token_tracker.start_timer()
+        self._enable_api_logging()
+        await self._persist_and_broadcast("leanoj_started")
+
+        try:
+            await self._run_workflow(self._request)
+        except asyncio.CancelledError:
+            raise
+        except Exception as exc:
+            logger.exception("LeanOJ workflow failed")
+            self._state.phase = "error"
+            self._state.last_error = str(exc)
+            await self._persist_and_broadcast("leanoj_error", {"message": str(exc)})
+        finally:
+            self._running = False
+            self._state.is_running = False
+            if self._state.phase not in {"verified", "error"}:
+                self._remember_active_phase()
+            self._state.updated_at = datetime.now()
+            token_tracker.stop_timer()
+            api_client_manager.set_autonomous_logger_callback(None)
+            await self._persist_and_broadcast("leanoj_stopped")
+
+    async def stop(self) -> None:
+        if not self.is_active and not self._state.session_id:
+            return
+        self._stop_event.set()
+        task = self._main_task
+        if task and not task.done():
+            try:
+                await asyncio.wait_for(asyncio.shield(task), timeout=5)
+            except asyncio.TimeoutError:
+                task.cancel()
+                await asyncio.gather(task, return_exceptions=True)
+        if not self._running:
+            self._state.is_running = False
+            if self._state.phase not in {"verified", "error"}:
+                self._remember_active_phase()
+            await self._persist_and_broadcast("leanoj_stopped")
+
+    async def clear(self) -> None:
+        """Clear Proof Solver progress. This is the explicit reset path."""
+        if self.is_active:
+            await self.stop()
+        base = self._sessions_base_dir()
+        if base.exists():
+            shutil.rmtree(base)
+        partial_base = self._partial_proofs_base_dir()
+        if partial_base.exists():
+            shutil.rmtree(partial_base)
+        await leanoj_context_manager.clear_all()
+
+        self._running = False
+        self._state = LeanOJState()
+        self._request = None
+        self._stop_event = asyncio.Event()
+        self._main_task = None
+        self._task_sequences = {}
+        self._validated_topics = []
+        self._accepted_ideas = []
+        self._accepted_idea_records = []
+        self._failed_feedback = []
+        self._final_attempts = []
+        self._final_context_events = []
+        self._partial_proofs = []
+        self._final_cycle_packets = []
+        self._current_final_cycle_packet = None
+        self._current_working_proof_attempt = None
+        self.workflow_tasks = []
+        self.completed_task_ids = set()
+        self.current_task_id = None
+        self._restored_from_disk = False
+        self._master_proof_no_progress_count = 0
+        self._last_master_proof_edit_signature = ""
+        await self._broadcast("leanoj_cleared", self.get_status())
+
+    async def skip_brainstorm(self) -> None:
+        self._state.skip_brainstorm_requested = True
+        await self._persist_and_broadcast("leanoj_skip_brainstorm_requested")
+
+    async def force_brainstorm(self) -> None:
+        self._state.force_brainstorm_requested = True
+        await self._persist_and_broadcast("leanoj_force_brainstorm_requested")
+
+    async def _consume_skip_brainstorm(self) -> bool:
+        if not self._state.skip_brainstorm_requested:
+            return False
+        self._state.skip_brainstorm_requested = False
+        self._state.current_path_decision = "solve_final_now"
+        self._state.user_forced_final_cycle = True
+        self._state.phase = "final_proof_loop"
+        await self._persist_and_broadcast("leanoj_brainstorm_skipped")
+        return True
+
+    async def _consume_force_brainstorm(self) -> bool:
+        if not self._state.force_brainstorm_requested:
+            return False
+        self._state.force_brainstorm_requested = False
+        self._state.skip_brainstorm_requested = False
+        self._state.user_forced_final_cycle = False
+        self._state.current_path_decision = "need_more_brainstorming"
+        # A user-forced recursive brainstorm is a fresh acceptance window.
+        # Otherwise the recursive sufficiency modulo can reuse the prior cycle's
+        # start count and fire before five new accepted brainstorms arrive.
+        self._state.active_brainstorm_phase = ""
+        self._state.active_brainstorm_start_count = self._state.brainstorm_acceptance_events
+        await self._set_current_working_proof_attempt(
+            trigger="user_force_brainstorm",
+            requested_path="need_more_brainstorming",
+            stuck_reason="User requested recursive brainstorming while preserving the current master proof draft.",
+        )
+        self._state.phase = "recursive_brainstorm"
+        await self._persist_and_broadcast("leanoj_brainstorm_forced")
+        return True
+
+    async def _run_workflow(self, request: LeanOJStartRequest) -> None:
+        if self._state.phase in {"idle", "initial_topic_candidates"}:
+            selected_topic = await self._initial_topic_phase(request)
+            if self._should_stop():
+                return
+            self._state.selected_topic = selected_topic
+
+        if await self._consume_force_brainstorm():
+            pass
+        elif self._state.phase == "initial_brainstorm" or (
+            self._state.phase == "initial_topic_candidates" and self._state.selected_topic
+        ):
+            await self._initial_brainstorm_phase(request)
+
+        if self._state.phase == "recursive_brainstorm":
+            await self._recursive_brainstorm_phase(request)
+
+        if self._state.phase == "proof_storm":
+            # Legacy sessions may resume from the removed proof-only brainstorm path.
+            # Continue with recursive brainstorming because verified proofs can now
+            # be generated directly inside any brainstorm phase.
+            await self._recursive_brainstorm_phase(request)
+
+        if self._state.phase == "final_proof_loop":
+            await self._final_proof_loop(request)
+
+        while not self._should_stop() and self._state.phase != "verified":
+            if await self._consume_force_brainstorm():
+                continue
+
+            if self._state.phase == "final_proof_loop" or self._state.user_forced_final_cycle:
+                await self._final_proof_loop(request)
+                continue
+
+            if self._state.phase == "recursive_brainstorm":
+                await self._recursive_brainstorm_phase(request)
+                continue
+
+            if self._state.phase == "proof_storm":
+                await self._recursive_brainstorm_phase(request)
+                continue
+
+            decision = await self._path_decision_phase(request)
+            if self._should_stop():
+                return
+
+            if await self._consume_force_brainstorm():
+                continue
+
+            if decision == "solve_final_now":
+                await self._final_proof_loop(request)
+            elif decision == "need_more_brainstorming":
+                await self._recursive_brainstorm_phase(request)
+            else:
+                logger.warning("Unknown Proof Solver path decision %s; falling back to recursive brainstorming", decision)
+                await self._recursive_brainstorm_phase(request)
+
+    async def _initial_topic_phase(self, request: LeanOJStartRequest) -> str:
+        self._state.phase = "initial_topic_candidates"
+        await self._persist_and_broadcast("leanoj_phase_changed")
+
+        if not await self._collect_initial_topics(request, target_topics=5):
+            return "Direct Proof Solver proof solving from the user's template"
+
+        if self._should_stop():
+            return ""
+        if not self._validated_topics:
+            return "Direct Proof Solver proof solving from the user's template"
+
+        selected_raw = await self._call_json(
+            request.topic_generator,
+            "leanoj_topic",
+            "leanoj_topic_selector",
+            build_topic_selection_prompt(request.user_prompt, request.lean_template, self._validated_topics),
+        )
+        selected = str(selected_raw.get("topic") or "").strip() or self._validated_topics[0]
+        if not await self._validate_topic(request, selected):
+            selected = self._validated_topics[0]
+
+        await self._persist_and_broadcast("leanoj_initial_topic_selected", {"topic": selected})
+        return selected
+
+    async def _validate_topic(
+        self,
+        request: LeanOJStartRequest,
+        topic: str,
+        accepted_topics: Optional[list[str]] = None,
+    ) -> bool:
+        raw = await self._call_json(
+            request.topic_validator,
+            "leanoj_topic_val",
+            "leanoj_topic_validator",
+            build_topic_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                topic,
+                accepted_topics if accepted_topics is not None else self._validated_topics,
+            ),
+        )
+        accepted = str(raw.get("decision") or "").strip().lower() == "accept"
+        self._last_brainstorm_validation_decisions = [
+            {
+                "accepted": accepted,
+                "reasoning": str(raw.get("reasoning") or "").strip(),
+                "summary": str(raw.get("summary") or "").strip(),
+            }
+        ]
+        return accepted
+
+    async def _validate_topic_batch(
+        self,
+        request: LeanOJStartRequest,
+        topics: list[str],
+        accepted_topics: Optional[list[str]] = None,
+    ) -> list[bool]:
+        if not topics:
+            return []
+        if len(topics) == 1:
+            return [await self._validate_topic(request, topics[0], accepted_topics)]
+
+        raw = await self._call_json(
+            request.topic_validator,
+            "leanoj_topic_val",
+            "leanoj_topic_validator",
+            build_topic_batch_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                topics,
+                accepted_topics if accepted_topics is not None else self._validated_topics,
+            ),
+        )
+        decisions = raw.get("decisions")
+        if not isinstance(decisions, list) or len(decisions) != len(topics):
+            logger.warning(
+                "LeanOJ topic batch validator returned %s decisions for %s topics",
+                len(decisions) if isinstance(decisions, list) else "non-list",
+                len(topics),
+            )
+            return [False for _ in topics]
+
+        accepted: list[bool] = []
+        for expected_number, decision_payload in enumerate(decisions, start=1):
+            if not isinstance(decision_payload, dict):
+                accepted.append(False)
+                continue
+            if decision_payload.get("topic_number") != expected_number:
+                logger.warning(
+                    "LeanOJ topic batch validator returned out-of-order decision: expected %s, got %s",
+                    expected_number,
+                    decision_payload.get("topic_number"),
+                )
+                return [False for _ in topics]
+            accepted.append(str(decision_payload.get("decision") or "").strip().lower() == "accept")
+        return accepted
+
+    async def _collect_initial_topics(self, request: LeanOJStartRequest, *, target_topics: int) -> bool:
+        if self._state.skip_brainstorm_requested:
+            await self._persist_and_broadcast("leanoj_brainstorm_skip_deferred")
+            return False
+
+        topic_queue: asyncio.Queue[tuple[int, str]] = asyncio.Queue(
+            maxsize=max(3, len(request.brainstorm_submitters) * 2)
+        )
+        submitter_tasks = [
+            asyncio.create_task(
+                self._topic_submitter_loop(
+                    request,
+                    index,
+                    submitter,
+                    topic_queue,
+                    target_topics=target_topics,
+                )
+            )
+            for index, submitter in enumerate(request.brainstorm_submitters, start=1)
+        ]
+        logger.info(
+            "LeanOJ initial topic submitters started (submitters=%s, target_topics=%s)",
+            len(submitter_tasks),
+            target_topics,
+        )
+        await self._broadcast(
+            "leanoj_topic_submitters_started",
+            {
+                "submitter_count": len(submitter_tasks),
+                "target_topics": target_topics,
+            },
+        )
+
+        try:
+            while len(self._validated_topics) < target_topics and not self._should_stop():
+                if self._state.skip_brainstorm_requested:
+                    await self._persist_and_broadcast("leanoj_brainstorm_skip_deferred")
+                    return False
+
+                remaining_topics = target_topics - len(self._validated_topics)
+                batch = await self._dequeue_topic_batch(topic_queue, max_count=min(3, remaining_topics))
+                if not batch:
+                    if all(task.done() for task in submitter_tasks):
+                        errors = [
+                            task.exception()
+                            for task in submitter_tasks
+                            if task.done() and not task.cancelled() and task.exception() is not None
+                        ]
+                        if errors:
+                            raise RuntimeError(f"All LeanOJ topic submitters stopped: {errors[0]}")
+                        return bool(self._validated_topics)
+                    continue
+
+                topics = [topic for _, topic in batch]
+                logger.info(
+                    "LeanOJ topic batch validation started (batch_size=%s, submitters=%s)",
+                    len(batch),
+                    [submitter_index for submitter_index, _ in batch],
+                )
+                await self._broadcast(
+                    "leanoj_topic_batch_validation_started",
+                    {
+                        "batch_size": len(batch),
+                        "submitters": [submitter_index for submitter_index, _ in batch],
+                        "accepted_topics": len(self._validated_topics),
+                        "target_topics": target_topics,
+                    },
+                )
+                decisions = await self._validate_topic_batch(
+                    request,
+                    topics,
+                    accepted_topics=list(self._validated_topics),
+                )
+                for (submitter_index, topic), accepted in zip(batch, decisions):
+                    submitter_config = request.brainstorm_submitters[submitter_index - 1]
+                    if accepted:
+                        self._validated_topics.append(topic)
+                        await self._persist_and_broadcast(
+                            "leanoj_topic_validated",
+                            {
+                                "topic": topic,
+                                "submitter": submitter_index,
+                                "submitter_id": submitter_index,
+                                "submitter_model": submitter_config.model_id,
+                                "submitter_provider": submitter_config.provider,
+                                "accepted_topics": len(self._validated_topics),
+                                "target_topics": target_topics,
+                            },
+                        )
+                    else:
+                        await self._broadcast(
+                            "leanoj_topic_rejected",
+                            {
+                                "topic": topic,
+                                "submitter": submitter_index,
+                                "submitter_id": submitter_index,
+                                "submitter_model": submitter_config.model_id,
+                                "submitter_provider": submitter_config.provider,
+                                "accepted_topics": len(self._validated_topics),
+                                "target_topics": target_topics,
+                            },
+                        )
+            return bool(self._validated_topics)
+        finally:
+            for task in submitter_tasks:
+                task.cancel()
+            await asyncio.gather(*submitter_tasks, return_exceptions=True)
+
+    async def _topic_submitter_loop(
+        self,
+        request: LeanOJStartRequest,
+        submitter_index: int,
+        submitter: LeanOJRoleConfig,
+        topic_queue: asyncio.Queue[tuple[int, str]],
+        *,
+        target_topics: int,
+    ) -> None:
+        task_prefix = f"leanoj_topic_sub{submitter_index}"
+        role_id = f"leanoj_topic_submitter_{submitter_index}"
+        attempt = 0
+        while not self._should_stop():
+            try:
+                attempt += 1
+                topic_index = min(target_topics, len(self._validated_topics) + topic_queue.qsize() + 1)
+                await self._broadcast(
+                    "leanoj_topic_generation_started",
+                    {
+                        "attempt": attempt,
+                        "topic_index": topic_index,
+                        "target_topics": target_topics,
+                        "accepted_topics": len(self._validated_topics),
+                        "submitter": submitter_index,
+                        "submitter_id": submitter_index,
+                        "submitter_model": submitter.model_id,
+                        "submitter_provider": submitter.provider,
+                    },
+                )
+                raw = await self._call_json(
+                    submitter,
+                    task_prefix,
+                    role_id,
+                    build_topic_candidate_prompt(
+                        request.user_prompt,
+                        request.lean_template,
+                        self._validated_topics,
+                    ),
+                    temperature=api_client_manager.parallel_brainstorm_submitter_temperature(submitter_index),
+                )
+
+                topic = str(raw.get("topic") or "").strip()
+                if not topic:
+                    await self._broadcast(
+                        "leanoj_topic_empty",
+                        {
+                            "attempt": attempt,
+                            "submitter": submitter_index,
+                            "submitter_id": submitter_index,
+                        },
+                    )
+                    continue
+
+                await topic_queue.put((submitter_index, topic))
+                await self._broadcast(
+                    "leanoj_topic_candidate_queued",
+                    {
+                        "submitter": submitter_index,
+                        "submitter_id": submitter_index,
+                        "submitter_model": submitter.model_id,
+                        "submitter_provider": submitter.provider,
+                        "queue_size": topic_queue.qsize(),
+                        "topic_preview": self._summarize_error(topic, limit=220),
+                    },
+                )
+            except asyncio.CancelledError:
+                raise
+            except LeanOJConfigurationError:
+                raise
+            except Exception as exc:
+                logger.warning("LeanOJ topic submitter %s failed: %s", submitter_index, exc)
+                await self._broadcast(
+                    "leanoj_topic_submitter_failed",
+                    {
+                        "submitter": submitter_index,
+                        "submitter_id": submitter_index,
+                        "message": str(exc),
+                    },
+                )
+                await asyncio.sleep(2)
+
+    async def _initial_brainstorm_phase(self, request: LeanOJStartRequest) -> None:
+        self._state.phase = "initial_brainstorm"
+        self._begin_brainstorm_acceptance_phase("initial_brainstorm")
+        await self._persist_and_broadcast("leanoj_phase_changed")
+        await self._brainstorm_until_path_check(
+            request,
+            phase_key="initial_brainstorm",
+            max_accepts=request.max_initial_brainstorm_accepts,
+            sufficiency_interval=10,
+            force_after_max=True,
+        )
+
+    async def _recursive_brainstorm_phase(self, request: LeanOJStartRequest) -> None:
+        if await self._consume_force_brainstorm():
+            return
+        if await self._consume_skip_brainstorm():
+            return
+
+        resuming_recursive_phase = self._state.phase == "recursive_brainstorm"
+        if not resuming_recursive_phase:
+            self._state.recursive_cycle_count += 1
+            self._state.active_brainstorm_phase = ""
+
+        self._state.phase = "recursive_brainstorm"
+        self._begin_brainstorm_acceptance_phase("recursive_brainstorm")
+        await self._persist_and_broadcast("leanoj_phase_changed")
+        accepted_at_phase_entry = self._state.brainstorm_acceptance_events
+        logger.info(
+            "LeanOJ recursive brainstorm cycle %s %s (accepted_events=%s)",
+            self._state.recursive_cycle_count,
+            "resumed" if resuming_recursive_phase else "started",
+            accepted_at_phase_entry,
+        )
+        await self._persist_and_broadcast(
+            "leanoj_recursive_brainstorm_started",
+            {
+                "cycle": self._state.recursive_cycle_count,
+                "resumed": resuming_recursive_phase,
+                "accepted_events": accepted_at_phase_entry,
+            },
+        )
+
+        try:
+            if await self._consume_skip_brainstorm():
+                return
+            await self._brainstorm_until_path_check(
+                request,
+                phase_key="recursive_brainstorm",
+                max_accepts=request.max_recursive_brainstorm_accepts,
+                sufficiency_interval=5,
+                force_after_max=True,
+            )
+            if not self._should_stop():
+                accepted_delta = self._state.brainstorm_acceptance_events - accepted_at_phase_entry
+                logger.info(
+                    "LeanOJ recursive brainstorm cycle %s completed (accepted_delta=%s, total_acceptances=%s)",
+                    self._state.recursive_cycle_count,
+                    accepted_delta,
+                    self._state.accepted_brainstorm_count,
+                )
+                await self._persist_and_broadcast(
+                    "leanoj_recursive_brainstorm_completed",
+                    {
+                        "cycle": self._state.recursive_cycle_count,
+                        "accepted_delta": accepted_delta,
+                        "total_acceptances": self._state.accepted_brainstorm_count,
+                        "total_brainstorm_acceptance_events": self._state.brainstorm_acceptance_events,
+                    },
+                )
+        finally:
+            if not self._should_stop():
+                self._clear_current_final_cycle_packet()
+
+    async def _brainstorm_until_path_check(
+        self,
+        request: LeanOJStartRequest,
+        *,
+        phase_key: str = "initial_brainstorm",
+        max_accepts: int,
+        sufficiency_interval: int,
+        force_after_max: bool,
+    ) -> None:
+        accepted_at_start = self._get_brainstorm_acceptance_start(phase_key)
+        run_exit_review = False
+        submission_queue = _LeanOJBrainstormSubmissionQueue(
+            submitter_count=len(request.brainstorm_submitters)
+        )
+        submitter_tasks = [
+            asyncio.create_task(
+                self._brainstorm_submitter_loop(request, index, submitter, submission_queue)
+            )
+            for index, submitter in enumerate(request.brainstorm_submitters, start=1)
+        ]
+        logger.info(
+            "LeanOJ brainstorm submitters started (phase=%s, submitters=%s, max_accepts=%s, accepted_at_start=%s)",
+            phase_key,
+            len(submitter_tasks),
+            max_accepts,
+            accepted_at_start,
+        )
+        await self._broadcast(
+            "leanoj_brainstorm_submitters_started",
+            {
+                "phase": phase_key,
+                "submitter_count": len(submitter_tasks),
+                "max_accepts": max_accepts,
+                "accepted_at_start": accepted_at_start,
+            },
+        )
+
+        try:
+            while not self._should_stop():
+                if await self._consume_force_brainstorm():
+                    run_exit_review = False
+                    return
+                if await self._consume_skip_brainstorm():
+                    run_exit_review = False
+                    return
+
+                accepted_delta = self._state.brainstorm_acceptance_events - accepted_at_start
+                if accepted_delta >= max_accepts and force_after_max:
+                    run_exit_review = True
+                    logger.info(
+                        "LeanOJ brainstorm phase limit reached (phase=%s, accepted_delta=%s, max_accepts=%s)",
+                        phase_key,
+                        accepted_delta,
+                        max_accepts,
+                    )
+                    await self._broadcast(
+                        "leanoj_brainstorm_phase_limit_reached",
+                        {
+                            "phase": phase_key,
+                            "accepted_delta": accepted_delta,
+                            "max_accepts": max_accepts,
+                            "total_acceptances": self._state.accepted_brainstorm_count,
+                        },
+                    )
+                    self._finish_brainstorm_acceptance_phase_for_path_decision()
+                    return
+                if (
+                    accepted_delta > 0
+                    and accepted_delta % sufficiency_interval == 0
+                    and self._state.brainstorm_acceptance_events
+                    != self._state.active_brainstorm_last_sufficiency_check_count
+                ):
+                    self._state.active_brainstorm_last_sufficiency_check_count = (
+                        self._state.brainstorm_acceptance_events
+                    )
+                    logger.info(
+                        "LeanOJ brainstorm sufficiency check started (phase=%s, accepted_delta=%s)",
+                        phase_key,
+                        accepted_delta,
+                    )
+                    await self._broadcast(
+                        "leanoj_sufficiency_check_started",
+                        {
+                            "phase": phase_key,
+                            "accepted_delta": accepted_delta,
+                            "total_acceptances": self._state.accepted_brainstorm_count,
+                        },
+                    )
+                    enough = await self._sufficiency_check(request)
+                    await self._persist_and_broadcast("leanoj_sufficiency_checked", {"enough": enough})
+                    if enough:
+                        run_exit_review = True
+                        self._finish_brainstorm_acceptance_phase_for_path_decision()
+                        return
+
+                batch = await self._dequeue_brainstorm_batch(submission_queue)
+                await self._sync_brainstorm_queue_pause_state(submission_queue, phase_key)
+                if not batch:
+                    if all(task.done() for task in submitter_tasks):
+                        errors = [
+                            task.exception()
+                            for task in submitter_tasks
+                            if task.done() and not task.cancelled() and task.exception() is not None
+                        ]
+                        if errors:
+                            raise RuntimeError(f"All LeanOJ brainstorm submitters stopped: {errors[0]}")
+                        run_exit_review = True
+                        self._finish_brainstorm_acceptance_phase_for_path_decision()
+                        return
+                    continue
+
+                submissions = [submission for _, submission, _ in batch]
+                logger.info(
+                    "LeanOJ brainstorm batch validation started (phase=%s, batch_size=%s, submitters=%s)",
+                    phase_key,
+                    len(batch),
+                    [submitter_index for submitter_index, _, _ in batch],
+                )
+                await self._broadcast(
+                    "leanoj_brainstorm_batch_validation_started",
+                    {
+                        "phase": phase_key,
+                        "batch_size": len(batch),
+                        "submitters": [submitter_index for submitter_index, _, _ in batch],
+                    },
+                )
+                decisions = await self._validate_brainstorm_batch(request, submissions)
+                validation_decisions = list(self._last_brainstorm_validation_decisions)
+                for batch_index, ((submitter_index, submission, metadata), accepted) in enumerate(
+                    zip(batch, decisions)
+                ):
+                    submitter_config = request.brainstorm_submitters[submitter_index - 1]
+                    if accepted:
+                        await self._record_accepted_brainstorm_proof(request, submitter_index, metadata)
+                        validation_feedback = (
+                            validation_decisions[batch_index]
+                            if batch_index < len(validation_decisions)
+                            else {}
+                        )
+                        self._record_accepted_brainstorm_idea(
+                            submission,
+                            submitter_index,
+                            phase_key,
+                            validation_feedback,
+                        )
+                        self._state.accepted_brainstorm_count = len(self._accepted_ideas)
+                        submission_preview = self._summarize_error(submission, limit=220)
+                        logger.info(
+                            "LeanOJ brainstorm ACCEPTED: Submitter %s [%s] (phase=%s, total_acceptances=%s, event=%s) - %s",
+                            submitter_index,
+                            submitter_config.model_id,
+                            phase_key,
+                            self._state.accepted_brainstorm_count,
+                            self._state.brainstorm_acceptance_events,
+                            submission_preview,
+                        )
+                        await self._persist_and_broadcast(
+                            "leanoj_brainstorm_accepted",
+                            {
+                                "submitter": submitter_index,
+                                "submitter_id": submitter_index,
+                                "submitter_model": submitter_config.model_id,
+                                "submitter_provider": submitter_config.provider,
+                                "submission": submission,
+                                "submission_preview": submission_preview,
+                                "phase": phase_key,
+                                "total_acceptances": self._state.accepted_brainstorm_count,
+                                "total_brainstorm_acceptance_events": self._state.brainstorm_acceptance_events,
+                            },
+                        )
+                        accepted_delta = self._state.brainstorm_acceptance_events - accepted_at_start
+                        if (
+                            accepted_delta > 0
+                            and accepted_delta % 7 == 0
+                            and self._state.brainstorm_acceptance_events
+                            != self._state.active_brainstorm_last_prune_review_count
+                        ):
+                            self._state.active_brainstorm_last_prune_review_count = (
+                                self._state.brainstorm_acceptance_events
+                            )
+                            await self._perform_brainstorm_prune_review(
+                                request,
+                                phase_key,
+                                reason=f"scheduled review after {accepted_delta} accepted brainstorm events",
+                            )
+                        if (
+                            force_after_max
+                            and self._state.brainstorm_acceptance_events - accepted_at_start >= max_accepts
+                        ):
+                            run_exit_review = True
+                            self._finish_brainstorm_acceptance_phase_for_path_decision()
+                            return
+                    else:
+                        validation_feedback = (
+                            validation_decisions[batch_index]
+                            if batch_index < len(validation_decisions)
+                            else {}
+                        )
+                        self._state.rejected_brainstorm_count += 1
+                        self._record_brainstorm_rejection_feedback(
+                            submitter_index,
+                            submission,
+                            validation_feedback,
+                        )
+                        submission_preview = self._summarize_error(submission, limit=220)
+                        rejection_reason = self._summarize_error(
+                            validation_feedback.get("summary")
+                            or validation_feedback.get("reasoning")
+                            or "Rejected by brainstorm validator.",
+                            limit=220,
+                        )
+                        logger.info(
+                            "LeanOJ brainstorm REJECTED: Submitter %s [%s] (phase=%s, total_rejections=%s) - %s",
+                            submitter_index,
+                            submitter_config.model_id,
+                            phase_key,
+                            self._state.rejected_brainstorm_count,
+                            rejection_reason,
+                        )
+                        await self._persist_and_broadcast(
+                            "leanoj_brainstorm_rejected",
+                            {
+                                "submitter": submitter_index,
+                                "submitter_id": submitter_index,
+                                "submitter_model": submitter_config.model_id,
+                                "submitter_provider": submitter_config.provider,
+                                "submission": submission,
+                                "submission_preview": submission_preview,
+                                "validator_reasoning": validation_feedback.get("reasoning", ""),
+                                "validator_summary": validation_feedback.get("summary", ""),
+                                "rejection_reason": rejection_reason,
+                                "phase": phase_key,
+                                "total_acceptances": self._state.accepted_brainstorm_count,
+                                "total_rejections": self._state.rejected_brainstorm_count,
+                            },
+                        )
+        finally:
+            for task in submitter_tasks:
+                task.cancel()
+            await asyncio.gather(*submitter_tasks, return_exceptions=True)
+            accepted_delta = self._state.brainstorm_acceptance_events - accepted_at_start
+            if (
+                run_exit_review
+                and not self._should_stop()
+                and accepted_delta > 0
+                and self._state.brainstorm_acceptance_events
+                != self._state.active_brainstorm_last_prune_review_count
+            ):
+                self._state.active_brainstorm_last_prune_review_count = (
+                    self._state.brainstorm_acceptance_events
+                )
+                await self._perform_brainstorm_prune_review(
+                    request,
+                    phase_key,
+                    reason=f"phase-exit review after {accepted_delta} accepted brainstorm events",
+                )
+
+    async def _wait_for_brainstorm_queue_turn(
+        self,
+        submission_queue: _LeanOJBrainstormSubmissionQueue,
+        submitter_index: int,
+    ) -> None:
+        while not self._should_stop() and submission_queue.should_pause_submitter(submitter_index):
+            await self._sync_brainstorm_queue_pause_state(
+                submission_queue,
+                self._state.active_brainstorm_phase or self._state.phase,
+            )
+            await asyncio.sleep(2)
+        await self._sync_brainstorm_queue_pause_state(
+            submission_queue,
+            self._state.active_brainstorm_phase or self._state.phase,
+        )
+
+    async def _sync_brainstorm_queue_pause_state(
+        self,
+        submission_queue: _LeanOJBrainstormSubmissionQueue,
+        phase_key: str,
+    ) -> None:
+        transitions = submission_queue.refresh_pause_transitions()
+        queue_size = transitions["queue_size"]
+        if transitions["global_changed"]:
+            if transitions["global_paused"]:
+                logger.info(
+                    "LeanOJ brainstorm queue size (%s) >= threshold (%s). Pausing all submitters.",
+                    queue_size,
+                    system_config.queue_overflow_threshold,
+                )
+                await self._broadcast(
+                    "leanoj_brainstorm_submitters_paused",
+                    {
+                        "phase": phase_key,
+                        "queue_size": queue_size,
+                        "threshold": system_config.queue_overflow_threshold,
+                    },
+                )
+            else:
+                logger.info(
+                    "LeanOJ brainstorm queue size (%s) < threshold (%s). Resuming all submitters.",
+                    queue_size,
+                    system_config.queue_overflow_threshold,
+                )
+                await self._broadcast(
+                    "leanoj_brainstorm_submitters_resumed",
+                    {
+                        "phase": phase_key,
+                        "queue_size": queue_size,
+                        "threshold": system_config.queue_overflow_threshold,
+                    },
+                )
+
+        for paused_submitter in sorted(transitions["submitters_paused"]):
+            pending_count = submission_queue.count_for_submitter(paused_submitter)
+            logger.info(
+                "LeanOJ brainstorm submitter %s paused for fairness (pending=%s, threshold=%s).",
+                paused_submitter,
+                pending_count,
+                system_config.per_submitter_queue_threshold,
+            )
+            await self._broadcast(
+                "leanoj_brainstorm_submitter_paused",
+                {
+                    "phase": phase_key,
+                    "queue_size": queue_size,
+                    "submitter": paused_submitter,
+                    "submitter_id": paused_submitter,
+                    "submitter_pending": pending_count,
+                    "threshold": system_config.per_submitter_queue_threshold,
+                },
+            )
+
+        for resumed_submitter in sorted(transitions["submitters_resumed"]):
+            pending_count = submission_queue.count_for_submitter(resumed_submitter)
+            logger.info(
+                "LeanOJ brainstorm submitter %s resumed for fairness (pending=%s, threshold=%s).",
+                resumed_submitter,
+                pending_count,
+                system_config.per_submitter_queue_threshold,
+            )
+            await self._broadcast(
+                "leanoj_brainstorm_submitter_resumed",
+                {
+                    "phase": phase_key,
+                    "queue_size": queue_size,
+                    "submitter": resumed_submitter,
+                    "submitter_id": resumed_submitter,
+                    "submitter_pending": pending_count,
+                    "threshold": system_config.per_submitter_queue_threshold,
+                },
+            )
+
+    async def _brainstorm_submitter_loop(
+        self,
+        request: LeanOJStartRequest,
+        submitter_index: int,
+        submitter: LeanOJRoleConfig,
+        submission_queue: _LeanOJBrainstormSubmissionQueue,
+    ) -> None:
+        task_prefix = f"leanoj_brainstorm_sub{submitter_index}"
+        role_id = f"leanoj_brainstorm_submitter_{submitter_index}"
+        while not self._should_stop():
+            try:
+                await self._wait_for_brainstorm_queue_turn(submission_queue, submitter_index)
+                if self._should_stop():
+                    break
+                active_topic = self._active_brainstorm_topic()
+                prompt_failed_feedback = self._general_brainstorm_feedback_records()
+                context_blocks = await self._build_context_blocks(
+                    request,
+                    submitter,
+                    mode="brainstorm",
+                    task_request=(
+                        "Generate one concrete proof-solving brainstorm idea for the active LeanOJ topic: "
+                        f"{active_topic}"
+                    ),
+                    include_current_final_cycle_packet=True,
+                    capped_rejection_feedback=self._format_capped_rejection_feedback(
+                        "RECENT FAILED / REJECTION FEEDBACK SUMMARIES",
+                        prompt_failed_feedback,
+                        limit=10,
+                    ),
+                )
+                raw = await self._call_json(
+                    submitter,
+                    task_prefix,
+                    role_id,
+                    build_brainstorm_prompt(
+                        request.user_prompt,
+                        request.lean_template,
+                        active_topic,
+                        self._accepted_ideas,
+                        [item.model_dump(mode="json") for item in self._state.verified_subproofs],
+                        prompt_failed_feedback,
+                        context_blocks=context_blocks,
+                    ),
+                    temperature=api_client_manager.parallel_brainstorm_submitter_temperature(submitter_index),
+                )
+                metadata: dict[str, Any] = {}
+                if is_lean_proof_submission(raw):
+                    source_context = "\n\n".join(
+                        part
+                        for part in [
+                            request.lean_template,
+                            active_topic,
+                            "\n\n".join(self._accepted_ideas),
+                            "\n\n".join(str(value) for value in context_blocks.values() if value),
+                        ]
+                        if part
+                    )
+                    gate_result = await verify_brainstorm_proof_candidate(
+                        parsed=raw,
+                        user_prompt=request.user_prompt,
+                        source_context=source_context,
+                        model_id=submitter.model_id,
+                        role_id=role_id,
+                        task_id_prefix=f"{task_prefix}_lean",
+                        max_tokens=submitter.max_output_tokens,
+                        validator_model=request.brainstorm_validator.model_id,
+                        validator_context=request.brainstorm_validator.context_window,
+                        validator_max_tokens=request.brainstorm_validator.max_output_tokens,
+                        validator_role_id="leanoj_brainstorm_validator",
+                        allowed_baseline=request.lean_template,
+                        max_attempts=5,
+                    )
+                    if not gate_result.accepted:
+                        feedback = {
+                            "request": str(raw.get("theorem_statement") or raw.get("submission") or active_topic),
+                            "error_summary": self._summarize_error(gate_result.failure_feedback, limit=1200),
+                            "lean_code": gate_result.lean_code,
+                        }
+                        self._failed_feedback.append(feedback)
+                        await self._persist_and_broadcast(
+                            "leanoj_brainstorm_proof_failed",
+                            {
+                                "submitter": submitter_index,
+                                "submitter_id": submitter_index,
+                                "submitter_model": submitter.model_id,
+                                "submitter_provider": submitter.provider,
+                                "feedback": feedback,
+                            },
+                        )
+                        continue
+                    raw = {
+                        **raw,
+                        "submission": gate_result.submission_content,
+                        "reasoning": gate_result.reasoning or raw.get("reasoning", ""),
+                    }
+                    metadata["brainstorm_lean_proof"] = {
+                        "theorem_statement": gate_result.theorem_statement,
+                        "theorem_name": gate_result.theorem_name,
+                        "formal_sketch": gate_result.formal_sketch,
+                        "lean_code": gate_result.lean_code,
+                        "lean_feedback": gate_result.lean_feedback,
+                        "reasoning": gate_result.reasoning,
+                        "attempts": [
+                            attempt.model_dump(mode="json")
+                            for attempt in (gate_result.attempts or [])
+                        ],
+                        "attempt_count": len(gate_result.attempts or []),
+                    }
+                submission = str(raw.get("submission") or "").strip()
+                if submission:
+                    await self._wait_for_brainstorm_queue_turn(submission_queue, submitter_index)
+                    if self._should_stop():
+                        break
+                    await submission_queue.put((submitter_index, submission, metadata))
+                    await self._sync_brainstorm_queue_pause_state(
+                        submission_queue,
+                        self._state.active_brainstorm_phase or self._state.phase,
+                    )
+                    logger.info(
+                        "LeanOJ brainstorm submission queued (phase=%s, submitter=%s, queue_size=%s)",
+                        self._state.active_brainstorm_phase or self._state.phase,
+                        submitter_index,
+                        submission_queue.qsize(),
+                    )
+                    await self._broadcast(
+                        "leanoj_brainstorm_submission_queued",
+                        {
+                            "phase": self._state.active_brainstorm_phase or self._state.phase,
+                            "submitter": submitter_index,
+                            "submitter_id": submitter_index,
+                            "submitter_model": submitter.model_id,
+                            "submitter_provider": submitter.provider,
+                            "queue_size": submission_queue.qsize(),
+                            "submission_preview": self._summarize_error(submission, limit=220),
+                        },
+                    )
+            except asyncio.CancelledError:
+                raise
+            except LeanOJConfigurationError:
+                raise
+            except Exception as exc:
+                logger.warning("LeanOJ brainstorm submitter %s failed: %s", submitter_index, exc)
+                await self._broadcast(
+                    "leanoj_brainstorm_submitter_failed",
+                    {"submitter": submitter_index, "message": str(exc)},
+                )
+                await asyncio.sleep(2)
+
+    async def _dequeue_brainstorm_batch(
+        self,
+        submission_queue: _LeanOJBrainstormSubmissionQueue,
+        *,
+        max_count: int = 3,
+    ) -> list[_BrainstormSubmission]:
+        return await submission_queue.dequeue_batch(max_count=max_count)
+
+    async def _dequeue_topic_batch(
+        self,
+        topic_queue: asyncio.Queue[tuple[int, str]],
+        *,
+        max_count: int = 3,
+    ) -> list[tuple[int, str]]:
+        try:
+            first = await asyncio.wait_for(topic_queue.get(), timeout=1.0)
+        except asyncio.TimeoutError:
+            return []
+
+        batch = [first]
+        deadline = time.monotonic() + 0.25
+        while len(batch) < max_count:
+            try:
+                batch.append(topic_queue.get_nowait())
+                continue
+            except asyncio.QueueEmpty:
+                pass
+
+            remaining = deadline - time.monotonic()
+            if remaining <= 0:
+                break
+            try:
+                batch.append(await asyncio.wait_for(topic_queue.get(), timeout=remaining))
+            except asyncio.TimeoutError:
+                break
+        return batch
+
+    def _topic_validation_context(self) -> list[str]:
+        topics: list[str] = []
+        seen: set[str] = set()
+        for topic in self._validated_topics:
+            normalized = topic.strip()
+            if not normalized or normalized in seen:
+                continue
+            topics.append(normalized)
+            seen.add(normalized)
+        return topics
+
+    async def _record_accepted_brainstorm_proof(
+        self,
+        request: LeanOJStartRequest,
+        submitter_index: int,
+        metadata: dict[str, Any],
+    ) -> None:
+        proof_payload = (metadata or {}).get("brainstorm_lean_proof")
+        if not isinstance(proof_payload, dict):
+            return
+
+        theorem_statement = str(proof_payload.get("theorem_statement") or "").strip()
+        lean_code = str(proof_payload.get("lean_code") or "").strip()
+        if not theorem_statement or not lean_code:
+            return
+
+        subproof_id = f"brainstorm_proof_{self._state.brainstorm_acceptance_events + 1}_{uuid.uuid4().hex[:6]}"
+        lean_feedback = str(proof_payload.get("lean_feedback") or "").strip()
+        proof_attempts = [
+            item if isinstance(item, ProofAttemptFeedback) else ProofAttemptFeedback.model_validate(item)
+            for item in (proof_payload.get("attempts") or [])
+        ]
+        proof_record: Optional[ProofRecord] = None
+        try:
+            proof_record = await self._register_verified_leanoj_proof(
+                request,
+                proof_kind="subproof",
+                theorem_statement=theorem_statement,
+                theorem_name=str(proof_payload.get("theorem_name") or subproof_id),
+                lean_code=lean_code,
+                attempt_count=int(proof_payload.get("attempt_count") or 1),
+                formal_sketch=str(proof_payload.get("formal_sketch") or "LeanOJ brainstorm proof candidate"),
+                theorem_id=subproof_id,
+                source_title=f"LeanOJ brainstorm proof from submitter {submitter_index}",
+                verification_notes=(
+                    lean_feedback
+                    or "Proof Solver verified this brainstorm subproof with Lean 4 and template/device checks."
+                ),
+                attempts=proof_attempts,
+            )
+        except Exception as exc:
+            logger.warning("LeanOJ accepted brainstorm proof registration failed: %s", exc, exc_info=True)
+            await self._broadcast(
+                "leanoj_brainstorm_proof_registration_failed",
+                {
+                    "subproof_id": subproof_id,
+                    "submitter": submitter_index,
+                    "error": str(exc),
+                },
+            )
+
+        record = LeanOJSubproofRecord(
+            subproof_id=subproof_id,
+            request=theorem_statement,
+            role="Verified during brainstorm before validator acceptance.",
+            theorem_or_lemma=str(proof_payload.get("theorem_name") or theorem_statement),
+            verified=True,
+            lean_code=lean_code,
+            lean_feedback=lean_feedback,
+            attempts_used=int(proof_payload.get("attempt_count") or 1),
+            proof_id=proof_record.proof_id if proof_record else "",
+            novel=proof_record.novel if proof_record else False,
+            novelty_tier=proof_record.novelty_tier if proof_record else "not_novel",
+            novelty_reasoning=proof_record.novelty_reasoning if proof_record else "",
+        )
+        self._state.verified_subproofs.append(record)
+        await self._persist_and_broadcast(
+            "leanoj_brainstorm_proof_verified",
+            {
+                "subproof": record.model_dump(mode="json"),
+                "submitter": submitter_index,
+                "submitter_id": submitter_index,
+            },
+        )
+
+    async def _validate_brainstorm(self, request: LeanOJStartRequest, submission: str) -> bool:
+        raw = await self._call_json(
+            request.brainstorm_validator,
+            "leanoj_brainstorm_val",
+            "leanoj_brainstorm_validator",
+            build_brainstorm_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                submission,
+                self._accepted_ideas,
+                context_blocks=await self._build_context_blocks(
+                    request,
+                    request.brainstorm_validator,
+                    mode="brainstorm",
+                    task_request="Validate whether a LeanOJ brainstorm submission is useful and non-redundant.",
+                    include_current_final_cycle_packet=True,
+                ),
+            ),
+        )
+        accepted = str(raw.get("decision") or "").strip().lower() == "accept"
+        self._last_brainstorm_validation_decisions = [
+            {
+                "accepted": accepted,
+                "context_role": self._normalize_brainstorm_context_role(raw, submission),
+                "reasoning": str(raw.get("reasoning") or "").strip(),
+                "summary": str(raw.get("summary") or "").strip(),
+            }
+        ]
+        return accepted
+
+    async def _validate_brainstorm_batch(self, request: LeanOJStartRequest, submissions: list[str]) -> list[bool]:
+        if not submissions:
+            self._last_brainstorm_validation_decisions = []
+            return []
+        if len(submissions) == 1:
+            return [await self._validate_brainstorm(request, submissions[0])]
+
+        raw = await self._call_json(
+            request.brainstorm_validator,
+            "leanoj_brainstorm_val",
+            "leanoj_brainstorm_validator",
+            build_brainstorm_batch_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                submissions,
+                self._accepted_ideas,
+                context_blocks=await self._build_context_blocks(
+                    request,
+                    request.brainstorm_validator,
+                    mode="brainstorm",
+                    task_request="Batch-validate LeanOJ brainstorm submissions for usefulness and redundancy.",
+                    include_current_final_cycle_packet=True,
+                ),
+            ),
+        )
+        decisions = raw.get("decisions")
+        if not isinstance(decisions, list) or len(decisions) != len(submissions):
+            logger.warning(
+                "LeanOJ brainstorm batch validator returned %s decisions for %s submissions",
+                len(decisions) if isinstance(decisions, list) else "non-list",
+                len(submissions),
+            )
+            self._last_brainstorm_validation_decisions = [
+                {
+                    "accepted": False,
+                    "reasoning": "Brainstorm validator returned malformed decision payload.",
+                    "summary": "Validator did not return one ordered decision per submission.",
+                }
+                for _ in submissions
+            ]
+            return [False for _ in submissions]
+
+        accepted: list[bool] = []
+        validation_decisions: list[dict[str, Any]] = []
+        for expected_number, decision_payload in enumerate(decisions, start=1):
+            if not isinstance(decision_payload, dict):
+                accepted.append(False)
+                validation_decisions.append(
+                    {
+                        "accepted": False,
+                        "reasoning": "Decision payload was not an object.",
+                        "summary": "Validator returned a malformed decision entry.",
+                    }
+                )
+                continue
+            if decision_payload.get("submission_number") != expected_number:
+                logger.warning(
+                    "LeanOJ brainstorm batch validator returned out-of-order decision: expected %s, got %s",
+                    expected_number,
+                    decision_payload.get("submission_number"),
+                )
+                self._last_brainstorm_validation_decisions = [
+                    {
+                        "accepted": False,
+                        "reasoning": "Brainstorm validator returned out-of-order decisions.",
+                        "summary": "Validator decisions could not be matched to submissions.",
+                    }
+                    for _ in submissions
+                ]
+                return [False for _ in submissions]
+            is_accepted = str(decision_payload.get("decision") or "").strip().lower() == "accept"
+            accepted.append(is_accepted)
+            validation_decisions.append(
+                {
+                    "accepted": is_accepted,
+                    "context_role": self._normalize_brainstorm_context_role(decision_payload, submissions[expected_number - 1]),
+                    "reasoning": str(decision_payload.get("reasoning") or "").strip(),
+                    "summary": str(decision_payload.get("summary") or "").strip(),
+                }
+            )
+        self._last_brainstorm_validation_decisions = validation_decisions
+        return accepted
+
+    def _record_brainstorm_rejection_feedback(
+        self,
+        submitter_index: int,
+        submission: str,
+        validation_feedback: dict[str, Any],
+    ) -> None:
+        summary = str(validation_feedback.get("summary") or "").strip()
+        reasoning = str(validation_feedback.get("reasoning") or "").strip()
+        feedback_parts = [
+            "VALIDATOR REJECTED BRAINSTORM SUBMISSION",
+            f"Summary: {summary}" if summary else "",
+            f"Reasoning: {reasoning}" if reasoning else "",
+            f"Rejected submission: {self._summarize_error(submission, limit=500)}",
+        ]
+        error_summary = "\n".join(part for part in feedback_parts if part)
+        self._failed_feedback.append(
+            {
+                "request": f"brainstorm submitter {submitter_index} rejected submission",
+                "error_summary": self._summarize_error(error_summary, limit=1200),
+                "submission": self._summarize_error(submission, limit=500),
+                "submitter_index": submitter_index,
+                "source": "brainstorm_validator",
+            }
+        )
+
+    def _record_accepted_brainstorm_idea(
+        self,
+        submission: str,
+        submitter_index: int,
+        phase_key: str,
+        validation_feedback: dict[str, Any] | None = None,
+    ) -> None:
+        validation_feedback = validation_feedback or {}
+        context_role = self._normalize_brainstorm_context_role(validation_feedback, submission)
+        self._accepted_ideas.append(submission)
+        self._state.brainstorm_acceptance_events += 1
+        self._accepted_idea_records.append(
+            {
+                "content": submission,
+                "context_role": context_role,
+                "submitter_index": submitter_index,
+                "phase": phase_key,
+                "validator_summary": str(validation_feedback.get("summary") or "").strip(),
+                "validator_reasoning": str(validation_feedback.get("reasoning") or "").strip(),
+                "created_at": datetime.now().isoformat(),
+                "acceptance_event": self._state.brainstorm_acceptance_events,
+            }
+        )
+
+    def _ensure_accepted_idea_records(self) -> None:
+        existing = [
+            dict(record)
+            for record in self._accepted_idea_records
+            if isinstance(record, dict) and str(record.get("content") or "").strip()
+        ]
+        used_existing_indices: set[int] = set()
+        existing_by_content: dict[str, list[tuple[int, dict[str, Any]]]] = {}
+        for record_index, record in enumerate(existing):
+            existing_by_content.setdefault(str(record.get("content") or ""), []).append((record_index, record))
+
+        def take_existing_record(content: str) -> dict[str, Any] | None:
+            candidates = existing_by_content.get(content, [])
+            while candidates:
+                record_index, record = candidates.pop(0)
+                if record_index not in used_existing_indices:
+                    used_existing_indices.add(record_index)
+                    return dict(record)
+            return None
+
+        records: list[dict[str, Any]] = []
+        for index, idea in enumerate(self._accepted_ideas):
+            content = str(idea)
+            aligned_record = (
+                existing[index]
+                if index < len(existing)
+                and str(existing[index].get("content") or "") == content
+                and index not in used_existing_indices
+                else None
+            )
+            if aligned_record is not None:
+                used_existing_indices.add(index)
+                record = dict(aligned_record)
+            else:
+                record = take_existing_record(content) or {}
+            if not record:
+                record = {
+                    "content": content,
+                    "submitter_index": 1,
+                    "phase": "legacy",
+                    "created_at": "",
+                    "acceptance_event": index + 1,
+                    "legacy": True,
+                }
+            record["content"] = content
+            record["context_role"] = self._normalize_brainstorm_context_role(record, idea)
+            records.append(record)
+        self._accepted_idea_records = records
+
+    @staticmethod
+    def _normalize_brainstorm_context_role(record: dict[str, Any] | None, text: str = "") -> str:
+        role = str((record or {}).get("context_role") or "").strip().lower()
+        if role in _LEANOJ_CONTEXT_ROLES:
+            return role
+
+        combined = " ".join(
+            part.lower()
+            for part in [
+                text,
+                str((record or {}).get("content") or ""),
+                str((record or {}).get("summary") or ""),
+                str((record or {}).get("reasoning") or ""),
+                str((record or {}).get("validator_summary") or ""),
+                str((record or {}).get("validator_reasoning") or ""),
+            ]
+            if part
+        )
+        if any(term in combined for term in _LEANOJ_REFUTED_CONTEXT_TERMS):
+            return "refuted_construction"
+        if "[lean 4 verified brainstorm proof]" in combined:
+            return "verified_hint"
+        if any(term in combined for term in _LEANOJ_ACTIVE_PLAN_CONTEXT_TERMS):
+            return "active_plan"
+        return "scratch"
+
+    def _final_solver_active_plan_items(self) -> list[str]:
+        self._ensure_accepted_idea_records()
+        return [
+            str(record.get("content") or "").strip()
+            for record in self._accepted_idea_records
+            if str(record.get("context_role") or "") in _LEANOJ_FINAL_ACTIVE_CONTEXT_ROLES
+            and str(record.get("content") or "").strip()
+        ]
+
+    def _final_solver_refuted_construction_records(self) -> list[dict[str, Any]]:
+        self._ensure_accepted_idea_records()
+        accepted_refutations = [
+            record
+            for record in self._accepted_idea_records
+            if str(record.get("context_role") or "") == "refuted_construction"
+        ]
+        verified_refutations = [
+            {
+                "content": record.get("request", record.get("theorem_or_lemma", "")),
+                "reasoning": record.get("theorem_or_lemma", record.get("role", "")),
+                "source": "verified_subproof",
+            }
+            for record in self._verified_subproof_dicts()
+            if self._record_mentions_refuted_construction(record)
+        ]
+        failure_refutations = [
+            {
+                "content": record.get("error_summary", record.get("summary", "")),
+                "reasoning": record.get("reasoning", record.get("lean_feedback", "")),
+                "source": record.get("request", "failure feedback"),
+            }
+            for record in [*self._failed_feedback, *self._failed_context_dicts(), *self._final_attempts]
+            if self._record_mentions_refuted_construction(record)
+        ]
+        return self._dedupe_dict_records([*accepted_refutations, *verified_refutations, *failure_refutations])
+
+    def _final_solver_verified_subproof_dicts(self) -> list[dict[str, Any]]:
+        return [
+            record
+            for record in self._verified_subproof_dicts()
+            if not self._record_mentions_refuted_construction(record)
+        ]
+
+    @staticmethod
+    def _record_mentions_refuted_construction(record: dict[str, Any]) -> bool:
+        combined = " ".join(
+            str(record.get(key) or "").lower()
+            for key in (
+                "request",
+                "theorem_or_lemma",
+                "role",
+                "error_summary",
+                "summary",
+                "reasoning",
+                "lean_feedback",
+                "submission",
+            )
+        )
+        return any(term in combined for term in _LEANOJ_REFUTED_CONTEXT_TERMS)
+
+    def _active_brainstorm_topic(self, phase_key: str = "") -> str:
+        phase = phase_key or self._state.phase
+        if phase == "recursive_brainstorm":
+            if self._current_working_proof_attempt:
+                summary = _remove_attempt_count_language(
+                    self._current_working_proof_attempt.get("summary") or ""
+                ).strip()
+                base = "Repair and complete the current Proof Solver master proof attempt."
+                return f"{base} {summary}".strip() if summary else base
+            return "Continue the recursive Proof Solver brainstorm from the current proof state and accepted proof memory."
+        if phase == "initial_brainstorm":
+            return self._state.selected_topic or "Solve the user's Proof Solver template."
+        return self._state.selected_topic or "Solve the user's Proof Solver template."
+
+    def _select_brainstorm_prune_reviewer(
+        self,
+        request: LeanOJStartRequest,
+        phase_key: str,
+    ) -> tuple[LeanOJRoleConfig, int]:
+        self._ensure_accepted_idea_records()
+        phase_records = [
+            record
+            for record in self._accepted_idea_records
+            if str(record.get("phase") or "") == phase_key
+        ]
+        submitter_index = 1
+        if phase_records:
+            try:
+                submitter_index = int(phase_records[-1].get("submitter_index") or 1)
+            except (TypeError, ValueError):
+                submitter_index = 1
+        submitter_index = max(1, min(submitter_index, len(request.brainstorm_submitters)))
+        return request.brainstorm_submitters[submitter_index - 1], submitter_index
+
+    async def _perform_brainstorm_prune_review(
+        self,
+        request: LeanOJStartRequest,
+        phase_key: str,
+        *,
+        reason: str,
+    ) -> None:
+        if not self._accepted_ideas:
+            return
+        self._state.brainstorm_prune_reviews_performed += 1
+        reviewer, reviewer_index = self._select_brainstorm_prune_reviewer(request, phase_key)
+        active_topic = self._active_brainstorm_topic(phase_key)
+        try:
+            context_blocks = await self._build_context_blocks(
+                request,
+                reviewer,
+                mode="brainstorm",
+                task_request=f"Review LeanOJ brainstorm memory for one conservative prune operation: {reason}.",
+                include_current_final_cycle_packet=True,
+            )
+            raw = await self._call_json(
+                reviewer,
+                "leanoj_brainstorm_prune",
+                f"leanoj_brainstorm_prune_reviewer_{reviewer_index}",
+                build_brainstorm_prune_review_prompt(
+                    request.user_prompt,
+                    request.lean_template,
+                    active_topic,
+                    self._accepted_ideas,
+                    context_blocks=context_blocks,
+                ),
+            )
+            operation = self._normalize_brainstorm_prune_operation(raw)
+            if operation["action"] == "none":
+                await self._persist_and_broadcast(
+                    "leanoj_brainstorm_prune_review_complete",
+                    {"action": "none", "reason": reason, "reviewer": reviewer_index},
+                )
+                return
+
+            validator_context = await self._build_context_blocks(
+                request,
+                request.brainstorm_validator,
+                mode="brainstorm",
+                task_request="Validate one proposed LeanOJ brainstorm prune operation.",
+                include_current_final_cycle_packet=True,
+            )
+            validation = await self._call_json(
+                request.brainstorm_validator,
+                "leanoj_brainstorm_prune_val",
+                "leanoj_brainstorm_validator",
+                build_brainstorm_prune_validation_prompt(
+                    request.user_prompt,
+                    request.lean_template,
+                    active_topic,
+                    self._accepted_ideas,
+                    operation,
+                    context_blocks=validator_context,
+                ),
+            )
+            if str(validation.get("decision") or "").strip().lower() != "accept":
+                await self._persist_and_broadcast(
+                    "leanoj_brainstorm_prune_rejected",
+                    {
+                        "operation": operation,
+                        "reasoning": validation.get("reasoning", ""),
+                        "reviewer": reviewer_index,
+                    },
+                )
+                return
+            applied = self._apply_brainstorm_prune_operation(operation, reviewer_index, phase_key)
+            await self._persist_and_broadcast(
+                "leanoj_brainstorm_prune_applied" if applied else "leanoj_brainstorm_prune_apply_failed",
+                {
+                    "operation": operation,
+                    "reasoning": validation.get("reasoning", ""),
+                    "reviewer": reviewer_index,
+                },
+            )
+        except asyncio.CancelledError:
+            raise
+        except LeanOJConfigurationError:
+            raise
+        except Exception as exc:
+            logger.warning("LeanOJ brainstorm prune review failed: %s", exc, exc_info=True)
+            await self._persist_and_broadcast(
+                "leanoj_brainstorm_prune_error",
+                {"message": str(exc), "reason": reason},
+            )
+
+    def _normalize_brainstorm_prune_operation(self, raw: dict[str, Any]) -> dict[str, Any]:
+        action = str(raw.get("action") or "none").strip().lower()
+        if action not in {"none", "delete", "edit", "add"}:
+            action = "none"
+        idea_index: Optional[int] = None
+        try:
+            if raw.get("idea_index") is not None:
+                idea_index = int(raw.get("idea_index"))
+        except (TypeError, ValueError):
+            idea_index = None
+        new_content = str(raw.get("new_content") or "").strip()
+        reasoning = str(raw.get("reasoning") or "").strip()
+        if action in {"delete", "edit"} and (idea_index is None or idea_index < 1 or idea_index > len(self._accepted_ideas)):
+            action = "none"
+            reasoning = f"Invalid idea_index for prune operation. {reasoning}".strip()
+        if action in {"edit", "add"} and not new_content:
+            action = "none"
+            reasoning = f"Missing new_content for prune operation. {reasoning}".strip()
+        return {
+            "action": action,
+            "idea_index": idea_index,
+            "new_content": new_content,
+            "reasoning": reasoning,
+        }
+
+    def _apply_brainstorm_prune_operation(self, operation: dict[str, Any], reviewer_index: int, phase_key: str) -> bool:
+        self._ensure_accepted_idea_records()
+        action = operation["action"]
+        idea_index = operation.get("idea_index")
+        if action == "delete":
+            if not isinstance(idea_index, int) or idea_index < 1 or idea_index > len(self._accepted_ideas):
+                return False
+            del self._accepted_ideas[idea_index - 1]
+            del self._accepted_idea_records[idea_index - 1]
+        elif action == "edit":
+            if not isinstance(idea_index, int) or idea_index < 1 or idea_index > len(self._accepted_ideas):
+                return False
+            self._accepted_ideas[idea_index - 1] = operation["new_content"]
+            self._accepted_idea_records[idea_index - 1]["content"] = operation["new_content"]
+            self._accepted_idea_records[idea_index - 1]["context_role"] = self._normalize_brainstorm_context_role(
+                {"reasoning": operation.get("reasoning", "")},
+                operation["new_content"],
+            )
+            self._accepted_idea_records[idea_index - 1]["edited_at"] = datetime.now().isoformat()
+            self._accepted_idea_records[idea_index - 1]["edit_reasoning"] = operation.get("reasoning", "")
+        elif action == "add":
+            self._accepted_ideas.append(operation["new_content"])
+            self._accepted_idea_records.append(
+                {
+                    "content": operation["new_content"],
+                    "context_role": self._normalize_brainstorm_context_role(
+                        {"reasoning": operation.get("reasoning", "")},
+                        operation["new_content"],
+                    ),
+                    "submitter_index": reviewer_index,
+                    "phase": phase_key,
+                    "created_at": datetime.now().isoformat(),
+                    "acceptance_event": self._state.brainstorm_acceptance_events,
+                    "prune_add": True,
+                    "reasoning": operation.get("reasoning", ""),
+                }
+            )
+        else:
+            return False
+        self._state.accepted_brainstorm_count = len(self._accepted_ideas)
+        self._state.brainstorm_prune_operations_applied += 1
+        return True
+
+    async def _sufficiency_check(self, request: LeanOJStartRequest) -> bool:
+        raw = await self._call_json(
+            request.brainstorm_validator,
+            "leanoj_sufficiency",
+            "leanoj_brainstorm_validator",
+            build_sufficiency_prompt(
+                request.user_prompt,
+                request.lean_template,
+                self._accepted_ideas,
+                [item.model_dump(mode="json") for item in self._state.verified_subproofs],
+                context_blocks=await self._build_context_blocks(
+                    request,
+                    request.brainstorm_validator,
+                    mode="brainstorm",
+                    task_request="Decide whether the accumulated Proof Solver context is sufficient for the final loop.",
+                    include_current_final_cycle_packet=True,
+                ),
+            ),
+        )
+        return bool(raw.get("enough"))
+
+    async def _path_decision_phase(self, request: LeanOJStartRequest) -> str:
+        self._state.phase = "path_decision"
+        await self._persist_and_broadcast("leanoj_phase_changed")
+        decision_actor, decision_role_id = self._path_decision_actor(request)
+        prompt_failed_feedback = self._general_brainstorm_feedback_records()
+        raw = await self._call_json(
+            decision_actor,
+            "leanoj_path",
+            decision_role_id,
+            build_path_decision_prompt(
+                request.user_prompt,
+                request.lean_template,
+                self._accepted_ideas,
+                [item.model_dump(mode="json") for item in self._state.verified_subproofs],
+                prompt_failed_feedback,
+                context_blocks=await self._build_context_blocks(
+                    request,
+                    decision_actor,
+                    mode="brainstorm",
+                    task_request="Choose the next LeanOJ path after reviewing accumulated proof memory.",
+                    include_current_final_cycle_packet=True,
+                    capped_rejection_feedback=self._format_capped_rejection_feedback(
+                        "RECENT FAILED / REJECTION FEEDBACK SUMMARIES",
+                        prompt_failed_feedback,
+                        limit=10,
+                    ),
+                ),
+            ),
+        )
+        decision = str(raw.get("path") or "").strip()
+        if decision not in _LEANOJ_PATH_OPTIONS_SET:
+            decision = "need_more_brainstorming"
+        path_valid, corrected_path = await self._validate_path_decision(request, decision, str(raw.get("reasoning") or ""))
+        if not path_valid:
+            decision = corrected_path or "need_more_brainstorming"
+        self._state.current_path_decision = decision
+        await self._persist_and_broadcast("leanoj_path_decided", {"decision": decision, "reasoning": raw.get("reasoning", "")})
+        return decision
+
+    @staticmethod
+    def _path_decision_actor(
+        request: LeanOJStartRequest,
+        valid_paths: tuple[str, ...] = _LEANOJ_PATH_OPTIONS,
+    ) -> tuple[LeanOJRoleConfig, str]:
+        if "solve_final_now" in valid_paths:
+            return request.final_solver, "leanoj_final_solver"
+        return request.topic_generator, "leanoj_topic_generator"
+
+    async def _validate_path_decision(self, request: LeanOJStartRequest, decision: str, reasoning: str) -> tuple[bool, str]:
+        raw = await self._call_json(
+            request.topic_validator,
+            "leanoj_path_val",
+            "leanoj_path_validator",
+            build_path_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                decision,
+                reasoning,
+                self._accepted_ideas,
+                [item.model_dump(mode="json") for item in self._state.verified_subproofs],
+                context_blocks=await self._build_context_blocks(
+                    request,
+                    request.topic_validator,
+                    mode="brainstorm",
+                    task_request="Validate the proposed LeanOJ path decision.",
+                    include_current_final_cycle_packet=True,
+                ),
+            ),
+        )
+        accepted = str(raw.get("decision") or "").strip().lower() == "accept"
+        corrected_path = str(raw.get("corrected_path") or "").strip()
+        if corrected_path not in _LEANOJ_PATH_OPTIONS_SET:
+            corrected_path = ""
+        await self._persist_and_broadcast(
+            "leanoj_path_validated",
+            {
+                "decision": decision,
+                "validated": accepted,
+                "corrected_path": corrected_path,
+                "reasoning": raw.get("reasoning", ""),
+            },
+        )
+        return accepted, corrected_path
+
+    async def _register_verified_leanoj_proof(
+        self,
+        request: LeanOJStartRequest,
+        *,
+        proof_kind: str,
+        theorem_statement: str,
+        theorem_name: str,
+        lean_code: str,
+        attempt_count: int,
+        formal_sketch: str = "",
+        theorem_id: str = "",
+        source_title: str = "",
+        verification_notes: str = "",
+        attempts: Optional[list[ProofAttemptFeedback]] = None,
+    ) -> Optional[ProofRecord]:
+        """Register a Proof Solver verified proof in the shared proof database."""
+        if not request.topic_validator.model_id:
+            raise LeanOJConfigurationError("Proof Solver proof novelty validator model is unavailable")
+
+        source_type = "leanoj_final" if proof_kind == "final" else "leanoj_subproof"
+        task_id = self._next_task_id(f"leanoj_{proof_kind}_novelty")
+        self.current_task_id = task_id
+        self._refresh_workflow_tasks(f"leanoj_{proof_kind}_novelty", "Proof Novelty Validator")
+        api_client_manager.set_autonomous_phase(self._state.phase or "leanoj")
+        try:
+            # Lazy import avoids pulling autonomous coordinator into LeanOJ module load.
+            from backend.autonomous.core.proof_registration import register_verified_lean_proof
+
+            registration = await register_verified_lean_proof(
+                proof_database=proof_database,
+                user_prompt=request.user_prompt,
+                theorem_statement=theorem_statement,
+                lean_code=lean_code,
+                validator_model=request.topic_validator.model_id,
+                validator_context=request.topic_validator.context_window,
+                validator_max_tokens=request.topic_validator.max_output_tokens,
+                task_id=task_id,
+                role_id="leanoj_proof_novelty",
+                source_type=source_type,
+                source_id=self._state.session_id,
+                source_title=source_title or self._state.selected_topic or request.user_prompt,
+                theorem_id=theorem_id,
+                theorem_name=theorem_name,
+                formal_sketch=formal_sketch,
+                solver="Proof Solver",
+                verification_notes=(
+                    verification_notes
+                    or "Proof Solver verified this proof with Lean 4 and template/device checks."
+                ),
+                attempt_count=attempt_count,
+                attempts=attempts,
+                broadcast_fn=self._broadcast,
+                base_event={
+                    "source_type": source_type,
+                    "source_id": self._state.session_id,
+                    "source_title": source_title or self._state.selected_topic or request.user_prompt,
+                    "trigger": "leanoj_verified",
+                },
+            )
+            self.completed_task_ids.add(task_id)
+            return registration.record
+        except Exception as exc:
+            logger.warning("Proof Solver proof registration failed for %s: %s", proof_kind, exc)
+            raise
+        finally:
+            self.current_task_id = None
+            self._refresh_workflow_tasks(f"leanoj_{proof_kind}_novelty", "Proof Novelty Validator")
+
+    async def _check_proof_and_capture_partial(
+        self,
+        request: LeanOJStartRequest,
+        lean_code: str,
+        *,
+        target: str,
+        attempt_number: int,
+        proof_request: str,
+        reasoning: str,
+        theorem_or_lemma: str = "",
+    ) -> Lean4Result:
+        placeholder_tokens = self._placeholder_tokens(lean_code)
+        if not placeholder_tokens:
+            return await get_lean4_client().check_proof(lean_code, timeout=system_config.lean4_proof_timeout)
+
+        lean_result = await get_lean4_client().check_proof(
+            lean_code,
+            timeout=system_config.lean4_proof_timeout,
+            allow_placeholders=True,
+        )
+        if not lean_result.success:
+            return lean_result
+
+        device_error = self._validate_no_new_declaration_devices(
+            request.lean_template,
+            lean_code,
+            target=f"partial {target}",
+        )
+        if device_error:
+            return Lean4Result(
+                success=False,
+                error_output=device_error,
+                goal_states=lean_result.goal_states,
+                raw_stderr=lean_result.raw_stderr,
+            )
+        if target == "final":
+            template_error = self._validate_final_solution_integrity(
+                request.lean_template,
+                lean_code,
+            )
+            if template_error:
+                return Lean4Result(
+                    success=False,
+                    error_output=template_error,
+                    goal_states=lean_result.goal_states,
+                    raw_stderr=lean_result.raw_stderr,
+                )
+
+        partial_record = {
+            "session_id": self._state.session_id,
+            "attempt": attempt_number,
+            "target": target,
+            "request": proof_request,
+            "theorem_or_lemma": theorem_or_lemma,
+            "placeholder_tokens": sorted(set(placeholder_tokens)),
+            "lean_code": lean_code,
+            "reasoning": reasoning,
+            "high_value_scaffold": False,
+            "master_seed_eligible": False,
+            "created_at": datetime.now().isoformat(),
+            "summary": (
+                "Lean accepted this incomplete scaffold with placeholders. "
+                "It is stored for future reference, but it is not a verified proof and is not eligible "
+                "to seed the master proof unless a validator explicitly marks it high-value."
+            ),
+        }
+        await self._record_partial_proof(partial_record)
+        return Lean4Result(
+            success=False,
+            error_output=(
+                "PARTIAL PROOF SAVED: Lean accepted this scaffold with placeholder token(s) "
+                f"{', '.join(partial_record['placeholder_tokens'])}. It has been stored in the "
+                "LeanOJ partial-proof database for future reference, but final verification must "
+                "continue until every `sorry`/`admit` is replaced by a complete proof."
+            ),
+            goal_states=lean_result.goal_states,
+            raw_stderr=lean_result.raw_stderr,
+        )
+
+    async def _record_partial_proof(self, partial_record: dict[str, Any]) -> None:
+        self._partial_proofs.append(partial_record)
+        await self._append_partial_proof_database(partial_record)
+        await self._persist_and_broadcast(
+            "leanoj_partial_proof_saved",
+            {"partial_proof": partial_record},
+        )
+
+    async def _append_partial_proof_database(self, partial_record: dict[str, Any]) -> None:
+        path = self._partial_proof_database_path()
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "a", encoding="utf-8") as f:
+            await f.write(json.dumps(partial_record, ensure_ascii=False) + "\n")
+        await leanoj_context_manager.append_record(
+            self._state.session_id,
+            ARTIFACT_PARTIAL_PROOFS,
+            partial_record,
+        )
+
+    @staticmethod
+    def _placeholder_tokens(lean_code: str) -> list[str]:
+        stripped = strip_lean_comments_and_strings(lean_code or "")
+        return [match.group(1) for match in _LEAN_PLACEHOLDER_RE.finditer(stripped)]
+
+    @staticmethod
+    def _partial_proofs_base_dir() -> Path:
+        return Path(system_config.data_dir) / "leanoj_partial_proofs"
+
+    def _partial_proof_database_path(self, session_id: str = "") -> Path:
+        return self._partial_proofs_base_dir() / f"{session_id or self._state.session_id or 'latest'}.jsonl"
+
+    def _load_partial_proof_database(self, session_id: str) -> list[dict[str, Any]]:
+        path = self._partial_proof_database_path(session_id)
+        if not path.exists():
+            return []
+        records: list[dict[str, Any]] = []
+        try:
+            for line in path.read_text(encoding="utf-8").splitlines():
+                if not line.strip():
+                    continue
+                item = json.loads(line)
+                if isinstance(item, dict):
+                    records.append(item)
+        except Exception as exc:
+            logger.warning("Failed to load LeanOJ partial proof database from %s: %s", path, exc)
+        return records
+
+    @staticmethod
+    def _dedupe_partial_proofs(records: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        deduped: list[dict[str, Any]] = []
+        seen: set[tuple[str, str, str, str, str]] = set()
+        for record in records:
+            key = (
+                str(record.get("session_id") or ""),
+                str(record.get("target") or ""),
+                str(record.get("attempt") or ""),
+                str(record.get("request") or ""),
+                str(record.get("lean_code") or ""),
+            )
+            if key in seen:
+                continue
+            seen.add(key)
+            deduped.append(record)
+        return deduped
+
+    @staticmethod
+    def _dedupe_strings(records: list[str]) -> list[str]:
+        deduped: list[str] = []
+        seen: set[str] = set()
+        for record in records:
+            value = str(record).strip()
+            if not value or value in seen:
+                continue
+            seen.add(value)
+            deduped.append(value)
+        return deduped
+
+    @staticmethod
+    def _dedupe_dict_records(records: list[dict[str, Any]]) -> list[dict[str, Any]]:
+        deduped: list[dict[str, Any]] = []
+        seen: set[str] = set()
+        for record in records:
+            key = LeanOJCoordinator._dict_record_key(record)
+            if key in seen:
+                continue
+            seen.add(key)
+            deduped.append(record)
+        return deduped
+
+    @staticmethod
+    def _dict_record_key(record: dict[str, Any]) -> str:
+        try:
+            return json.dumps(record, sort_keys=True, default=str)
+        except TypeError:
+            return str(record)
+
+    def _verified_subproof_dicts(self) -> list[dict[str, Any]]:
+        return [item.model_dump(mode="json") for item in self._state.verified_subproofs]
+
+    def _failed_context_dicts(self) -> list[dict[str, Any]]:
+        return self._dedupe_dict_records(
+            [
+                *[item.model_dump(mode="json") for item in self._state.failed_subproofs],
+                *self._failed_feedback,
+            ]
+        )
+
+    @staticmethod
+    def _is_subproof_or_final_failure_feedback(record: dict[str, Any]) -> bool:
+        request = str(record.get("request") or "").lower()
+        return bool(record.get("lean_code")) or "subproof" in request or "final proof solver" in request
+
+    def _general_brainstorm_feedback_records(self) -> list[dict[str, Any]]:
+        if self._state.phase == "recursive_brainstorm":
+            return []
+        return [
+            record
+            for record in self._failed_feedback
+            if isinstance(record, dict) and not self._is_subproof_or_final_failure_feedback(record)
+        ]
+
+    async def _build_context_blocks(
+        self,
+        request: LeanOJStartRequest,
+        role_config: LeanOJRoleConfig,
+        *,
+        mode: str,
+        task_request: str,
+        include_current_final_cycle_packet: bool = False,
+        capped_rejection_feedback: str = "",
+        context_scope: str = "",
+    ) -> dict[str, str]:
+        resolved_scope = context_scope or self._infer_context_scope(mode)
+        current_packet = self._current_final_cycle_packet if include_current_final_cycle_packet else None
+        working_proof_attempt = None
+        if resolved_scope == "recursive_brainstorm":
+            working_proof_attempt = await self._working_proof_attempt_context_packet()
+            capped_rejection_feedback = ""
+        include_failed_subproofs = resolved_scope == "subproof"
+        accepted_context = (
+            self._final_solver_active_plan_items()
+            if resolved_scope == "final_solver"
+            else self._accepted_ideas
+        )
+        refuted_constructions = (
+            self._final_solver_refuted_construction_records()
+            if resolved_scope == "final_solver"
+            else []
+        )
+        allocation = await leanoj_context_manager.allocate_context(
+            session_id=self._state.session_id,
+            mode=resolved_scope,
+            user_prompt=request.user_prompt,
+            lean_template=request.lean_template,
+            task_request=task_request,
+            context_window=role_config.context_window,
+            max_output_tokens=role_config.max_output_tokens,
+            accepted_ideas=accepted_context,
+            recursive_topics=self._recursive_topics,
+            verified_subproofs=(
+                self._final_solver_verified_subproof_dicts()
+                if resolved_scope == "final_solver"
+                else self._verified_subproof_dicts()
+            ),
+            partial_proofs=self._partial_proofs,
+            failed_subproofs=self._failed_context_dicts() if include_failed_subproofs else [],
+            final_attempts=self._final_attempts[-5:] if resolved_scope == "final_solver" else [],
+            final_cycle_packets=[],
+            refuted_constructions=refuted_constructions,
+            current_final_cycle_packet=current_packet,
+            current_working_proof_attempt=working_proof_attempt,
+            capped_rejection_feedback=capped_rejection_feedback,
+        )
+        return allocation.as_prompt_blocks()
+
+    def _infer_context_scope(self, mode: str) -> str:
+        if mode == "final_solver":
+            return "final_solver"
+        if mode == "subproof":
+            return "subproof"
+        if self._state.phase == "recursive_brainstorm" or self._current_working_proof_attempt:
+            return "recursive_brainstorm"
+        return "brainstorm"
+
+    async def _set_current_working_proof_attempt(
+        self,
+        *,
+        trigger: str,
+        requested_path: str,
+        stuck_reason: str,
+    ) -> None:
+        master_proof = await self._read_master_proof()
+        if master_proof:
+            self._set_master_proof_metadata(master_proof)
+        prompt_safe_stuck_reason = _remove_attempt_count_language(
+            stuck_reason or self._state.master_proof_last_stuck_reason or "Final proof needs more context."
+        )
+        summary = self._summarize_error(
+            f"{trigger}: {prompt_safe_stuck_reason}",
+            limit=500,
+        )
+        self._current_working_proof_attempt = {
+            "session_id": self._state.session_id,
+            "trigger": trigger,
+            "requested_path": requested_path,
+            "stuck_reason": self._summarize_error(prompt_safe_stuck_reason, limit=1200),
+            "summary": summary,
+            "master_proof_version": self._state.master_proof_version,
+            "master_proof_hash": self._state.master_proof_hash,
+            "master_proof_line_count": self._state.master_proof_line_count,
+            "master_proof_char_count": self._state.master_proof_char_count,
+            "master_proof_last_edit_summary": self._state.master_proof_last_edit_summary,
+            "created_at": datetime.now().isoformat(),
+        }
+
+    async def _working_proof_attempt_context_packet(self) -> Optional[dict[str, Any]]:
+        if not self._current_working_proof_attempt:
+            return None
+        master_proof = await self._read_master_proof()
+        if master_proof:
+            self._set_master_proof_metadata(master_proof)
+        old_attempt_before_redo = await self._read_master_proof_old_attempt_before_redo()
+        packet = dict(self._current_working_proof_attempt)
+        packet.update(
+            {
+                "master_proof": master_proof,
+                "master_proof_version": self._state.master_proof_version,
+                "master_proof_hash": self._state.master_proof_hash,
+                "master_proof_line_count": self._state.master_proof_line_count,
+                "master_proof_char_count": self._state.master_proof_char_count,
+                "master_proof_last_edit_summary": self._state.master_proof_last_edit_summary,
+                "old_attempt_before_redo": old_attempt_before_redo,
+                "old_attempt_before_redo_version": self._state.master_proof_old_attempt_before_redo_version,
+                "old_attempt_before_redo_hash": self._state.master_proof_old_attempt_before_redo_hash,
+                "old_attempt_before_redo_line_count": self._state.master_proof_old_attempt_before_redo_line_count,
+                "old_attempt_before_redo_char_count": self._state.master_proof_old_attempt_before_redo_char_count,
+                "old_attempt_before_redo_summary": self._state.master_proof_old_attempt_before_redo_summary,
+                "old_attempt_before_redo_validator_justification": (
+                    self._state.master_proof_old_attempt_before_redo_validator_justification
+                ),
+                "old_attempt_before_redo_apparent_issue": (
+                    self._state.master_proof_old_attempt_before_redo_apparent_issue
+                ),
+                "recent_final_attempts": leanoj_context_manager._format_attempts(self._final_attempts[-10:]),
+                "verified_subproofs": self._verified_subproof_dicts(),
+                "partial_final_proofs": [
+                    proof for proof in self._partial_proofs[-10:] if str(proof.get("target") or "") == "final"
+                ],
+            }
+        )
+        return packet
+
+    def _clear_current_final_cycle_packet(self) -> None:
+        """Clear one-shot direct final-cycle context after its next phase has completed."""
+        self._current_final_cycle_packet = None
+
+    @staticmethod
+    def _format_capped_rejection_feedback(
+        title: str,
+        records: list[dict[str, Any]],
+        *,
+        limit: int,
+    ) -> str:
+        visible = [record for record in records[-limit:] if isinstance(record, dict)]
+        if not visible:
+            return ""
+        lines = [title]
+        for index, record in enumerate(visible, start=1):
+            lines.append(
+                f"{index}. {_remove_attempt_count_language(record.get('request', 'proof feedback'))} :: "
+                f"{_remove_attempt_count_language(record.get('error_summary', record.get('error_output', '')))}"
+            )
+            lean_feedback = _remove_attempt_count_language(record.get("lean_feedback") or "")
+            if lean_feedback:
+                lines.append(f"   Lean feedback: {lean_feedback}")
+        return "\n".join(lines)
+
+    @staticmethod
+    def _is_final_prompt_feedback_safe(record: dict[str, Any]) -> bool:
+        text = "\n".join(
+            str(record.get(key) or "")
+            for key in ("request", "error_summary", "error_output", "lean_feedback", "reasoning")
+        ).lower()
+        if not text.strip():
+            return False
+        blocked_terms = (
+            "brainstorm",
+            "need_more_brainstorming",
+            "stuck_needs_brainstorm",
+            "final proof solver proof cycle",
+            "failed-attempt count",
+            "failed attempts",
+        )
+        if not any(term in text for term in blocked_terms):
+            return True
+        concrete_terms = (
+            "old_string",
+            "unexpected token",
+            "missing cases",
+            "unsolved goals",
+            "error:",
+            "rejected",
+            "invalid",
+            "json",
+            "max_tokens",
+            "lean",
+            "verification",
+            "watchdog",
+        )
+        return any(term in text for term in concrete_terms)
+
+    def _record_final_context_event(
+        self,
+        event_type: str,
+        *,
+        request: str,
+        error_summary: str = "",
+        lean_feedback: str = "",
+        reasoning: str = "",
+    ) -> None:
+        record = {
+            "event_type": event_type,
+            "request": self._summarize_error(request, limit=300),
+            "error_summary": self._summarize_error(error_summary, limit=1200),
+            "lean_feedback": self._summarize_error(lean_feedback, limit=1200),
+            "reasoning": self._summarize_error(reasoning, limit=800),
+            "created_at": datetime.now().isoformat(),
+        }
+        self._final_context_events.append(record)
+        self._final_context_events = self._final_context_events[-50:]
+
+    def _final_solver_failure_window(self) -> list[dict[str, Any]]:
+        recent_events = [
+            event
+            for event in self._final_context_events[-5:]
+            if isinstance(event, dict)
+        ]
+        return [
+            event
+            for event in recent_events
+            if event.get("event_type") == "failure" and self._is_final_prompt_feedback_safe(event)
+        ]
+
+    def _master_proof_path(self, session_id: str = "") -> Path:
+        resolved_session_id = session_id or self._state.session_id or "latest"
+        return self._sessions_base_dir() / resolved_session_id / "master_proof.lean"
+
+    def _master_proof_old_attempt_before_redo_path(self, session_id: str = "") -> Path:
+        resolved_session_id = session_id or self._state.session_id or "latest"
+        return self._sessions_base_dir() / resolved_session_id / "master_proof_old_attempt_before_redo.lean"
+
+    def _master_proof_edit_log_path(self, session_id: str = "") -> Path:
+        resolved_session_id = session_id or self._state.session_id or "latest"
+        return self._sessions_base_dir() / resolved_session_id / "master_proof_edits.jsonl"
+
+    def _master_proof_snapshot_log_path(self, session_id: str = "") -> Path:
+        resolved_session_id = session_id or self._state.session_id or "latest"
+        return self._sessions_base_dir() / resolved_session_id / "master_proof_snapshots.jsonl"
+
+    @staticmethod
+    def _hash_master_proof(content: str) -> str:
+        return hashlib.sha256((content or "").encode("utf-8")).hexdigest() if content else ""
+
+    def _set_master_proof_metadata(
+        self,
+        content: str,
+        *,
+        summary: str = "",
+        increment_version: bool = False,
+    ) -> None:
+        if increment_version:
+            self._state.master_proof_version += 1
+        self._state.master_proof_initialized = bool((content or "").strip())
+        self._state.master_proof_hash = self._hash_master_proof(content)
+        self._state.master_proof_char_count = len(content or "")
+        self._state.master_proof_line_count = len((content or "").splitlines()) if content else 0
+        if summary:
+            self._state.master_proof_last_edit_summary = self._summarize_error(summary, limit=500)
+
+    async def _read_master_proof(self) -> str:
+        path = self._master_proof_path()
+        if not path.exists():
+            return ""
+        try:
+            async with aiofiles.open(path, "r", encoding="utf-8") as f:
+                return await f.read()
+        except Exception as exc:
+            logger.warning("Failed to read Proof Solver master proof from %s: %s", path, exc)
+            return ""
+
+    async def _write_master_proof(self, content: str, *, summary: str = "") -> None:
+        path = self._master_proof_path()
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "w", encoding="utf-8") as f:
+            await f.write(content or "")
+        self._set_master_proof_metadata(content or "", summary=summary, increment_version=True)
+
+    async def _read_master_proof_old_attempt_before_redo(self) -> str:
+        path = self._master_proof_old_attempt_before_redo_path()
+        if not path.exists():
+            return ""
+        try:
+            async with aiofiles.open(path, "r", encoding="utf-8") as f:
+                return await f.read()
+        except Exception as exc:
+            logger.warning("Failed to read Proof Solver old attempt before redo from %s: %s", path, exc)
+            return ""
+
+    async def _write_master_proof_old_attempt_before_redo(self, content: str) -> None:
+        path = self._master_proof_old_attempt_before_redo_path()
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "w", encoding="utf-8") as f:
+            await f.write(content or "")
+
+    async def _append_master_proof_edit(self, record: dict[str, Any]) -> None:
+        path = self._master_proof_edit_log_path()
+        path.parent.mkdir(parents=True, exist_ok=True)
+        payload = {
+            "session_id": self._state.session_id,
+            "master_proof_version": self._state.master_proof_version,
+            "created_at": datetime.now().isoformat(),
+            **record,
+        }
+        async with aiofiles.open(path, "a", encoding="utf-8") as f:
+            await f.write(json.dumps(payload, ensure_ascii=False) + "\n")
+        await self._compact_master_proof_edit_log_if_needed()
+
+    async def get_master_proof_draft(self) -> dict[str, Any]:
+        content = await self._read_master_proof()
+        if content:
+            self._set_master_proof_metadata(content)
+        return {
+            "session_id": self._state.session_id,
+            "exists": bool(content.strip()),
+            "content": content,
+            "metadata": self._master_proof_metadata_payload(),
+        }
+
+    async def get_master_proof_edit_summaries(self, *, limit: int = 50) -> dict[str, Any]:
+        safe_limit = max(1, min(500, int(limit or 50)))
+        records = self._read_master_proof_edit_records()
+        visible = records[-safe_limit:]
+        return {
+            "session_id": self._state.session_id,
+            "total_edits": len(records),
+            "limit": safe_limit,
+            "edits": [self._summarize_master_proof_edit_record(record) for record in visible],
+            "metadata": self._master_proof_metadata_payload(),
+        }
+
+    def _master_proof_metadata_payload(self) -> dict[str, Any]:
+        return {
+            "initialized": self._state.master_proof_initialized,
+            "version": self._state.master_proof_version,
+            "sha256": self._state.master_proof_hash,
+            "line_count": self._state.master_proof_line_count,
+            "char_count": self._state.master_proof_char_count,
+            "last_edit_summary": self._state.master_proof_last_edit_summary,
+            "last_stuck_reason": self._state.master_proof_last_stuck_reason,
+        }
+
+    def _read_master_proof_edit_records(self, session_id: str = "") -> list[dict[str, Any]]:
+        path = self._master_proof_edit_log_path(session_id)
+        if not path.exists():
+            return []
+        records: list[dict[str, Any]] = []
+        try:
+            for line in path.read_text(encoding="utf-8").splitlines():
+                if not line.strip():
+                    continue
+                item = json.loads(line)
+                if isinstance(item, dict):
+                    records.append(item)
+        except Exception as exc:
+            logger.warning("Failed to read Proof Solver master proof edit log %s: %s", path, exc)
+        return records
+
+    def _summarize_master_proof_edit_record(self, record: dict[str, Any]) -> dict[str, Any]:
+        summary_keys = [
+            "session_id",
+            "master_proof_version",
+            "created_at",
+            "action",
+            "operation",
+            "accepted",
+            "needs_more_time",
+            "requested_path",
+            "master_proof_hash",
+            "master_proof_line_count",
+            "master_proof_char_count",
+        ]
+        summary = {key: record.get(key) for key in summary_keys if key in record}
+        for key in ("reasoning", "stuck_reason", "error_summary", "validator_feedback", "validator_reasoning"):
+            if record.get(key):
+                summary[key] = self._summarize_error(str(record.get(key)), limit=500)
+        if isinstance(record.get("shortening_metrics"), dict):
+            summary["shortening_metrics"] = record.get("shortening_metrics")
+        if record.get("old_string"):
+            summary["old_string_preview"] = self._summarize_error(str(record.get("old_string")), limit=240)
+        if record.get("new_string"):
+            summary["new_string_preview"] = self._summarize_error(str(record.get("new_string")), limit=240)
+            summary["new_string_char_count"] = len(str(record.get("new_string") or ""))
+        return summary
+
+    async def _compact_master_proof_edit_log_if_needed(self) -> None:
+        path = self._master_proof_edit_log_path()
+        records = self._read_master_proof_edit_records()
+        if len(records) <= _MASTER_PROOF_EDIT_LOG_COMPACT_RECORD_LIMIT:
+            return
+
+        keep_count = min(_MASTER_PROOF_EDIT_LOG_RECENT_RECORDS_TO_KEEP, len(records))
+        retained = records[-keep_count:]
+        compacted_count = len(records) - len(retained)
+        current_proof = await self._read_master_proof()
+        snapshot = {
+            "session_id": self._state.session_id,
+            "created_at": datetime.now().isoformat(),
+            "snapshot_kind": "master_proof_edit_log_compaction",
+            "compacted_edit_count": compacted_count,
+            "retained_edit_count": len(retained),
+            "master_proof_version": self._state.master_proof_version,
+            "master_proof_hash": self._hash_master_proof(current_proof),
+            "master_proof_line_count": len(current_proof.splitlines()) if current_proof else 0,
+            "master_proof_char_count": len(current_proof or ""),
+            "first_compacted_edit": self._summarize_master_proof_edit_record(records[0]),
+            "last_compacted_edit": self._summarize_master_proof_edit_record(records[compacted_count - 1]),
+        }
+        snapshot_path = self._master_proof_snapshot_log_path()
+        snapshot_path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(snapshot_path, "a", encoding="utf-8") as f:
+            await f.write(json.dumps(snapshot, ensure_ascii=False) + "\n")
+        await self._write_jsonl_records(path, retained)
+
+    @staticmethod
+    async def _write_jsonl_records(path: Path, records: list[dict[str, Any]]) -> None:
+        path.parent.mkdir(parents=True, exist_ok=True)
+        async with aiofiles.open(path, "w", encoding="utf-8") as f:
+            for record in records:
+                await f.write(json.dumps(record, ensure_ascii=False) + "\n")
+
+    def _select_master_proof_seed(self, request: LeanOJStartRequest) -> str:
+        for proof in reversed(self._partial_proofs):
+            if str(proof.get("target") or "") != "final":
+                continue
+            lean_code = str(proof.get("lean_code") or "").strip()
+            if (
+                lean_code
+                and self._is_high_value_master_seed_partial(request, proof, lean_code)
+                and not self._validate_final_solution_integrity(request.lean_template, lean_code)
+            ):
+                return lean_code
+
+        for attempt in reversed(self._final_attempts):
+            lean_code = str(attempt.get("lean_code") or "").strip()
+            if not lean_code:
+                continue
+            if not self._is_explicit_master_seed_candidate(request, attempt, lean_code):
+                continue
+            if lean_code and not self._validate_final_solution_integrity(request.lean_template, lean_code):
+                return lean_code
+
+        return request.lean_template.strip()
+
+    def _is_high_value_master_seed_partial(
+        self,
+        request: LeanOJStartRequest,
+        proof: dict[str, Any],
+        lean_code: str,
+    ) -> bool:
+        """Only explicitly elevated partials may seed the durable master proof."""
+        return self._is_explicit_master_seed_candidate(
+            request,
+            proof,
+            lean_code,
+            require_placeholders=True,
+        )
+
+    def _is_explicit_master_seed_candidate(
+        self,
+        request: LeanOJStartRequest,
+        record: dict[str, Any],
+        lean_code: str,
+        *,
+        require_placeholders: bool = False,
+    ) -> bool:
+        """Require an explicit validator/metadata signal before seeding from prior attempts."""
+        if not (record.get("high_value_scaffold") is True or record.get("master_seed_eligible") is True):
+            return False
+        if not lean_code.strip():
+            return False
+        if require_placeholders and not self._placeholder_tokens(lean_code):
+            return False
+        normalized_code = self._normalize_lean_for_template_check(lean_code)
+        normalized_template = self._normalize_lean_for_template_check(request.lean_template)
+        if normalized_code == normalized_template:
+            return False
+        text = " ".join(
+            str(record.get(key) or "").lower()
+            for key in ("request", "reasoning", "error_summary")
+        )
+        blocked_terms = (
+            "template unchanged",
+            "minimal scaffold",
+            "best achievable",
+            "infeasible",
+            "cannot be completed",
+            "sorry placeholders",
+        )
+        return not any(term in text for term in blocked_terms)
+
+    async def _ensure_master_proof_initialized(self, request: LeanOJStartRequest) -> str:
+        current = await self._read_master_proof()
+        if current.strip():
+            self._set_master_proof_metadata(current)
+            return current
+
+        seed = self._select_master_proof_seed(request)
+        await self._write_master_proof(seed, summary="Initialized Proof Solver master proof draft")
+        await self._append_master_proof_edit(
+            {
+                "action": "initialize_master_proof",
+                "operation": "full_content",
+                "reasoning": "Seeded the durable master proof draft from existing Proof Solver context.",
+                "new_string": seed,
+            }
+        )
+        await self._persist_and_broadcast("leanoj_master_proof_initialized")
+        return seed
+
+    @staticmethod
+    def _normalize_final_solver_edit(raw: dict[str, Any]) -> dict[str, Any]:
+        if raw.get("lean_code") and not raw.get("action"):
+            return {
+                "action": "edit_proof",
+                "operation": "full_content",
+                "old_string": "",
+                "new_string": str(raw.get("lean_code") or ""),
+                "needs_more_time": False,
+                "reasoning": str(raw.get("reasoning") or "Legacy whole-file final proof response."),
+            }
+
+        action = str(raw.get("action") or "").strip()
+        if not action and raw.get("operation"):
+            action = "edit_proof"
+        needs_more_time = bool(raw.get("needs_more_time"))
+        return {
+            "action": action,
+            "operation": str(raw.get("operation") or "").strip(),
+            "old_string": str(raw.get("old_string") or ""),
+            "new_string": str(raw.get("new_string") or ""),
+            "needs_more_time": needs_more_time,
+            "reasoning": str(raw.get("reasoning") or raw.get("summary") or "").strip(),
+            "stuck_reason": str(raw.get("stuck_reason") or raw.get("reasoning") or "").strip(),
+            "requested_path": str(raw.get("requested_path") or raw.get("path") or "").strip(),
+        }
+
+    def _apply_master_proof_edit(self, current_proof: str, edit: dict[str, Any]) -> tuple[Optional[str], str]:
+        action = str(edit.get("action") or "").strip()
+        if action not in _LEANOJ_PROOF_EDIT_ACTIONS:
+            return None, (
+                f"Invalid final solver action `{action}`. Final proof mode accepts only `edit_proof`; "
+                "phase transitions are selected by the separate path-decision mode."
+            )
+
+        operation = str(edit.get("operation") or "").strip()
+        old_string = str(edit.get("old_string") or "")
+        new_string = str(edit.get("new_string") or "")
+        if operation not in _LEANOJ_PROOF_EDIT_OPERATIONS:
+            return None, (
+                f"Invalid master proof edit operation `{operation}`. "
+                "Use full_content, replace, insert_after, or delete."
+            )
+
+        if operation == "full_content":
+            if not new_string.strip():
+                return None, "full_content requires non-empty new_string Lean code."
+            return new_string.strip(), ""
+
+        if not current_proof.strip():
+            return None, f"Master proof is empty; operation `{operation}` must be full_content."
+        if not old_string:
+            return None, f"Operation `{operation}` requires a non-empty old_string copied from the current master proof."
+        match_count = current_proof.count(old_string)
+        if match_count == 0:
+            return None, "old_string was not found verbatim in the current master proof."
+        if match_count > 1:
+            return None, f"old_string appears {match_count} times in the current master proof; include more context."
+
+        if operation == "replace":
+            return current_proof.replace(old_string, new_string, 1), ""
+        if operation == "insert_after":
+            if not new_string.strip():
+                return None, "insert_after requires non-empty new_string Lean code."
+            insert_pos = current_proof.find(old_string) + len(old_string)
+            return (
+                current_proof[:insert_pos].rstrip()
+                + "\n\n"
+                + new_string.strip()
+                + "\n\n"
+                + current_proof[insert_pos:].lstrip()
+            ), ""
+        if operation == "delete":
+            updated = current_proof.replace(old_string, "", 1)
+            while "\n\n\n" in updated:
+                updated = updated.replace("\n\n\n", "\n\n")
+            return updated, ""
+
+        return None, f"Unsupported master proof edit operation `{operation}`."
+
+    @classmethod
+    def _master_proof_shortening_metrics(cls, before_proof: str, after_proof: str) -> dict[str, Any]:
+        before = before_proof or ""
+        after = after_proof or ""
+        before_chars = len(before)
+        after_chars = len(after)
+        before_lines = len(before.splitlines()) if before else 0
+        after_lines = len(after.splitlines()) if after else 0
+        before_placeholders = len(cls._placeholder_tokens(before))
+        after_placeholders = len(cls._placeholder_tokens(after))
+        return {
+            "before_char_count": before_chars,
+            "after_char_count": after_chars,
+            "char_delta_removed": max(0, before_chars - after_chars),
+            "before_line_count": before_lines,
+            "after_line_count": after_lines,
+            "line_delta_removed": max(0, before_lines - after_lines),
+            "before_placeholder_count": before_placeholders,
+            "after_placeholder_count": after_placeholders,
+            "placeholder_delta_added": max(0, after_placeholders - before_placeholders),
+            "after_to_before_char_ratio": round(after_chars / before_chars, 4) if before_chars else 1.0,
+        }
+
+    @staticmethod
+    def _should_validate_master_proof_shortening_edit(edit: dict[str, Any], metrics: dict[str, Any]) -> bool:
+        char_delta = int(metrics.get("char_delta_removed") or 0)
+        line_delta = int(metrics.get("line_delta_removed") or 0)
+        placeholder_delta = int(metrics.get("placeholder_delta_added") or 0)
+        if char_delta <= 0:
+            return False
+        operation = str(edit.get("operation") or "").strip()
+        return (
+            line_delta > 0
+            or char_delta >= _MASTER_PROOF_SHORTENING_CHAR_THRESHOLD
+            or placeholder_delta > 0
+            or operation == "delete"
+        )
+
+    async def _validate_master_proof_shortening_edit(
+        self,
+        request: LeanOJStartRequest,
+        edit: dict[str, Any],
+        before_proof: str,
+        after_proof: str,
+        metrics: dict[str, Any],
+    ) -> tuple[bool, str, str, str, str]:
+        await self._broadcast(
+            "leanoj_master_proof_edit_validation_started",
+            {
+                "master_proof_version": self._state.master_proof_version,
+                "operation": str(edit.get("operation") or ""),
+                "char_delta_removed": metrics.get("char_delta_removed", 0),
+                "line_delta_removed": metrics.get("line_delta_removed", 0),
+            },
+        )
+        raw = await self._call_json(
+            request.brainstorm_validator,
+            "leanoj_master_proof_edit_val",
+            "leanoj_master_proof_edit_validator",
+            build_master_proof_edit_validation_prompt(
+                request.user_prompt,
+                request.lean_template,
+                before_proof,
+                after_proof,
+                edit,
+                metrics,
+            ),
+        )
+        decision = str(raw.get("decision") or "").strip().lower()
+        reasoning = str(raw.get("reasoning") or raw.get("summary") or "").strip()
+        feedback = str(raw.get("feedback_to_submitter") or raw.get("summary") or reasoning).strip()
+        approval_justification = str(
+            raw.get("shortening_approval_justification")
+            or raw.get("approval_justification")
+            or reasoning
+        ).strip()
+        apparent_issue = str(
+            raw.get("apparent_issue_with_old_attempt")
+            or raw.get("old_attempt_apparent_issue")
+            or raw.get("old_attempt_issue")
+            or ""
+        ).strip()
+        if decision == "accept":
+            accepted_reasoning = reasoning or "Master proof edit validator accepted the shortening as progressive."
+            return (
+                True,
+                feedback,
+                accepted_reasoning,
+                approval_justification or accepted_reasoning,
+                apparent_issue
+                or "Validator judged the removed material redundant, superseded, or less progressive than the shorter edit.",
+            )
+        return (
+            False,
+            feedback or "Restore the deleted proof progress or replace it with an equivalent stronger proof before shortening.",
+            reasoning or "Master proof edit validator rejected the shortening as non-progressive.",
+            "",
+            "",
+        )
+
+    def _build_master_proof_direct_context(
+        self,
+        master_proof: str,
+        request: LeanOJStartRequest,
+        context_blocks: dict[str, str] | None,
+    ) -> tuple[str, dict[str, Any]]:
+        proof = master_proof or request.lean_template
+        proof_tokens = count_tokens(proof)
+        available_input = rag_config.get_available_input_tokens(
+            request.final_solver.context_window,
+            request.final_solver.max_output_tokens,
+        )
+        nonproof_parts = [
+            request.user_prompt,
+            request.lean_template,
+            "\n\n".join(str(value) for value in (context_blocks or {}).values() if value),
+        ]
+        nonproof_tokens = sum(count_tokens(part) for part in nonproof_parts)
+        nonproof_tokens += rag_config.get_prompt_assembly_overhead_estimate() + 2500
+        proof_token_budget = available_input - nonproof_tokens
+
+        if proof_tokens > proof_token_budget:
+            raise LeanOJConfigurationError(
+                "PROOF SOLVER MANDATORY DIRECT CONTEXT OVERFLOW: The full master proof is mandatory direct-inject "
+                "context and cannot be truncated, summarized, windowed, or RAG-substituted. "
+                f"Full master proof tokens: {proof_tokens}. Available mandatory direct-inject proof budget after "
+                f"user prompt, Lean template, proof memory, schema, and output reserve: {proof_token_budget}. "
+                f"Configured final-solver context window: {request.final_solver.context_window}. "
+                f"Configured final-solver max output tokens: {request.final_solver.max_output_tokens}. "
+                "Increase the final solver context window or reduce other mandatory prompt context before resuming."
+            )
+
+        return proof, {
+            "direct_context_mode": "full_mandatory",
+            "master_proof_tokens": proof_tokens,
+            "mandatory_direct_proof_token_budget": proof_token_budget,
+        }
+
+    @classmethod
+    def _normalize_master_proof_for_progress(cls, content: str) -> str:
+        return cls._normalize_lean_for_template_check(strip_lean_comments_and_strings(content or ""))
+
+    def _record_master_proof_progress(
+        self,
+        edit: dict[str, Any],
+        before_proof: str,
+        after_proof: str,
+    ) -> str:
+        before_hash = self._hash_master_proof(before_proof)
+        after_hash = self._hash_master_proof(after_proof)
+        before_semantic = self._normalize_master_proof_for_progress(before_proof)
+        after_semantic = self._normalize_master_proof_for_progress(after_proof)
+        signature = self._master_proof_edit_signature(edit)
+        no_hash_change = before_hash == after_hash
+        no_semantic_change = before_semantic == after_semantic
+        repeated_region = bool(signature and signature == self._last_master_proof_edit_signature)
+
+        if no_hash_change or no_semantic_change or repeated_region:
+            self._master_proof_no_progress_count += 1
+        else:
+            self._master_proof_no_progress_count = 0
+
+        self._last_master_proof_edit_signature = signature
+
+        if self._master_proof_no_progress_count < _MASTER_PROOF_NO_PROGRESS_LIMIT:
+            return ""
+
+        reason_parts = [
+            f"LeanOJ final solver made {_MASTER_PROOF_NO_PROGRESS_LIMIT} consecutive edit-only steps",
+        ]
+        if no_semantic_change:
+            reason_parts.append("without changing non-comment Lean code")
+        elif no_hash_change:
+            reason_parts.append("without changing the master proof hash")
+        if repeated_region:
+            reason_parts.append("while repeatedly editing/inserting at the same proof region")
+        reason_parts.append("so the run is returning to recursive brainstorming for fresh context instead of looping indefinitely.")
+        return "; ".join(reason_parts)
+
+    def _reset_master_proof_progress_watchdog(self) -> None:
+        self._master_proof_no_progress_count = 0
+        self._last_master_proof_edit_signature = ""
+
+    @classmethod
+    def _master_proof_edit_signature(cls, edit: dict[str, Any]) -> str:
+        operation = str(edit.get("operation") or "")
+        old_string = str(edit.get("old_string") or "")
+        if operation == "full_content":
+            new_string = str(edit.get("new_string") or "")
+            normalized_new = cls._normalize_master_proof_for_progress(new_string)
+            return f"full_content:{hashlib.sha256(normalized_new[:1000].encode('utf-8')).hexdigest()}"
+        if not old_string:
+            return operation
+        normalized_old = cls._normalize_master_proof_for_progress(old_string)
+        return f"{operation}:{hashlib.sha256(normalized_old.encode('utf-8')).hexdigest()}"
+
+    @staticmethod
+    def _final_cycle_should_handoff_to_recursive(cycle_attempts: list[dict[str, Any]]) -> bool:
+        if any(
+            str(attempt.get("request") or "") == "final Proof Solver master proof progress watchdog"
+            for attempt in cycle_attempts
+        ):
+            return True
+        stale_edit_failures = sum(
+            1
+            for attempt in cycle_attempts
+            if "old_string was not found verbatim" in str(attempt.get("error_summary") or "")
+        )
+        return stale_edit_failures >= _MASTER_PROOF_STALE_EDIT_FAILURE_HANDOFF_COUNT
+
+    @staticmethod
+    def _format_lean_success_feedback(lean_result: Lean4Result) -> str:
+        diagnostics = str(getattr(lean_result, "diagnostic_output", "") or "").strip()
+        if not diagnostics:
+            diagnostics = str(getattr(lean_result, "raw_stderr", "") or "").strip()
+        goal_states = str(getattr(lean_result, "goal_states", "") or "").strip()
+        parts = []
+        if diagnostics:
+            parts.append(diagnostics)
+        if goal_states:
+            parts.append(f"Goal state output:\n{goal_states}")
+        return "\n\n".join(parts).strip() or "Lean 4 accepted with no diagnostics."
+
+    async def _review_final_solution_completion(
+        self,
+        request: LeanOJStartRequest,
+        *,
+        lean_code: str,
+        final_solver_reasoning: str,
+        lean_result: Lean4Result,
+    ) -> tuple[bool, str, str]:
+        lean_feedback = self._format_lean_success_feedback(lean_result)
+        raw = await self._call_json(
+            request.final_solver,
+            "leanoj_final_review",
+            "leanoj_final_solver",
+            build_final_solution_review_prompt(
+                request.user_prompt,
+                request.lean_template,
+                lean_code,
+                final_solver_reasoning,
+                lean_feedback,
+            ),
+        )
+        raw_solved = raw.get("solved")
+        solved = raw_solved if isinstance(raw_solved, bool) else str(raw_solved).strip().lower() == "true"
+        reasoning = str(raw.get("reasoning") or raw.get("summary") or "").strip()
+        continuation_feedback = str(raw.get("continuation_feedback") or "").strip()
+        if solved:
+            return True, reasoning or "Final solver review accepted the Lean-verified solution.", lean_feedback
+        return (
+            False,
+            continuation_feedback or reasoning or "Final solver review rejected this Lean-accepted code as not complete.",
+            lean_feedback,
+        )
+
+    async def _check_master_proof_edit_before_persist(
+        self,
+        request: LeanOJStartRequest,
+        *,
+        lean_code: str,
+        needs_more_time: bool,
+        attempt_number: int,
+        reasoning: str,
+        final_solver_metadata: dict[str, Any],
+    ) -> tuple[Lean4Result, str]:
+        if needs_more_time:
+            lean_result = await get_lean4_client().check_proof(
+                lean_code,
+                timeout=system_config.lean4_proof_timeout,
+                allow_placeholders=True,
+            )
+            lean_pass_feedback = self._format_lean_success_feedback(lean_result) if lean_result.success else ""
+            if lean_result.success:
+                template_error = self._validate_final_solution_integrity(
+                    request.lean_template,
+                    lean_code,
+                )
+                if template_error:
+                    lean_result.success = False
+                    lean_result.error_output = template_error
+            return lean_result, lean_pass_feedback
+
+        lean_result = await self._check_proof_and_capture_partial(
+            request,
+            lean_code,
+            target="final",
+            attempt_number=attempt_number,
+            proof_request="final Proof Solver solution",
+            reasoning=reasoning,
+        )
+        lean_pass_feedback = self._format_lean_success_feedback(lean_result) if lean_result.success else ""
+        if lean_result.success:
+            template_error = self._validate_final_solution_integrity(
+                request.lean_template,
+                lean_code,
+            )
+            if template_error:
+                lean_result.success = False
+                lean_result.error_output = template_error
+            else:
+                adequacy_error = self._validate_final_answer_adequacy(
+                    request.lean_template,
+                    lean_code,
+                )
+                if adequacy_error:
+                    lean_result.success = False
+                    lean_result.error_output = adequacy_error
+            if lean_result.success:
+                review_solved, review_feedback, lean_pass_feedback = await self._review_final_solution_completion(
+                    request,
+                    lean_code=lean_code,
+                    final_solver_reasoning=reasoning,
+                    lean_result=lean_result,
+                )
+                if not review_solved:
+                    lean_result.success = False
+                    lean_result.error_output = (
+                        "PROOF SOLVER FINAL SOLUTION REVIEW REJECTED: Lean 4 accepted the code, but the "
+                        "Final Proof Solver judged that it does not yet solve the actual Proof Solver problem. "
+                        f"Continuation feedback: {review_feedback}"
+                    )
+                    self._failed_feedback.append(
+                        {
+                            "request": "final Proof Solver solution semantic review",
+                            "error_summary": self._summarize_error(lean_result.error_output, limit=1200),
+                            "lean_feedback": self._summarize_error(lean_pass_feedback, limit=1200),
+                            "lean_code": lean_code,
+                        }
+                    )
+                    await self._persist_and_broadcast(
+                        "leanoj_final_solution_review_rejected",
+                        {
+                            "attempt": attempt_number,
+                            "continuation_feedback": self._summarize_error(review_feedback, limit=1200),
+                            "lean_feedback": self._summarize_error(lean_pass_feedback, limit=1200),
+                            **final_solver_metadata,
+                        },
+                    )
+        return lean_result, lean_pass_feedback
+
+    async def _final_proof_loop(self, request: LeanOJStartRequest) -> None:
+        if await self._consume_force_brainstorm():
+            return
+
+        self._state.phase = "final_proof_loop"
+        await self._persist_and_broadcast("leanoj_phase_changed")
+
+        await self._ensure_master_proof_initialized(request)
+        final_solver_metadata = {
+            "solver_model": request.final_solver.model_id,
+            "solver_provider": request.final_solver.provider,
+        }
+        failed_attempts_this_cycle = 0
+        cycle_start_attempt = self._state.final_attempt_count + 1
+        max_failed_attempts = max(1, request.final_attempts_per_cycle)
+        while not self._should_stop() and failed_attempts_this_cycle < max_failed_attempts:
+            if await self._consume_force_brainstorm():
+                return
+
+            current_master_proof = await self._read_master_proof()
+            self._set_master_proof_metadata(current_master_proof)
+            final_prompt_feedback = self._final_solver_failure_window()
+            await self._broadcast(
+                "leanoj_master_proof_edit_started",
+                {
+                    "next_verification_attempt": self._state.final_attempt_count + 1,
+                    "master_proof_version": self._state.master_proof_version,
+                },
+            )
+            try:
+                context_blocks = await self._build_context_blocks(
+                    request,
+                    request.final_solver,
+                    mode="final_solver",
+                    task_request="Edit the durable Proof Solver master proof and decide whether it is ready for Lean verification.",
+                    capped_rejection_feedback=self._format_capped_rejection_feedback(
+                        "RECENT PROOF FEEDBACK SUMMARIES",
+                        final_prompt_feedback,
+                        limit=10,
+                    ),
+                )
+                master_proof_direct_context, direct_context_metadata = self._build_master_proof_direct_context(
+                    current_master_proof,
+                    request,
+                    context_blocks,
+                )
+                raw = await self._call_json(
+                    request.final_solver,
+                    "leanoj_final",
+                    "leanoj_final_solver",
+                    build_final_solver_prompt(
+                        request.user_prompt,
+                        request.lean_template,
+                        master_proof_direct_context,
+                        {
+                            "version": self._state.master_proof_version,
+                            "line_count": self._state.master_proof_line_count,
+                            "char_count": self._state.master_proof_char_count,
+                            "sha256": self._state.master_proof_hash,
+                            "last_edit_summary": self._state.master_proof_last_edit_summary,
+                            "last_shortening_approval_justification": (
+                                self._state.master_proof_last_shortening_approval_justification
+                            ),
+                            "last_shortening_apparent_issue": self._state.master_proof_last_shortening_apparent_issue,
+                            **direct_context_metadata,
+                        },
+                        self._final_solver_active_plan_items(),
+                        self._final_solver_verified_subproof_dicts(),
+                        self._partial_proofs,
+                        final_prompt_feedback,
+                        self._final_attempts[-5:],
+                        context_blocks=context_blocks,
+                    ),
+                )
+            except asyncio.CancelledError:
+                raise
+            except LeanOJConfigurationError:
+                raise
+            except Exception as exc:
+                attempt_number = self._state.final_attempt_count + 1
+                self._state.final_attempt_count = attempt_number
+                failed_attempts_this_cycle += 1
+                error_text = f"Final solver failed before Lean verification: {type(exc).__name__}: {exc}"
+                attempt = LeanOJAttemptRecord(
+                    attempt=attempt_number,
+                    target="final",
+                    request="final Proof Solver master proof edit",
+                    success=False,
+                    error_output=error_text,
+                    reasoning="Model/API output could not be parsed or generated; retrying in the final loop.",
+                )
+                self._final_attempts.append(
+                    {
+                        "request": "final Proof Solver master proof edit",
+                        "error_summary": self._summarize_error(error_text, limit=1200),
+                        "lean_code": current_master_proof,
+                    }
+                )
+                self._record_final_context_event(
+                    "failure",
+                    request="final Proof Solver master proof edit",
+                    error_summary=error_text,
+                )
+                await self._persist_and_broadcast(
+                    "leanoj_final_attempt_failed",
+                    {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+                )
+                continue
+
+            edit = self._normalize_final_solver_edit(raw)
+            action = str(edit.get("action") or "")
+            reasoning = str(edit.get("reasoning") or "")
+            updated_master_proof, edit_error = self._apply_master_proof_edit(current_master_proof, edit)
+            if edit_error or updated_master_proof is None:
+                attempt_number = self._state.final_attempt_count + 1
+                self._state.final_attempt_count = attempt_number
+                failed_attempts_this_cycle += 1
+                error_text = f"MASTER PROOF EDIT REJECTED: {edit_error}"
+                attempt = LeanOJAttemptRecord(
+                    attempt=attempt_number,
+                    target="final",
+                    request="final Proof Solver master proof edit",
+                    lean_code=current_master_proof,
+                    success=False,
+                    error_output=error_text,
+                    reasoning=reasoning,
+                )
+                self._final_attempts.append(
+                    {
+                        "request": "final Proof Solver master proof edit",
+                        "error_summary": self._summarize_error(error_text, limit=1200),
+                        "lean_code": current_master_proof,
+                    }
+                )
+                self._record_final_context_event(
+                    "failure",
+                    request="final Proof Solver master proof edit",
+                    error_summary=error_text,
+                    reasoning=reasoning,
+                )
+                await self._append_master_proof_edit(
+                    {
+                        **edit,
+                        "accepted": False,
+                        "error_summary": self._summarize_error(error_text, limit=1200),
+                    }
+                )
+                await self._persist_and_broadcast(
+                    "leanoj_final_attempt_failed",
+                    {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+                )
+                continue
+
+            shortening_metrics = self._master_proof_shortening_metrics(current_master_proof, updated_master_proof)
+            shortening_approval_justification = ""
+            old_attempt_apparent_issue = ""
+            if self._should_validate_master_proof_shortening_edit(edit, shortening_metrics):
+                (
+                    edit_valid,
+                    validator_feedback,
+                    validator_reasoning,
+                    shortening_approval_justification,
+                    old_attempt_apparent_issue,
+                ) = await self._validate_master_proof_shortening_edit(
+                    request,
+                    edit,
+                    current_master_proof,
+                    updated_master_proof,
+                    shortening_metrics,
+                )
+                if not edit_valid:
+                    attempt_number = self._state.final_attempt_count + 1
+                    self._state.final_attempt_count = attempt_number
+                    failed_attempts_this_cycle += 1
+                    error_text = (
+                        "MASTER PROOF EDIT VALIDATOR REJECTED SHORTENING: "
+                        f"{validator_feedback}"
+                    )
+                    error_summary = self._summarize_error(error_text, limit=1200)
+                    self._failed_feedback.append(
+                        {
+                            "request": "final Proof Solver master proof edit validator",
+                            "error_summary": error_summary,
+                            "reasoning": self._summarize_error(validator_reasoning, limit=1200),
+                        }
+                    )
+                    attempt = LeanOJAttemptRecord(
+                        attempt=attempt_number,
+                        target="final",
+                        request="final Proof Solver master proof edit validator",
+                        lean_code=current_master_proof,
+                        success=False,
+                        error_output=error_text,
+                        reasoning=reasoning,
+                    )
+                    self._final_attempts.append(
+                        {
+                            "request": "final Proof Solver master proof edit validator",
+                            "error_summary": error_summary,
+                            "lean_code": current_master_proof,
+                            "validator_feedback": self._summarize_error(validator_feedback, limit=1200),
+                            "validator_reasoning": self._summarize_error(validator_reasoning, limit=1200),
+                        }
+                    )
+                    self._record_final_context_event(
+                        "failure",
+                        request="final Proof Solver master proof edit validator",
+                        error_summary=error_summary,
+                        reasoning=validator_reasoning,
+                    )
+                    await self._append_master_proof_edit(
+                        {
+                            **edit,
+                            "accepted": False,
+                            "error_summary": error_summary,
+                            "validator_feedback": self._summarize_error(validator_feedback, limit=1200),
+                            "validator_reasoning": self._summarize_error(validator_reasoning, limit=1200),
+                            "shortening_metrics": shortening_metrics,
+                        }
+                    )
+                    await self._persist_and_broadcast(
+                        "leanoj_master_proof_edit_rejected",
+                        {
+                            "attempt": attempt_number,
+                            "error_summary": error_summary,
+                            "validator_feedback": self._summarize_error(validator_feedback, limit=1200),
+                            "validator_reasoning": self._summarize_error(validator_reasoning, limit=1200),
+                            "shortening_metrics": shortening_metrics,
+                            **final_solver_metadata,
+                        },
+                    )
+                    await self._persist_and_broadcast(
+                        "leanoj_final_attempt_failed",
+                        {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+                    )
+                    continue
+
+            needs_more_time = bool(edit.get("needs_more_time"))
+            lean_code = updated_master_proof.strip()
+            attempt_number = self._state.final_attempt_count + 1
+            if not needs_more_time:
+                await self._broadcast(
+                    "leanoj_final_attempt_started",
+                    {"attempt": attempt_number, **final_solver_metadata},
+                )
+            lean_result, lean_pass_feedback = await self._check_master_proof_edit_before_persist(
+                request,
+                lean_code=lean_code,
+                needs_more_time=needs_more_time,
+                attempt_number=attempt_number,
+                reasoning=reasoning,
+                final_solver_metadata=final_solver_metadata,
+            )
+            if not lean_result.success:
+                self._state.final_attempt_count = attempt_number
+                failed_attempts_this_cycle += 1
+                failure_request = (
+                    "final Proof Solver master proof edit Lean gate"
+                    if needs_more_time
+                    else "final Proof Solver solution from master proof"
+                )
+                error_summary = self._summarize_error(lean_result.error_output, limit=1200)
+                attempt = LeanOJAttemptRecord(
+                    attempt=attempt_number,
+                    target="final",
+                    request=failure_request,
+                    lean_code=lean_code,
+                    success=False,
+                    error_output=lean_result.error_output,
+                    reasoning=reasoning,
+                )
+                failure = {
+                    "request": failure_request,
+                    "error_summary": error_summary,
+                    "lean_code": lean_code,
+                }
+                if lean_pass_feedback:
+                    failure["lean_feedback"] = self._summarize_error(lean_pass_feedback, limit=1200)
+                lean_diagnostics = {
+                    key: self._summarize_error(str(value), limit=1200)
+                    for key, value in {
+                        "diagnostic_output": getattr(lean_result, "diagnostic_output", ""),
+                        "goal_states": getattr(lean_result, "goal_states", ""),
+                        "raw_stderr": getattr(lean_result, "raw_stderr", ""),
+                    }.items()
+                    if str(value or "").strip()
+                }
+                failure.update(lean_diagnostics)
+                self._final_attempts.append(failure)
+                self._record_final_context_event(
+                    "failure",
+                    request=failure_request,
+                    error_summary=error_summary,
+                    lean_feedback=str(failure.get("lean_feedback") or ""),
+                    reasoning=reasoning,
+                )
+                await self._append_master_proof_edit(
+                    {
+                        **edit,
+                        "accepted": False,
+                        "error_summary": error_summary,
+                        "lean_code": lean_code,
+                        **lean_diagnostics,
+                        **({"lean_feedback": failure["lean_feedback"]} if "lean_feedback" in failure else {}),
+                    }
+                )
+                await self._persist_and_broadcast(
+                    "leanoj_master_proof_edit_rejected",
+                    {
+                        "attempt": attempt_number,
+                        "error_summary": error_summary,
+                        **lean_diagnostics,
+                        **({"lean_feedback": failure["lean_feedback"]} if "lean_feedback" in failure else {}),
+                        **final_solver_metadata,
+                    },
+                )
+                await self._persist_and_broadcast(
+                    "leanoj_final_attempt_failed",
+                    {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+                )
+                continue
+
+            if shortening_approval_justification or old_attempt_apparent_issue:
+                self._state.master_proof_last_shortening_approval_justification = self._summarize_error(
+                    shortening_approval_justification,
+                    limit=1200,
+                )
+                self._state.master_proof_last_shortening_apparent_issue = self._summarize_error(
+                    old_attempt_apparent_issue,
+                    limit=1200,
+                )
+                old_char_count = len(current_master_proof or "")
+                stored_old_char_count = self._state.master_proof_old_attempt_before_redo_char_count
+                if old_char_count > stored_old_char_count:
+                    await self._write_master_proof_old_attempt_before_redo(current_master_proof)
+                    self._state.master_proof_old_attempt_before_redo_version = self._state.master_proof_version
+                    self._state.master_proof_old_attempt_before_redo_hash = self._hash_master_proof(current_master_proof)
+                    self._state.master_proof_old_attempt_before_redo_line_count = (
+                        len(current_master_proof.splitlines()) if current_master_proof else 0
+                    )
+                    self._state.master_proof_old_attempt_before_redo_char_count = old_char_count
+                    self._state.master_proof_old_attempt_before_redo_summary = (
+                        f"Submitter chose to redo/shorten this v{self._state.master_proof_version} attempt "
+                        f"({old_char_count} chars, "
+                        f"{self._state.master_proof_old_attempt_before_redo_line_count} lines)."
+                    )
+                    self._state.master_proof_old_attempt_before_redo_validator_justification = (
+                        self._summarize_error(shortening_approval_justification, limit=1200)
+                    )
+                    self._state.master_proof_old_attempt_before_redo_apparent_issue = self._summarize_error(
+                        old_attempt_apparent_issue,
+                        limit=1200,
+                    )
+
+            edit_summary = reasoning or f"Applied {edit.get('operation')} edit to Proof Solver master proof."
+            if shortening_approval_justification or old_attempt_apparent_issue:
+                edit_summary = " ".join(
+                    part
+                    for part in (
+                        edit_summary,
+                        (
+                            f"Validator allowed shortening because: {shortening_approval_justification}"
+                            if shortening_approval_justification
+                            else ""
+                        ),
+                        (
+                            f"Apparent issue with old longer attempt: {old_attempt_apparent_issue}"
+                            if old_attempt_apparent_issue
+                            else ""
+                        ),
+                    )
+                    if part
+                )
+            shortening_audit = {}
+            if shortening_approval_justification:
+                shortening_audit["shortening_approval_justification"] = self._summarize_error(
+                    shortening_approval_justification,
+                    limit=1200,
+                )
+            if old_attempt_apparent_issue:
+                shortening_audit["old_attempt_apparent_issue"] = self._summarize_error(
+                    old_attempt_apparent_issue,
+                    limit=1200,
+                )
+            await self._write_master_proof(updated_master_proof, summary=edit_summary)
+            await self._append_master_proof_edit(
+                {
+                    **edit,
+                    "accepted": True,
+                    "master_proof_hash": self._state.master_proof_hash,
+                    "master_proof_line_count": self._state.master_proof_line_count,
+                    "master_proof_char_count": self._state.master_proof_char_count,
+                    **shortening_audit,
+                }
+            )
+            await self._persist_and_broadcast(
+                "leanoj_master_proof_edit_applied",
+                {
+                    "master_proof_version": self._state.master_proof_version,
+                    "needs_more_time": needs_more_time,
+                    "reasoning": self._summarize_error(edit_summary, limit=500),
+                },
+            )
+            self._record_final_context_event(
+                "acceptance",
+                request="final Proof Solver master proof edit accepted",
+                reasoning=edit_summary,
+            )
+
+            if needs_more_time:
+                watchdog_reason = self._record_master_proof_progress(edit, current_master_proof, updated_master_proof)
+                if watchdog_reason:
+                    self._state.master_proof_last_stuck_reason = self._summarize_error(watchdog_reason, limit=500)
+                    self._failed_feedback.append(
+                        {
+                            "request": "final Proof Solver master proof progress watchdog",
+                            "error_summary": self._summarize_error(watchdog_reason, limit=1200),
+                        }
+                    )
+                    await self._append_master_proof_edit(
+                        {
+                            "action": "progress_watchdog",
+                            "reasoning": watchdog_reason,
+                            "master_proof_hash": self._state.master_proof_hash,
+                            "master_proof_line_count": self._state.master_proof_line_count,
+                            "master_proof_char_count": self._state.master_proof_char_count,
+                        }
+                    )
+                    self._reset_master_proof_progress_watchdog()
+                    attempt_number = self._state.final_attempt_count + 1
+                    self._state.final_attempt_count = attempt_number
+                    failed_attempts_this_cycle += 1
+                    self._final_attempts.append(
+                        {
+                            "request": "final Proof Solver master proof progress watchdog",
+                            "error_summary": self._summarize_error(watchdog_reason, limit=1200),
+                            "lean_code": updated_master_proof,
+                        }
+                    )
+                    self._record_final_context_event(
+                        "failure",
+                        request="final Proof Solver master proof progress watchdog",
+                        error_summary=watchdog_reason,
+                        reasoning=reasoning,
+                    )
+                    await self._persist_and_broadcast(
+                        "leanoj_final_attempt_failed",
+                        {
+                            "attempt": LeanOJAttemptRecord(
+                                attempt=attempt_number,
+                                target="final",
+                                request="final Proof Solver master proof progress watchdog",
+                                lean_code=updated_master_proof,
+                                success=False,
+                                error_output=watchdog_reason,
+                                reasoning=reasoning,
+                            ).model_dump(mode="json"),
+                            **final_solver_metadata,
+                        },
+                    )
+                    await self._persist_and_broadcast(
+                        "leanoj_master_proof_progress_watchdog",
+                        {
+                            "reasoning": watchdog_reason,
+                            "continuing_final_cycle": (
+                                failed_attempts_this_cycle < max_failed_attempts
+                                and self._state.user_forced_final_cycle
+                            ),
+                        },
+                    )
+                    if failed_attempts_this_cycle < max_failed_attempts and self._state.user_forced_final_cycle:
+                        logger.info(
+                            "LeanOJ final cycle continuing after progress watchdog",
+                        )
+                        self._state.phase = "final_proof_loop"
+                        self._state.current_path_decision = "solve_final_now"
+                        continue
+                    break
+                continue
+            self._reset_master_proof_progress_watchdog()
+
+            self._state.final_attempt_count = attempt_number
+            attempt = LeanOJAttemptRecord(
+                attempt=attempt_number,
+                target="final",
+                request="final Proof Solver solution from master proof",
+                lean_code=lean_code,
+                success=lean_result.success,
+                error_output=lean_result.error_output,
+                reasoning=reasoning,
+            )
+
+            try:
+                proof_record = await self._register_verified_leanoj_proof(
+                    request,
+                    proof_kind="final",
+                    theorem_statement=request.user_prompt,
+                    theorem_name="Final Proof Solver Submission",
+                    lean_code=lean_code,
+                    attempt_count=attempt_number,
+                    formal_sketch="Final Proof Solver solution for the user's template.",
+                    theorem_id=f"{self._state.session_id}_final",
+                    source_title=self._state.selected_topic or request.user_prompt,
+                )
+            except Exception as exc:
+                if self._is_non_retryable_model_error(exc):
+                    raise LeanOJConfigurationError(str(exc)) from exc
+                lean_result.success = False
+                lean_result.error_output = f"PROOF SOLVER PROOF REGISTRATION FAILED: {exc}"
+                attempt.success = False
+                attempt.error_output = lean_result.error_output
+
+            if lean_result.success:
+                self._state.phase = "verified"
+                self._state.user_forced_final_cycle = False
+                self._state.final_solution = lean_code
+                self._state.final_proof_id = proof_record.proof_id if proof_record else ""
+                self._state.final_novel = proof_record.novel if proof_record else False
+                self._state.final_novelty_tier = proof_record.novelty_tier if proof_record else "not_novel"
+                self._state.final_novelty_reasoning = proof_record.novelty_reasoning if proof_record else ""
+                self._current_final_cycle_packet = None
+                self._current_working_proof_attempt = None
+                await self._persist_and_broadcast(
+                    "leanoj_final_verified",
+                    {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+                )
+                return
+
+            failure = {
+                "request": "final Proof Solver solution from master proof",
+                "error_summary": self._summarize_error(lean_result.error_output, limit=1200),
+                "lean_code": lean_code,
+            }
+            if lean_pass_feedback:
+                failure["lean_feedback"] = self._summarize_error(lean_pass_feedback, limit=1200)
+            self._final_attempts.append(failure)
+            self._record_final_context_event(
+                "failure",
+                request=str(failure.get("request") or "final Proof Solver solution from master proof"),
+                error_summary=str(failure.get("error_summary") or ""),
+                lean_feedback=str(failure.get("lean_feedback") or ""),
+                reasoning=reasoning,
+            )
+            failed_attempts_this_cycle += 1
+            await self._persist_and_broadcast(
+                "leanoj_final_attempt_failed",
+                {"attempt": attempt.model_dump(mode="json"), **final_solver_metadata},
+            )
+
+        if self._should_stop() or self._state.phase == "verified":
+            return
+
+        cycle_end_attempt = self._state.final_attempt_count
+        last_error = ""
+        if self._final_attempts:
+            last_error = str(self._final_attempts[-1].get("error_summary") or "")
+        cycle_summary = (
+            "The final master proof loop did not verify yet. "
+            f"Latest blocker: {last_error or 'No final attempt error was recorded.'} "
+            "Use the concrete Lean/edit feedback to choose the next proof action."
+        )
+        cycle_attempts = list(self._final_attempts[-failed_attempts_this_cycle:])
+        cycle_partials = [
+            proof
+            for proof in self._partial_proofs
+            if str(proof.get("target") or "") == "final"
+            and cycle_start_attempt <= int(proof.get("attempt") or 0) <= cycle_end_attempt
+        ]
+        cycle_packet = {
+            "session_id": self._state.session_id,
+            "cycle_start_attempt": cycle_start_attempt,
+            "cycle_end_attempt": cycle_end_attempt,
+            "failed_attempt_count": failed_attempts_this_cycle,
+            "attempts": cycle_attempts,
+            "partial_proofs": cycle_partials,
+            "created_at": datetime.now().isoformat(),
+            "summary": self._summarize_error(cycle_summary, limit=1200),
+        }
+        self._final_cycle_packets.append(cycle_packet)
+        self._current_final_cycle_packet = cycle_packet
+        self._failed_feedback.append(
+            {
+                "request": "final Proof Solver proof cycle",
+                "error_summary": self._summarize_error(cycle_summary, limit=1200),
+            }
+        )
+        handoff_to_recursive = self._final_cycle_should_handoff_to_recursive(cycle_attempts)
+        self._state.user_forced_final_cycle = False
+        self._state.phase = "recursive_brainstorm" if handoff_to_recursive else "path_decision"
+        self._state.current_path_decision = "need_more_brainstorming"
+        await self._set_current_working_proof_attempt(
+            trigger="final_attempt_cycle_exhausted",
+            requested_path="need_more_brainstorming",
+            stuck_reason=cycle_summary,
+        )
+        await self._persist_and_broadcast(
+            "leanoj_final_attempt_cycle_exhausted",
+            {
+                "attempts_in_cycle": failed_attempts_this_cycle,
+                "cycle_start_attempt": cycle_start_attempt,
+                "cycle_end_attempt": cycle_end_attempt,
+                "message": self._summarize_error(cycle_summary, limit=500),
+            },
+        )
+
+    @staticmethod
+    def _normalize_lean_for_template_check(code: str) -> str:
+        return " ".join((code or "").split())
+
+    @classmethod
+    def _validate_final_solution_integrity(cls, lean_template: str, lean_code: str) -> str:
+        device_error = cls._validate_no_new_declaration_devices(lean_template, lean_code, target="solution")
+        if device_error:
+            return device_error
+        template_error = cls._validate_final_solution_matches_template(lean_template, lean_code)
+        if template_error:
+            return template_error
+        return ""
+
+    @classmethod
+    def _validate_final_answer_adequacy(cls, lean_template: str, lean_code: str) -> str:
+        """Reject final-only answer definitions that restate the extremal target."""
+        if cls._placeholder_tokens(lean_code):
+            return ""
+        template_answer = cls._find_declaration_block(lean_template, "def answer")
+        if not template_answer or not cls._declaration_has_placeholder(template_answer):
+            return ""
+        candidate_answer = cls._find_declaration_block(lean_code, "def answer")
+        if not candidate_answer:
+            return ""
+
+        body = cls._normalize_lean_for_semantic_scan(cls._lean_declaration_body(candidate_answer))
+        if not body:
+            return ""
+
+        extremal_markers = (
+            "ssup",
+            "csup",
+            "nat.ssup",
+            "sup ",
+            "isgreatest",
+            "bddabove",
+            "upperbounds",
+        )
+        self_reference_markers = (
+            "s n",
+            "set ",
+            "finset",
+            "card",
+            "exists",
+            "u in",
+            "v in",
+            "divides",
+            " ∣ ",
+            "∣",
+        )
+        if any(marker in body for marker in extremal_markers) and any(
+            marker in body for marker in self_reference_markers
+        ):
+            return (
+                "PROOF SOLVER ANSWER ADEQUACY REJECTED: Lean accepted the final code, but `answer` is defined "
+                "using an extremal/supremum construction over the same feasible-cardinality problem instead "
+                "of determining the requested largest size in terms of n. This may remain in the durable "
+                "master proof as intermediate context, but it is not final-ready. Continue the Proof Solver loop, "
+                "derive an explicit formula for `answer n`, and then prove `IsGreatest (S n)` for that formula."
+            )
+        return ""
+
+    @classmethod
+    def _validate_no_new_declaration_devices(cls, lean_template: str, lean_code: str, *, target: str) -> str:
+        integrity = validate_lean_proof_integrity(
+            lean_code=lean_code,
+            allowed_baseline=lean_template,
+        )
+        if integrity.valid:
+            return ""
+        return (
+            "PROOF SOLVER FORBIDDEN PROOF DEVICE: Lean accepted the submitted code, but the "
+            f"{target} introduced new axiom/constant/opaque declarations not present in the original template: "
+            f"{', '.join(integrity.introduced_devices[:8])}. Do not solve Proof Solver problems by adding fake assumptions; "
+            "preserve the template and fill the proof using constructive Lean/Mathlib proof terms or tactics."
+        )
+
+    @classmethod
+    def _validate_final_solution_matches_template(cls, lean_template: str, lean_code: str) -> str:
+        """Return an error message when a compiling final answer does not solve the template."""
+        template = lean_template or ""
+        candidate = lean_code or ""
+        hole_aware_error = cls._validate_final_solution_matches_template_declarations(template, candidate)
+        if hole_aware_error is not None:
+            return hole_aware_error
+
+        template_parts = [
+            cls._normalize_lean_for_template_check(part)
+            for part in _LEAN_PLACEHOLDER_RE.split(template)
+            if part not in {"sorry", "admit"}
+        ]
+        significant_parts = [part for part in template_parts if len(part) >= 12]
+        normalized_candidate = cls._normalize_lean_for_template_check(candidate)
+
+        if not significant_parts:
+            normalized_template = cls._normalize_lean_for_template_check(template)
+            if normalized_template and normalized_template not in normalized_candidate:
+                return (
+                    "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but the code does not preserve "
+                    "the user's original Proof Solver template/declaration. Return the complete original template with "
+                    "only the proof holes filled unless a template change is explicitly required."
+                )
+            return ""
+
+        search_from = 0
+        for part in significant_parts:
+            found_at = normalized_candidate.find(part, search_from)
+            if found_at < 0:
+                return (
+                    "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but the code does not contain "
+                    "the original Proof Solver template structure around the proof hole. Do not replace the task with "
+                    "an unrelated theorem; preserve the user's declarations and fill the required proof."
+                )
+            search_from = found_at + len(part)
+        return ""
+
+    @classmethod
+    def _validate_final_solution_matches_template_declarations(cls, lean_template: str, lean_code: str) -> Optional[str]:
+        """Validate LeanOJ submissions by preserving declarations while allowing hole bodies to change."""
+        template_decls = cls._lean_declaration_blocks(lean_template)
+        candidate_decls = cls._lean_declaration_blocks(lean_code)
+        if not template_decls or not candidate_decls:
+            return None
+
+        candidate_by_key: dict[str, str] = {}
+        for declaration in candidate_decls:
+            key = cls._lean_declaration_key(declaration)
+            if key and key not in candidate_by_key:
+                candidate_by_key[key] = declaration
+
+        candidate_imports = set(cls._lean_imports(lean_code))
+        for import_line in cls._lean_imports(lean_template):
+            if import_line not in candidate_imports:
+                return (
+                    "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but the code removed an "
+                    f"original Proof Solver import required by the template: {import_line}. Preserve original imports; "
+                    "additional imports are allowed when Lean needs them."
+                )
+
+        for template_decl in template_decls:
+            key = cls._lean_declaration_key(template_decl)
+            if not key:
+                continue
+            candidate_decl = candidate_by_key.get(key)
+            if not candidate_decl:
+                return (
+                    "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but it does not preserve "
+                    f"the original Proof Solver declaration `{key}`. Do not replace the task with unrelated declarations."
+                )
+
+            if cls._declaration_has_placeholder(template_decl):
+                template_header = cls._normalize_lean_declaration_header(template_decl)
+                candidate_header = cls._normalize_lean_declaration_header(candidate_decl)
+                if template_header != candidate_header:
+                    return (
+                        "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but it changed the "
+                        f"signature/target of original declaration `{key}`. Fill only the `sorry`/`admit` body."
+                    )
+                continue
+
+            normalized_template_decl = cls._normalize_lean_for_template_check(template_decl)
+            normalized_candidate_decl = cls._normalize_lean_for_template_check(candidate_decl)
+            if normalized_template_decl != normalized_candidate_decl:
+                return (
+                    "PROOF SOLVER TEMPLATE MISMATCH: Lean accepted the submitted code, but it changed a fixed "
+                    f"non-hole declaration `{key}` from the original template. Preserve fixed definitions exactly."
+                )
+
+        return ""
+
+    @staticmethod
+    def _lean_imports(code: str) -> list[str]:
+        return [
+            line.strip()
+            for line in (code or "").splitlines()
+            if line.strip().startswith("import ")
+        ]
+
+    @staticmethod
+    def _lean_declaration_blocks(code: str) -> list[str]:
+        matches = list(_LEAN_TOP_LEVEL_DECL_RE.finditer(code or ""))
+        blocks: list[str] = []
+        for index, match in enumerate(matches):
+            end = matches[index + 1].start() if index + 1 < len(matches) else len(code or "")
+            block = (code or "")[match.start() : end].strip()
+            if block:
+                blocks.append(block)
+        return blocks
+
+    @staticmethod
+    def _lean_declaration_key(declaration: str) -> str:
+        match = _LEAN_DECL_KEY_RE.search(declaration or "")
+        if not match:
+            return ""
+        kind = match.group("kind") or ""
+        name = match.group("name") or ""
+        return f"{kind} {name}".strip()
+
+    @classmethod
+    def _find_declaration_block(cls, code: str, declaration_key: str) -> str:
+        for declaration in cls._lean_declaration_blocks(code):
+            if cls._lean_declaration_key(declaration) == declaration_key:
+                return declaration
+        return ""
+
+    @staticmethod
+    def _lean_declaration_body(declaration: str) -> str:
+        if ":=" not in (declaration or ""):
+            return ""
+        return (declaration or "").split(":=", 1)[1].strip()
+
+    @classmethod
+    def _normalize_lean_for_semantic_scan(cls, code: str) -> str:
+        return cls._normalize_lean_for_template_check(strip_lean_comments_and_strings(code or "")).lower()
+
+    @staticmethod
+    def _declaration_has_placeholder(declaration: str) -> bool:
+        return bool(_LEAN_PLACEHOLDER_RE.search(strip_lean_comments_and_strings(declaration or "")))
+
+    @classmethod
+    def _normalize_lean_declaration_header(cls, declaration: str) -> str:
+        header = (declaration or "").split(":=", 1)[0]
+        normalized = cls._normalize_lean_for_template_check(header)
+        while True:
+            previous = normalized
+            normalized = re.sub(r"^open\s+Classical\s+in\s+", "", normalized)
+            normalized = re.sub(r"^(?:@\[[^\]]+\]\s*)+", "", normalized)
+            normalized = re.sub(r"^(?:(?:private|protected|noncomputable|unsafe)\s+)+", "", normalized)
+            normalized = normalized.strip()
+            if normalized == previous:
+                break
+        return normalized.strip()
+
+    @staticmethod
+    def _json_retry_schema_hint(role_id: str) -> str:
+        if role_id.startswith("leanoj_brainstorm_submitter_"):
+            return (
+                "ROLE-SPECIFIC COMPACT RETRY CONTRACT:\n"
+                "- For this retry, use the normal idea schema only; do not choose `lean_proof`.\n"
+                "- Return exactly: "
+                "{\"submission_type\":\"idea\",\"submission\":\"...\",\"reasoning\":\"...\"}\n"
+                "- Keep `submission` under 600 characters and `reasoning` under 200 characters.\n"
+                "- Do not quote the Lean template, prior proof, accepted ideas, or failure log."
+            )
+        if role_id == "leanoj_brainstorm_validator":
+            return (
+                "ROLE-SPECIFIC COMPACT RETRY CONTRACT:\n"
+                "- If the original prompt requested batch validation, return exactly one compact "
+                "`decisions` entry per submission in the original order.\n"
+                "- If the original prompt requested single validation, return one compact "
+                "`decision` object.\n"
+                "- Keep every `reasoning` and `summary` string under 160 characters.\n"
+                "- Do not quote submissions, Lean code, accepted ideas, or proof context."
+            )
+        if role_id == "leanoj_topic_validator":
+            return (
+                "ROLE-SPECIFIC COMPACT RETRY CONTRACT:\n"
+                "- Keep every topic, reasoning, and summary field under 200 characters.\n"
+                "- Do not quote the Lean template or prior topics."
+            )
+        return (
+            "ROLE-SPECIFIC COMPACT RETRY CONTRACT:\n"
+            "- Keep every string field short; do not quote large context blocks or code."
+        )
+
+    @classmethod
+    def _summarize_model_call_result(
+        cls,
+        role_id: str,
+        task_id: str,
+        parsed: dict[str, Any],
+        *,
+        limit: int = 700,
+    ) -> str:
+        """Return a compact outcome summary for live logs and INFO output."""
+        if not isinstance(parsed, dict):
+            return cls._summarize_error(str(parsed), limit=limit)
+
+        def clean(value: Any, text_limit: int = 320) -> str:
+            return cls._summarize_error(str(value or ""), limit=text_limit)
+
+        def first_text(*keys: str, text_limit: int = 320) -> str:
+            for key in keys:
+                value = parsed.get(key)
+                if value:
+                    return clean(value, text_limit)
+            return ""
+
+        decisions = parsed.get("decisions")
+        if isinstance(decisions, list):
+            accepted = 0
+            rejected = 0
+            samples: list[str] = []
+            for index, decision in enumerate(decisions, start=1):
+                if not isinstance(decision, dict):
+                    continue
+                verdict = clean(decision.get("decision") or decision.get("verdict"), 40).lower()
+                if verdict == "accept":
+                    accepted += 1
+                elif verdict == "reject":
+                    rejected += 1
+                reason = clean(
+                    decision.get("summary") or decision.get("reasoning") or decision.get("feedback"),
+                    160,
+                )
+                if reason and len(samples) < 2:
+                    samples.append(f"{index}: {verdict or 'decision'} - {reason}")
+            prefix = f"batch result: {accepted} accepted, {rejected} rejected"
+            return cls._summarize_error(
+                f"{prefix}; {'; '.join(samples)}" if samples else prefix,
+                limit=limit,
+            )
+
+        if "enough" in parsed:
+            status = "ready for path decision" if bool(parsed.get("enough")) else "continue brainstorming"
+            reason = first_text("reasoning", "summary", "feedback", text_limit=260)
+            return cls._summarize_error(
+                f"sufficiency result: {status}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("path"):
+            reason = first_text("reasoning", "summary", text_limit=300)
+            return cls._summarize_error(
+                f"path result: {clean(parsed.get('path'), 80)}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("decision"):
+            reason = first_text("summary", "reasoning", "feedback_to_submitter", text_limit=300)
+            return cls._summarize_error(
+                f"decision: {clean(parsed.get('decision'), 80)}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("action") or parsed.get("operation"):
+            action = clean(parsed.get("action") or "action", 80)
+            operation = clean(parsed.get("operation"), 80)
+            reason = first_text("reasoning", "summary", "stuck_reason", text_limit=300)
+            label = f"{action}{f'/{operation}' if operation else ''}"
+            return cls._summarize_error(
+                f"action result: {label}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("topic"):
+            reason = first_text("reasoning", "summary", text_limit=220)
+            return cls._summarize_error(
+                f"topic: {clean(parsed.get('topic'), 360)}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("submission"):
+            submission_type = clean(parsed.get("submission_type") or "idea", 60)
+            reason = first_text("reasoning", "formal_sketch", text_limit=220)
+            return cls._summarize_error(
+                f"{submission_type}: {clean(parsed.get('submission'), 420)}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        if parsed.get("theorem_statement"):
+            theorem = clean(parsed.get("theorem_name") or parsed.get("theorem_statement"), 360)
+            sketch = first_text("formal_sketch", "reasoning", text_limit=220)
+            return cls._summarize_error(
+                f"lean proof: {theorem}{f' - {sketch}' if sketch else ''}",
+                limit=limit,
+            )
+
+        if "solved" in parsed:
+            reason = first_text("reasoning", "summary", "continuation_feedback", text_limit=320)
+            return cls._summarize_error(
+                f"solver review: {'solved' if bool(parsed.get('solved')) else 'not solved'}{f' - {reason}' if reason else ''}",
+                limit=limit,
+            )
+
+        summary = first_text(
+            "summary",
+            "reasoning",
+            "feedback",
+            "message",
+            "answer",
+            text_limit=500,
+        )
+        if summary:
+            return summary
+
+        keys = ", ".join(sorted(str(key) for key in parsed.keys())[:8])
+        return f"{role_id or task_id} returned JSON fields: {keys or 'none'}"
+
+    async def _call_json(
+        self,
+        config: LeanOJRoleConfig,
+        task_prefix: str,
+        role_id: str,
+        prompt: str,
+        temperature: float = 0.0,
+    ) -> dict[str, Any]:
+        if not config.model_id:
+            raise LeanOJConfigurationError(f"Proof Solver role {role_id} has no configured model")
+        current_prompt = prompt
+        attempt_index = 0
+        while not self._should_stop():
+            attempt_index += 1
+            if self._should_stop():
+                raise asyncio.CancelledError()
+            task_id = self._next_task_id(task_prefix)
+            self.current_task_id = task_id
+            self._refresh_workflow_tasks(task_prefix, role_id)
+            api_client_manager.set_autonomous_phase(self._state.phase or "leanoj")
+            started = time.monotonic()
+            call_payload = {
+                "role_id": role_id,
+                "task_id": task_id,
+                "phase": self._state.phase or "leanoj",
+                "attempt": attempt_index,
+                "provider": config.provider,
+                "model": config.model_id,
+                "context_window": config.context_window,
+                "max_output_tokens": config.max_output_tokens,
+                "temperature": temperature,
+            }
+            logger.debug(
+                "Proof Solver model call started (role=%s, task=%s, phase=%s, provider=%s, model=%s, attempt=%s)",
+                role_id,
+                task_id,
+                call_payload["phase"],
+                config.provider,
+                config.model_id,
+                attempt_index,
+            )
+            try:
+                prompt_tokens = count_tokens(current_prompt)
+                max_input_tokens = rag_config.get_available_input_tokens(
+                    config.context_window,
+                    config.max_output_tokens,
+                )
+                call_payload["prompt_tokens"] = prompt_tokens
+                call_payload["max_input_tokens"] = max_input_tokens
+                if prompt_tokens > max_input_tokens:
+                    raise LeanOJConfigurationError(
+                        "PROOF SOLVER PROMPT CONTEXT OVERFLOW: assembled prompt exceeds the configured "
+                        f"input budget for role {role_id}. Prompt tokens: {prompt_tokens}. "
+                        f"Available input tokens: {max_input_tokens}. Context window: {config.context_window}. "
+                        f"Max output tokens: {config.max_output_tokens}."
+                    )
+                response = await api_client_manager.generate_completion(
+                    task_id=task_id,
+                    role_id=role_id,
+                    model=config.model_id,
+                    messages=[{"role": "user", "content": current_prompt}],
+                    max_tokens=config.max_output_tokens,
+                    temperature=temperature,
+                )
+                self.completed_task_ids.add(task_id)
+
+                choices = response.get("choices") or []
+                content = ""
+                if choices:
+                    message = choices[0].get("message") or {}
+                    content = message.get("content") or message.get("reasoning") or ""
+                parsed = parse_json(content)
+                if isinstance(parsed, list):
+                    parsed = parsed[0] if parsed else {}
+                if isinstance(parsed, dict):
+                    duration_ms = round((time.monotonic() - started) * 1000)
+                    result_summary = self._summarize_model_call_result(role_id, task_id, parsed)
+                    logger.info(
+                        "Proof Solver model call result (role=%s, task=%s, phase=%s, duration_ms=%s, response_chars=%s): %s",
+                        role_id,
+                        task_id,
+                        call_payload["phase"],
+                        duration_ms,
+                        len(content),
+                        result_summary,
+                    )
+                    await self._broadcast(
+                        "leanoj_model_call_completed",
+                        {
+                            **call_payload,
+                            "duration_ms": duration_ms,
+                            "response_chars": len(content),
+                            "result_summary": result_summary,
+                        },
+                    )
+                    return parsed
+                raise ValueError("Proof Solver role returned JSON that was not an object.")
+            except asyncio.CancelledError:
+                raise
+            except LeanOJConfigurationError:
+                raise
+            except Exception as exc:
+                duration_ms = round((time.monotonic() - started) * 1000)
+                if self._is_non_retryable_model_error(exc):
+                    logger.error(
+                        "Proof Solver model call failed with non-retryable error (role=%s, task=%s, phase=%s, duration_ms=%s): %s",
+                        role_id,
+                        task_id,
+                        call_payload["phase"],
+                        duration_ms,
+                        exc,
+                    )
+                    await self._broadcast(
+                        "leanoj_model_call_failed",
+                        {
+                            **call_payload,
+                            "duration_ms": duration_ms,
+                            "retryable": False,
+                            "message": self._summarize_error(str(exc), limit=700),
+                        },
+                    )
+                    raise LeanOJConfigurationError(str(exc)) from exc
+                logger.warning(
+                    "Proof Solver role %s task %s failed to produce valid JSON on retryable attempt %s: %s",
+                    role_id,
+                    task_id,
+                    attempt_index,
+                    exc,
+                )
+                error_summary = self._summarize_error(
+                    f"Proof Solver role {role_id} returned unusable JSON on retryable attempt {attempt_index}: "
+                    f"{type(exc).__name__}: {exc}",
+                    limit=1200,
+                )
+                await self._broadcast(
+                    "leanoj_model_call_failed",
+                    {
+                        **call_payload,
+                        "duration_ms": duration_ms,
+                        "retryable": True,
+                        "message": error_summary,
+                    },
+                )
+                if attempt_index == 1 or attempt_index % 3 == 0:
+                    self._failed_feedback.append(
+                        {
+                            "request": f"{role_id} JSON generation",
+                            "error_summary": error_summary,
+                            "role_id": role_id,
+                            "attempt": attempt_index,
+                        }
+                    )
+                await self._persist_and_broadcast(
+                    "leanoj_role_json_retrying",
+                    {
+                        "role_id": role_id,
+                        "task_id": task_id,
+                        "attempt": attempt_index,
+                        "message": error_summary,
+                    },
+                )
+                current_prompt = (
+                    f"{prompt}\n\n"
+                    "IMPORTANT - YOUR PREVIOUS RESPONSE WAS REJECTED BY THE JSON PARSER:\n"
+                    "REJECTION REASON: INVALID_OR_TRUNCATED_JSON\n"
+                    f"ISSUE: {type(exc).__name__}: {self._summarize_error(str(exc), limit=700)}\n"
+                    "FIX REQUIRED:\n"
+                    "- Return raw JSON only, with no markdown fences, commentary, or analysis.\n"
+                    "- Start with `{` and end with `}`.\n"
+                    "- Keep every string field concise enough to finish before max_tokens.\n"
+                    "- Preserve the requested schema exactly.\n"
+                    "- Escape Lean/LaTeX backslashes so the result is valid JSON.\n\n"
+                    f"{self._json_retry_schema_hint(role_id)}"
+                )
+                if attempt_index % 3 == 0:
+                    await asyncio.sleep(min(5.0, 0.5 * (attempt_index // 3)))
+            finally:
+                self.current_task_id = None
+                self._refresh_workflow_tasks(task_prefix, role_id)
+
+        raise asyncio.CancelledError()
+
+    @staticmethod
+    def _missing_model_roles(request: LeanOJStartRequest) -> list[str]:
+        role_configs: list[tuple[str, LeanOJRoleConfig]] = [
+            ("topic_generator", request.topic_generator),
+            ("topic_validator", request.topic_validator),
+            ("brainstorm_validator", request.brainstorm_validator),
+            ("final_solver", request.final_solver),
+        ]
+        role_configs.extend(
+            (f"brainstorm_submitter_{index}", submitter)
+            for index, submitter in enumerate(request.brainstorm_submitters, start=1)
+        )
+        return [role_name for role_name, config in role_configs if not (config.model_id or "").strip()]
+
+    def _next_task_id(self, prefix: str) -> str:
+        current = self._task_sequences.get(prefix, 0)
+        self._task_sequences[prefix] = current + 1
+        return f"{prefix}_{current:03d}"
+
+    def _refresh_workflow_tasks(self, active_prefix: str = "leanoj_topic", active_role: str = "LeanOJ") -> None:
+        submitter_count = max(1, len(self._request.brainstorm_submitters) if self._request else 1)
+        brainstorm_submitter_patterns = [
+            (f"leanoj_brainstorm_sub{index}", f"Brainstorm Submitter {index}", "Cumulative Brainstorm")
+            for index in range(1, submitter_count + 1)
+        ]
+        pattern = [
+            ("leanoj_topic", "Topic Generator", "Topic Selection"),
+            ("leanoj_topic_val", "Topic Validator", "Topic Validation"),
+            *brainstorm_submitter_patterns,
+            ("leanoj_brainstorm_val", "Brainstorm Validator", "Brainstorm Validation"),
+            ("leanoj_brainstorm_prune", "Brainstorm Prune Reviewer", "Brainstorm Pruning"),
+            ("leanoj_brainstorm_prune_val", "Brainstorm Prune Validator", "Brainstorm Pruning"),
+            ("leanoj_path", "Final Proof Solver", "Path Decision"),
+            ("leanoj_path_val", "Path Validator", "Path Validation"),
+            ("leanoj_final", "Final Solver", "Final Lean Loop"),
+            ("leanoj_master_proof_edit_val", "Master Proof Edit Validator", "Final Lean Loop"),
+            ("leanoj_final_review", "Final Solver Review", "Final Lean Loop"),
+        ]
+        tasks: list[WorkflowTask] = []
+        start_seq = sum(self._task_sequences.values())
+        for offset in range(20):
+            prefix, role, mode = pattern[offset % len(pattern)]
+            seq = self._task_sequences.get(prefix, 0) + offset
+            task_id = f"{prefix}_{seq:03d}"
+            tasks.append(
+                WorkflowTask(
+                    task_id=task_id,
+                    sequence_number=start_seq + offset + 1,
+                    role=active_role if prefix == active_prefix else role,
+                    mode=mode,
+                    provider="lm_studio",
+                    active=prefix == active_prefix,
+                    completed=task_id in self.completed_task_ids,
+                )
+            )
+        self.workflow_tasks = tasks
+
+    def _configure_roles(self, request: LeanOJStartRequest) -> None:
+        self._configure_role("leanoj_topic_generator", request.topic_generator)
+        self._configure_role("leanoj_topic_selector", request.topic_generator)
+        self._configure_role("leanoj_topic_validator", request.topic_validator)
+        self._configure_role("leanoj_path_validator", request.topic_validator)
+        self._configure_role("leanoj_proof_novelty", request.topic_validator)
+        self._configure_role("leanoj_brainstorm_validator", request.brainstorm_validator)
+        self._configure_role("leanoj_master_proof_edit_validator", request.brainstorm_validator)
+        self._configure_role("leanoj_final_solver", request.final_solver)
+        for index, submitter in enumerate(request.brainstorm_submitters, start=1):
+            self._configure_role(f"leanoj_topic_submitter_{index}", submitter)
+            self._configure_role(f"leanoj_brainstorm_submitter_{index}", submitter)
+            self._configure_role(f"leanoj_brainstorm_prune_reviewer_{index}", submitter)
+
+    @staticmethod
+    def _configure_role(role_id: str, config: LeanOJRoleConfig) -> None:
+        api_client_manager.configure_role(
+            role_id,
+            ModelConfig(
+                provider=config.provider,
+                model_id=config.model_id,
+                openrouter_model_id=config.model_id if config.provider == "openrouter" else None,
+                openrouter_provider=config.openrouter_provider,
+                openrouter_reasoning_effort=config.openrouter_reasoning_effort,
+                lm_studio_fallback_id=config.lm_studio_fallback_id,
+                context_window=config.context_window,
+                max_output_tokens=config.max_output_tokens,
+                supercharge_enabled=config.supercharge_enabled,
+            ),
+        )
+
+    async def _persist_and_broadcast(self, event: str, data: Optional[dict[str, Any]] = None) -> None:
+        self._state.updated_at = datetime.now()
+        self._remember_active_phase()
+        await self._persist_state()
+        await self._broadcast(event, data or self.get_status())
+        await self._broadcast("leanoj_status_updated", self.get_status())
+
+    async def _persist_state(self) -> None:
+        session_dir = self._session_dir()
+        session_dir.mkdir(parents=True, exist_ok=True)
+        self._ensure_accepted_idea_records()
+        payload = self.get_status()
+        if self._request is not None:
+            payload["request"] = self._request.model_dump(mode="json")
+        payload["task_sequences"] = dict(self._task_sequences)
+        payload["completed_task_ids"] = sorted(self.completed_task_ids)
+        await leanoj_context_manager.write_session_artifacts(
+            session_id=self._state.session_id,
+            accepted_ideas=self._accepted_ideas,
+            accepted_idea_records=self._accepted_idea_records,
+            recursive_topics=self._recursive_topics,
+            verified_subproofs=self._verified_subproof_dicts(),
+            partial_proofs=self._partial_proofs,
+            failed_subproofs=self._failed_context_dicts(),
+            final_attempts=self._final_attempts,
+            final_cycle_packets=self._final_cycle_packets,
+        )
+        async with aiofiles.open(session_dir / "state.json", "w", encoding="utf-8") as f:
+            await f.write(json.dumps(payload, indent=2))
+
+    def _session_dir(self) -> Path:
+        session_id = self._state.session_id or "latest"
+        return self._sessions_base_dir() / session_id
+
+    @staticmethod
+    def _sessions_base_dir() -> Path:
+        return Path(system_config.data_dir) / "leanoj_sessions"
+
+    def _find_latest_state_file(self) -> Optional[Path]:
+        base = self._sessions_base_dir()
+        if not base.exists():
+            return None
+        state_files = [path for path in base.glob("*/state.json") if path.is_file()]
+        if not state_files:
+            return None
+        return max(state_files, key=lambda path: path.stat().st_mtime)
+
+    def _find_best_resumable_state_file(self) -> Optional[Path]:
+        """Prefer the most valuable interrupted session after process restart."""
+        return self._find_best_state_file()
+
+    def _find_best_matching_state_file(self, request: LeanOJStartRequest) -> Optional[Path]:
+        """Prefer the most-progressed saved session for this exact Proof Solver problem."""
+        return self._find_best_state_file(request)
+
+    def _find_best_state_file(self, request: Optional[LeanOJStartRequest] = None) -> Optional[Path]:
+        base = self._sessions_base_dir()
+        if not base.exists():
+            return None
+
+        candidates: list[tuple[tuple[int, int, int, int, int, int, int, float], Path]] = []
+        for path in base.glob("*/state.json"):
+            if not path.is_file():
+                continue
+            try:
+                payload = json.loads(path.read_text(encoding="utf-8"))
+            except Exception:
+                continue
+            if request is not None and not self._payload_matches_request(payload, request):
+                continue
+            if payload.get("final_solution"):
+                continue
+            phase = str(payload.get("phase") or "")
+            if phase in _TERMINAL_PHASES:
+                continue
+            candidates.append((self._payload_progress_score(payload, path), path))
+
+        if not candidates:
+            return None
+        return max(candidates, key=lambda item: item[0])[1]
+
+    @staticmethod
+    def _payload_matches_request(payload: dict[str, Any], request: LeanOJStartRequest) -> bool:
+        request_payload = payload.get("request")
+        if not isinstance(request_payload, dict):
+            return False
+        return (
+            str(request_payload.get("user_prompt") or "").strip() == request.user_prompt.strip()
+            and str(request_payload.get("lean_template") or "").strip() == request.lean_template.strip()
+        )
+
+    @staticmethod
+    def _payload_progress_score(payload: dict[str, Any], path: Path) -> tuple[int, int, int, int, int, int, int, float]:
+        verified_subproofs = payload.get("verified_subproofs") or []
+        validated_topics = payload.get("validated_topics") or []
+        failed_subproofs = payload.get("failed_subproofs") or []
+        accepted_count = int(payload.get("accepted_brainstorm_count") or 0)
+        topic_count = len(validated_topics) if isinstance(validated_topics, list) else 0
+        final_attempt_count = int(payload.get("final_attempt_count") or 0)
+        master_proof_version = int(payload.get("master_proof_version") or 0)
+        return (
+            LeanOJCoordinator._payload_phase_rank(payload),
+            master_proof_version,
+            final_attempt_count,
+            len(verified_subproofs) if isinstance(verified_subproofs, list) else 0,
+            accepted_count,
+            topic_count,
+            len(failed_subproofs) if isinstance(failed_subproofs, list) else 0,
+            path.stat().st_mtime,
+        )
+
+    @staticmethod
+    def _payload_phase_rank(payload: dict[str, Any]) -> int:
+        phase = str(payload.get("phase") or "")
+        if phase in {"stopped", "error"}:
+            last_active_phase = str(payload.get("last_active_phase") or "")
+            inferred_rank = LeanOJCoordinator._infer_payload_phase_rank(payload)
+            last_active_rank = _PHASE_PROGRESS_RANK.get(last_active_phase, 0)
+            return max(inferred_rank, last_active_rank)
+        return _PHASE_PROGRESS_RANK.get(phase, 0)
+
+    @staticmethod
+    def _infer_payload_phase_rank(payload: dict[str, Any]) -> int:
+        if payload.get("master_proof_initialized") or int(payload.get("master_proof_version") or 0) > 0:
+            return _PHASE_PROGRESS_RANK["final_proof_loop"]
+        if int(payload.get("final_attempt_count") or 0) > 0 or payload.get("final_attempts"):
+            return _PHASE_PROGRESS_RANK["final_proof_loop"]
+        if payload.get("current_path_decision") == "solve_final_now":
+            return _PHASE_PROGRESS_RANK["final_proof_loop"]
+        if payload.get("verified_subproofs") or payload.get("failed_subproofs"):
+            return _PHASE_PROGRESS_RANK["path_decision"]
+        if int(payload.get("accepted_brainstorm_count") or 0) > 0 or payload.get("accepted_ideas"):
+            return _PHASE_PROGRESS_RANK["initial_brainstorm"]
+        if payload.get("selected_topic"):
+            return _PHASE_PROGRESS_RANK["initial_brainstorm"]
+        if payload.get("validated_topics"):
+            return _PHASE_PROGRESS_RANK["initial_topic_candidates"]
+        return _PHASE_PROGRESS_RANK["idle"]
+
+    def _restore_from_payload(self, payload: dict[str, Any]) -> None:
+        request_payload = payload.get("request")
+        restored_request = LeanOJStartRequest.model_validate(request_payload) if request_payload else None
+
+        self._state = LeanOJState.model_validate(payload)
+        self._state.is_running = False
+        master_proof_path = self._master_proof_path(self._state.session_id)
+        if master_proof_path.exists():
+            try:
+                self._set_master_proof_metadata(master_proof_path.read_text(encoding="utf-8"))
+            except Exception as exc:
+                logger.warning("Failed to restore Proof Solver master proof metadata from %s: %s", master_proof_path, exc)
+        artifacts = leanoj_context_manager.load_session_artifacts(self._state.session_id)
+        self._validated_topics = [str(item) for item in payload.get("validated_topics") or []]
+        restored_accepted_ideas = [
+            *[str(item) for item in payload.get("accepted_ideas") or []],
+            *[str(item) for item in artifacts.get(ARTIFACT_ACCEPTED_IDEAS, [])],
+        ]
+        self._accepted_idea_records = [
+            dict(item) for item in (payload.get("accepted_idea_records") or []) if isinstance(item, dict)
+        ]
+        artifact_idea_records = [
+            dict(item)
+            for item in artifacts.get("accepted_idea_records", [])
+            if isinstance(item, dict)
+        ]
+        if artifact_idea_records:
+            record_keys = {
+                self._dict_record_key(record)
+                for record in self._accepted_idea_records
+            }
+            for record in artifact_idea_records:
+                content = str(record.get("content") or "")
+                record_key = self._dict_record_key(record)
+                if content.strip() and record_key not in record_keys:
+                    self._accepted_idea_records.append(record)
+                    record_keys.add(record_key)
+        if self._accepted_idea_records:
+            self._accepted_ideas = [
+                str(record.get("content") or "")
+                for record in self._accepted_idea_records
+                if str(record.get("content") or "").strip()
+            ]
+            recorded_contents = set(self._accepted_ideas)
+            self._accepted_ideas.extend(
+                idea
+                for idea in restored_accepted_ideas
+                if str(idea).strip() and idea not in recorded_contents
+            )
+        else:
+            self._accepted_ideas = self._dedupe_strings(restored_accepted_ideas)
+        self._ensure_accepted_idea_records()
+        if self._state.brainstorm_acceptance_events < len(self._accepted_ideas):
+            self._state.brainstorm_acceptance_events = max(
+                int(payload.get("brainstorm_acceptance_events") or 0),
+                len(self._accepted_ideas),
+            )
+        self._failed_feedback = [
+            dict(item) for item in (payload.get("failed_feedback") or []) if isinstance(item, dict)
+        ]
+        self._failed_feedback = self._dedupe_dict_records(
+            [
+                *self._failed_feedback,
+                *[
+                    dict(item)
+                    for item in artifacts.get(ARTIFACT_FAILED_SUBPROOFS, [])
+                    if isinstance(item, dict)
+                ],
+            ]
+        )
+        self._final_attempts = [
+            dict(item) for item in (payload.get("final_attempts") or []) if isinstance(item, dict)
+        ]
+        self._final_attempts = self._dedupe_dict_records(
+            [
+                *[
+                    dict(item)
+                    for item in artifacts.get(ARTIFACT_FINAL_ATTEMPTS, [])
+                    if isinstance(item, dict)
+                ],
+                *self._final_attempts,
+            ]
+        )
+        self._final_context_events = [
+            dict(item)
+            for item in payload.get("final_context_events") or []
+            if isinstance(item, dict)
+        ][-50:]
+        partial_proofs = [
+            dict(item) for item in (payload.get("partial_proofs") or []) if isinstance(item, dict)
+        ]
+        persisted_partial_proofs = self._load_partial_proof_database(self._state.session_id)
+        self._partial_proofs = self._dedupe_partial_proofs(
+            [
+                *partial_proofs,
+                *persisted_partial_proofs,
+                *[
+                    dict(item)
+                    for item in artifacts.get(ARTIFACT_PARTIAL_PROOFS, [])
+                    if isinstance(item, dict)
+                ],
+            ]
+        )
+        verified_records = self._dedupe_dict_records(
+            [
+                *[item.model_dump(mode="json") for item in self._state.verified_subproofs],
+                *[
+                    dict(item)
+                    for item in artifacts.get(ARTIFACT_VERIFIED_SUBPROOFS, [])
+                    if isinstance(item, dict)
+                ],
+            ]
+        )
+        self._state.verified_subproofs = [
+            LeanOJSubproofRecord.model_validate(item)
+            for item in verified_records
+        ]
+        self._final_cycle_packets = self._dedupe_dict_records(
+            [
+                *[
+                    dict(item)
+                    for item in artifacts.get(ARTIFACT_FINAL_CYCLE_PACKETS, [])
+                    if isinstance(item, dict)
+                ],
+                *[
+                    dict(item)
+                    for item in payload.get("final_cycle_packets") or []
+                    if isinstance(item, dict)
+                ],
+            ]
+        )
+        current_packet = payload.get("current_final_cycle_packet")
+        self._current_final_cycle_packet = dict(current_packet) if isinstance(current_packet, dict) else None
+        working_packet = payload.get("current_working_proof_attempt")
+        self._current_working_proof_attempt = dict(working_packet) if isinstance(working_packet, dict) else None
+        self._task_sequences = {
+            str(key): int(value)
+            for key, value in (payload.get("task_sequences") or {}).items()
+            if isinstance(value, int) or str(value).isdigit()
+        }
+        self.completed_task_ids = {str(item) for item in payload.get("completed_task_ids") or []}
+        self.workflow_tasks = []
+        self.current_task_id = None
+        self._stop_event = asyncio.Event()
+        self._request = restored_request
+        self._running = False
+        self._restored_from_disk = True
+        self._reset_master_proof_progress_watchdog()
+
+        if self._request is not None:
+            self._configure_roles(self._request)
+
+    def _should_stop(self) -> bool:
+        return self._stop_event.is_set()
+
+    def _begin_brainstorm_acceptance_phase(self, phase_key: str) -> None:
+        if self._state.active_brainstorm_phase != phase_key:
+            self._state.active_brainstorm_phase = phase_key
+            self._state.active_brainstorm_start_count = self._state.brainstorm_acceptance_events
+            self._state.active_brainstorm_last_sufficiency_check_count = 0
+            self._state.active_brainstorm_last_prune_review_count = 0
+
+    def _get_brainstorm_acceptance_start(self, phase_key: str) -> int:
+        if self._state.active_brainstorm_phase != phase_key:
+            self._begin_brainstorm_acceptance_phase(phase_key)
+        if self._state.active_brainstorm_start_count > self._state.brainstorm_acceptance_events:
+            self._state.active_brainstorm_start_count = self._state.brainstorm_acceptance_events
+        return self._state.active_brainstorm_start_count
+
+    def _finish_brainstorm_acceptance_phase_for_path_decision(self) -> None:
+        self._state.phase = "path_decision"
+        self._state.active_brainstorm_phase = ""
+        self._state.active_brainstorm_start_count = self._state.brainstorm_acceptance_events
+        self._state.active_brainstorm_last_sufficiency_check_count = 0
+        self._state.active_brainstorm_last_prune_review_count = 0
+
+    @staticmethod
+    def _is_non_retryable_model_error(exc: Exception) -> bool:
+        return is_non_retryable_model_error(exc)
+
+    def _remember_active_phase(self) -> None:
+        if self._state.phase in _ACTIVE_PHASES:
+            self._state.last_active_phase = self._state.phase
+
+    def _infer_resume_phase(self) -> str:
+        if (
+            self._current_working_proof_attempt
+            or self._state.master_proof_initialized
+            or self._state.master_proof_version > 0
+        ):
+            return "final_proof_loop"
+        if self._state.final_attempt_count > 0 or self._final_attempts:
+            return "final_proof_loop"
+        if self._state.current_path_decision == "solve_final_now":
+            return "final_proof_loop"
+        if self._state.last_active_phase in _ACTIVE_PHASES:
+            return self._state.last_active_phase
+        if self._state.verified_subproofs or self._state.failed_subproofs:
+            return "path_decision"
+        if self._accepted_ideas or self._state.accepted_brainstorm_count > 0 or self._state.selected_topic:
+            return "initial_brainstorm"
+        if self._validated_topics:
+            return "initial_topic_candidates"
+        return "initial_topic_candidates"
+
+    @staticmethod
+    def _summarize_error(error_text: str, limit: int = 800) -> str:
+        cleaned = " ".join((error_text or "").split())
+        return cleaned[:limit] + ("..." if len(cleaned) > limit else "")
+
+
+leanoj_coordinator = LeanOJCoordinator()
diff --git a/backend/leanoj/prompts.py b/backend/leanoj/prompts.py
new file mode 100644
index 0000000..e4e9ad5
--- /dev/null
+++ b/backend/leanoj/prompts.py
@@ -0,0 +1,1009 @@
+"""Prompt builders for the LeanOJ proof-solver mode."""
+from __future__ import annotations
+
+import re
+from typing import Any, Iterable
+
+
+JSON_RULES = (
+    "Respond with ONLY valid JSON. Do not use markdown fences. "
+    "Escape Lean backslashes and newlines correctly for JSON strings."
+)
+
+LEANOJ_FORMALIZATION_GUARDRAILS = """LEANOJ FORMALIZATION GUARDRAILS:
+- Treat the LeanOJ template as the source of truth for formal semantics. Do not silently reinterpret template operations to match informal olympiad intuition. For example, in a template over `Nat`, `a - b` is truncated natural subtraction, not signed integer subtraction.
+- Before committing to a closed-form `answer`, test proposed formulas and constructions against the exact Lean predicate on small cases when feasible. Counterexamples to the exact template override informal expectations.
+- Lean acceptance is necessary but not sufficient for final success. A Lean-verified file proves the formal statement it encodes; it does not automatically prove the user's informal problem statement if the template or chosen definitions exploit or mismatch the natural-language task.
+- If the template semantics and informal statement appear to conflict, make the mismatch explicit in reasoning and do not claim that a Lean-verified template proof settles the informal statement unless that correspondence has also been justified."""
+
+
+def _format_items(items: Iterable[Any], *, empty: str = "[none]") -> str:
+    values = [str(item).strip() for item in (items or []) if str(item).strip()]
+    if not values:
+        return empty
+    return "\n".join(f"{index}. {value}" for index, value in enumerate(values, start=1))
+
+
+def _format_brainstorm(ideas: list[str], limit: int = 80) -> str:
+    if not ideas:
+        return "[No accepted brainstorm ideas yet.]"
+    visible = ideas[-limit:]
+    prefix = "" if len(visible) == len(ideas) else f"[Showing most recent {len(visible)} of {len(ideas)} accepted ideas.]\n"
+    return prefix + "\n".join(f"{index}. {idea}" for index, idea in enumerate(visible, start=1))
+
+
+def _final_mode_text(value: Any) -> str:
+    text = str(value or "")
+    cleaned = (
+        text.replace("need_more_brainstorming", "additional proof context")
+        .replace("Brainstorm", "Proof memory")
+        .replace("brainstorm", "proof memory")
+        .replace("BRAINSTORM", "PROOF MEMORY")
+    )
+    return _remove_attempt_count_language(cleaned)
+
+
+def _remove_attempt_count_language(value: Any) -> str:
+    text = str(value or "")
+    replacements = (
+        (
+            r"\bfailed\s+\d+\s+consecutive\s+verification/edit\s+attempts?\b",
+            "encountered repeated verification/edit failures",
+        ),
+        (r"\bfailed\s+\d+\s+consecutive\s+attempts?\b", "encountered repeated failures"),
+        (r"\bfailed\s+\d+\s+attempts?\b", "encountered repeated failures"),
+        (r"\bfailed\s+\d+\s+times\b", "encountered repeated failures"),
+        (r"\bafter\s+failed\s+attempts\b", "after recent proof-check failures"),
+        (r"\bfailed\s+attempts\b", "proof-check failures"),
+        (r"\battempts\s+\d+\s*-\s*\d+\b", "recent final-loop feedback"),
+        (r"\bwith\s+exactly\s+\d+\s+failed\s+attempts?\b", "with recent proof-check failures"),
+        (r"\bUse this exact failed-attempt count[^.]*\.", ""),
+        (r"\bfailed-attempt count\b", "failure context"),
+    )
+    for pattern, replacement in replacements:
+        text = re.sub(pattern, replacement, text, flags=re.IGNORECASE)
+    return re.sub(r" {2,}", " ", text).strip()
+
+
+def _format_proof_memory_notes(ideas: list[str], limit: int = 80) -> str:
+    if not ideas:
+        return "[No accepted proof memory notes yet.]"
+    visible = ideas[-limit:]
+    prefix = "" if len(visible) == len(ideas) else f"[Showing most recent {len(visible)} accepted proof memory notes.]\n"
+    return prefix + "\n".join(f"{index}. {_final_mode_text(idea)}" for index, idea in enumerate(visible, start=1))
+
+
+def _format_verified_subproofs(subproofs: list[dict[str, Any]]) -> str:
+    if not subproofs:
+        return "[No verified subproofs yet.]"
+    blocks = []
+    for index, subproof in enumerate(subproofs, start=1):
+        lean_feedback = str(subproof.get("lean_feedback") or "").strip()
+        feedback_lines = ["Lean verifier feedback:", lean_feedback] if lean_feedback else []
+        blocks.append(
+            "\n".join(
+                [
+                    f"SUBPROOF {index}: {subproof.get('request', '')}",
+                    f"Role: {subproof.get('role', '')}",
+                    f"Theorem/Lemma: {subproof.get('theorem_or_lemma', '')}",
+                    *feedback_lines,
+                    "Verified Lean 4 code:",
+                    subproof.get("lean_code", ""),
+                    "---",
+                ]
+            )
+        )
+    return "\n".join(blocks)
+
+
+def _format_verified_subproofs_for_final(subproofs: list[dict[str, Any]]) -> str:
+    if not subproofs:
+        return "[No verified subproofs yet.]"
+    blocks = []
+    for index, subproof in enumerate(subproofs, start=1):
+        lean_feedback = _final_mode_text(subproof.get("lean_feedback") or "").strip()
+        feedback_lines = ["Lean verifier feedback:", lean_feedback] if lean_feedback else []
+        blocks.append(
+            "\n".join(
+                [
+                    f"SUBPROOF {index}: {_final_mode_text(subproof.get('request', ''))}",
+                    f"Theorem/Lemma: {_final_mode_text(subproof.get('theorem_or_lemma', ''))}",
+                    *feedback_lines,
+                    "Verified Lean 4 code:",
+                    subproof.get("lean_code", ""),
+                    "---",
+                ]
+            )
+        )
+    return "\n".join(blocks)
+
+
+def _format_partial_proofs(partial_proofs: list[dict[str, Any]], limit: int = 8) -> str:
+    if not partial_proofs:
+        return "[No accepted partial proof scaffolds yet.]"
+    blocks = []
+    for index, proof in enumerate(partial_proofs[-limit:], start=1):
+        placeholders = ", ".join(proof.get("placeholder_tokens") or []) or "unknown"
+        blocks.append(
+            "\n".join(
+                [
+                    f"PARTIAL PROOF {index}: {proof.get('request', '')}",
+                    f"Target: {proof.get('target', '')}; placeholders: {placeholders}",
+                    f"Summary: {proof.get('summary', '')}",
+                    "Lean-accepted incomplete scaffold:",
+                    proof.get("lean_code", ""),
+                    "---",
+                ]
+            )
+        )
+    return "\n".join(blocks)
+
+
+def _format_partial_proofs_for_final(partial_proofs: list[dict[str, Any]], limit: int = 8) -> str:
+    if not partial_proofs:
+        return "[No accepted partial proof scaffolds yet.]"
+    blocks = []
+    for index, proof in enumerate(partial_proofs[-limit:], start=1):
+        placeholders = ", ".join(proof.get("placeholder_tokens") or []) or "unknown"
+        blocks.append(
+            "\n".join(
+                [
+                    f"PARTIAL PROOF {index}: {_final_mode_text(proof.get('request', ''))}",
+                    f"Placeholders: {placeholders}",
+                    f"Summary: {_final_mode_text(proof.get('summary', ''))}",
+                    "Lean-accepted incomplete scaffold:",
+                    proof.get("lean_code", ""),
+                    "---",
+                ]
+            )
+        )
+    return "\n".join(blocks)
+
+
+def _format_failures(failures: list[dict[str, Any]], limit: int = 10) -> str:
+    if not failures:
+        return "[No useful failed proof feedback yet.]"
+    visible = failures[-limit:]
+    blocks = []
+    for index, failure in enumerate(visible, start=1):
+        block = (
+            f"{index}. {_remove_attempt_count_language(failure.get('request', 'final proof'))} :: "
+            f"{_remove_attempt_count_language(failure.get('error_summary', ''))}"
+        )
+        lean_feedback = str(failure.get("lean_feedback") or "").strip()
+        if lean_feedback:
+            block += f"\n   Lean feedback: {_remove_attempt_count_language(lean_feedback)}"
+        blocks.append(block)
+    return "\n".join(blocks)
+
+
+def _format_feedback_notes(failures: list[dict[str, Any]], limit: int = 10) -> str:
+    if not failures:
+        return "[No recent proof feedback available.]"
+    visible = failures[-limit:]
+    blocks = []
+    for failure in visible:
+        request = str(failure.get("request") or "").strip()
+        error_summary = str(failure.get("error_summary") or failure.get("error_output") or "").strip()
+        lean_feedback = str(failure.get("lean_feedback") or "").strip()
+        combined = "\n".join(part for part in [request, error_summary, lean_feedback] if part).lower()
+        phase_noise = "need_more_brainstorming" in combined or "stuck_needs_brainstorm" in combined
+        if phase_noise and not _has_concrete_execution_feedback(combined):
+            continue
+        pieces = [
+            part
+            for part in [
+                _final_mode_text(error_summary),
+                f"Lean feedback: {_final_mode_text(lean_feedback)}" if lean_feedback else "",
+            ]
+            if part
+        ]
+        if pieces:
+            blocks.append("\n".join(pieces))
+    return "\n\n---\n\n".join(blocks) if blocks else "[No recent proof feedback available.]"
+
+
+def _has_concrete_execution_feedback(text: str) -> bool:
+    concrete_terms = (
+        "old_string",
+        "unexpected token",
+        "missing cases",
+        "unsolved goals",
+        "error:",
+        "rejected",
+        "invalid",
+        "json",
+        "max_tokens",
+        "lean",
+        "verification",
+        "watchdog",
+    )
+    lowered = str(text or "").lower()
+    return any(term in lowered for term in concrete_terms)
+
+
+def _clip_prompt_field(value: Any, limit: int = 1200) -> str:
+    text = _final_mode_text(value).strip()
+    if len(text) <= limit:
+        return text
+    return text[: limit - 20].rstrip() + " ... [truncated]"
+
+
+def _format_recent_final_attempts(attempts: list[dict[str, Any]], limit: int = 5) -> str:
+    visible = [record for record in (attempts or [])[-limit:] if isinstance(record, dict)]
+    if not visible:
+        return "[No recent final feedback recorded.]"
+    blocks = []
+    for index, record in enumerate(visible, start=1):
+        request = _clip_prompt_field(record.get("request") or "final proof feedback", limit=300)
+        error_summary = _clip_prompt_field(
+            record.get("error_summary") or record.get("error_output") or "",
+            limit=1400,
+        )
+        lean_feedback = _clip_prompt_field(record.get("lean_feedback") or "", limit=1000)
+        reasoning = _clip_prompt_field(record.get("reasoning") or "", limit=800)
+        lines = [f"FEEDBACK ITEM {index}: {request}"]
+        if error_summary:
+            lines.append(f"Result/error: {error_summary}")
+        if lean_feedback:
+            lines.append(f"Lean feedback: {lean_feedback}")
+        if reasoning:
+            lines.append(f"Prior solver reasoning: {reasoning}")
+        blocks.append("\n".join(lines))
+    return "\n\n---\n\n".join(blocks)
+
+
+def _format_context_blocks(context_blocks: dict[str, str] | None, fallback: str) -> str:
+    if not context_blocks:
+        return fallback
+    sections = []
+    working_proof = (context_blocks.get("current_working_proof_attempt") or "").strip()
+    current_packet = (context_blocks.get("current_final_cycle_packet") or "").strip()
+    direct_context = (context_blocks.get("direct_proof_context") or "").strip()
+    rag_context = (context_blocks.get("rag_evidence_context") or "").strip()
+    refuted_warnings = (context_blocks.get("refuted_construction_warnings") or "").strip()
+    capped_feedback = (context_blocks.get("capped_rejection_feedback") or "").strip()
+    if working_proof:
+        sections.append(working_proof)
+    if current_packet:
+        sections.append(current_packet)
+    if direct_context:
+        sections.append(f"DIRECT PROOF CONTEXT:\n{direct_context}")
+    if rag_context:
+        sections.append(f"RETRIEVED LEANOJ RAG EVIDENCE:\n{rag_context}")
+    if refuted_warnings:
+        sections.append(
+            "REFUTED CONSTRUCTIONS - DO NOT USE AS PROOF EVIDENCE:\n"
+            f"{refuted_warnings}"
+        )
+    if capped_feedback:
+        sections.append(f"CAPPED REJECTION FEEDBACK:\n{capped_feedback}")
+    return "\n\n".join(sections) if sections else fallback
+
+
+def build_topic_candidate_prompt(user_prompt: str, lean_template: str, prior_topics: list[str]) -> str:
+    return f"""You are generating one candidate root foundation question for a LeanOJ proof-solving run.
+
+The system must solve the user's Lean 4 template completely. Propose a broad initial foundation question that can guide the entire session before recursive brainstorms add details. This is not a local sublemma target: it should set the durable direction for finding the complete solution.
+
+The topic must address ALL major solution obligations:
+- Determine an explicit formula/value for `answer n`.
+- Find or verify the extremal lower-bound construction.
+- Prove the matching upper bound.
+- Respect the exact LeanOJ template semantics, including Lean/Nat behavior.
+- Identify a Mathlib-compatible Lean 4 formalization route for `IsGreatest (S n) (answer n)`.
+
+Reject narrow framing in your own generation. Do not return a topic that is only about one lemma, one tactic, one bound, one construction, small-case testing alone, or repairing a current proof attempt.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+PRIOR VALIDATED TOPICS:
+{_format_items(prior_topics)}
+
+Return a new non-duplicative broad foundation topic. It should read like a general question that addresses the whole problem and can remain locked as the initial session foundation. If prior topics already cover the same root framing, choose a distinct foundation angle that still covers all obligations, such as exact-template semantics first, extremal-combinatorics first, or Lean-formalization architecture first.
+
+Correct topic style:
+{{"topic": "Determine a complete Lean 4 solution strategy for the exact LeanOJ template, including the explicit answer formula, extremal construction, upper-bound proof, template-semantics checks, and Mathlib formalization route.", "reasoning": "This covers every obligation needed for the final LeanOJ proof."}}
+
+Wrong topic style:
+{{"topic": "Find a useful divisibility lemma for complex numbers.", "reasoning": "This is too narrow because it targets only one possible lemma and does not address the full solution foundation."}}
+
+{JSON_RULES}
+JSON format:
+{{"topic": "broad foundation topic", "reasoning": "why this topic sets the best foundation for solving the whole Lean template"}}
+"""
+
+
+def build_topic_validation_prompt(user_prompt: str, lean_template: str, topic: str, accepted_topics: list[str]) -> str:
+    return f"""You are validating a proposed LeanOJ initial foundation topic.
+
+Accept only if the topic is relevant to solving the user's exact Lean 4 template, non-duplicative, and broad enough to serve as the locked initial session foundation.
+
+The topic must address ALL major solution obligations:
+- An explicit formula/value for `answer n`.
+- A lower-bound construction.
+- A matching upper-bound proof.
+- Exact LeanOJ template semantics, including Lean/Nat behavior.
+- A Lean 4 / Mathlib formalization route for `IsGreatest (S n) (answer n)`.
+
+Reject topics that are narrow, partial, or local: one sublemma, one tactic, one bound, one construction, small-case testing alone, or current-proof repair. Those belong in recursive brainstorms after the foundation exists, not in initial topic selection.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ACCEPTED TOPICS:
+{_format_items(accepted_topics)}
+
+PROPOSED TOPIC:
+{topic}
+
+Correct acceptance target:
+{{"decision": "accept", "reasoning": "The topic covers answer formula, construction, upper bound, template semantics, and Lean formalization.", "summary": "Broad foundation topic."}}
+
+Required rejection target for narrow topics:
+{{"decision": "reject", "reasoning": "The topic asks for one divisibility lemma.", "summary": "Invalid because this is a narrow sublemma topic, not a whole-problem foundation."}}
+
+{JSON_RULES}
+JSON format:
+{{"decision": "accept or reject", "reasoning": "brief validation reasoning", "summary": "short feedback if rejected"}}
+"""
+
+
+def build_topic_batch_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    topics: list[str],
+    accepted_topics: list[str],
+) -> str:
+    formatted_topics = "\n\n---\n\n".join(
+        f"TOPIC {index}:\n{topic}"
+        for index, topic in enumerate(topics, start=1)
+    )
+    return f"""You are the single validator for cumulative LeanOJ initial foundation topics.
+
+Evaluate EACH proposed topic independently against the current accepted topic context, then check accepted topics for intra-batch redundancy. Accept only topics that are relevant to solving the user's exact Lean 4 template, non-duplicative, and broad enough to serve as the locked initial session foundation.
+
+Each accepted topic must address ALL major solution obligations:
+- An explicit formula/value for `answer n`.
+- A lower-bound construction.
+- A matching upper-bound proof.
+- Exact LeanOJ template semantics, including Lean/Nat behavior.
+- A Lean 4 / Mathlib formalization route for `IsGreatest (S n) (answer n)`.
+
+CRITICAL:
+- Judge each topic against CURRENT ACCEPTED TOPICS first, not against the other topics in this batch.
+- Only after independent decisions, compare independently accepted topics against each other.
+- If two accepted topics are redundant with each other, keep the stronger/more concrete one and reject the weaker one with an intra-batch redundancy summary.
+- Reject narrow or partial initial topics even if they would be useful later: one sublemma, one tactic, one bound, one construction, small-case testing alone, or current-proof repair.
+- Return exactly one decision object per topic, in the same order.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+CURRENT ACCEPTED TOPICS:
+{_format_items(accepted_topics)}
+
+TOPICS TO VALIDATE:
+{formatted_topics}
+
+Correct acceptance target:
+{{"topic_number": 1, "decision": "accept", "reasoning": "The topic covers the full answer formula, construction, upper bound, exact template semantics, and Lean formalization route.", "summary": "Broad foundation topic."}}
+
+Required rejection target for narrow topics:
+{{"topic_number": 1, "decision": "reject", "reasoning": "The topic asks for one useful tactic or helper lemma.", "summary": "Invalid because this is too narrow for initial topic selection."}}
+
+{JSON_RULES}
+JSON format:
+{{"decisions": [{{"topic_number": 1, "decision": "accept or reject", "reasoning": "validation reasoning", "summary": "short rejection or acceptance summary"}}]}}
+"""
+
+
+def build_topic_selection_prompt(user_prompt: str, lean_template: str, topics: list[str]) -> str:
+    return f"""You are selecting the locked initial foundation topic for a LeanOJ proof-solving run.
+
+Choose exactly one of the validated topics below, or propose a clearly better replacement topic. The chosen topic must maximize the chance of solving the Lean 4 template by setting a broad root direction for the whole session.
+
+The selected topic will be treated as the initial frozen foundation that recursive brainstorms build on. It must not be a narrow sublemma, tactic-only investigation, one-bound-only question, one-construction-only question, small-case-only check, or current-proof repair target.
+
+The selected topic must address ALL major solution obligations:
+- Determine an explicit formula/value for `answer n`.
+- Establish the extremal lower-bound construction.
+- Prove the matching upper bound.
+- Respect exact LeanOJ template semantics, including Lean/Nat behavior.
+- Set a Mathlib-compatible Lean 4 formalization route for `IsGreatest (S n) (answer n)`.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+VALIDATED TOPICS:
+{_format_items(topics)}
+
+Correct selected-topic style:
+{{"topic": "Determine a complete Lean 4 solution strategy for the exact LeanOJ template, including the explicit answer formula, extremal construction, upper-bound proof, template-semantics checks, and Mathlib formalization route.", "reasoning": "This is broad enough to anchor the session and leaves recursive brainstorms to fill in details."}}
+
+Wrong selected-topic style:
+{{"topic": "Prove one helper divisibility lemma.", "reasoning": "This is too narrow because it cannot serve as the locked foundation for the whole problem."}}
+
+{JSON_RULES}
+JSON format:
+{{"topic": "selected or improved broad foundation topic", "reasoning": "why this is the best locked initial foundation for solving the whole Lean template"}}
+"""
+
+
+def build_brainstorm_prompt(
+    user_prompt: str,
+    lean_template: str,
+    active_topic: str,
+    accepted_ideas: list[str],
+    verified_subproofs: list[dict[str, Any]],
+    failed_feedback: list[dict[str, Any]],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"""ACCEPTED BRAINSTORM CONTEXT:
+{_format_brainstorm(accepted_ideas)}
+
+VERIFIED SUBPROOFS:
+{_format_verified_subproofs(verified_subproofs)}
+
+USEFUL FAILED PROOF FEEDBACK:
+{_format_failures(failed_feedback)}"""
+    return f"""You are a LeanOJ proof brainstorm submitter. Generate one concrete idea that helps solve the user's Lean 4 template.
+
+Focus on exact Lean tactics, Mathlib lemmas, theorem-shaping, induction/cases structure, or mathematical transformations. If a current working proof attempt is provided, treat ACTIVE TOPIC as that exact proof-repair target. Brainstorm only information that directly helps complete or repair it; if a direct solution is unavailable, give the nearest concrete step that works toward solving that exact proof.
+
+If you can produce a complete Lean 4 proof for a useful sublemma or proof fragment, you may choose `submission_type: "lean_proof"`. The system will run Lean 4 first, give you up to 5 repair attempts with Lean feedback, and only then send the Lean-verified proof to the normal brainstorm validator. Do not use `sorry`, `admit`, or fake `axiom`/`constant`/`opaque` devices.
+
+Do not write a whole final proof unless the idea is directly useful as context. Final template solving still happens in the final loop.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ACTIVE TOPIC:
+{active_topic}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+{JSON_RULES}
+JSON format for a normal idea:
+{{"submission_type": "idea", "submission": "one concrete proof-solving idea", "reasoning": "why it advances the LeanOJ solution"}}
+
+JSON format for a Lean proof candidate:
+{{"submission_type": "lean_proof", "theorem_statement": "natural-language statement proved", "formal_sketch": "why this proof fragment helps the LeanOJ template", "theorem_name": "optional Lean declaration name", "lean_code": "complete Lean 4 code", "reasoning": "why this verified proof would help"}}
+"""
+
+
+def build_brainstorm_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    submission: str,
+    accepted_ideas: list[str],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"CURRENT ACCEPTED IDEAS:\n{_format_brainstorm(accepted_ideas)}"
+    return f"""You are the single validator for a cumulative LeanOJ proof-solving brainstorm.
+
+Accept the submission only if it adds useful, non-redundant information for solving the exact Lean template. Reject vague encouragement, duplicate ideas, or claims unrelated to Lean verification.
+
+If the submission contains [LEAN 4 VERIFIED BRAINSTORM PROOF], Lean 4 and MOTO integrity checks already accepted the code. Your job is still to decide whether the verified proof is useful, relevant, and non-redundant for this LeanOJ brainstorm. Do not re-prove Lean correctness, and do not accept irrelevant/trivial proofs merely because Lean verified them.
+
+Classify accepted submissions for later final-proof context:
+- active_plan: a concrete current proof route, decomposition plan, or next obligation that should guide `master_proof.lean`.
+- verified_hint: a reusable verified lemma or exact Lean tactic fact.
+- refuted_construction: a failed construction/counterexample/route warning. This is useful only as "do not use" feedback and must not be treated as proof evidence.
+- scratch: useful exploratory context that should not be direct final-proof context.
+
+Use `scratch` unless the submission clearly fits one of the narrower roles. Do not default to `active_plan`.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+SUBMISSION:
+{submission}
+
+{JSON_RULES}
+JSON format:
+{{"decision": "accept", "context_role": "scratch", "reasoning": "validation reasoning", "summary": "short rejection or acceptance summary"}}
+"""
+
+
+def build_brainstorm_batch_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    submissions: list[str],
+    accepted_ideas: list[str],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    formatted_submissions = "\n\n---\n\n".join(
+        f"SUBMISSION {index}:\n{submission}"
+        for index, submission in enumerate(submissions, start=1)
+    )
+    fallback_context = f"CURRENT ACCEPTED IDEAS:\n{_format_brainstorm(accepted_ideas)}"
+    return f"""You are the single validator for a cumulative LeanOJ proof-solving brainstorm.
+
+Evaluate EACH submission independently against the current accepted brainstorm context, then check accepted submissions for intra-batch redundancy. Accept only submissions that add useful, non-redundant information for solving the exact Lean template. Reject vague encouragement, duplicate ideas, or claims unrelated to Lean verification.
+
+If a submission contains [LEAN 4 VERIFIED BRAINSTORM PROOF], Lean 4 and MOTO integrity checks already accepted the code. Still decide whether that verified proof is useful, relevant, and non-redundant for this LeanOJ brainstorm.
+
+For each accepted submission, classify how it may be used later:
+- active_plan: a concrete current proof route, decomposition plan, or next obligation that should guide `master_proof.lean`.
+- verified_hint: a reusable verified lemma or exact Lean tactic fact.
+- refuted_construction: a failed construction/counterexample/route warning. This is useful only as "do not use" feedback and must not be treated as proof evidence.
+- scratch: useful exploratory context that should not be direct final-proof context.
+
+Use `scratch` unless the submission clearly fits one of the narrower roles. Do not default to `active_plan`.
+
+CRITICAL:
+- Judge each submission against CURRENT ACCEPTED IDEAS first, not against the other submissions in this batch.
+- Only after independent decisions, compare independently accepted submissions against each other.
+- If two accepted submissions are redundant with each other, keep the stronger/more concrete one and reject the weaker one with an intra-batch redundancy summary.
+- Return exactly one decision object per submission, in the same order.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+SUBMISSIONS TO VALIDATE:
+{formatted_submissions}
+
+{JSON_RULES}
+JSON format:
+{{"decisions": [{{"submission_number": 1, "decision": "accept", "context_role": "scratch", "reasoning": "validation reasoning", "summary": "short rejection or acceptance summary"}}]}}
+"""
+
+
+def build_brainstorm_prune_review_prompt(
+    user_prompt: str,
+    lean_template: str,
+    active_topic: str,
+    accepted_ideas: list[str],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"CURRENT ACCEPTED IDEAS:\n{_format_brainstorm(accepted_ideas)}"
+    return f"""You are checking whether any LeanOJ brainstorm memory should be removed or updated because it is outdated, redundant, wrong, harmful, superseded, or missing proof-solving information.
+
+You may propose AT MOST ONE operation. Do not force a removal: choose "none" unless one operation clearly improves the proof-solving database.
+
+Allowed actions:
+- "none": no change is needed.
+- "delete": remove one accepted idea that is outdated, wrong, harmful, redundant with stronger retained context, or now superseded.
+- "edit": replace one accepted idea with a more accurate version, especially when it removes outdated or redundant content while preserving unique proof-solving value.
+- "add": add one compact corrective insight that is now clearly needed.
+
+Do not prune merely for style. Keep any idea that still provides unique proof-solving value. The question is whether any single idea should be removed or updated due to being outdated, redundant, wrong, harmful, or superseded; if not, return "none".
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ACTIVE TOPIC:
+{active_topic}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+ACCEPTED BRAINSTORM IDEAS TO REVIEW:
+{_format_brainstorm(accepted_ideas)}
+
+{JSON_RULES}
+JSON format:
+{{"action": "none", "idea_index": null, "new_content": "", "reasoning": "why no prune is needed or why this one operation improves the database"}}
+"""
+
+
+def build_brainstorm_prune_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    active_topic: str,
+    accepted_ideas: list[str],
+    operation: dict[str, Any],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"CURRENT ACCEPTED IDEAS:\n{_format_brainstorm(accepted_ideas)}"
+    return f"""You are the single validator for a proposed LeanOJ brainstorm prune operation.
+
+Validate ONLY whether this operation improves the proof-solving brainstorm database for the exact Lean template and active topic. Use a conservative default: reject if uncertain.
+
+ACCEPT delete only if the selected idea is outdated, wrong, harmful, redundant with stronger retained context, or superseded by stronger retained context.
+ACCEPT edit only if the replacement is materially more accurate and still useful, including when it removes outdated or redundant content while preserving unique proof-solving value.
+ACCEPT add only if the new content is concrete, non-redundant, and directly useful for the proof.
+REJECT vague, stylistic, speculative, or risky changes.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ACTIVE TOPIC:
+{active_topic}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+CURRENT ACCEPTED IDEAS:
+{_format_brainstorm(accepted_ideas)}
+
+PROPOSED OPERATION:
+{operation}
+
+{JSON_RULES}
+JSON format:
+{{"decision": "reject", "reasoning": "why this prune operation should be accepted or rejected"}}
+"""
+
+
+def build_sufficiency_prompt(
+    user_prompt: str,
+    lean_template: str,
+    accepted_ideas: list[str],
+    verified_subproofs: list[dict[str, Any]],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"""ACCEPTED BRAINSTORM CONTEXT:
+{_format_brainstorm(accepted_ideas)}
+
+VERIFIED SUBPROOFS:
+{_format_verified_subproofs(verified_subproofs)}"""
+    return f"""You are deciding whether there is enough context to attempt solving the user's LeanOJ template now.
+
+This is not final proof validation. Lean 4 will validate the actual proof. Decide whether the accumulated context is likely sufficient to start the final proof loop.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+{JSON_RULES}
+JSON format:
+{{"enough": true, "reasoning": "why the final loop should or should not start"}}
+"""
+
+
+def build_path_decision_prompt(
+    user_prompt: str,
+    lean_template: str,
+    accepted_ideas: list[str],
+    verified_subproofs: list[dict[str, Any]],
+    failed_feedback: list[dict[str, Any]],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"""ACCEPTED BRAINSTORM CONTEXT:
+{_format_brainstorm(accepted_ideas)}
+
+VERIFIED SUBPROOFS:
+{_format_verified_subproofs(verified_subproofs)}
+
+USEFUL FAILED PROOF FEEDBACK:
+{_format_failures(failed_feedback)}"""
+    return f"""You are choosing the next path in a LeanOJ proof-solving state machine.
+
+There is no give-up state. Choose one:
+- solve_final_now: the system should attempt the final full Lean 4 solution.
+- need_more_brainstorming: more cumulative brainstorm context is needed.
+
+When solve_final_now is available, make this decision from the final proof solver's perspective: decide whether the dominant next move toward a solution is to enter the final Lean proof loop now. Since Lean-verified subproofs can now be generated during any brainstorm, defer only to more brainstorming when the final proof path is not yet the strongest next move.
+
+If the current proof memory includes a recent final-cycle packet or working-proof attempt caused by repeated stale `old_string` edits, no-progress watchdog feedback, placeholder/comment churn, or an unresolved missing lemma, choose `need_more_brainstorming` unless the allocated memory already contains fresh concrete proof content that directly resolves that blocker.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+{JSON_RULES}
+JSON format:
+{{"path": "solve_final_now", "reasoning": "why this path is required", "remaining_questions": ["optional missing questions"]}}
+"""
+
+
+def build_path_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    proposed_path: str,
+    proposed_reasoning: str,
+    accepted_ideas: list[str],
+    verified_subproofs: list[dict[str, Any]],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    fallback_context = f"""ACCEPTED BRAINSTORM CONTEXT:
+{_format_brainstorm(accepted_ideas)}
+
+VERIFIED SUBPROOFS:
+{_format_verified_subproofs(verified_subproofs)}"""
+    return f"""You are validating a LeanOJ path decision.
+
+Accept only if the proposed path is justified by the current proof-solving context. Reject decisions that try the final proof too early or request more brainstorming when the next proof action is already clear.
+
+VALID PATHS:
+- solve_final_now
+- need_more_brainstorming
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+PROPOSED PATH:
+{proposed_path}
+
+PROPOSED REASONING:
+{proposed_reasoning}
+
+{JSON_RULES}
+JSON format:
+{{"decision": "accept", "reasoning": "validation reasoning", "summary": "short rejection feedback if rejected", "corrected_path": "solve_final_now or need_more_brainstorming if rejected"}}
+"""
+
+def build_final_solver_prompt(
+    user_prompt: str,
+    lean_template: str,
+    current_master_proof: str,
+    master_proof_metadata: dict[str, Any],
+    accepted_ideas: list[str],
+    verified_subproofs: list[dict[str, Any]],
+    partial_proofs: list[dict[str, Any]],
+    failed_feedback: list[dict[str, Any]],
+    final_attempts: list[dict[str, Any]],
+    context_blocks: dict[str, str] | None = None,
+) -> str:
+    metadata_lines = "\n".join(
+        f"- {key}: {value}"
+        for key, value in (master_proof_metadata or {}).items()
+        if value not in (None, "")
+    ) or "[No master proof metadata available.]"
+    recent_final_feedback = _format_recent_final_attempts(final_attempts, limit=5)
+    fallback_context = f"""ACTIVE PROOF-PLAN NOTES:
+{_format_proof_memory_notes(accepted_ideas)}
+
+VERIFIED SUBPROOFS:
+{_format_verified_subproofs_for_final(verified_subproofs)}
+
+RECENT EXECUTION FEEDBACK - USE TO CHOOSE THE NEXT EDIT; DO NOT TREAT FAILED CODE AS PROVEN:
+{_format_feedback_notes(failed_feedback)}"""
+    return f"""You are in the final LeanOJ master-proof editing loop.
+
+Your task is to edit the durable master Lean 4 proof like a paper draft. Preserve the original imports and declarations unless changing them is necessary and allowed by the problem template. Replace required `sorry` holes with real Lean proofs over as many edit prompts as needed.
+
+Master proof route discipline:
+- `master_proof.lean` must contain the current chosen proof route only.
+- Do not append multiple competing constructions or abandoned approaches into the master proof.
+- If a route is refuted or superseded, replace it with the chosen route instead of keeping both.
+- Failed constructions may appear only as compact comments when they directly explain an active invariant; otherwise keep them out of the Lean file.
+- Use verified standalone lemmas and active proof-plan notes as positive context. Treat refuted-construction warnings only as "do not use" constraints, never as evidence for a proof route.
+
+Correction priority:
+- Required corrections take priority over new additions. Treat recent final feedback, Lean errors, exact-string edit rejections, edit-validator feedback, and semantic-review continuation feedback as the next correction targets.
+- If any correction is pending, your next edit must address that correction before attempting unrelated new lemmas, fresh proof routes, or speculative additions.
+- New additions are allowed only when they directly implement the required correction or provide helper code needed for that correction.
+- In your reasoning, name the correction you addressed. If no correction is pending, state which next unsolved proof obligation your edit advances.
+
+You must choose exactly one action: edit_proof.
+This final mode cannot request phase transitions, cannot delegate to planning, and cannot stop early. If the proof is incomplete, make the best concrete edit available and set "needs_more_time": true.
+
+Binary verification gate:
+- The system runs Lean after every proposed master proof edit before accepting it into the durable master proof.
+- If your edit is useful but the proof still needs more editing time, set "needs_more_time": true. Lean will check the edited file with placeholders allowed, and syntax/type errors will reject the edit.
+- If your edit should make the current master proof final-ready, set "needs_more_time": false. Lean will check the edited file with no placeholders allowed, then final integrity/review checks will run.
+- A master proof edit is not accepted merely because the string edit applies; it must pass the appropriate Lean gate first.
+- A Lean-accepted loophole may be useful intermediate progress, but it is not final-ready. For LeanOJ `answer` definitions, do not terminate with `answer` defined as `sSup`, `csSup`, `Nat.sSup`, `Sup`, or an equivalent maximum over the same feasible set. Final readiness requires an explicit formula/value for `answer n` and a proof that this formula is greatest.
+- A continuing edit must change non-comment Lean proof content in a way that discharges, splits, or materially advances an obligation. Do not spend an edit only rewriting comments, TODOs, placeholders, or "prepare for next edit" wording.
+
+Exact-string editing rules:
+- Use operation "full_content" only when replacing the whole master proof.
+- Use operation "replace", "insert_after", or "delete" for targeted edits.
+- For targeted edits, old_string must be copied verbatim from the CURRENT FULL MASTER PROOF and must appear exactly once in that full master proof.
+- Include enough surrounding Lean lines in old_string to make the match unique.
+- new_string must contain the replacement/insertion Lean code, except delete uses an empty new_string.
+- Never introduce fake `axiom`, `constant`, or `opaque` proof devices.
+- Final verification requires no `sorry`/`admit`, but intermediate master proof edits may preserve placeholders while you continue working.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE TO SOLVE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+CURRENT MASTER PROOF METADATA:
+{metadata_lines}
+
+RECENT FINAL FEEDBACK (USE TO AVOID REPEATING FAILED EDITS):
+{recent_final_feedback}
+
+CURRENT FULL MASTER PROOF TO EDIT (MANDATORY DIRECT-INJECT CONTEXT; NEVER TRUNCATED):
+{current_master_proof or lean_template}
+
+ALLOCATED LEANOJ PROOF MEMORY:
+{_format_context_blocks(context_blocks, fallback_context)}
+
+{JSON_RULES}
+JSON format for continuing edits:
+{{"action": "edit_proof", "needs_more_time": true, "operation": "replace", "old_string": "exact unique text from CURRENT MASTER PROOF", "new_string": "updated Lean code", "reasoning": "why this edit advances the proof and what remains"}}
+
+JSON format for final verification after this edit:
+{{"action": "edit_proof", "needs_more_time": false, "operation": "replace", "old_string": "exact unique text from CURRENT MASTER PROOF", "new_string": "updated Lean code expected to verify", "reasoning": "why the edited master proof should now pass Lean"}}
+"""
+
+
+def build_master_proof_edit_validation_prompt(
+    user_prompt: str,
+    lean_template: str,
+    current_master_proof: str,
+    proposed_master_proof: str,
+    edit: dict[str, Any],
+    metrics: dict[str, Any],
+) -> str:
+    metrics_lines = "\n".join(
+        f"- {key}: {value}"
+        for key, value in (metrics or {}).items()
+        if value not in (None, "")
+    ) or "[No shortening metrics available.]"
+    return f"""You are the independent LeanOJ master-proof edit validator.
+
+The final Proof Solver proposed an edit that shortens the durable master proof. Your job is to decide whether this shortening is real proof progress or whether it deletes useful work because the solver is stuck, frustrated, restarting, or giving up.
+
+Accept only if the proposed shorter proof is genuinely progressive for solving the exact LeanOJ template:
+- It preserves or strengthens useful solved Lean content, definitions, lemmas, and proof structure.
+- It replaces removed material with equivalent or stronger proof content, or removes only clearly redundant/noisy material.
+- It still moves toward a complete Lean 4 proof of the original template.
+
+Reject if the edit goes backward:
+- It deletes useful proof progress, helper lemmas, explicit formulas, or developed argument structure without a stronger replacement.
+- It replaces concrete work with `sorry`, `admit`, comments, vague plans, or a reset toward the original template.
+- It looks like abandonment, frustration, a restart, or an attempt to make the file shorter by discarding hard obligations.
+- It bloats the master proof by accumulating multiple competing/refuted proof routes instead of maintaining one current chosen route.
+- It ignores a required correction in the proof and instead prioritizes unrelated new additions, fresh routes, or speculative helper material.
+
+If you reject, give precise feedback to the proof submitter. Name the content that must be restored or the exact kind of progressive replacement required.
+If corrections are required, your feedback must say that those corrections must be fixed before any new addition attempts. New additions are acceptable only when they directly implement the required correction.
+
+If you accept, give a clear justification that can be shown later alongside the old longer proof. This justification must explain:
+- WHY the validator allowed the shortening instead of requiring the longer attempt to be restored.
+- What the apparent issue was with the old longer attempt, such as redundant code, noisy scaffolding, a weaker route, or content replaced by stronger proof structure.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+PROPOSED EDIT:
+- operation: {edit.get("operation", "")}
+- needs_more_time: {edit.get("needs_more_time", "")}
+- solver_reasoning: {edit.get("reasoning", "")}
+- old_string:
+{edit.get("old_string", "")}
+
+- new_string:
+{edit.get("new_string", "")}
+
+SHORTENING METRICS:
+{metrics_lines}
+
+CURRENT MASTER PROOF BEFORE EDIT:
+{current_master_proof}
+
+PROPOSED MASTER PROOF AFTER EDIT:
+{proposed_master_proof}
+
+{JSON_RULES}
+JSON format if this shortening is progressive:
+{{"decision": "accept", "reasoning": "why this shorter edit preserves or improves proof progress", "shortening_approval_justification": "clear reason the validator allowed this shortening", "apparent_issue_with_old_attempt": "what was apparently wrong, redundant, noisy, or superseded in the old longer attempt", "feedback_to_submitter": ""}}
+
+JSON format if this shortening goes backward:
+{{"decision": "reject", "reasoning": "why this deletes progress or gives up", "feedback_to_submitter": "precise correction for the final solver"}}
+"""
+
+
+def build_final_solution_review_prompt(
+    user_prompt: str,
+    lean_template: str,
+    lean_code: str,
+    final_solver_reasoning: str,
+    lean_feedback: str,
+) -> str:
+    return f"""You are the final LeanOJ proof checker for a Lean-accepted submission.
+
+Lean 4 has already checked the code. Your job is NOT to re-run Lean or act as a planning validator. Your job is to decide whether this Lean-accepted file actually solves the user's LeanOJ problem prompt and template in the intended sense.
+
+Lean acceptance is necessary but not sufficient. Reject loopholes that satisfy the weak formal theorem while evading the natural-language task, such as defining an answer by taking a maximum/supremum over the same feasible set instead of determining the requested value in terms of n.
+
+Accept only if the code:
+- Preserves and solves the user's LeanOJ template.
+- Fully addresses the actual problem prompt, not merely a different formal statement.
+- Uses an answer/formulation that genuinely determines the requested object when the problem asks for an explicit value or formula.
+- Contains no placeholder proof devices or semantic shortcuts that should remain continuation context instead of the final stop condition.
+
+USER PROBLEM:
+{user_prompt}
+
+LEANOJ TEMPLATE:
+{lean_template}
+
+{LEANOJ_FORMALIZATION_GUARDRAILS}
+
+LEAN 4 FEEDBACK FROM THE ACCEPTED RUN:
+{lean_feedback or "Lean 4 accepted with no diagnostics."}
+
+FINAL SOLVER REASONING BEFORE LEAN CHECK:
+{final_solver_reasoning or "[No final solver reasoning provided.]"}
+
+LEAN-ACCEPTED FINAL CODE:
+{lean_code}
+
+{JSON_RULES}
+JSON format if this is truly solved:
+{{"solved": true, "reasoning": "why this Lean-accepted code completely solves the LeanOJ problem prompt and template"}}
+
+JSON format if this is not done:
+{{"solved": false, "continuation_feedback": "specific feedback explaining what is missing and what the next final solver attempt should fix", "reasoning": "why Lean acceptance is not enough here"}}
+"""
diff --git a/backend/shared/api_client_manager.py b/backend/shared/api_client_manager.py
index cfbbe7e..57cd383 100644
--- a/backend/shared/api_client_manager.py
+++ b/backend/shared/api_client_manager.py
@@ -9,6 +9,7 @@
 4. Per-task Toggle - Task ID based (legacy)
 """
 import asyncio
+import json
 import logging
 import time
 from typing import Dict, Any, List, Optional, Callable
@@ -26,18 +27,43 @@
 from backend.shared.config import rag_config, system_config
 from backend.shared.fastembed_provider import FASTEMBED_MODEL_NAME, FastEmbedProvider
 from backend.shared.free_model_manager import free_model_manager
+from backend.shared.json_parser import sanitize_model_output_for_retry_context
 from backend.shared.models import ModelConfig
 from backend.shared.token_tracker import token_tracker
 
 logger = logging.getLogger(__name__)
 
 
+def _response_shape_for_logging(response: Any) -> str:
+    """Summarize an upstream response shape without logging provider/model text."""
+    if isinstance(response, dict):
+        keys = sorted(str(key) for key in response.keys())
+        usage = response.get("usage") if isinstance(response.get("usage"), dict) else {}
+        return (
+            f"type=dict, keys={keys}, choices_present={bool(response.get('choices'))}, "
+            f"error_present={'error' in response}, usage_keys={sorted(str(key) for key in usage.keys())}"
+        )
+    if isinstance(response, list):
+        return f"type=list, length={len(response)}"
+    return f"type={type(response).__name__}"
+
+
 class APIClientManager:
     """
     Central manager for routing API calls to OpenRouter or LM Studio.
     Handles fallback on credit exhaustion and boost integration.
     """
     CALL_METADATA_KEY = "_moto_call_metadata"
+    # Supercharge intentionally breaks the default 0.0 temperature policy for
+    # candidate attempts so parallel completions produce meaningfully different answers.
+    SUPERCHARGE_ATTEMPT_TEMPERATURES = (0.0, 0.2, 0.4, 0.8)
+    SUPERCHARGE_CANDIDATE_MAX_CHARS = 20000
+    # Parallel brainstorm submitters use a lane-based ladder: submitter 1 stays
+    # deterministic, later lanes get increasing exploration pressure.
+    PARALLEL_BRAINSTORM_SUBMITTER_TEMPERATURES = (
+        0.0, 0.1, 0.2, 0.3, 0.4,
+        0.5, 0.6, 0.7, 0.8, 0.9,
+    )
     
     def __init__(self):
         self._openrouter_client: Optional[OpenRouterClient] = None
@@ -60,10 +86,11 @@ def __init__(self):
         # Signature: async callback(model_id: str)
         self._model_tracking_callback: Optional[Callable] = None
         
-        # Autonomous API logger callback
-        # Called after each API call (success or failure) with full details
-        # Signature: async callback(task_id, role_id, model, provider, prompt, response, duration_ms, success, error, phase)
-        self._autonomous_logger_callback: Optional[Callable] = None
+        # API logger callback. Workflows can override this to add namespace-specific
+        # metadata; otherwise the manager still logs every model call by default.
+        # Signature: async callback(task_id, role_id, model, provider, prompt, response,
+        #                           tokens_used, duration_ms, success, error, phase)
+        self._autonomous_logger_callback: Optional[Callable] = self._default_api_logger_callback
         
         # Current autonomous phase (set by autonomous coordinator)
         self._current_autonomous_phase: str = "unknown"
@@ -73,6 +100,17 @@ def __init__(self):
         
         # Lock for thread-safe state updates
         self._state_lock = asyncio.Lock()
+
+    @classmethod
+    def parallel_brainstorm_submitter_temperature(cls, submitter_index: int) -> float:
+        """Return the deterministic temperature lane for a parallel brainstorm submitter."""
+        try:
+            index = int(submitter_index)
+        except (TypeError, ValueError):
+            index = 1
+        index = max(1, index)
+        ladder_index = min(index - 1, len(cls.PARALLEL_BRAINSTORM_SUBMITTER_TEMPERATURES) - 1)
+        return cls.PARALLEL_BRAINSTORM_SUBMITTER_TEMPERATURES[ladder_index]
     
     def set_broadcast_callback(self, callback: Callable) -> None:
         """Set callback for broadcasting WebSocket events."""
@@ -136,6 +174,78 @@ def set_model_tracking_callback(self, callback: Optional[Callable]) -> None:
         else:
             logger.info("Model tracking callback cleared")
     
+    @staticmethod
+    def _infer_api_log_workflow(task_id: str, role_id: str) -> str:
+        """Infer the API-log namespace used by the shared log tab."""
+        task = (task_id or "").strip().lower()
+        role = (role_id or "").strip().lower()
+        if role.startswith("leanoj_") or task.startswith("leanoj_"):
+            return "leanoj"
+        return "autonomous"
+
+    @staticmethod
+    def _prompt_for_logging(messages: Optional[List[Dict[str, Any]]]) -> str:
+        """Return a safe prompt preview source without raw tool-result content."""
+        if not messages:
+            return ""
+
+        message = messages[-1]
+        role = str(message.get("role") or "")
+        content = message.get("content", "")
+
+        if role == "tool":
+            tool_name = str(message.get("name") or "")
+            tool_call_id = str(message.get("tool_call_id") or "")
+            content_len = len(content) if isinstance(content, str) else len(str(content or ""))
+            return (
+                "[tool message redacted for API logging; "
+                f"name={tool_name or 'unknown'}, "
+                f"tool_call_id_present={bool(tool_call_id)}, "
+                f"content_length={content_len}]"
+            )
+
+        if isinstance(content, str):
+            return content
+        try:
+            return json.dumps(content, ensure_ascii=False)
+        except Exception:
+            return str(content or "")
+
+    async def _default_api_logger_callback(
+        self,
+        task_id,
+        role_id,
+        model,
+        provider,
+        prompt,
+        response,
+        tokens_used,
+        duration_ms,
+        success,
+        error,
+        phase,
+    ) -> None:
+        """Persist API calls even when no workflow-specific logger is active."""
+        try:
+            from backend.autonomous.memory.autonomous_api_logger import autonomous_api_logger
+
+            await autonomous_api_logger.log_api_call(
+                task_id=task_id,
+                role_id=role_id,
+                model=model,
+                provider=provider,
+                prompt=prompt,
+                response_content=response,
+                tokens_used=tokens_used,
+                duration_ms=duration_ms,
+                success=success,
+                error=error,
+                phase=phase or self._current_autonomous_phase,
+                workflow=self._infer_api_log_workflow(task_id, role_id),
+            )
+        except Exception as e:
+            logger.error(f"Failed to log API call in default logger: {e}")
+
     def set_autonomous_logger_callback(self, callback: Optional[Callable]) -> None:
         """
         Set callback for autonomous API logging.
@@ -143,16 +253,16 @@ def set_autonomous_logger_callback(self, callback: Optional[Callable]) -> None:
         The callback is called after each API call with full details for logging.
         
         Args:
-            callback: Async function with signature: 
+            callback: Async function with signature:
                       callback(task_id, role_id, model, provider, prompt, response, 
-                               duration_ms, success, error, phase)
-                      or None to disable
+                               tokens_used, duration_ms, success, error, phase)
+                      or None to restore default all-call logging
         """
-        self._autonomous_logger_callback = callback
+        self._autonomous_logger_callback = callback or self._default_api_logger_callback
         if callback:
             logger.info("Autonomous API logger callback set")
         else:
-            logger.info("Autonomous API logger callback cleared")
+            logger.info("Autonomous API logger callback restored to default")
     
     def set_autonomous_phase(self, phase: str) -> None:
         """
@@ -189,6 +299,7 @@ def _annotate_response_with_call_metadata(
         boosted: bool,
         boost_mode: Optional[str] = None,
         openrouter_provider: Optional[str] = None,
+        openrouter_reasoning_effort: Optional[str] = None,
     ) -> Dict[str, Any]:
         """Attach effective routing details to a successful API response."""
         if not isinstance(response, dict):
@@ -205,6 +316,7 @@ def _annotate_response_with_call_metadata(
             "boosted": boosted,
             "boost_mode": boost_mode,
             "openrouter_provider": openrouter_provider,
+            "openrouter_reasoning_effort": openrouter_reasoning_effort,
         }
         return response
 
@@ -249,6 +361,27 @@ def configure_role(self, role_id: str, config: ModelConfig) -> None:
             config: Model configuration (includes provider, model_id, openrouter_model_id, 
                     lm_studio_fallback_id, and optionally openrouter_provider)
         """
+        if system_config.generic_mode:
+            if config.provider != "openrouter":
+                logger.warning(
+                    "Generic mode is OpenRouter-only. Normalizing role '%s' from provider=%s to OpenRouter.",
+                    role_id,
+                    config.provider,
+                )
+                config = config.model_copy(
+                    update={
+                        "provider": "openrouter",
+                        "openrouter_model_id": config.openrouter_model_id or config.model_id,
+                        "lm_studio_fallback_id": None,
+                    }
+                )
+            elif config.lm_studio_fallback_id:
+                logger.warning(
+                    "Generic mode is OpenRouter-only. Dropping LM Studio fallback for role '%s'.",
+                    role_id,
+                )
+                config = config.model_copy(update={"lm_studio_fallback_id": None})
+
         self._role_model_configs[role_id] = config
         
         # Set initial fallback state based on provider
@@ -294,7 +427,7 @@ def _determine_boost_mode(self, task_id: str) -> Optional[str]:
             return "task_id"
         
         return None
-    
+
     async def generate_completion(
         self,
         task_id: str,
@@ -307,6 +440,184 @@ async def generate_completion(
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Any] = None,
         **kwargs
+    ) -> Dict[str, Any]:
+        """Generate a completion, optionally wrapping the role with Supercharge."""
+        async with self._state_lock:
+            role_config = self._role_model_configs.get(role_id)
+
+        supercharge_enabled = bool(getattr(role_config, "supercharge_enabled", False))
+        # Tool-call conversations need exact assistant/tool turn pairing, so keep them single-shot.
+        if not supercharge_enabled or tools or tool_choice is not None:
+            return await self._generate_completion_once(
+                task_id=task_id,
+                role_id=role_id,
+                model=model,
+                messages=messages,
+                temperature=temperature,
+                max_tokens=max_tokens,
+                response_format=response_format,
+                tools=tools,
+                tool_choice=tool_choice,
+                **kwargs
+            )
+
+        return await self._generate_supercharged_completion(
+            task_id=task_id,
+            role_id=role_id,
+            model=model,
+            messages=messages,
+            temperature=temperature,
+            max_tokens=max_tokens,
+            response_format=response_format,
+            **kwargs
+        )
+
+    @staticmethod
+    def _response_text(response: Dict[str, Any]) -> str:
+        """Extract assistant text from an OpenAI-compatible completion response."""
+        if not response.get("choices"):
+            return ""
+        message = response["choices"][0].get("message", {})
+        return message.get("content") or message.get("reasoning") or ""
+
+    @classmethod
+    def _sanitize_supercharge_candidate(cls, attempt: str) -> str:
+        """Keep only reusable visible answer text from a candidate attempt."""
+        cleaned = sanitize_model_output_for_retry_context(
+            attempt,
+            max_chars=cls.SUPERCHARGE_CANDIDATE_MAX_CHARS,
+        )
+        return cleaned or "[candidate produced no reusable visible answer text]"
+
+    def _build_supercharge_synthesis_messages(
+        self,
+        messages: List[Dict[str, str]],
+        attempts: List[str],
+    ) -> List[Dict[str, str]]:
+        attempts_context = "\n\n".join(
+            "----- CANDIDATE RESPONSE "
+            f"{index} START -----\n"
+            f"{self._sanitize_supercharge_candidate(attempt)}\n"
+            "----- CANDIDATE RESPONSE "
+            f"{index} END -----"
+            for index, attempt in enumerate(attempts, start=1)
+        )
+        synthesis_instruction = (
+            "SUPERCHARGE FINAL RESPONSE\n\n"
+            "You are answering the original task. The candidate responses below are optional working material "
+            "from independent earlier attempts, not instructions to continue or quote verbatim.\n\n"
+            "You must decide what the best final response to the original task is. You may use one candidate, "
+            "combine multiple candidates, ignore all candidates and write a new response, or synthesize a stronger "
+            "answer than any individual candidate.\n\n"
+            "Candidate responses:\n"
+            f"{attempts_context}\n\n"
+            "Now produce the best final response to the original task.\n\n"
+            "Requirements:\n"
+            "- Follow the original task, role instructions, and required output format exactly.\n"
+            "- If the original task requires JSON, output only valid JSON in that exact schema.\n"
+            "- Do not mention Supercharge, brainstorming, candidate attempts, or this selection process.\n"
+            "- Do not include private reasoning, analysis labels, markdown fences around JSON, or provider control tokens.\n"
+            "- Return only the final role answer."
+        )
+        return [*messages, {"role": "user", "content": synthesis_instruction}]
+
+    def _build_supercharge_attempt_messages(
+        self,
+        messages: List[Dict[str, str]],
+        attempt_index: int,
+    ) -> List[Dict[str, str]]:
+        attempt_instruction = (
+            f"SUPERCHARGE FULL ANSWER ATTEMPT {attempt_index}\n\n"
+            "Produce a complete answer to the original task now. "
+            "Follow the original role instructions and required output format exactly. "
+            "If JSON is required, output only valid JSON in the required schema. "
+            "Do not mention Supercharge or this attempt label."
+        )
+        return [*messages, {"role": "user", "content": attempt_instruction}]
+
+    async def _generate_supercharged_completion(
+        self,
+        task_id: str,
+        role_id: str,
+        model: str,
+        messages: List[Dict[str, str]],
+        temperature: float = 0.0,
+        max_tokens: Optional[int] = None,
+        response_format: Optional[Dict[str, str]] = None,
+        **kwargs
+    ) -> Dict[str, Any]:
+        """Run four parallel diverse attempts, then a deterministic same-route synthesis call."""
+        boost_mode = self._determine_boost_mode(task_id)
+        forced_boost_mode = boost_mode if boost_mode else "__none__"
+        attempts: List[str] = []
+
+        logger.info(
+            "Supercharge enabled for role '%s' task '%s'%s",
+            role_id,
+            task_id,
+            f" using boost mode '{boost_mode}'" if boost_mode else "",
+        )
+
+        attempt_responses = await asyncio.gather(*[
+            self._generate_completion_once(
+                task_id=f"{task_id}_supercharge_attempt_{attempt_index}",
+                role_id=role_id,
+                model=model,
+                messages=self._build_supercharge_attempt_messages(messages, attempt_index),
+                temperature=attempt_temperature,
+                max_tokens=max_tokens,
+                response_format=response_format,
+                _moto_force_boost_mode=forced_boost_mode,
+                _moto_consume_boost_count=False,
+                _moto_strict_boost=bool(boost_mode),
+                **kwargs
+            )
+            for attempt_index, attempt_temperature in enumerate(
+                self.SUPERCHARGE_ATTEMPT_TEMPERATURES,
+                start=1,
+            )
+        ])
+        attempts = [self._response_text(response) for response in attempt_responses]
+
+        synthesis_response = await self._generate_completion_once(
+            task_id=f"{task_id}_supercharge_final",
+            role_id=role_id,
+            model=model,
+            messages=self._build_supercharge_synthesis_messages(messages, attempts),
+            temperature=0.0,
+            max_tokens=max_tokens,
+            response_format=response_format,
+            _moto_force_boost_mode=forced_boost_mode,
+            _moto_consume_boost_count=False,
+            _moto_strict_boost=bool(boost_mode),
+            **kwargs
+        )
+
+        metadata = self.extract_call_metadata(synthesis_response)
+        if boost_mode == "next_count" and metadata.get("boosted"):
+            await boost_manager.consume_boost_count()
+
+        if isinstance(synthesis_response, dict):
+            synthesis_response[self.CALL_METADATA_KEY] = {
+                **metadata,
+                "supercharged": True,
+                "supercharge_attempts": 4,
+                "supercharge_attempt_temperatures": list(self.SUPERCHARGE_ATTEMPT_TEMPERATURES),
+            }
+        return synthesis_response
+
+    async def _generate_completion_once(
+        self,
+        task_id: str,
+        role_id: str,
+        model: str,
+        messages: List[Dict[str, str]],
+        temperature: float = 0.0,
+        max_tokens: Optional[int] = None,
+        response_format: Optional[Dict[str, str]] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
+        **kwargs
     ) -> Dict[str, Any]:
         """
         Generate a completion using the appropriate API.
@@ -331,13 +642,21 @@ async def generate_completion(
         Returns:
             API response dict
         """
+        forced_boost_mode = kwargs.pop("_moto_force_boost_mode", None)
+        consume_boost_count = kwargs.pop("_moto_consume_boost_count", True)
+        strict_boost = kwargs.pop("_moto_strict_boost", False)
         requested_model = model
         async with self._state_lock:
             initial_role_config = self._role_model_configs.get(role_id)
         configured_provider = initial_role_config.provider if initial_role_config else None
 
         # Check if task should use boost (unified check for all boost modes)
-        boost_mode = self._determine_boost_mode(task_id)
+        if forced_boost_mode == "__none__":
+            boost_mode = None
+        elif forced_boost_mode is not None:
+            boost_mode = forced_boost_mode
+        else:
+            boost_mode = self._determine_boost_mode(task_id)
         
         if boost_mode and boost_manager.boost_config:
             boost_model = boost_manager.boost_config.boost_model_id
@@ -348,8 +667,8 @@ async def generate_completion(
             # Get prompt preview for logging
             prompt_preview = ""
             if messages:
-                last_message = messages[-1].get("content", "")
-                prompt_preview = last_message[:500] if last_message else ""
+                last_message = self._prompt_for_logging(messages)
+                prompt_preview = last_message or ""
             
             start_time = time.time()
             
@@ -373,6 +692,7 @@ async def generate_completion(
                             max_tokens=max_tokens or boost_manager.boost_config.boost_max_output_tokens,
                             response_format=response_format,
                             provider=boost_provider,
+                            reasoning_effort=boost_manager.boost_config.boost_reasoning_effort,
                             tools=tools,
                             tool_choice=tool_choice,
                         ),
@@ -386,9 +706,11 @@ async def generate_completion(
                     
                     # Check for missing choices (upstream provider timeout/error)
                     if not result.get("choices"):
-                        import json as _json
-                        raw_response = _json.dumps(result)[:2000]
-                        logger.error(f"OpenRouter boost response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                        logger.error(
+                            "OpenRouter boost response missing 'choices' after %.0fms - %s",
+                            duration_ms,
+                            _response_shape_for_logging(result),
+                        )
                         
                         # Log as failure
                         await boost_logger.log_boost_call(
@@ -433,6 +755,7 @@ async def generate_completion(
                         boosted=True,
                         boost_mode=boost_mode,
                         openrouter_provider=boost_provider,
+                        openrouter_reasoning_effort=boost_manager.boost_config.boost_reasoning_effort,
                     )
                     
                     # Log the boost call
@@ -450,7 +773,7 @@ async def generate_completion(
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -469,7 +792,7 @@ async def generate_completion(
                     await self._track_model_usage(boost_model)
                     
                     # Consume boost count if using next_count mode
-                    if boost_mode == "next_count":
+                    if boost_mode == "next_count" and consume_boost_count:
                         await boost_manager.consume_boost_count()
                     
                     return result
@@ -493,7 +816,7 @@ async def generate_completion(
                 
                 # Log to autonomous API logger if callback set
                 if self._autonomous_logger_callback:
-                    full_prompt = messages[-1].get("content", "") if messages else ""
+                    full_prompt = self._prompt_for_logging(messages)
                     await self._autonomous_logger_callback(
                         task_id=task_id,
                         role_id=role_id,
@@ -519,6 +842,8 @@ async def generate_completion(
                 
                 # Fall through to primary model (boost has no fallback concept)
                 logger.info(f"Boost rate limited, using primary model for task {task_id}")
+                if strict_boost:
+                    raise RuntimeError(f"Strict boost call failed for task {task_id}: {e}") from e
             
             except OpenRouterPrivacyPolicyError as e:
                 # Privacy policy error - log and crash (boost has no fallback concept)
@@ -537,7 +862,7 @@ async def generate_completion(
                 
                 # Log to autonomous API logger if callback set
                 if self._autonomous_logger_callback:
-                    full_prompt = messages[-1].get("content", "") if messages else ""
+                    full_prompt = self._prompt_for_logging(messages)
                     await self._autonomous_logger_callback(
                         task_id=task_id,
                         role_id=role_id,
@@ -597,7 +922,7 @@ async def generate_completion(
                 
                 # Log to autonomous API logger if callback set
                 if self._autonomous_logger_callback:
-                    full_prompt = messages[-1].get("content", "") if messages else ""
+                    full_prompt = self._prompt_for_logging(messages)
                     await self._autonomous_logger_callback(
                         task_id=task_id,
                         role_id=role_id,
@@ -618,6 +943,8 @@ async def generate_completion(
                     "task_id": task_id,
                     "message": "Boost credits exhausted, falling back to primary model"
                 })
+                if strict_boost:
+                    raise RuntimeError(f"Strict boost call credits exhausted for task {task_id}: {e}") from e
                 # Continue to primary model routing below
                 
             except Exception as e:
@@ -637,7 +964,7 @@ async def generate_completion(
                 
                 # Log to autonomous API logger if callback set
                 if self._autonomous_logger_callback:
-                    full_prompt = messages[-1].get("content", "") if messages else ""
+                    full_prompt = self._prompt_for_logging(messages)
                     await self._autonomous_logger_callback(
                         task_id=task_id,
                         role_id=role_id,
@@ -653,12 +980,23 @@ async def generate_completion(
                     )
                 
                 logger.error(f"Boost API error for task {task_id}: {e}, using primary model")
+                if strict_boost:
+                    raise RuntimeError(f"Strict boost call failed for task {task_id}: {e}") from e
                 # Fall through to primary model
         
         # Check role fallback state
         async with self._state_lock:
             fallback_state = self._role_fallback_state.get(role_id, "lm_studio")
             role_config = self._role_model_configs.get(role_id)
+
+            if system_config.generic_mode and role_config and fallback_state != "openrouter":
+                logger.warning(
+                    "Generic mode reset role '%s' fallback state from %s to OpenRouter.",
+                    role_id,
+                    fallback_state,
+                )
+                fallback_state = "openrouter"
+                self._role_fallback_state[role_id] = "openrouter"
         
         # If OpenRouter configured and not fallen back, try OpenRouter
         if fallback_state == "openrouter" and role_config:
@@ -719,6 +1057,7 @@ async def generate_completion(
                             max_tokens=max_tokens or role_config.max_output_tokens,
                             response_format=response_format,
                             provider=openrouter_provider,
+                            reasoning_effort=role_config.openrouter_reasoning_effort,
                             tools=tools,
                             tool_choice=tool_choice,
                         ),
@@ -732,9 +1071,11 @@ async def generate_completion(
                     
                     # Check for missing choices (upstream provider timeout/error)
                     if not result.get("choices"):
-                        import json as _json
-                        raw_response = _json.dumps(result)[:2000]
-                        logger.error(f"OpenRouter response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                        logger.error(
+                            "OpenRouter response missing 'choices' after %.0fms - %s",
+                            duration_ms,
+                            _response_shape_for_logging(result),
+                        )
                         raise ValueError(f"OpenRouter response missing 'choices' after {duration_ms:.0f}ms (upstream provider timeout)")
                     
                     response_content = ""
@@ -761,11 +1102,12 @@ async def generate_completion(
                         boosted=False,
                         boost_mode=None,
                         openrouter_provider=openrouter_provider,
+                        openrouter_reasoning_effort=role_config.openrouter_reasoning_effort,
                     )
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -790,7 +1132,7 @@ async def generate_completion(
                     duration_ms = (time.time() - start_time) * 1000
                     
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -827,6 +1169,9 @@ async def generate_completion(
                         temperature=temperature,
                         max_tokens=max_tokens or role_config.max_output_tokens,
                         response_format=response_format,
+                        reasoning_effort=role_config.openrouter_reasoning_effort,
+                        tools=tools,
+                        tool_choice=tool_choice,
                     )
                     if rotated_result is not None:
                         free_model_manager.clear_failed_models()  # Success - clear failures
@@ -852,7 +1197,7 @@ async def generate_completion(
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -918,7 +1263,7 @@ async def generate_completion(
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -979,7 +1324,7 @@ async def generate_completion(
                     
                     # Log to autonomous API logger if callback set
                     if self._autonomous_logger_callback:
-                        full_prompt = messages[-1].get("content", "") if messages else ""
+                        full_prompt = self._prompt_for_logging(messages)
                         await self._autonomous_logger_callback(
                             task_id=task_id,
                             role_id=role_id,
@@ -1010,6 +1355,12 @@ async def generate_completion(
                         )
                         raise
         
+        if system_config.generic_mode:
+            raise RuntimeError(
+                f"Generic mode is OpenRouter-only; role '{role_id}' cannot use LM Studio. "
+                "Configure the role with provider='openrouter' and a valid OpenRouter model/key."
+            )
+
         # Use LM Studio (either configured as primary or fallen back)
         logger.debug(f"Role {role_id} using LM Studio: {model}")
         start_time = time.time()
@@ -1036,13 +1387,17 @@ async def generate_completion(
             
             # Check for missing choices
             if not result.get("choices"):
-                import json as _json
-                raw_response = _json.dumps(result)[:2000]
-                logger.error(f"LM Studio response missing 'choices' after {duration_ms:.0f}ms - raw: {raw_response}")
+                logger.error(
+                    "LM Studio response missing 'choices' after %.0fms - %s",
+                    duration_ms,
+                    _response_shape_for_logging(result),
+                )
                 raise ValueError(f"LM Studio response missing 'choices' after {duration_ms:.0f}ms")
             
             response_content = ""
             tokens_used = None
+            lm_routing_metadata = lm_studio_client.extract_routing_metadata(result)
+            actual_lm_studio_model = lm_routing_metadata.get("actual_model") or model
             if result.get("choices"):
                 message = result["choices"][0].get("message", {})
                 response_content = message.get("content") or message.get("reasoning") or ""
@@ -1051,7 +1406,7 @@ async def generate_completion(
                 _pt = result["usage"].get("prompt_tokens")
                 _ct = result["usage"].get("completion_tokens")
                 if _pt is not None and _ct is not None:
-                    token_tracker.track(model, _pt, _ct)
+                    token_tracker.track(actual_lm_studio_model, _pt, _ct)
                     await self._broadcast("token_usage_updated", token_tracker.get_stats())
 
             result = self._annotate_response_with_call_metadata(
@@ -1059,7 +1414,7 @@ async def generate_completion(
                 task_id=task_id,
                 role_id=role_id,
                 configured_model=requested_model,
-                actual_model=model,
+                actual_model=actual_lm_studio_model,
                 configured_provider=role_config.provider if role_config else configured_provider or "lm_studio",
                 actual_provider="lm_studio",
                 boosted=False,
@@ -1068,11 +1423,11 @@ async def generate_completion(
             
             # Log to autonomous API logger if callback set
             if self._autonomous_logger_callback:
-                full_prompt = messages[-1].get("content", "") if messages else ""
+                full_prompt = self._prompt_for_logging(messages)
                 await self._autonomous_logger_callback(
                     task_id=task_id,
                     role_id=role_id,
-                    model=model,
+                    model=actual_lm_studio_model,
                     provider="lm_studio",
                     prompt=full_prompt,
                     response=response_content,
@@ -1084,7 +1439,7 @@ async def generate_completion(
                 )
             
             # Track model usage for Tier 3
-            await self._track_model_usage(model)
+            await self._track_model_usage(actual_lm_studio_model)
             
             return result
             
@@ -1092,7 +1447,7 @@ async def generate_completion(
             # Log LM Studio error to autonomous logger if callback set
             duration_ms = (time.time() - start_time) * 1000
             if self._autonomous_logger_callback:
-                full_prompt = messages[-1].get("content", "") if messages else ""
+                full_prompt = self._prompt_for_logging(messages)
                 await self._autonomous_logger_callback(
                     task_id=task_id,
                     role_id=role_id,
@@ -1120,6 +1475,9 @@ async def _try_free_model_rotation(
         temperature: float,
         max_tokens: int,
         response_format: Optional[Dict[str, str]],
+        reasoning_effort: Optional[str] = None,
+        tools: Optional[List[Dict[str, Any]]] = None,
+        tool_choice: Optional[Any] = None,
     ) -> Optional[Dict[str, Any]]:
         """
         Attempt free model rotation chain: looping -> auto-selector.
@@ -1153,6 +1511,7 @@ async def _try_free_model_rotation(
                             temperature=temperature,
                             max_tokens=max_tokens,
                             response_format=response_format,
+                            reasoning_effort=reasoning_effort,
                             tools=tools,
                             tool_choice=tool_choice,
                         ),
@@ -1177,6 +1536,7 @@ async def _try_free_model_rotation(
                         actual_provider="openrouter",
                         boosted=False,
                         boost_mode=None,
+                        openrouter_reasoning_effort=reasoning_effort,
                     )
                     if free_model_manager.is_account_exhausted():
                         free_model_manager.clear_account_exhaustion()
@@ -1204,6 +1564,7 @@ async def _try_free_model_rotation(
                         temperature=temperature,
                         max_tokens=max_tokens,
                         response_format=response_format,
+                        reasoning_effort=reasoning_effort,
                         tools=tools,
                         tool_choice=tool_choice,
                     ),
@@ -1228,6 +1589,7 @@ async def _try_free_model_rotation(
                     actual_provider="openrouter",
                     boosted=False,
                     boost_mode=None,
+                    openrouter_reasoning_effort=reasoning_effort,
                 )
                 if free_model_manager.is_account_exhausted():
                     free_model_manager.clear_account_exhaustion()
diff --git a/backend/shared/boost_logger.py b/backend/shared/boost_logger.py
index 257cb59..13df4ff 100644
--- a/backend/shared/boost_logger.py
+++ b/backend/shared/boost_logger.py
@@ -4,18 +4,32 @@
 main API call log view.
 """
 import asyncio
+import hashlib
 import json
 import logging
 import os
+from collections import deque
 from datetime import datetime
 from typing import Dict, Any, List, Optional
 from pathlib import Path
 
 from backend.shared.config import system_config
+from backend.shared.log_redaction import redact_log_text
 
 logger = logging.getLogger(__name__)
 
 
+def _payload_metadata(value: str, preview_chars: int) -> Dict[str, Any]:
+    """Return safe log metadata for a boost response payload."""
+    text = value or ""
+    preview = redact_log_text(text, preview_chars)
+    return {
+        "preview": preview,
+        "size": len(text),
+        "sha256": hashlib.sha256(text.encode("utf-8", errors="replace")).hexdigest() if text else "",
+    }
+
+
 class BoostLogger:
     """
     Logger for boost API call outputs.
@@ -39,6 +53,7 @@ def __init__(self):
         
         self._initialized = True
         self._ensure_log_file()
+        self._scrub_persisted_full_payloads()
         logger.info("BoostLogger initialized")
     
     def _ensure_log_file(self) -> None:
@@ -52,6 +67,61 @@ def _ensure_log_file(self) -> None:
     def _get_log_path(self) -> Path:
         """Return the instance-scoped boost log path."""
         return Path(system_config.data_dir) / "boost_api_log.txt"
+
+    def _scrub_persisted_full_payloads(self) -> None:
+        """Remove legacy raw prompt/response bodies from the on-disk JSONL log."""
+        log_path = self._get_log_path()
+        if not log_path.exists():
+            return
+
+        changed = False
+        scrubbed_lines: List[str] = []
+
+        try:
+            with open(log_path, "r", encoding="utf-8") as f:
+                lines = f.readlines()
+
+            for line in lines:
+                stripped = line.strip()
+                if not stripped:
+                    continue
+                try:
+                    entry = json.loads(stripped)
+                except json.JSONDecodeError:
+                    scrubbed_lines.append(line)
+                    continue
+
+                original_entry = dict(entry)
+                prompt_full = str(entry.pop("prompt_full", "") or "")
+                response_full = str(entry.pop("response_full", "") or "")
+                prompt_source = prompt_full or str(entry.get("prompt_preview") or "")
+                response_source = response_full or str(entry.get("response_preview") or "")
+
+                if prompt_source:
+                    entry["prompt_preview"] = redact_log_text(prompt_source, 500)
+                    entry["prompt_size"] = int(entry.get("prompt_size") or len(prompt_source))
+                if response_source:
+                    response_meta = _payload_metadata(response_source, 2000)
+                    entry["response_preview"] = response_meta["preview"]
+                    entry["response_size"] = int(entry.get("response_size") or response_meta["size"])
+                    entry.setdefault("response_sha256", response_meta["sha256"])
+
+                entry["has_full_prompt"] = False
+                entry["has_full_response"] = False
+                entry["response_redacted"] = True
+                if entry.get("error"):
+                    entry["error"] = redact_log_text(entry["error"], 1000)
+
+                if prompt_full or response_full or entry != original_entry:
+                    changed = True
+                scrubbed_lines.append(json.dumps(entry) + "\n")
+
+            if changed:
+                with open(log_path, "w", encoding="utf-8") as f:
+                    f.writelines(scrubbed_lines)
+                logger.info("Scrubbed legacy full payloads from boost API log")
+        except Exception as e:
+            logger.warning(f"Failed to scrub legacy boost API log payloads: {e}")
     
     async def log_boost_call(
         self,
@@ -83,20 +153,27 @@ async def log_boost_call(
         """
         async with self._lock:
             try:
+                response_meta = _payload_metadata(response_content, 2000)
+                store_full_payloads = bool(system_config.api_log_store_full_payloads)
                 log_entry = {
                     "timestamp": datetime.now().isoformat(),
                     "task_id": task_id,
                     "role_id": role_id,
                     "model": model,
                     "boost_mode": boost_mode,
-                    "prompt_preview": prompt_preview[:500] if prompt_preview else "",
-                    "response_preview": response_content[:2000] if response_content else "",
-                    "response_full": response_content,
+                    "prompt_preview": redact_log_text(prompt_preview, 500) if prompt_preview else "",
+                    "response_preview": response_meta["preview"],
+                    "response_size": response_meta["size"],
+                    "response_sha256": response_meta["sha256"],
+                    "response_redacted": not store_full_payloads,
+                    "has_full_response": store_full_payloads and bool(response_content),
                     "tokens_used": tokens_used,
                     "duration_ms": duration_ms,
                     "success": success,
-                    "error": error
+                    "error": redact_log_text(error, 1000)
                 }
+                if store_full_payloads:
+                    log_entry["response_full"] = response_content
                 
                 # Append to log file
                 with open(self._get_log_path(), "a", encoding="utf-8") as f:
@@ -126,7 +203,7 @@ async def _trim_log_if_needed(self) -> None:
         except Exception as e:
             logger.error(f"Failed to trim boost log: {e}")
     
-    async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
+    async def get_logs(self, limit: int = 100, include_full: bool = True) -> List[Dict[str, Any]]:
         """
         Get recent boost API call logs.
         
@@ -143,7 +220,7 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
                     return []
                 
                 with open(log_path, "r", encoding="utf-8") as f:
-                    lines = f.readlines()
+                    lines = deque(f, maxlen=max(1, limit))
                 
                 logs = []
                 for line in lines:
@@ -151,6 +228,15 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
                     if line:
                         try:
                             log_entry = json.loads(line)
+                            if not include_full or not system_config.api_log_store_full_payloads:
+                                prompt_full = str(log_entry.pop("prompt_full", "") or "")
+                                response_full = str(log_entry.pop("response_full", "") or "")
+                                log_entry["prompt_size"] = len(prompt_full)
+                                log_entry["response_size"] = int(log_entry.get("response_size") or len(response_full))
+                                log_entry["has_full_prompt"] = False
+                                log_entry["has_full_response"] = False
+                                if response_full and not log_entry.get("response_sha256"):
+                                    log_entry["response_sha256"] = hashlib.sha256(response_full.encode("utf-8", errors="replace")).hexdigest()
                             logs.append(log_entry)
                         except json.JSONDecodeError:
                             continue
@@ -163,7 +249,7 @@ async def get_logs(self, limit: int = 100) -> List[Dict[str, Any]]:
                 logger.error(f"Failed to get boost logs: {e}")
                 return []
     
-    async def get_log_entry(self, index: int) -> Optional[Dict[str, Any]]:
+    async def get_log_entry(self, index: int, include_full: bool = True) -> Optional[Dict[str, Any]]:
         """
         Get a specific log entry by index (0 = most recent).
         
@@ -173,15 +259,53 @@ async def get_log_entry(self, index: int) -> Optional[Dict[str, Any]]:
         Returns:
             Log entry dict or None if not found
         """
-        logs = await self.get_logs(limit=index + 1)
+        logs = await self.get_logs(limit=index + 1, include_full=include_full)
         if index < len(logs):
             return logs[index]
         return None
     
-    async def clear_logs(self) -> None:
-        """Clear all boost API logs."""
+    @staticmethod
+    def _entry_workflow(entry: Dict[str, Any]) -> str:
+        workflow = str(entry.get("workflow") or "").strip().lower()
+        if workflow:
+            return workflow
+
+        role_id = str(entry.get("role_id") or "")
+        task_id = str(entry.get("task_id") or "")
+        if role_id.startswith("leanoj_") or task_id.startswith("leanoj_"):
+            return "leanoj"
+        return "autonomous"
+
+    async def clear_logs(self, workflow: Optional[str] = None) -> None:
+        """Clear boost API logs, optionally scoped to one workflow."""
         async with self._lock:
             try:
+                if workflow:
+                    log_path = self._get_log_path()
+                    if not os.path.exists(log_path):
+                        return
+
+                    with open(log_path, "r", encoding="utf-8") as f:
+                        lines = f.readlines()
+
+                    retained_lines: List[str] = []
+                    for line in lines:
+                        stripped = line.strip()
+                        if not stripped:
+                            continue
+                        try:
+                            entry = json.loads(stripped)
+                        except json.JSONDecodeError:
+                            retained_lines.append(line)
+                            continue
+                        if self._entry_workflow(entry) != workflow:
+                            retained_lines.append(line)
+
+                    with open(log_path, "w", encoding="utf-8") as f:
+                        f.writelines(retained_lines)
+                    logger.info("Boost logs cleared for workflow %s", workflow)
+                    return
+
                 with open(self._get_log_path(), "w", encoding="utf-8") as f:
                     f.write("")
                 logger.info("Boost logs cleared")
diff --git a/backend/shared/boost_manager.py b/backend/shared/boost_manager.py
index d26f883..e967b50 100644
--- a/backend/shared/boost_manager.py
+++ b/backend/shared/boost_manager.py
@@ -13,6 +13,8 @@
 - Topic Validator, Redundancy Checker → agg_val (Agg Validator)
 - Brainstorm aggregation submitters/validator → agg_sub1..10, agg_val (via Coordinator)
 - Paper compilation → comp_hc, comp_hp, comp_val, comp_crit (via CompilerCoordinator)
+- LeanOJ path-decision calls use `leanoj_path_*` task IDs for workflow display, but belong to the
+  Final Solver boost category (`leanoj_final`) because that role owns final-readiness decisions.
 
 State is persisted to backend/data/boost_state.json for crash recovery.
 """
@@ -22,7 +24,7 @@
 import os
 from typing import Optional, Set, Callable, Any, Dict, List
 
-from backend.shared.config import system_config
+from backend.shared.config import rag_config, system_config
 from backend.shared.models import BoostConfig
 
 logger = logging.getLogger(__name__)
@@ -48,6 +50,38 @@
     "comp_hp": "High-Param Model",
     "comp_val": "Compiler Validator",
     "comp_crit": "Critique Submitter",
+    # LeanOJ
+    "leanoj_topic": "Proof Solver Topic Generator",
+    "leanoj_topic_val": "Proof Solver Topic Validator",
+    "leanoj_topic_sub1": "Proof Solver Topic Submitter 1",
+    "leanoj_topic_sub2": "Proof Solver Topic Submitter 2",
+    "leanoj_topic_sub3": "Proof Solver Topic Submitter 3",
+    "leanoj_topic_sub4": "Proof Solver Topic Submitter 4",
+    "leanoj_topic_sub5": "Proof Solver Topic Submitter 5",
+    "leanoj_topic_sub6": "Proof Solver Topic Submitter 6",
+    "leanoj_topic_sub7": "Proof Solver Topic Submitter 7",
+    "leanoj_topic_sub8": "Proof Solver Topic Submitter 8",
+    "leanoj_topic_sub9": "Proof Solver Topic Submitter 9",
+    "leanoj_topic_sub10": "Proof Solver Topic Submitter 10",
+    "leanoj_brainstorm_sub1": "Proof Solver Brainstorm Submitter 1",
+    "leanoj_brainstorm_sub2": "Proof Solver Brainstorm Submitter 2",
+    "leanoj_brainstorm_sub3": "Proof Solver Brainstorm Submitter 3",
+    "leanoj_brainstorm_sub4": "Proof Solver Brainstorm Submitter 4",
+    "leanoj_brainstorm_sub5": "Proof Solver Brainstorm Submitter 5",
+    "leanoj_brainstorm_sub6": "Proof Solver Brainstorm Submitter 6",
+    "leanoj_brainstorm_sub7": "Proof Solver Brainstorm Submitter 7",
+    "leanoj_brainstorm_sub8": "Proof Solver Brainstorm Submitter 8",
+    "leanoj_brainstorm_sub9": "Proof Solver Brainstorm Submitter 9",
+    "leanoj_brainstorm_sub10": "Proof Solver Brainstorm Submitter 10",
+    "leanoj_brainstorm_val": "Proof Solver Brainstorm Validator",
+    "leanoj_sufficiency": "Proof Solver Sufficiency Check",
+    "leanoj_path_val": "Proof Solver Path Validator",
+    "leanoj_final": "Proof Solver Final Solver",
+}
+
+CATEGORY_ALIASES = {
+    # Path decisions are absorbed into the dominant Final Solver role.
+    "leanoj_path": "leanoj_final",
 }
 
 
@@ -110,26 +144,36 @@ def _load_state(self) -> None:
                 with open(state_file, 'r', encoding='utf-8') as f:
                     state = json.load(f)
                 
-                # Restore boost config if it was enabled
+                legacy_key_present = bool(state.get('api_key'))
+
+                # Restore boost config if it was enabled. Legacy plaintext
+                # `api_key` values are intentionally ignored and scrubbed below.
                 if state.get('enabled') and state.get('model_id'):
                     self.boost_config = BoostConfig(
                         enabled=True,
-                        openrouter_api_key=state.get('api_key', ''),
+                        openrouter_api_key='',
                         boost_model_id=state.get('model_id'),
                         boost_provider=state.get('provider'),
+                        boost_reasoning_effort=state.get('reasoning_effort', 'auto'),
                         boost_context_window=state.get('context_window', 131072),
                         boost_max_output_tokens=state.get('max_output_tokens', 25000)
                     )
                 
                 # Restore boost modes
                 self.boost_next_count = state.get('boost_next_count', 0)
-                self.boosted_categories = set(state.get('boosted_categories', []))
+                self.boosted_categories = {
+                    self._canonical_category(category)
+                    for category in state.get('boosted_categories', [])
+                }
                 self.boost_always_prefer = state.get('boost_always_prefer', False)
                 self.boosted_task_ids = set(state.get('boosted_task_ids', []))
                 
                 logger.info(f"Loaded boost state: enabled={state.get('enabled')}, model={state.get('model_id')}, "
                            f"next_count={self.boost_next_count}, categories={len(self.boosted_categories)}, "
                            f"always_prefer={self.boost_always_prefer}")
+                if legacy_key_present:
+                    self._save_state()
+                    logger.info("Scrubbed legacy plaintext boost API key from persisted state")
         except Exception as e:
             logger.warning(f"Failed to load boost state: {e}")
     
@@ -144,9 +188,9 @@ def _save_state(self) -> None:
                 'enabled': self.boost_config is not None and self.boost_config.enabled,
                 'model_id': self.boost_config.boost_model_id if self.boost_config else None,
                 'provider': self.boost_config.boost_provider if self.boost_config else None,
+                'reasoning_effort': self.boost_config.boost_reasoning_effort if self.boost_config else 'auto',
                 'context_window': self.boost_config.boost_context_window if self.boost_config else 131072,
                 'max_output_tokens': self.boost_config.boost_max_output_tokens if self.boost_config else 25000,
-                'api_key': self.boost_config.openrouter_api_key if self.boost_config else '',
                 'boost_next_count': self.boost_next_count,
                 'boosted_categories': list(self.boosted_categories),
                 'boost_always_prefer': self.boost_always_prefer,
@@ -181,6 +225,7 @@ async def set_boost_config(self, config: BoostConfig) -> None:
             provider_info = f", provider={config.boost_provider}" if config.boost_provider else " (auto-routing)"
             logger.info(
                 f"Boost enabled: model={config.boost_model_id}{provider_info}, "
+                f"reasoning={config.boost_reasoning_effort}, "
                 f"context={config.boost_context_window}, "
                 f"max_tokens={config.boost_max_output_tokens}"
             )
@@ -191,6 +236,7 @@ async def set_boost_config(self, config: BoostConfig) -> None:
             await self._broadcast("boost_enabled", {
                 "model_id": config.boost_model_id,
                 "provider": config.boost_provider,
+                "reasoning_effort": config.boost_reasoning_effort,
                 "context_window": config.boost_context_window,
                 "max_output_tokens": config.boost_max_output_tokens
             })
@@ -307,6 +353,7 @@ async def toggle_category_boost(self, category: str) -> bool:
         Returns:
             True if category is now boosted, False if unboosted
         """
+        category = self._canonical_category(category)
         async with self._lock:
             if category in self.boosted_categories:
                 self.boosted_categories.remove(category)
@@ -327,6 +374,11 @@ async def toggle_category_boost(self, category: str) -> bool:
             })
             
             return boosted
+
+    @staticmethod
+    def _canonical_category(category: str) -> str:
+        """Map absorbed/legacy category prefixes to their owning role category."""
+        return CATEGORY_ALIASES.get(category, category)
     
     def _extract_role_prefix(self, task_id: str) -> str:
         """
@@ -340,8 +392,8 @@ def _extract_role_prefix(self, task_id: str) -> str:
         # Split on last underscore and take everything before it
         parts = task_id.rsplit('_', 1)
         if len(parts) == 2:
-            return parts[0]
-        return task_id
+            return self._canonical_category(parts[0])
+        return self._canonical_category(task_id)
     
     def should_use_boost(self, task_id: str) -> bool:
         """
@@ -410,6 +462,8 @@ def get_boost_status(self) -> Dict[str, Any]:
             return {
                 "enabled": False,
                 "model_id": None,
+                "has_available_key": bool(rag_config.openrouter_api_key),
+                "needs_key": False,
                 "boosted_task_count": 0,
                 "boost_next_count": 0,
                 "boosted_categories": [],
@@ -417,12 +471,19 @@ def get_boost_status(self) -> Dict[str, Any]:
                 "boosted_tasks": []
             }
         
+        has_available_key = bool(
+            (self.boost_config.openrouter_api_key or "").strip()
+            or (rag_config.openrouter_api_key or "").strip()
+        )
         return {
             "enabled": self.boost_config.enabled,
             "model_id": self.boost_config.boost_model_id,
             "provider": self.boost_config.boost_provider,
+            "reasoning_effort": self.boost_config.boost_reasoning_effort,
             "context_window": self.boost_config.boost_context_window,
             "max_output_tokens": self.boost_config.boost_max_output_tokens,
+            "has_available_key": has_available_key,
+            "needs_key": bool(self.boost_config.enabled and not has_available_key),
             "boosted_task_count": len(self.boosted_task_ids),
             "boosted_tasks": list(self.boosted_task_ids),
             "boost_next_count": self.boost_next_count,
@@ -470,6 +531,26 @@ def get_available_categories(self, mode: str = "all") -> List[Dict[str, str]]:
             {"id": "comp_hp", "label": "High-Param Model", "group": "Compiler"},
             {"id": "comp_crit", "label": "Critique Submitter", "group": "Compiler"},
         ])
+
+        categories.extend([
+            {"id": "leanoj_topic", "label": "Topic Generator", "group": "Proof Solver"},
+            {"id": "leanoj_topic_val", "label": "Topic Validator", "group": "Proof Solver"},
+            {"id": "leanoj_brainstorm_val", "label": "Brainstorm Validator", "group": "Proof Solver"},
+            {"id": "leanoj_sufficiency", "label": "Sufficiency Check", "group": "Proof Solver"},
+            {"id": "leanoj_path_val", "label": "Path Validator", "group": "Proof Solver"},
+            {"id": "leanoj_final", "label": "Final Solver", "group": "Proof Solver"},
+        ])
+        for i in range(1, 11):
+            categories.append({
+                "id": f"leanoj_topic_sub{i}",
+                "label": f"Topic Submitter {i}",
+                "group": "Proof Solver",
+            })
+            categories.append({
+                "id": f"leanoj_brainstorm_sub{i}",
+                "label": f"Brainstorm Submitter {i}",
+                "group": "Proof Solver",
+            })
         
         return categories
     
diff --git a/backend/shared/brainstorm_proof_gate.py b/backend/shared/brainstorm_proof_gate.py
new file mode 100644
index 0000000..1d2a26e
--- /dev/null
+++ b/backend/shared/brainstorm_proof_gate.py
@@ -0,0 +1,341 @@
+"""Shared Lean 4 gate for brainstorm proof candidates."""
+from __future__ import annotations
+
+import logging
+from dataclasses import dataclass
+from typing import Any, Optional
+
+from backend.autonomous.prompts.proof_prompts import LEAN4_COMMON_PITFALLS
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.config import system_config
+from backend.shared.json_parser import parse_json
+from backend.shared.lean4_client import get_lean4_client
+from backend.shared.lean_proof_integrity import validate_full_lean_proof_integrity
+from backend.shared.model_error_utils import is_non_retryable_model_error
+from backend.shared.models import ProofAttemptFeedback
+
+logger = logging.getLogger(__name__)
+
+BRAINSTORM_LEAN_PROOF_MARKER = "[LEAN 4 VERIFIED BRAINSTORM PROOF]"
+
+
+@dataclass
+class BrainstormProofGateResult:
+    """Result of checking a proof candidate before normal brainstorm validation."""
+
+    accepted: bool
+    submission_content: str = ""
+    theorem_statement: str = ""
+    theorem_name: str = ""
+    formal_sketch: str = ""
+    lean_code: str = ""
+    reasoning: str = ""
+    lean_feedback: str = ""
+    attempts: list[ProofAttemptFeedback] | None = None
+    failure_feedback: str = ""
+
+
+def is_lean_proof_submission(parsed: dict[str, Any]) -> bool:
+    """Return True when a submitter chose the optional Lean proof route."""
+    submission_type = str(parsed.get("submission_type") or parsed.get("type") or "").strip().lower()
+    if submission_type in {"lean_proof", "proof", "lean4_proof"}:
+        return True
+    return bool(parsed.get("lean_code")) and bool(parsed.get("theorem_statement") or parsed.get("theorem_or_lemma"))
+
+
+def _summarize_error(error_output: str, limit: int = 1400) -> str:
+    text = " ".join((error_output or "").split())
+    return text[:limit] + ("..." if len(text) > limit else "")
+
+
+def _format_attempts(attempts: list[ProofAttemptFeedback]) -> str:
+    if not attempts:
+        return "No prior Lean attempts."
+    blocks: list[str] = []
+    for attempt in attempts[-5:]:
+        lean_feedback = (
+            attempt.error_output
+            or attempt.diagnostic_output
+            or attempt.raw_stderr
+            or ("Lean accepted this attempt with no diagnostics." if attempt.success else "[none]")
+        )
+        blocks.extend(
+            [
+                f"ATTEMPT {attempt.attempt}:",
+                f"Reasoning: {attempt.reasoning or '[none]'}",
+                "Lean code:",
+                attempt.lean_code or "[none]",
+                "Lean / integrity feedback:",
+                lean_feedback,
+                f"Goal states: {attempt.goal_states or '[none]'}",
+                "---",
+            ]
+        )
+    return "\n".join(blocks)
+
+
+def _format_lean_feedback(lean_result: Any) -> str:
+    diagnostics = str(getattr(lean_result, "diagnostic_output", "") or "").strip()
+    if not diagnostics:
+        diagnostics = str(getattr(lean_result, "raw_stderr", "") or "").strip()
+    goal_states = str(getattr(lean_result, "goal_states", "") or "").strip()
+    parts = []
+    if diagnostics:
+        parts.append(diagnostics)
+    if goal_states:
+        parts.append(f"Goal state output:\n{goal_states}")
+    return "\n\n".join(parts).strip() or "Lean 4 accepted with no diagnostics."
+
+
+def _build_retry_prompt(
+    *,
+    user_prompt: str,
+    source_context: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    prior_attempts: list[ProofAttemptFeedback],
+) -> str:
+    context_excerpt = (source_context or "").strip()
+    if len(context_excerpt) > 12000:
+        context_excerpt = context_excerpt[:12000] + "\n...[context truncated for proof retry]..."
+    return f"""You are repairing a Lean 4 proof candidate for a brainstorm submission.
+
+The previous proof candidate was rejected by Lean 4 or by MOTO's post-Lean integrity gate. Produce a corrected complete Lean 4 proof. Do not use `sorry`, `admit`, or fake `axiom`/`constant`/`opaque` proof devices.
+
+{LEAN4_COMMON_PITFALLS}
+
+USER PROMPT:
+{user_prompt}
+
+INTENDED THEOREM STATEMENT:
+{theorem_statement}
+
+FORMALIZATION NOTES:
+{formal_sketch or "[none]"}
+
+BRAINSTORM CONTEXT EXCERPT:
+{context_excerpt or "[none]"}
+
+PRIOR ATTEMPTS AND FEEDBACK:
+{_format_attempts(prior_attempts)}
+
+Respond with ONLY valid JSON:
+{{
+  "theorem_name": "Lean declaration name, if named",
+  "theorem_statement": "natural-language theorem statement being proved",
+  "formal_sketch": "updated formalization notes",
+  "lean_code": "complete Lean 4 code",
+  "reasoning": "brief explanation of the repair"
+}}
+"""
+
+
+def _build_submission_content(
+    *,
+    theorem_statement: str,
+    formal_sketch: str,
+    lean_code: str,
+    reasoning: str,
+    lean_feedback: str,
+    attempts: list[ProofAttemptFeedback],
+) -> str:
+    attempt_count = len(attempts)
+    sections = [
+        BRAINSTORM_LEAN_PROOF_MARKER,
+        "",
+        "Lean 4 has accepted the following proof before this submission reached the brainstorm validator. The validator should still decide whether it is useful, non-redundant brainstorm progress.",
+        "",
+        f"Theorem statement: {theorem_statement}",
+    ]
+    if formal_sketch:
+        sections.extend(["", f"Formalization notes: {formal_sketch}"])
+    if reasoning:
+        sections.extend(["", f"Submitter reasoning: {reasoning}"])
+    sections.extend(
+        [
+            "",
+            f"Lean verification: accepted after {attempt_count} attempt{'s' if attempt_count != 1 else ''}.",
+            f"Lean verifier feedback: {lean_feedback}",
+            "",
+            "Lean 4 code:",
+            "```lean",
+            lean_code,
+            "```",
+        ]
+    )
+    return "\n".join(sections).strip()
+
+
+async def verify_brainstorm_proof_candidate(
+    *,
+    parsed: dict[str, Any],
+    user_prompt: str,
+    source_context: str,
+    model_id: str,
+    role_id: str,
+    task_id_prefix: str,
+    max_tokens: int,
+    validator_model: Optional[str],
+    validator_context: int,
+    validator_max_tokens: int,
+    validator_role_id: str,
+    allowed_baseline: str = "",
+    max_attempts: int = 5,
+) -> BrainstormProofGateResult:
+    """Lean-check a brainstorm proof candidate before it reaches the validator."""
+    theorem_statement = str(parsed.get("theorem_statement") or parsed.get("theorem_or_lemma") or parsed.get("submission") or "").strip()
+    formal_sketch = str(parsed.get("formal_sketch") or parsed.get("proof_sketch") or "").strip()
+    theorem_name = str(parsed.get("theorem_name") or "").strip()
+    lean_code = str(parsed.get("lean_code") or "").strip()
+    reasoning = str(parsed.get("reasoning") or "").strip()
+
+    if not theorem_statement or not lean_code:
+        return BrainstormProofGateResult(
+            accepted=False,
+            theorem_statement=theorem_statement,
+            lean_code=lean_code,
+            reasoning=reasoning,
+            failure_feedback=(
+                "Lean proof candidate was malformed: both `theorem_statement` and `lean_code` "
+                "are required. Start the next brainstorm attempt fresh."
+            ),
+            attempts=[],
+        )
+
+    attempts: list[ProofAttemptFeedback] = []
+    current = {
+        "theorem_statement": theorem_statement,
+        "formal_sketch": formal_sketch,
+        "theorem_name": theorem_name,
+        "lean_code": lean_code,
+        "reasoning": reasoning,
+    }
+
+    for attempt_number in range(1, max(1, max_attempts) + 1):
+        theorem_statement = str(current.get("theorem_statement") or theorem_statement).strip()
+        formal_sketch = str(current.get("formal_sketch") or formal_sketch).strip()
+        theorem_name = str(current.get("theorem_name") or theorem_name).strip()
+        lean_code = str(current.get("lean_code") or "").strip()
+        reasoning = str(current.get("reasoning") or reasoning).strip()
+
+        lean_result = await get_lean4_client().check_proof(
+            lean_code,
+            timeout=system_config.lean4_proof_timeout,
+        )
+        feedback = ProofAttemptFeedback(
+            attempt=attempt_number,
+            theorem_id="brainstorm_inline_proof",
+            reasoning=reasoning,
+            lean_code=lean_code,
+            error_output=lean_result.error_output,
+            diagnostic_output=str(getattr(lean_result, "diagnostic_output", "") or ""),
+            goal_states=lean_result.goal_states,
+            raw_stderr=str(getattr(lean_result, "raw_stderr", "") or ""),
+            strategy="full_script",
+            success=lean_result.success,
+        )
+
+        if lean_result.success:
+            lean_feedback = _format_lean_feedback(lean_result)
+            integrity = await validate_full_lean_proof_integrity(
+                user_prompt=user_prompt,
+                theorem_statement=theorem_statement,
+                formal_sketch=formal_sketch,
+                lean_code=lean_code,
+                source_excerpt=source_context or theorem_statement,
+                allowed_baseline=allowed_baseline,
+                validator_model=validator_model,
+                validator_context=validator_context,
+                validator_max_tokens=validator_max_tokens,
+                task_id=f"{task_id_prefix}_integrity_{attempt_number}",
+                role_id=validator_role_id,
+                require_statement_alignment=True,
+            )
+            if integrity.valid:
+                feedback.success = True
+                feedback.error_output = ""
+                attempts.append(feedback)
+                return BrainstormProofGateResult(
+                    accepted=True,
+                    submission_content=_build_submission_content(
+                        theorem_statement=theorem_statement,
+                        formal_sketch=formal_sketch,
+                        lean_code=lean_code,
+                        reasoning=reasoning,
+                        lean_feedback=lean_feedback,
+                        attempts=attempts,
+                    ),
+                    theorem_statement=theorem_statement,
+                    theorem_name=theorem_name,
+                    formal_sketch=formal_sketch,
+                    lean_code=lean_code,
+                    reasoning=reasoning,
+                    lean_feedback=lean_feedback,
+                    attempts=attempts,
+                )
+
+            feedback.success = False
+            feedback.error_output = integrity.reason
+
+        attempts.append(feedback)
+        if attempt_number >= max_attempts:
+            break
+
+        prompt = _build_retry_prompt(
+            user_prompt=user_prompt,
+            source_context=source_context,
+            theorem_statement=theorem_statement,
+            formal_sketch=formal_sketch,
+            prior_attempts=attempts,
+        )
+        try:
+            response = await api_client_manager.generate_completion(
+                task_id=f"{task_id_prefix}_repair_{attempt_number + 1}",
+                role_id=role_id,
+                model=model_id,
+                messages=[{"role": "user", "content": prompt}],
+                temperature=0.0,
+                max_tokens=max_tokens,
+            )
+            if not response or not response.get("choices"):
+                raise ValueError("Proof repair model returned no choices.")
+            message = response["choices"][0].get("message", {})
+            content = message.get("content") or message.get("reasoning") or ""
+            repaired = parse_json(content)
+            if isinstance(repaired, list):
+                repaired = repaired[0] if repaired else {}
+            if not isinstance(repaired, dict):
+                raise ValueError("Proof repair response was not a JSON object.")
+            current = {
+                "theorem_statement": str(repaired.get("theorem_statement") or theorem_statement).strip(),
+                "formal_sketch": str(repaired.get("formal_sketch") or formal_sketch).strip(),
+                "theorem_name": str(repaired.get("theorem_name") or theorem_name).strip(),
+                "lean_code": str(repaired.get("lean_code") or "").strip(),
+                "reasoning": str(repaired.get("reasoning") or "").strip(),
+            }
+        except Exception as exc:
+            if is_non_retryable_model_error(exc):
+                raise
+            logger.warning("Brainstorm proof repair attempt setup failed: %s", exc)
+            current = {
+                "theorem_statement": theorem_statement,
+                "formal_sketch": formal_sketch,
+                "theorem_name": theorem_name,
+                "lean_code": lean_code,
+                "reasoning": f"Prior proof repair call failed before Lean verification: {exc}",
+            }
+
+    last_error = attempts[-1].error_output if attempts else "No Lean attempts completed."
+    return BrainstormProofGateResult(
+        accepted=False,
+        theorem_statement=theorem_statement,
+        theorem_name=theorem_name,
+        formal_sketch=formal_sketch,
+        lean_code=lean_code,
+        reasoning=reasoning,
+        attempts=attempts,
+        failure_feedback=(
+            "Lean proof candidate failed the 5-attempt brainstorm proof gate. "
+            f"Last feedback: {_summarize_error(last_error)}. Start the next brainstorm attempt with a fresh useful question or idea."
+        ),
+    )
diff --git a/backend/shared/build_info.py b/backend/shared/build_info.py
index 94ae74c..bda5d73 100644
--- a/backend/shared/build_info.py
+++ b/backend/shared/build_info.py
@@ -22,7 +22,7 @@
     "version": "0.0.0-dev",
     "build_commit": "dev",
     "update_channel": "main",
-    "api_contract_version": "build5-v1",
+    "api_contract_version": "build5-v12",
 }
 
 _ENV_OVERRIDES = {
diff --git a/backend/shared/config.py b/backend/shared/config.py
index 1f965f5..257eefd 100644
--- a/backend/shared/config.py
+++ b/backend/shared/config.py
@@ -138,7 +138,7 @@ class SystemConfig(BaseSettings):
         validation_alias=AliasChoices("MOTO_INSTANCE_ID", "INSTANCE_ID"),
     )
     backend_host: str = Field(
-        default="0.0.0.0",
+        default="127.0.0.1",
         validation_alias=AliasChoices("MOTO_BACKEND_HOST", "HOST"),
     )
     backend_port: int = Field(
@@ -157,6 +157,30 @@ class SystemConfig(BaseSettings):
         default=None,
         validation_alias=AliasChoices("MOTO_INTERNAL_PROXY_SECRET", "INTERNAL_PROXY_SECRET"),
     )
+    generic_max_request_bytes: int = Field(
+        default=16 * 1024 * 1024,
+        validation_alias=AliasChoices("MOTO_GENERIC_MAX_REQUEST_BYTES", "GENERIC_MAX_REQUEST_BYTES"),
+    )
+    pdf_max_html_bytes: int = Field(
+        default=2 * 1024 * 1024,
+        validation_alias=AliasChoices("MOTO_PDF_MAX_HTML_BYTES", "PDF_MAX_HTML_BYTES"),
+    )
+    pdf_max_outline_bytes: int = Field(
+        default=1 * 1024 * 1024,
+        validation_alias=AliasChoices("MOTO_PDF_MAX_OUTLINE_BYTES", "PDF_MAX_OUTLINE_BYTES"),
+    )
+    pdf_max_metadata_bytes: int = Field(
+        default=64 * 1024,
+        validation_alias=AliasChoices("MOTO_PDF_MAX_METADATA_BYTES", "PDF_MAX_METADATA_BYTES"),
+    )
+    api_log_store_full_payloads: bool = Field(
+        default=False,
+        validation_alias=AliasChoices("MOTO_API_LOG_STORE_FULL_PAYLOADS", "API_LOG_STORE_FULL_PAYLOADS"),
+    )
+    desktop_api_token: Optional[str] = Field(
+        default=None,
+        validation_alias=AliasChoices("MOTO_DESKTOP_API_TOKEN", "DESKTOP_API_TOKEN"),
+    )
     frontend_storage_prefix: Optional[str] = Field(
         default=None,
         validation_alias=AliasChoices("MOTO_FRONTEND_STORAGE_PREFIX", "FRONTEND_STORAGE_PREFIX"),
@@ -169,6 +193,13 @@ class SystemConfig(BaseSettings):
     consecutive_rejection_reset_threshold: int = 15
     queue_overflow_threshold: int = 10
     per_submitter_queue_threshold: int = 4  # Pause an individual submitter when it already has more than this many submissions queued (fairness cap)
+    max_model_concurrency_per_model: int = Field(
+        default=3,
+        validation_alias=AliasChoices(
+            "MOTO_MAX_MODEL_CONCURRENCY_PER_MODEL",
+            "MAX_MODEL_CONCURRENCY_PER_MODEL",
+        ),
+    )
     
     # Compiler settings (Phase 2)
     # NOTE: Compiler contexts are set by user in GUI, these are just default fallbacks
@@ -235,6 +266,10 @@ class SystemConfig(BaseSettings):
         default=600,
         validation_alias=AliasChoices("MOTO_LEAN4_LSP_IDLE_TIMEOUT", "LEAN4_LSP_IDLE_TIMEOUT"),
     )
+    leanoj_auto_resume_enabled: bool = Field(
+        default=False,
+        validation_alias=AliasChoices("MOTO_LEANOJ_AUTO_RESUME_ENABLED", "LEANOJ_AUTO_RESUME_ENABLED"),
+    )
     # Maximum number of theorem candidates whose Lean 4 formalization attempts
     # may run concurrently within a single proof-verification stage. Novelty
     # assessment and proof-database persistence remain serialized after each
@@ -374,6 +409,9 @@ def _join_data_path(*parts: str) -> str:
         if self.internal_proxy_secret is not None:
             self.internal_proxy_secret = self.internal_proxy_secret.strip() or None
 
+        if self.desktop_api_token is not None:
+            self.desktop_api_token = self.desktop_api_token.strip() or None
+
         if self.frontend_storage_prefix is not None:
             self.frontend_storage_prefix = self.frontend_storage_prefix.strip() or None
 
diff --git a/backend/shared/json_parser.py b/backend/shared/json_parser.py
index befbd08..5f8f4c8 100644
--- a/backend/shared/json_parser.py
+++ b/backend/shared/json_parser.py
@@ -10,11 +10,277 @@
 import json
 import logging
 import re
+import hashlib
 from typing import Any
 
 logger = logging.getLogger(__name__)
 
 
+RETRY_CONTEXT_EMPTY_PLACEHOLDER = "[previous output contained no reusable visible answer text]"
+
+
+def _content_diagnostics(value: str) -> str:
+    """Return parse diagnostics without logging raw model output."""
+    text = value or ""
+    return f"length={len(text)}, sha256={hashlib.sha256(text.encode('utf-8', errors='replace')).hexdigest() if text else ''}"
+
+_PRIVATE_REASONING_OPEN_TAG_PATTERN = re.compile(r"^\s*<(?:think|thought)\b[^>]*>", re.IGNORECASE)
+_FINAL_CHANNEL_PATTERN = re.compile(r"<\|channel\|?>\s*final\b", re.IGNORECASE)
+_PRIVATE_CHANNEL_PATTERN = re.compile(r"<\|channel\|?>\s*(?:analysis|thought|commentary)\b", re.IGNORECASE)
+_LEGACY_CHANNEL_BOUNDARY_PATTERN = re.compile(r"<channel\|>", re.IGNORECASE)
+_KNOWN_CONTROL_TOKEN_NAMES = (
+    "channel",
+    "message",
+    "end",
+    "constrain",
+    "start",
+    "return",
+    "call",
+    "recipient",
+)
+_KNOWN_CONTROL_TOKEN_ALTERNATION = "|".join(_KNOWN_CONTROL_TOKEN_NAMES)
+_BROAD_CONTROL_TOKEN_PATTERN = re.compile(r"<\|[A-Za-z0-9_:-]+(?:\|>|>)", re.IGNORECASE)
+_LEGACY_CONTROL_TOKEN_PATTERN = re.compile(r"<(?:channel|message|end|constrain)\|>", re.IGNORECASE)
+_PARTIAL_CONTROL_TOKEN_PATTERN = re.compile(
+    rf"<\|(?:{_KNOWN_CONTROL_TOKEN_ALTERNATION})[A-Za-z_:-]*$|"
+    r"<(?:channel|message|end|constrain)\|?$",
+    re.IGNORECASE,
+)
+
+
+def _first_likely_visible_boundary(content: str) -> int:
+    """Return the first likely user-visible answer boundary, or -1 if absent."""
+    candidates = []
+    for marker in ("```", "{"):
+        idx = content.find(marker)
+        if idx >= 0:
+            candidates.append(idx)
+    if candidates:
+        return min(candidates)
+
+    for match in re.finditer(r"\[", content):
+        after_bracket = content[match.end():].lstrip()
+        if after_bracket and after_bracket[0] in '{["]-0123456789tfn':
+            return match.start()
+
+    return -1
+
+
+def _find_matches_outside_json_strings(pattern: re.Pattern, content: str) -> list[re.Match]:
+    """Find regex matches that start outside JSON-style quoted strings."""
+    matches = []
+    i = 0
+    in_string = False
+    escape_next = False
+
+    while i < len(content):
+        char = content[i]
+
+        if escape_next:
+            escape_next = False
+            i += 1
+            continue
+
+        if char == "\\" and in_string:
+            escape_next = True
+            i += 1
+            continue
+
+        if char == '"':
+            in_string = not in_string
+            i += 1
+            continue
+
+        if not in_string:
+            match = pattern.match(content, i)
+            if match:
+                matches.append(match)
+                i = max(match.end(), i + 1)
+                continue
+
+        i += 1
+
+    return matches
+
+
+def _has_match_outside_json_strings(pattern: re.Pattern, content: str) -> bool:
+    """Return True when pattern matches outside JSON-style quoted strings."""
+    return bool(_find_matches_outside_json_strings(pattern, content))
+
+
+def _strip_control_tokens_outside_json_strings(content: str) -> str:
+    """Strip provider control tokens without touching visible JSON string values."""
+    result = []
+    i = 0
+    in_string = False
+    escape_next = False
+
+    while i < len(content):
+        char = content[i]
+
+        if escape_next:
+            result.append(char)
+            escape_next = False
+            i += 1
+            continue
+
+        if char == "\\" and in_string:
+            result.append(char)
+            escape_next = True
+            i += 1
+            continue
+
+        if char == '"':
+            in_string = not in_string
+            result.append(char)
+            i += 1
+            continue
+
+        if not in_string:
+            if content.startswith("<|", i):
+                pipe_close = content.find("|>", i + 2)
+                angle_close = content.find(">", i + 2)
+                token_end = -1
+
+                if pipe_close >= 0 and (angle_close < 0 or pipe_close + 1 <= angle_close):
+                    token_end = pipe_close + 2
+                    token_body = content[i + 2:pipe_close]
+                elif angle_close >= 0:
+                    token_end = angle_close + 1
+                    token_body = content[i + 2:angle_close]
+                else:
+                    token_body = content[i + 2:]
+                    if re.fullmatch(r"[A-Za-z0-9_:-]+", token_body):
+                        i = len(content)
+                        continue
+
+                if token_end > 0 and re.fullmatch(r"[A-Za-z0-9_:-]+", token_body.strip()):
+                    i = token_end
+                    continue
+
+            for legacy_token in ("<channel|>", "<message|>", "<end|>", "<constrain|>"):
+                if content[i:i + len(legacy_token)].lower() == legacy_token:
+                    i += len(legacy_token)
+                    break
+            else:
+                result.append(char)
+                i += 1
+            continue
+
+        result.append(char)
+        i += 1
+
+    return "".join(result)
+
+
+def _strip_leading_private_reasoning_blocks(content: str) -> str:
+    """
+    Remove leading private reasoning transcript blocks without touching visible content.
+
+    Some providers expose private reasoning as a leading `<think>` or `<thought>`
+    block before the actual answer. Treat only leading blocks as transcript
+    scaffolding; preserve literal tags that appear inside visible JSON, code, or
+    prose because those may be the user's/model's actual content.
+    """
+    while True:
+        match = _PRIVATE_REASONING_OPEN_TAG_PATTERN.match(content)
+        if not match:
+            return content.strip()
+
+        tag_match = re.match(r"\s*<(?P<tag>think|thought)\b", content, re.IGNORECASE)
+        if not tag_match:
+            return content.strip()
+
+        tag_name = tag_match.group("tag")
+        close_match = re.search(rf"</{tag_name}\s*>", content[match.end():], re.IGNORECASE)
+        if close_match:
+            content = content[match.end() + close_match.end():].strip()
+            continue
+
+        # Unclosed private block: keep later likely answer text if it exists.
+        after_open_tag = content[match.end():]
+        boundary = _first_likely_visible_boundary(after_open_tag)
+        if boundary >= 0:
+            content = after_open_tag[boundary:].strip()
+            continue
+
+        return RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+
+def sanitize_model_output_for_retry_context(raw: str, max_chars: int = 2000) -> str:
+    """
+    Sanitize raw model output before replaying it as retry context.
+
+    This preserves useful visible failed-output excerpts for conversational retries
+    while stripping private reasoning/channel/control tokens that provider chat
+    templates may reject or that should not enter MOTO memory/context surfaces.
+    """
+    if raw is None:
+        return RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+    content = str(raw).replace("\r\n", "\n").replace("\r", "\n").strip()
+    if not content:
+        return RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+    original_content = content
+    private_marker_seen = bool(
+        _has_match_outside_json_strings(_PRIVATE_CHANNEL_PATTERN, content)
+        or _has_match_outside_json_strings(_FINAL_CHANNEL_PATTERN, content)
+        or _has_match_outside_json_strings(_LEGACY_CHANNEL_BOUNDARY_PATTERN, content)
+        or _has_match_outside_json_strings(_BROAD_CONTROL_TOKEN_PATTERN, content)
+        or _has_match_outside_json_strings(_LEGACY_CONTROL_TOKEN_PATTERN, content)
+        or _has_match_outside_json_strings(_PARTIAL_CONTROL_TOKEN_PATTERN, content)
+    )
+
+    # If a Harmony-style final channel is present, only the final-channel payload
+    # is reusable answer text. Earlier analysis/thought channels are private.
+    final_matches = _find_matches_outside_json_strings(_FINAL_CHANNEL_PATTERN, content)
+    if final_matches:
+        content = content[final_matches[-1].end():]
+    elif _has_match_outside_json_strings(_PRIVATE_CHANNEL_PATTERN, content):
+        legacy_boundaries = _find_matches_outside_json_strings(_LEGACY_CHANNEL_BOUNDARY_PATTERN, content)
+        if legacy_boundaries:
+            content = content[legacy_boundaries[-1].end():]
+        else:
+            boundary = _first_likely_visible_boundary(content)
+            if boundary >= 0:
+                content = content[boundary:]
+            else:
+                return RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+    content = _strip_leading_private_reasoning_blocks(content)
+    if content == RETRY_CONTEXT_EMPTY_PLACEHOLDER:
+        return content
+
+    # Remove complete and partial provider/private control tokens. Channel labels
+    # directly following token shapes are not user-visible answer content.
+    content = _strip_control_tokens_outside_json_strings(content)
+    content = re.sub(r"(?im)^\s*(analysis|thought|commentary|final)\s*$", "", content)
+    content = content.strip()
+
+    if private_marker_seen:
+        boundary = _first_likely_visible_boundary(content)
+        if boundary > 0:
+            content = content[boundary:].strip()
+
+    content = re.sub(r"\n{3,}", "\n\n", content).strip()
+    if not content:
+        logger.debug("Retry-context sanitizer removed private-only model output")
+        return RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+    if max_chars and max_chars > 0 and len(content) > max_chars:
+        content = content[:max_chars].rstrip() + "\n[...sanitized output truncated for retry...]"
+
+    if content != original_content:
+        logger.debug(
+            "Sanitized retry context output (%d -> %d chars)",
+            len(original_content),
+            len(content),
+        )
+
+    return content or RETRY_CONTEXT_EMPTY_PLACEHOLDER
+
+
 def sanitize_json_response(raw_content: str) -> str:
     """
     Sanitize JSON response to handle LaTeX expressions and invalid escape sequences.
@@ -68,7 +334,7 @@ def sanitize_json_response(raw_content: str) -> str:
     
     if len(content) < original_len:
         logger.debug(f"Stripped <think>...</think> reasoning tokens ({original_len} -> {len(content)} chars)")
-        logger.debug(f"Content after think removal (first 300 chars): {repr(content[:300])}")
+        logger.debug("Content after think removal redacted (%s)", _content_diagnostics(content))
     
     # Extra safety: Remove any remaining thinking-related tags
     content = re.sub(r'</think\s*>', '', content, flags=re.IGNORECASE).strip()
@@ -122,8 +388,9 @@ def sanitize_json_response(raw_content: str) -> str:
         original_content = content
         content = re.sub(control_token_pattern, '', content).strip()
         logger.debug(
-            f"Stripped control tokens: "
-            f"'{original_content[:150]}...' -> '{content[:150]}...'"
+            "Stripped control tokens: before=(%s), after=(%s)",
+            _content_diagnostics(original_content),
+            _content_diagnostics(content),
         )
     
     # Additional cleanup: Remove any remaining angle bracket artifacts
@@ -146,14 +413,14 @@ def sanitize_json_response(raw_content: str) -> str:
     # If no JSON start found, raise explicit error
     if json_start < 0:
         logger.warning(f"No JSON start character found in content (length={len(content)})")
-        logger.warning(f"Content preview: {repr(content[:200])}...")
+        logger.warning("Content preview redacted (%s)", _content_diagnostics(content))
         
         # NEW: Don't continue - this is pure reasoning text with no JSON
         # Raise explicit error for retry mechanism
         raise ValueError(
             f"No JSON found in response - only conversational reasoning text "
             f"({len(content)} chars). Model likely hit max_tokens before writing JSON. "
-            f"Content starts with: {repr(content[:200])}"
+            "Raw content preview is withheld from retry prompts; use logs for diagnostics."
         )
     else:
         # Strip everything before the JSON start (handles reasoning models that output
@@ -163,7 +430,7 @@ def sanitize_json_response(raw_content: str) -> str:
             content = content[json_start:]
             json_start = 0  # Reset to 0 since we stripped the prefix
             logger.debug(f"Stripped {len(stripped_prefix)} chars of non-JSON prefix")
-            logger.debug(f"Stripped prefix preview: {repr(stripped_prefix[:200])}...")
+            logger.debug("Stripped prefix preview redacted (%s)", _content_diagnostics(stripped_prefix))
     
     if json_start >= 0:
         try:
@@ -220,7 +487,7 @@ def sanitize_json_response(raw_content: str) -> str:
                         f"JSON response truncated at max_tokens: {brace_count} unclosed braces, "
                         f"in_string={in_string}, response length {len(content)} chars. "
                         f"Model needs to generate more concise output that fits within token limits. "
-                        f"{last_complete_context}"
+                        "Raw content preview is withheld from retry prompts; use logs for diagnostics."
                     )
             
             elif start_char == '[':
@@ -277,7 +544,7 @@ def sanitize_json_response(raw_content: str) -> str:
     # Safety check: ensure content is not empty after preprocessing
     if not content or not content.strip():
         logger.error(f"Sanitization resulted in empty content! Original length: {len(raw_content)}")
-        logger.error(f"Original content preview: {raw_content[:500]}...")
+        logger.error("Original content preview redacted (%s)", _content_diagnostics(raw_content))
         # Return original content and let the caller handle the error
         return raw_content.strip()
     
@@ -683,7 +950,7 @@ def parse_json(response_content: str) -> dict:
     # Check for anomalously short response
     if len(response_content.strip()) < 10:
         logger.error(f"parse_json: Response too short ({len(response_content)} chars)")
-        logger.error(f"Short response content: {repr(response_content)}")
+        logger.error("Short response content redacted (%s)", _content_diagnostics(response_content))
         raise ValueError(f"Response too short ({len(response_content)} chars)")
     
     # Sanitize and parse
@@ -718,7 +985,7 @@ def parse_json(response_content: str) -> dict:
         stripped = sanitized_content.rstrip()
         if stripped and stripped[-1] not in '}]':
             is_likely_truncated = True
-            truncation_hints.append(f"JSON doesn't end with }} or ] (ends with: {repr(stripped[-20:])})")
+            truncation_hints.append("JSON doesn't end with } or ]")
         
         # Count unclosed braces/brackets (rough check)
         open_braces = sanitized_content.count('{') - sanitized_content.count('}')
@@ -737,23 +1004,14 @@ def parse_json(response_content: str) -> dict:
             logger.error(f"🚨 LIKELY TRUNCATED LLM OUTPUT: {', '.join(truncation_hints)}")
             logger.error("This usually means the LLM hit max_tokens limit before completing the JSON response")
         
-        logger.error(f"Original response length: {len(response_content)} chars")
-        logger.error(f"Original response (first 500 chars): {repr(response_content[:500])}")
-        logger.error(f"Original response (last 200 chars): {repr(response_content[-200:])}")
-        logger.error(f"Sanitized content length: {len(sanitized_content)} chars")
-        logger.error(f"Sanitized content (first 500 chars): {repr(sanitized_content[:500])}")
-        logger.error(f"Sanitized content (last 200 chars): {repr(sanitized_content[-200:])}")
+        logger.error("Original response content redacted (%s)", _content_diagnostics(response_content))
+        logger.error("Sanitized content redacted (%s)", _content_diagnostics(sanitized_content))
         logger.error(f"Error position: line {e.lineno}, column {e.colno}, char {e.pos}")
-        if e.pos is not None and e.pos < len(sanitized_content):
-            # Show context around error position
-            start = max(0, e.pos - 50)
-            end = min(len(sanitized_content), e.pos + 50)
-            logger.error(f"Error context: ...{repr(sanitized_content[start:end])}...")
         raise
     except Exception as e:
         # Catch any other parsing errors
         logger.error(f"parse_json: Unexpected error during parsing - {type(e).__name__}: {e}")
-        logger.error(f"Response content: {repr(response_content[:1000])}")
+        logger.error("Response content redacted (%s)", _content_diagnostics(response_content))
         raise
     
     # Handle array responses - extract first element
diff --git a/backend/shared/lean4_client.py b/backend/shared/lean4_client.py
index 310d4b3..e8d0fcf 100644
--- a/backend/shared/lean4_client.py
+++ b/backend/shared/lean4_client.py
@@ -52,6 +52,7 @@ class Lean4Result:
     """Result of one Lean 4 proof check."""
     success: bool
     error_output: str = ""
+    diagnostic_output: str = ""
     goal_states: str = ""
     raw_stderr: str = ""
     tactic_error_slice: str = ""
@@ -370,7 +371,7 @@ async def _run_lean_file_once(
     ) -> tuple[int, str, str]:
         temp_path = self.workspace_dir / temp_filename
         try:
-            temp_path.write_text(prepared_code, encoding="utf-8")
+            await asyncio.to_thread(temp_path.write_text, prepared_code, encoding="utf-8")
             return await self._run_process(
                 [self.lake_path, "env", self.lean_path or self._resolve_executable("lean"), temp_filename],
                 cwd=self.workspace_dir,
@@ -379,7 +380,7 @@ async def _run_lean_file_once(
         finally:
             try:
                 if temp_path.exists():
-                    temp_path.unlink()
+                    await asyncio.to_thread(temp_path.unlink)
             except OSError:
                 logger.debug("Could not remove temporary Lean file %s", temp_path)
 
@@ -478,7 +479,7 @@ async def _repair_workspace_after_infrastructure_error(self, output: str) -> boo
         async with self._workspace_lock:
             self._workspace_unhealthy_error = ""
             self._workspace_ready = False
-            self._wipe_lake_directory()
+            await asyncio.to_thread(self._wipe_lake_directory)
             repaired = await self._ensure_workspace_locked()
             if not repaired:
                 self._mark_workspace_unhealthy(output)
@@ -940,7 +941,7 @@ def _extract_tactic_error_slice(
             ).strip()
         return error_slice, failing_tactic_index
 
-    async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
+    async def check_proof(self, lean_code: str, timeout: int = 120, *, allow_placeholders: bool = False) -> Lean4Result:
         """Write a temp Lean file, run Lean 4, and return structured feedback."""
         if not system_config.lean4_enabled:
             return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
@@ -951,9 +952,10 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
 
         # Fast pre-check: reject placeholder proofs before invoking Lean so
         # the model learns the rejection reason even when Lean would have
-        # compiled the file with only a warning.
+        # compiled the file with only a warning. LeanOJ can opt out when it
+        # intentionally wants to harvest a compiling incomplete scaffold.
         placeholder = _detect_forbidden_placeholder(prepared_code)
-        if placeholder:
+        if placeholder and not allow_placeholders:
             return Lean4Result(
                 success=False,
                 error_output=_format_placeholder_rejection(placeholder, from_lean_diagnostic=False),
@@ -1002,16 +1004,13 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
         has_error_diagnostic = "error:" in lowered
         has_sorry_warning = _output_contains_sorry_warning(combined_output)
         lean_exited_cleanly = returncode == 0
-        positive_pass = (
-            lean_exited_cleanly
-            and not has_error_diagnostic
-            and not has_sorry_warning
-        )
+        positive_pass = lean_exited_cleanly and not has_error_diagnostic and (allow_placeholders or not has_sorry_warning)
 
         if positive_pass:
             return Lean4Result(
                 success=True,
                 error_output="",
+                diagnostic_output=combined_output,
                 goal_states=goal_states,
                 raw_stderr=stderr.strip(),
             )
@@ -1173,6 +1172,7 @@ async def _run_tactic_script_once(
             return Lean4Result(
                 success=True,
                 error_output="",
+                diagnostic_output=combined_output,
                 goal_states=goal_states,
                 raw_stderr=stderr.strip(),
                 tactic_error_slice="",
@@ -1586,6 +1586,7 @@ def _result_from_diagnostics(
             return Lean4Result(
                 success=True,
                 error_output="",
+                diagnostic_output=combined_output,
                 goal_states=goal_states,
                 raw_stderr=raw_stderr,
             )
@@ -1649,7 +1650,7 @@ async def _check_via_lsp(
         self._open_document_versions[uri] = version
 
         try:
-            temp_path.write_text(prepared_code, encoding="utf-8")
+            await asyncio.to_thread(temp_path.write_text, prepared_code, encoding="utf-8")
             await self._send_notification(
                 "textDocument/didOpen",
                 {
@@ -1697,9 +1698,9 @@ async def _check_via_lsp(
             self._open_document_versions.pop(uri, None)
             with suppress(OSError):
                 if temp_path.exists():
-                    temp_path.unlink()
+                    await asyncio.to_thread(temp_path.unlink)
 
-    async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
+    async def check_proof(self, lean_code: str, timeout: int = 120, *, allow_placeholders: bool = False) -> Lean4Result:
         """Check a proof through the persistent Lean LSP when healthy, otherwise fall back."""
         if not system_config.lean4_enabled:
             return Lean4Result(success=False, error_output="Lean 4 is disabled in system configuration.")
@@ -1709,6 +1710,12 @@ async def check_proof(self, lean_code: str, timeout: int = 120) -> Lean4Result:
             return Lean4Result(success=False, error_output="No Lean 4 code was provided.")
 
         placeholder = _detect_forbidden_placeholder(prepared_code)
+        if placeholder and allow_placeholders:
+            return await self._subprocess_fallback.check_proof(
+                lean_code,
+                timeout=timeout,
+                allow_placeholders=True,
+            )
         if placeholder:
             return Lean4Result(
                 success=False,
diff --git a/backend/shared/lean_proof_integrity.py b/backend/shared/lean_proof_integrity.py
new file mode 100644
index 0000000..ee81e74
--- /dev/null
+++ b/backend/shared/lean_proof_integrity.py
@@ -0,0 +1,233 @@
+"""Shared integrity checks for Lean 4 proof outputs."""
+from __future__ import annotations
+
+import logging
+import re
+from dataclasses import dataclass, field
+from typing import Optional
+
+from backend.autonomous.prompts.proof_prompts import build_proof_statement_alignment_prompt
+from backend.shared.api_client_manager import api_client_manager
+from backend.shared.json_parser import parse_json
+from backend.shared.model_error_utils import is_non_retryable_model_error
+from backend.shared.utils import count_tokens
+
+logger = logging.getLogger(__name__)
+
+_LEAN_DECL_NAME = r"(?:[A-Za-z_][A-Za-z0-9_'.]*|«[^»]+»)"
+
+_DECLARATION_DEVICE_COMMAND_RE = re.compile(
+    r"^\s*(?:@\[[^\]]+\]\s*)*(?:private\s+|protected\s+|noncomputable\s+|unsafe\s+)*"
+    r"(axiom|constant|opaque)\b(?P<body>.*?)"
+    r"(?=^\s*(?:@\[[^\]]+\]\s*)*(?:private\s+|protected\s+|noncomputable\s+|unsafe\s+)*"
+    r"(?:axiom|constant|opaque|theorem|lemma|def|example|import|namespace|section|end|open|"
+    r"variable|variables|structure|class|inductive|instance|abbrev)\b|\Z)",
+    re.MULTILINE | re.DOTALL,
+)
+_DECLARATION_NAME_RE = re.compile(_LEAN_DECL_NAME)
+_DECLARATION_BINDER_RE = re.compile(rf"\(\s*({_LEAN_DECL_NAME}(?:\s+{_LEAN_DECL_NAME})*)\s*:")
+_DECLARATION_LEADING_NAMES_RE = re.compile(rf"^\s*({_LEAN_DECL_NAME}(?:\s+{_LEAN_DECL_NAME})*)\s*(?::|:=|where\b|$)")
+
+
+@dataclass
+class LeanProofIntegrityResult:
+    """Result of non-Lean integrity checks applied after Lean accepts code."""
+    valid: bool
+    reason: str = ""
+    category: str = "ok"
+    introduced_devices: list[str] = field(default_factory=list)
+
+
+def strip_lean_comments_and_strings(code: str) -> str:
+    """Best-effort removal of comments and string literals before source scanning."""
+    without_block_comments = re.sub(r"/-.*?-/", " ", code or "", flags=re.DOTALL)
+    without_line_comments = re.sub(r"--[^\n]*", " ", without_block_comments)
+    return re.sub(r'"(?:\\.|[^"\\])*"', ' "" ', without_line_comments)
+
+
+def find_declaration_devices(code: str) -> set[tuple[str, str]]:
+    """Return axiom/constant/opaque declarations found in Lean source."""
+    devices: set[tuple[str, str]] = set()
+    for match in _DECLARATION_DEVICE_COMMAND_RE.finditer(strip_lean_comments_and_strings(code)):
+        kind = match.group(1)
+        body = match.group("body") or ""
+        names: list[str] = []
+
+        for binder_match in _DECLARATION_BINDER_RE.finditer(body):
+            names.extend(name.group(0) for name in _DECLARATION_NAME_RE.finditer(binder_match.group(1)))
+
+        if not names:
+            leading_match = _DECLARATION_LEADING_NAMES_RE.match(body)
+            if leading_match:
+                names.extend(name.group(0) for name in _DECLARATION_NAME_RE.finditer(leading_match.group(1)))
+
+        for name in names:
+            devices.add((kind, name))
+    return devices
+
+
+def find_introduced_declaration_devices(lean_code: str, allowed_baseline: str = "") -> list[str]:
+    """Return declaration devices present in ``lean_code`` but absent from baseline."""
+    allowed = find_declaration_devices(allowed_baseline)
+    introduced: list[str] = []
+    for kind, name in sorted(find_declaration_devices(lean_code)):
+        if (kind, name) not in allowed:
+            introduced.append(f"{kind} {name}")
+    return introduced
+
+
+def validate_lean_proof_integrity(
+    *,
+    lean_code: str,
+    allowed_baseline: str = "",
+) -> LeanProofIntegrityResult:
+    """Reject fake declaration devices that Lean accepts but MOTO does not."""
+    introduced = find_introduced_declaration_devices(
+        lean_code=lean_code,
+        allowed_baseline=allowed_baseline,
+    )
+    if introduced:
+        return LeanProofIntegrityResult(
+            valid=False,
+            category="forbidden_declaration_device",
+            introduced_devices=introduced,
+            reason=(
+                "LEAN PROOF INTEGRITY REJECTED: the submitted Lean code introduces new "
+                "axiom/constant/opaque declarations not present in the allowed baseline: "
+                f"{', '.join(introduced[:8])}. Do not prove results by adding fake assumptions; "
+                "use constructive Lean/Mathlib proof terms or tactics."
+            ),
+        )
+    return LeanProofIntegrityResult(valid=True)
+
+
+async def validate_lean_statement_alignment(
+    *,
+    user_prompt: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    lean_code: str,
+    source_excerpt: str,
+    validator_model: str,
+    validator_context: int,
+    validator_max_tokens: int,
+    task_id: str,
+    role_id: str,
+) -> LeanProofIntegrityResult:
+    """Use an LLM validator to ensure accepted Lean code matches the intended claim."""
+    prompt = build_proof_statement_alignment_prompt(
+        user_prompt=user_prompt,
+        theorem_statement=theorem_statement,
+        formal_sketch=formal_sketch,
+        lean_code=lean_code,
+        source_excerpt=source_excerpt,
+    )
+    max_input_tokens = validator_context - validator_max_tokens
+    trimmed_excerpt = source_excerpt or ""
+    while count_tokens(prompt) > max_input_tokens and len(trimmed_excerpt) > 1500:
+        trimmed_excerpt = trimmed_excerpt[: max(len(trimmed_excerpt) // 2, 1500)]
+        prompt = build_proof_statement_alignment_prompt(
+            user_prompt=user_prompt,
+            theorem_statement=theorem_statement,
+            formal_sketch=formal_sketch,
+            lean_code=lean_code,
+            source_excerpt=trimmed_excerpt,
+        )
+
+    try:
+        response = await api_client_manager.generate_completion(
+            task_id=task_id,
+            role_id=role_id,
+            model=validator_model,
+            messages=[{"role": "user", "content": prompt}],
+            max_tokens=validator_max_tokens,
+            temperature=0.0,
+        )
+        if not response or not response.get("choices"):
+            return LeanProofIntegrityResult(
+                valid=False,
+                category="statement_alignment_unavailable",
+                reason="LEAN PROOF INTEGRITY REJECTED: statement-alignment validator returned no response.",
+            )
+        message = response["choices"][0].get("message", {})
+        content = message.get("content") or message.get("reasoning") or ""
+        if not content:
+            return LeanProofIntegrityResult(
+                valid=False,
+                category="statement_alignment_unavailable",
+                reason="LEAN PROOF INTEGRITY REJECTED: statement-alignment validator returned empty content.",
+            )
+        data = parse_json(content)
+        if isinstance(data, list):
+            data = data[0] if data else {}
+        if not isinstance(data, dict):
+            data = {}
+    except Exception as exc:
+        if is_non_retryable_model_error(exc):
+            raise
+        logger.warning("Lean statement alignment validation failed: %s", exc)
+        return LeanProofIntegrityResult(
+            valid=False,
+            category="statement_alignment_unavailable",
+            reason=(
+                "LEAN PROOF INTEGRITY REJECTED: statement-alignment validation failed before "
+                f"a usable decision was produced: {type(exc).__name__}: {exc}"
+            ),
+        )
+
+    decision = str(data.get("decision") or "").strip().lower()
+    reasoning = str(data.get("reasoning") or data.get("summary") or "").strip()
+    if decision != "accept":
+        return LeanProofIntegrityResult(
+            valid=False,
+            category="statement_alignment_rejected",
+            reason=(
+                "LEAN PROOF INTEGRITY REJECTED: Lean accepted the code, but the statement-alignment "
+                f"validator rejected it as unrelated or insufficient. {reasoning}"
+            ).strip(),
+        )
+    return LeanProofIntegrityResult(valid=True, reason=reasoning, category="statement_alignment")
+
+
+async def validate_full_lean_proof_integrity(
+    *,
+    user_prompt: str,
+    theorem_statement: str,
+    formal_sketch: str,
+    lean_code: str,
+    source_excerpt: str,
+    allowed_baseline: str,
+    validator_model: Optional[str] = None,
+    validator_context: int = 131072,
+    validator_max_tokens: int = 25000,
+    task_id: str = "proof_integrity_000",
+    role_id: str = "proof_integrity_validator",
+    require_statement_alignment: bool = True,
+) -> LeanProofIntegrityResult:
+    """Run all post-Lean integrity checks used by proof-producing systems."""
+    structural = validate_lean_proof_integrity(
+        lean_code=lean_code,
+        allowed_baseline=allowed_baseline,
+    )
+    if not structural.valid:
+        return structural
+    if not require_statement_alignment:
+        return structural
+    if not validator_model:
+        return LeanProofIntegrityResult(
+            valid=False,
+            category="statement_alignment_unavailable",
+            reason="LEAN PROOF INTEGRITY REJECTED: no validator model was configured for statement alignment.",
+        )
+    return await validate_lean_statement_alignment(
+        user_prompt=user_prompt,
+        theorem_statement=theorem_statement,
+        formal_sketch=formal_sketch,
+        lean_code=lean_code,
+        source_excerpt=source_excerpt,
+        validator_model=validator_model,
+        validator_context=validator_context,
+        validator_max_tokens=validator_max_tokens,
+        task_id=task_id,
+        role_id=role_id,
+    )
diff --git a/backend/shared/lm_studio_client.py b/backend/shared/lm_studio_client.py
index ebc0e1a..3b0b8fe 100644
--- a/backend/shared/lm_studio_client.py
+++ b/backend/shared/lm_studio_client.py
@@ -15,9 +15,10 @@
 import asyncio
 import time
 import os
+import re
 from pathlib import Path
 from datetime import datetime
-from typing import List, Dict, Any, Optional
+from typing import List, Dict, Any, Optional, Tuple
 from backend.shared.config import rag_config, system_config
 import logging
 
@@ -27,8 +28,23 @@
 Path(system_config.logs_dir).mkdir(parents=True, exist_ok=True)
 
 
+def _sanitize_lm_studio_error_text(value: Any, max_chars: int = 500) -> str:
+    """Return a bounded LM Studio diagnostic without echoed prompts or secrets."""
+    text = str(value or "")
+    text = re.sub(r"(Bearer\s+)[A-Za-z0-9._~+\-/=]+", r"\1[redacted]", text, flags=re.IGNORECASE)
+    text = re.sub(r'("api[_-]?key"\s*:\s*)"[^"]*"', r'\1"[redacted]"', text, flags=re.IGNORECASE)
+    text = re.sub(r'("messages"\s*:\s*)\[[\s\S]*?\]', r'\1[redacted]', text, flags=re.IGNORECASE)
+    text = re.sub(r'("prompt"\s*:\s*)"[\s\S]*?"', r'\1"[redacted]"', text, flags=re.IGNORECASE)
+    if len(text) > max_chars:
+        return text[:max_chars] + "...[truncated]"
+    return text
+
+
 class LMStudioClient:
     """Client for LM Studio API."""
+    ROUTING_METADATA_KEY = "_moto_lm_studio_routing"
+    INSTANCE_REGISTRY_TTL_SECONDS = 5.0
+    _NUMERIC_INSTANCE_SUFFIX_RE = re.compile(r"^(?P<base>.+):(?P<instance>\d+)$")
     
     # Embedding performance settings
     EMBEDDING_BATCH_SIZE = 100  # Process embeddings in batches of 100
@@ -56,11 +72,76 @@ def __init__(self, base_url: str = None):
                 keepalive_expiry=30.0
             )
         )
+        self._loaded_instance_groups: Dict[str, List[str]] = {}
+        self._loaded_instance_cache_at = 0.0
+        self._instance_registry_lock = asyncio.Lock()
+        self._inflight_by_model: Dict[str, int] = {}
+        self._inflight_lock = asyncio.Lock()
+
+    @classmethod
+    def split_numeric_instance_suffix(cls, model: str) -> Tuple[str, Optional[int]]:
+        """Split LM Studio's final numeric `:#` instance suffix, if present."""
+        model_id = (model or "").strip()
+        match = cls._NUMERIC_INSTANCE_SUFFIX_RE.match(model_id)
+        if not match:
+            return model_id, None
+        return match.group("base"), int(match.group("instance"))
+
+    @classmethod
+    def normalize_instance_base(cls, model: str) -> str:
+        """Return the same-base model key used to group LM Studio sibling instances."""
+        base, _ = cls.split_numeric_instance_suffix(model)
+        return base
+
+    @classmethod
+    def has_numeric_instance_suffix(cls, model: str) -> bool:
+        """Return True only for LM Studio-style numeric instance IDs like `model:2`."""
+        _, instance = cls.split_numeric_instance_suffix(model)
+        return instance is not None
+
+    @classmethod
+    def build_instance_groups(cls, loaded_models: List[str]) -> Dict[str, List[str]]:
+        """Group loaded LM Studio model IDs by same-base instance family."""
+        groups: Dict[str, List[str]] = {}
+        for model in loaded_models or []:
+            model_id = (model or "").strip()
+            if not model_id:
+                continue
+            base = cls.normalize_instance_base(model_id)
+            groups.setdefault(base, []).append(model_id)
+
+        for base, models in groups.items():
+            groups[base] = sorted(
+                dict.fromkeys(models),
+                key=lambda item: (
+                    cls.split_numeric_instance_suffix(item)[1]
+                    if cls.split_numeric_instance_suffix(item)[1] is not None
+                    else 0,
+                    item,
+                ),
+            )
+        return groups
+
+    @classmethod
+    def get_sibling_instances_from_loaded(cls, model: str, loaded_models: List[str]) -> List[str]:
+        """Return same-base loaded instances for a requested model."""
+        base = cls.normalize_instance_base(model)
+        siblings = cls.build_instance_groups(loaded_models).get(base, [])
+        if len(siblings) < 2:
+            return []
+        if not any(cls.has_numeric_instance_suffix(candidate) for candidate in siblings):
+            return []
+        return siblings
+
+    @classmethod
+    def count_sibling_instances_from_loaded(cls, model: str, loaded_models: List[str]) -> int:
+        """Count same-base loaded LM Studio instances for scheduler decisions."""
+        return len(cls.get_sibling_instances_from_loaded(model, loaded_models))
     
     async def _get_model_semaphore(self, model: str) -> asyncio.Semaphore:
         """
         Get or create semaphore for a specific model.
-        Each model gets its own semaphore (limit=1) to prevent concurrent requests.
+        Each model gets its own semaphore to bound concurrent requests.
         Different models can run in parallel.
         
         Args:
@@ -71,8 +152,9 @@ async def _get_model_semaphore(self, model: str) -> asyncio.Semaphore:
         """
         async with self._semaphore_lock:
             if model not in self._model_semaphores:
-                self._model_semaphores[model] = asyncio.Semaphore(1)
-                logger.debug(f"Created semaphore for model: {model}")
+                limit = max(1, int(system_config.max_model_concurrency_per_model or 1))
+                self._model_semaphores[model] = asyncio.Semaphore(limit)
+                logger.debug(f"Created semaphore for model: {model} (limit={limit})")
             return self._model_semaphores[model]
     
     async def list_models(self) -> List[Dict[str, Any]]:
@@ -151,6 +233,142 @@ async def get_loaded_models(self) -> List[str]:
         except Exception as e:
             logger.error(f"Failed to get loaded models: {e}")
             return []
+
+    async def get_loaded_instance_groups(self, force_refresh: bool = False) -> Dict[str, List[str]]:
+        """Return cached same-base groups for loaded LM Studio instances."""
+        now = time.monotonic()
+        async with self._instance_registry_lock:
+            cache_is_fresh = (
+                not force_refresh
+                and self._loaded_instance_cache_at > 0
+                and now - self._loaded_instance_cache_at < self.INSTANCE_REGISTRY_TTL_SECONDS
+            )
+            if cache_is_fresh:
+                return {base: list(models) for base, models in self._loaded_instance_groups.items()}
+
+            try:
+                loaded_models = await self.get_loaded_models()
+            except Exception as exc:
+                logger.debug(f"LM Studio instance registry refresh failed: {exc}")
+                loaded_models = []
+
+            self._loaded_instance_groups = self.build_instance_groups(loaded_models)
+            self._loaded_instance_cache_at = time.monotonic()
+            return {base: list(models) for base, models in self._loaded_instance_groups.items()}
+
+    async def count_loaded_sibling_instances(self, model: str, loaded_models: Optional[List[str]] = None) -> int:
+        """Count loaded same-base instances for a requested model."""
+        if loaded_models is not None:
+            return self.count_sibling_instances_from_loaded(model, loaded_models)
+        groups = await self.get_loaded_instance_groups()
+        siblings = groups.get(self.normalize_instance_base(model), [])
+        if len(siblings) < 2:
+            return 0
+        if not any(self.has_numeric_instance_suffix(candidate) for candidate in siblings):
+            return 0
+        return len(siblings)
+
+    @classmethod
+    def extract_routing_metadata(cls, response: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+        """Return LM Studio instance-routing metadata attached to a response."""
+        if not isinstance(response, dict):
+            return {}
+        metadata = response.get(cls.ROUTING_METADATA_KEY)
+        if isinstance(metadata, dict):
+            return metadata.copy()
+        return {}
+
+    def _attach_routing_metadata(
+        self,
+        response: Dict[str, Any],
+        *,
+        requested_model: str,
+        actual_model: str,
+        sibling_instances: Optional[List[str]] = None,
+    ) -> Dict[str, Any]:
+        """Attach requested/actual LM Studio instance details to a response."""
+        if not isinstance(response, dict):
+            return response
+        base_model = self.normalize_instance_base(requested_model)
+        response[self.ROUTING_METADATA_KEY] = {
+            "requested_model": requested_model,
+            "actual_model": actual_model,
+            "base_model": base_model,
+            "shared_instance": actual_model != requested_model,
+            "sibling_instances": list(sibling_instances or []),
+        }
+        return response
+
+    async def _select_completion_model(self, requested_model: str) -> Tuple[str, List[str]]:
+        """
+        Choose an idle same-base LM Studio instance for a completion.
+
+        Discovery failures are fail-closed: return the requested model.
+        """
+        groups = await self.get_loaded_instance_groups()
+        base_model = self.normalize_instance_base(requested_model)
+        siblings = groups.get(base_model, [])
+        if len(siblings) < 2 or not any(self.has_numeric_instance_suffix(candidate) for candidate in siblings):
+            siblings = []
+
+        # If discovery found loaded siblings for this base, only dispatch to
+        # those concrete loaded IDs. This also supports callers configured with
+        # the unsuffixed base model while LM Studio exposes `base:1`, `base:2`.
+        candidates = siblings or [requested_model]
+
+        requested_base = self.normalize_instance_base(requested_model)
+        candidates = [
+            candidate
+            for candidate in dict.fromkeys(candidates)
+            if self.normalize_instance_base(candidate) == requested_base
+        ]
+        if not candidates:
+            candidates = [requested_model]
+
+        async with self._inflight_lock:
+            idle_candidates = [
+                candidate
+                for candidate in candidates
+                if self._inflight_by_model.get(candidate, 0) <= 0
+            ]
+            if idle_candidates:
+                selected_model = min(
+                    idle_candidates,
+                    key=lambda candidate: (
+                        candidate != requested_model,
+                        self.split_numeric_instance_suffix(candidate)[1]
+                        if self.split_numeric_instance_suffix(candidate)[1] is not None
+                        else 0,
+                        candidate,
+                    ),
+                )
+            elif requested_model in candidates:
+                selected_model = requested_model
+            else:
+                # Unsuffixed configs may only have concrete loaded `base:#`
+                # instances. If they are all busy, queue on the least-loaded
+                # concrete instance rather than sending an unloaded base ID.
+                selected_model = min(
+                    candidates,
+                    key=lambda candidate: (
+                        self._inflight_by_model.get(candidate, 0),
+                        self.split_numeric_instance_suffix(candidate)[1]
+                        if self.split_numeric_instance_suffix(candidate)[1] is not None
+                        else 0,
+                        candidate,
+                    ),
+                )
+            self._inflight_by_model[selected_model] = self._inflight_by_model.get(selected_model, 0) + 1
+            return selected_model, siblings
+
+    async def _release_completion_model(self, actual_model: str) -> None:
+        """Release in-flight accounting for a selected LM Studio instance."""
+        async with self._inflight_lock:
+            current = self._inflight_by_model.get(actual_model, 0)
+            if current <= 1:
+                self._inflight_by_model.pop(actual_model, None)
+            else:
+                self._inflight_by_model[actual_model] = current - 1
     
     async def generate_completion(
         self,
@@ -171,22 +389,39 @@ async def generate_completion(
             tools: Optional OpenAI-compatible tool schemas (LM Studio 0.3+).
             tool_choice: Optional tool-choice directive.
         """
+        requested_model = model
         # Get model-specific semaphore (allows different models to run in parallel)
         if skip_semaphore:
             # Direct execution without semaphore
-            return await self._execute_completion_request(
+            response = await self._execute_completion_request(
                 model, messages, temperature, max_tokens, response_format,
                 tools=tools, tool_choice=tool_choice,
             )
+            return self._attach_routing_metadata(
+                response,
+                requested_model=requested_model,
+                actual_model=model,
+                sibling_instances=[],
+            )
         
-        model_semaphore = await self._get_model_semaphore(model)
+        actual_model, sibling_instances = await self._select_completion_model(requested_model)
+        model_semaphore = await self._get_model_semaphore(actual_model)
         
-        # ACQUIRE THIS MODEL'S SEMAPHORE to prevent concurrent requests to same model
-        async with model_semaphore:
-            return await self._execute_completion_request(
-                model, messages, temperature, max_tokens, response_format,
-                tools=tools, tool_choice=tool_choice,
-            )
+        # Bound same-model parallelism so multi-submitter phases can overlap without unbounded fanout.
+        try:
+            async with model_semaphore:
+                response = await self._execute_completion_request(
+                    actual_model, messages, temperature, max_tokens, response_format,
+                    tools=tools, tool_choice=tool_choice,
+                )
+                return self._attach_routing_metadata(
+                    response,
+                    requested_model=requested_model,
+                    actual_model=actual_model,
+                    sibling_instances=sibling_instances,
+                )
+        finally:
+            await self._release_completion_model(actual_model)
     
     async def _execute_completion_request(
         self,
@@ -247,7 +482,8 @@ async def _execute_completion_request(
                 
             except httpx.HTTPStatusError as e:
                 if e.response.status_code == 400:
-                    error_detail = e.response.text if hasattr(e.response, 'text') else str(e)
+                    raw_error_detail = e.response.text if hasattr(e.response, 'text') else str(e)
+                    error_detail = _sanitize_lm_studio_error_text(raw_error_detail)
                     logger.error(
                         f"LM Studio 400 Bad Request (attempt {attempt + 1}/{max_retries + 1}): "
                         f"model={model}, approx_tokens={approx_tokens}, "
@@ -444,7 +680,7 @@ async def test_connection(self) -> bool:
             logger.error(f"Failed to connect to LM Studio: {e}")
             return False
     
-    async def check_availability(self) -> Dict[str, Any]:
+    async def check_availability(self, include_cli_models: bool = False) -> Dict[str, Any]:
         """
         Check if LM Studio server is reachable and has models loaded.
         
@@ -472,13 +708,9 @@ async def check_availability(self) -> Dict[str, Any]:
             # Server is reachable
             result["available"] = True
 
-            # Extract models from the /v1/models response as a reliable fallback.
-            # The `lms ps` CLI is preferred (it returns instance IDs), but the CLI
-            # may be missing from PATH or slow/timing out during startup while
-            # nomic is still loading. In either case we must NOT downgrade a
-            # successful /v1/models response to "no models" — that produces a
-            # phantom "LM Studio Offline" state even though embedding calls
-            # are succeeding.
+            # Extract models from the /v1/models response. Routine availability
+            # checks use HTTP only; the `lms ps` CLI can hang or crash under load
+            # on Windows, so reserve it for explicit diagnostics.
             http_models: List[str] = []
             try:
                 data = response.json()
@@ -490,7 +722,7 @@ async def check_availability(self) -> Dict[str, Any]:
             except Exception as parse_err:
                 logger.debug(f"Could not parse /v1/models response body: {parse_err}")
 
-            cli_models = await self.get_loaded_models()
+            cli_models = await self.get_loaded_models() if include_cli_models else []
 
             if cli_models:
                 models = cli_models
@@ -557,7 +789,6 @@ async def test_model_compatibility(self, model_name: str) -> tuple[bool, str, di
                 "completion_tokens": completion_tokens,
                 "prompt_tokens": prompt_tokens,
                 "content_length": len(content),
-                "content_preview": content[:100] if content else "(empty)"
             }
             
             # Check 1: Empty or whitespace-only response
@@ -581,11 +812,15 @@ async def test_model_compatibility(self, model_name: str) -> tuple[bool, str, di
                 
                 sanitized_content = sanitize_json_response(content)
                 parsed_json = json.loads(sanitized_content)
-                logger.info(f"Model '{model_name}' produced valid JSON: {parsed_json}")
+                logger.info(
+                    "Model '%s' produced valid JSON with keys: %s",
+                    model_name,
+                    sorted(parsed_json.keys()) if isinstance(parsed_json, dict) else type(parsed_json).__name__,
+                )
             except json.JSONDecodeError as json_err:
                 error = f"Model '{model_name}' FAILED to produce valid JSON: {json_err}"
                 logger.error(f"Compatibility test FAILED: {error}")
-                logger.error(f"Response content: {content}")
+                logger.error("Response content redacted (length=%d)", len(content or ""))
                 logger.error(f"Details: {details}")
                 return (False, error, details)
             
diff --git a/backend/shared/log_redaction.py b/backend/shared/log_redaction.py
new file mode 100644
index 0000000..c5a24bc
--- /dev/null
+++ b/backend/shared/log_redaction.py
@@ -0,0 +1,29 @@
+"""
+Small helpers for removing obvious secrets from locally persisted log previews.
+"""
+from __future__ import annotations
+
+import re
+from typing import Any
+
+
+_SECRET_PATTERNS = (
+    re.compile(r"(Bearer\s+)[A-Za-z0-9._~+/=-]+", re.IGNORECASE),
+    re.compile(r'("(?:api[_-]?key|appid|authorization|password|token|secret)"\s*:\s*)"[^"]*"', re.IGNORECASE),
+    re.compile(r"((?:api[_-]?key|appid|authorization|password|token|secret)\s*[=:]\s*)[^\s,&}\]]+", re.IGNORECASE),
+    re.compile(r"\bsk-or-v1-[A-Za-z0-9._~+/=-]+", re.IGNORECASE),
+)
+
+
+def redact_log_text(value: Any, max_chars: int | None = None) -> str:
+    """Return text with common credential shapes redacted and optionally capped."""
+    text = str(value or "")
+    for pattern in _SECRET_PATTERNS:
+        text = pattern.sub(
+            lambda match: f"{match.group(1) if match.lastindex else ''}[redacted]",
+            text,
+        )
+
+    if max_chars is not None and max_chars >= 0 and len(text) > max_chars:
+        return text[:max_chars] + "...[truncated]"
+    return text
diff --git a/backend/shared/model_error_utils.py b/backend/shared/model_error_utils.py
new file mode 100644
index 0000000..d6455b9
--- /dev/null
+++ b/backend/shared/model_error_utils.py
@@ -0,0 +1,39 @@
+"""Helpers for distinguishing model availability failures from ordinary output errors."""
+from __future__ import annotations
+
+from backend.shared.openrouter_client import (
+    CreditExhaustionError,
+    FreeModelExhaustedError,
+    OpenRouterPrivacyPolicyError,
+)
+
+
+_NON_RETRYABLE_MODEL_ERROR_MARKERS = (
+    "account free credits exhausted",
+    "all free model options exhausted",
+    "and no fallback configured",
+    "and no lm studio fallback",
+    "boost requested but no openrouter api key",
+    "free credits exhausted",
+    "no api key is set",
+    "no fallback configured",
+    "no lm studio fallback",
+    "no openrouter api key is available",
+    "openrouter credits exhausted",
+    "openrouter privacy settings are blocking",
+)
+
+
+def is_non_retryable_model_error(exc: Exception) -> bool:
+    """Return true when a model/API failure should halt workflow progress."""
+    if isinstance(
+        exc,
+        (
+            CreditExhaustionError,
+            FreeModelExhaustedError,
+            OpenRouterPrivacyPolicyError,
+        ),
+    ):
+        return True
+    message = str(exc).lower()
+    return any(marker in message for marker in _NON_RETRYABLE_MODEL_ERROR_MARKERS)
diff --git a/backend/shared/models.py b/backend/shared/models.py
index 2532b4e..dee2328 100644
--- a/backend/shared/models.py
+++ b/backend/shared/models.py
@@ -5,7 +5,12 @@
 from datetime import datetime
 from typing import List, Dict, Optional, Any, Literal
 
-from pydantic import BaseModel, Field
+from pydantic import BaseModel, ConfigDict, Field
+
+DEFAULT_CONTEXT_WINDOW = 131072
+DEFAULT_MAX_OUTPUT_TOKENS = 25000
+DEFAULT_OPENROUTER_REASONING_EFFORT = "auto"
+OpenRouterReasoningEffort = Literal["auto", "xhigh", "high", "medium", "low", "minimal", "none"]
 
 
 class DocumentChunk(BaseModel):
@@ -105,9 +110,11 @@ class ModelConfig(BaseModel):
     model_id: str
     openrouter_model_id: Optional[str] = None  # For OpenRouter (different naming)
     openrouter_provider: Optional[str] = None  # Specific OpenRouter provider (e.g., "Anthropic")
+    openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     lm_studio_fallback_id: Optional[str] = None  # Fallback LM Studio model if OpenRouter fails
-    context_window: int = 131072
-    max_output_tokens: int = 25000
+    context_window: int = DEFAULT_CONTEXT_WINDOW
+    max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    supercharge_enabled: bool = False
 
 
 class BoostConfig(BaseModel):
@@ -116,8 +123,9 @@ class BoostConfig(BaseModel):
     openrouter_api_key: str = ""
     boost_model_id: str = ""  # OpenRouter model to use for boost
     boost_provider: Optional[str] = None  # Specific provider, or None to let OpenRouter choose
-    boost_context_window: int = 131072
-    boost_max_output_tokens: int = 25000
+    boost_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
+    boost_context_window: int = DEFAULT_CONTEXT_WINDOW
+    boost_max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
 
 
 class FreeModelSettings(BaseModel):
@@ -144,9 +152,11 @@ class SubmitterConfig(BaseModel):
     provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     model_id: str  # LM Studio model OR OpenRouter model based on provider
     openrouter_provider: Optional[str] = None  # Specific OpenRouter provider (e.g., "Anthropic")
+    openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     lm_studio_fallback_id: Optional[str] = None  # Fallback LM Studio model if OpenRouter fails
-    context_window: int = 131072
-    max_output_tokens: int = 25000
+    context_window: int = DEFAULT_CONTEXT_WINDOW
+    max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    supercharge_enabled: bool = False
 
 
 class AggregatorStartRequest(BaseModel):
@@ -157,9 +167,11 @@ class AggregatorStartRequest(BaseModel):
     validator_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     validator_model: str  # LM Studio model OR OpenRouter model based on provider
     validator_openrouter_provider: Optional[str] = None  # Specific OpenRouter provider
+    validator_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     validator_lm_studio_fallback: Optional[str] = None  # Fallback if OpenRouter fails
-    validator_context_size: int = 131072
-    validator_max_output_tokens: int = 25000
+    validator_context_size: int = DEFAULT_CONTEXT_WINDOW
+    validator_max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    validator_supercharge_enabled: bool = False
     uploaded_files: List[str] = Field(default_factory=list)
 
 
@@ -280,30 +292,38 @@ class CompilerStartRequest(BaseModel):
     validator_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     validator_model: str
     validator_openrouter_provider: Optional[str] = None
+    validator_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     validator_lm_studio_fallback: Optional[str] = None
-    validator_context_size: int = 131072
-    validator_max_output_tokens: int = 25000
+    validator_context_size: int = DEFAULT_CONTEXT_WINDOW
+    validator_max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    validator_supercharge_enabled: bool = False
     # High-context submitter config
     high_context_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     high_context_model: str
     high_context_openrouter_provider: Optional[str] = None
+    high_context_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     high_context_lm_studio_fallback: Optional[str] = None
-    high_context_context_size: int = 131072
-    high_context_max_output_tokens: int = 25000
+    high_context_context_size: int = DEFAULT_CONTEXT_WINDOW
+    high_context_max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    high_context_supercharge_enabled: bool = False
     # High-param submitter config
     high_param_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     high_param_model: str
     high_param_openrouter_provider: Optional[str] = None
+    high_param_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     high_param_lm_studio_fallback: Optional[str] = None
-    high_param_context_size: int = 131072
-    high_param_max_output_tokens: int = 25000
+    high_param_context_size: int = DEFAULT_CONTEXT_WINDOW
+    high_param_max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    high_param_supercharge_enabled: bool = False
     # Critique submitter config
     critique_submitter_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     critique_submitter_model: str
     critique_submitter_openrouter_provider: Optional[str] = None
+    critique_submitter_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     critique_submitter_lm_studio_fallback: Optional[str] = None
-    critique_submitter_context_window: int = 131072
-    critique_submitter_max_tokens: int = 25000
+    critique_submitter_context_window: int = DEFAULT_CONTEXT_WINDOW
+    critique_submitter_max_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    critique_submitter_supercharge_enabled: bool = False
 
 
 # ============================================================================
@@ -331,7 +351,7 @@ class PaperMetadata(BaseModel):
     word_count: int = 0
     source_brainstorm_ids: List[str] = Field(default_factory=list)
     referenced_papers: List[str] = Field(default_factory=list)
-    status: Literal["in_progress", "complete", "archived"] = "complete"
+    status: Literal["in_progress", "complete", "archived", "pruned"] = "complete"
     created_at: datetime = Field(default_factory=datetime.now)
     # Per-paper model tracking: model_id -> API call count
     model_usage: Optional[Dict[str, int]] = None
@@ -339,6 +359,10 @@ class PaperMetadata(BaseModel):
     generation_date: Optional[datetime] = None
     # Wolfram Alpha verification count (tracked separately from LLM API calls)
     wolfram_calls: Optional[int] = None
+    # Pruned papers are preserved for users but excluded from all model context.
+    pruned_at: Optional[datetime] = None
+    pruned_reason: Optional[str] = None
+    pruned_by: Optional[Literal["system", "user", "legacy"]] = None
 
 
 class TopicSelectionSubmission(BaseModel):
@@ -422,6 +446,7 @@ class AutonomousResearchState(BaseModel):
     total_brainstorms_completed: int = 0
     total_papers_completed: int = 0
     total_papers_archived: int = 0
+    total_papers_pruned: int = 0
     total_submissions_accepted: int = 0
     total_submissions_rejected: int = 0
     topic_selection_rejections: int = 0
@@ -438,30 +463,38 @@ class AutonomousResearchStartRequest(BaseModel):
     validator_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     validator_model: str
     validator_openrouter_provider: Optional[str] = None
+    validator_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     validator_lm_studio_fallback: Optional[str] = None
-    validator_context_window: int = 131072
-    validator_max_tokens: int = 25000
+    validator_context_window: int = DEFAULT_CONTEXT_WINDOW
+    validator_max_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    validator_supercharge_enabled: bool = False
     # Compiler high-context settings (separate from aggregator submitters)
     high_context_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     high_context_model: str = ""  # Empty string allowed, will use submitter model as fallback
     high_context_openrouter_provider: Optional[str] = None
+    high_context_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     high_context_lm_studio_fallback: Optional[str] = None
-    high_context_context_window: int = 131072
-    high_context_max_tokens: int = 25000
+    high_context_context_window: int = DEFAULT_CONTEXT_WINDOW
+    high_context_max_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    high_context_supercharge_enabled: bool = False
     # Compiler high-param settings
     high_param_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     high_param_model: str = ""  # Empty string allowed, will use submitter model as fallback
     high_param_openrouter_provider: Optional[str] = None
+    high_param_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     high_param_lm_studio_fallback: Optional[str] = None
-    high_param_context_window: int = 131072
-    high_param_max_tokens: int = 25000
+    high_param_context_window: int = DEFAULT_CONTEXT_WINDOW
+    high_param_max_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    high_param_supercharge_enabled: bool = False
     # Critique submitter settings
     critique_submitter_provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     critique_submitter_model: str = ""  # For critique generation and rewrite decisions (uses high_context if empty)
     critique_submitter_openrouter_provider: Optional[str] = None
+    critique_submitter_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     critique_submitter_lm_studio_fallback: Optional[str] = None
-    critique_submitter_context_window: int = 131072
-    critique_submitter_max_tokens: int = 25000
+    critique_submitter_context_window: int = DEFAULT_CONTEXT_WINDOW
+    critique_submitter_max_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    critique_submitter_supercharge_enabled: bool = False
     # Tier 3 Final Answer settings
     tier3_enabled: bool = False  # Default OFF — system stops at Tier 2 paper library
 
@@ -520,9 +553,11 @@ class ProofRoleConfigSnapshot(BaseModel):
     provider: Literal["lm_studio", "openrouter"] = "lm_studio"
     model_id: str = ""
     openrouter_provider: Optional[str] = None
+    openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
     lm_studio_fallback_id: Optional[str] = None
-    context_window: int = 131072
-    max_output_tokens: int = 25000
+    context_window: int = DEFAULT_CONTEXT_WINDOW
+    max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    supercharge_enabled: bool = False
 
 
 class ProofRuntimeConfigSnapshot(BaseModel):
@@ -555,7 +590,9 @@ class ProofAttemptFeedback(BaseModel):
     reasoning: str = ""
     lean_code: str = ""
     error_output: str = ""
+    diagnostic_output: str = ""
     goal_states: str = ""
+    raw_stderr: str = ""
     strategy: Literal["full_script", "tactic_script"] = "full_script"
     tactic_trace: List[str] = Field(default_factory=list)
     success: bool = False
@@ -568,7 +605,7 @@ class ProofRecord(BaseModel):
     theorem_statement: str
     theorem_name: str = ""
     formal_sketch: str = ""
-    source_type: Literal["brainstorm", "paper"]
+    source_type: Literal["brainstorm", "paper", "leanoj_subproof", "leanoj_final"]
     source_id: str
     source_title: str = ""
     solver: str = "Lean 4"
@@ -610,19 +647,143 @@ class ProofCheckRequest(BaseModel):
     """Request body for manually triggering a proof check."""
     source_type: Literal["brainstorm", "paper"]
     source_id: str
+    proof_runtime_config: Optional[Dict[str, Any]] = None
 
 
 class ProofSettingsUpdateRequest(BaseModel):
     """Request body for updating runtime Lean 4 proof settings."""
+    model_config = ConfigDict(extra="forbid")
+
     enabled: bool
     timeout: int = Field(default=120, ge=10, le=3600)
     lean4_lsp_enabled: Optional[bool] = None
     lean4_lsp_idle_timeout: Optional[int] = Field(default=None, ge=60, le=7200)
     smt_enabled: Optional[bool] = None
-    z3_path: Optional[str] = None
     smt_timeout: Optional[int] = Field(default=None, ge=1, le=600)
 
 
+# ============================================================================
+# LEANOJ PROOF SOLVER MODELS
+# ============================================================================
+
+
+class LeanOJRoleConfig(BaseModel):
+    """Model/runtime configuration for one LeanOJ proof-solver role."""
+    provider: Literal["lm_studio", "openrouter"] = "lm_studio"
+    model_id: str = ""
+    openrouter_provider: Optional[str] = None
+    openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
+    lm_studio_fallback_id: Optional[str] = None
+    context_window: int = DEFAULT_CONTEXT_WINDOW
+    max_output_tokens: int = DEFAULT_MAX_OUTPUT_TOKENS
+    supercharge_enabled: bool = False
+
+
+class LeanOJStartRequest(BaseModel):
+    """Request to start the LeanOJ proof-solver mode."""
+    user_prompt: str
+    lean_template: str
+    topic_generator: LeanOJRoleConfig
+    topic_validator: LeanOJRoleConfig
+    brainstorm_submitters: List[LeanOJRoleConfig] = Field(default_factory=list, min_length=1, max_length=10)
+    brainstorm_validator: LeanOJRoleConfig
+    path_decider: LeanOJRoleConfig = Field(default_factory=LeanOJRoleConfig)
+    final_solver: LeanOJRoleConfig
+    max_initial_brainstorm_accepts: int = Field(default=30, ge=1, le=200)
+    max_recursive_brainstorm_accepts: int = Field(default=10, ge=1, le=100)
+    final_attempts_per_cycle: int = Field(default=30, ge=30, le=200)
+
+
+class LeanOJAttemptRecord(BaseModel):
+    """One Lean 4 attempt made by the LeanOJ solver."""
+    attempt: int
+    target: Literal["subproof", "final"]
+    request: str = ""
+    lean_code: str = ""
+    success: bool = False
+    error_output: str = ""
+    reasoning: str = ""
+    created_at: datetime = Field(default_factory=datetime.now)
+
+
+class LeanOJSubproofRecord(BaseModel):
+    """Verified or exhausted subproof produced during one LeanOJ run."""
+    subproof_id: str
+    request: str
+    role: str = ""
+    theorem_or_lemma: str = ""
+    verified: bool = False
+    lean_code: str = ""
+    lean_feedback: str = ""
+    attempts_used: int = 0
+    error_summary: str = ""
+    proof_id: str = ""
+    novel: bool = False
+    novelty_tier: str = "not_novel"
+    novelty_reasoning: str = ""
+    created_at: datetime = Field(default_factory=datetime.now)
+
+
+class LeanOJState(BaseModel):
+    """Current state snapshot for LeanOJ proof-solver mode."""
+    is_running: bool = False
+    phase: Literal[
+        "idle",
+        "initial_topic_candidates",
+        "initial_brainstorm",
+        "path_decision",
+        "recursive_brainstorm",
+        "proof_storm",
+        "final_proof_loop",
+        "verified",
+        "stopped",
+        "error",
+    ] = "idle"
+    last_active_phase: str = ""
+    active_brainstorm_phase: str = ""
+    active_brainstorm_start_count: int = 0
+    session_id: str = ""
+    selected_topic: str = ""
+    current_path_decision: str = ""
+    accepted_brainstorm_count: int = 0
+    rejected_brainstorm_count: int = 0
+    brainstorm_acceptance_events: int = 0
+    active_brainstorm_last_sufficiency_check_count: int = 0
+    active_brainstorm_last_prune_review_count: int = 0
+    brainstorm_prune_reviews_performed: int = 0
+    brainstorm_prune_operations_applied: int = 0
+    recursive_cycle_count: int = 0
+    verified_subproofs: List[LeanOJSubproofRecord] = Field(default_factory=list)
+    failed_subproofs: List[LeanOJSubproofRecord] = Field(default_factory=list)
+    final_attempt_count: int = 0
+    final_solution: str = ""
+    final_proof_id: str = ""
+    final_novel: bool = False
+    final_novelty_tier: str = "not_novel"
+    final_novelty_reasoning: str = ""
+    master_proof_initialized: bool = False
+    master_proof_version: int = 0
+    master_proof_hash: str = ""
+    master_proof_line_count: int = 0
+    master_proof_char_count: int = 0
+    master_proof_last_edit_summary: str = ""
+    master_proof_last_stuck_reason: str = ""
+    master_proof_old_attempt_before_redo_version: int = 0
+    master_proof_old_attempt_before_redo_hash: str = ""
+    master_proof_old_attempt_before_redo_line_count: int = 0
+    master_proof_old_attempt_before_redo_char_count: int = 0
+    master_proof_old_attempt_before_redo_summary: str = ""
+    master_proof_old_attempt_before_redo_validator_justification: str = ""
+    master_proof_old_attempt_before_redo_apparent_issue: str = ""
+    master_proof_last_shortening_approval_justification: str = ""
+    master_proof_last_shortening_apparent_issue: str = ""
+    last_error: str = ""
+    skip_brainstorm_requested: bool = False
+    force_brainstorm_requested: bool = False
+    user_forced_final_cycle: bool = False
+    updated_at: datetime = Field(default_factory=datetime.now)
+
+
 # ============================================================================
 # TIER 3: FINAL ANSWER MODELS (Part 3 - Final Answer Generation)
 # ============================================================================
@@ -829,4 +990,6 @@ class CritiqueRequest(BaseModel):
     validator_context_window: Optional[int] = None
     validator_max_tokens: Optional[int] = None
     validator_provider: Optional[str] = None  # "lm_studio" or "openrouter"
-    validator_openrouter_provider: Optional[str] = None  # Specific provider like "Anthropic"
\ No newline at end of file
+    validator_openrouter_provider: Optional[str] = None  # Specific provider like "Anthropic"
+    validator_openrouter_reasoning_effort: OpenRouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT
+    validator_supercharge_enabled: bool = False
\ No newline at end of file
diff --git a/backend/shared/openrouter_client.py b/backend/shared/openrouter_client.py
index 60c4bdf..d034b11 100644
--- a/backend/shared/openrouter_client.py
+++ b/backend/shared/openrouter_client.py
@@ -8,12 +8,38 @@
 import asyncio
 import json
 import logging
+import re
 import time
 from typing import List, Dict, Any, Optional
 
+from backend.shared.config import system_config
+
 logger = logging.getLogger(__name__)
 
 
+_PROVIDER_SECRET_PATTERNS = (
+    re.compile(r"Bearer\s+[A-Za-z0-9._~+/=-]+", re.IGNORECASE),
+    re.compile(r'("(?:api[_-]?key|appid|authorization|token|secret)"\s*:\s*)"[^"]*"', re.IGNORECASE),
+    re.compile(r"((?:api[_-]?key|appid|authorization|token|secret)\s*[=:]\s*)[^\s,&}]+", re.IGNORECASE),
+)
+
+
+def sanitize_provider_error_text(value: Any, max_chars: int = 500) -> str:
+    """Return a capped provider error preview with obvious secrets/body fields redacted."""
+    text = str(value or "")
+    for pattern in _PROVIDER_SECRET_PATTERNS:
+        text = pattern.sub(lambda match: f"{match.group(1) if match.lastindex else 'Bearer '}[redacted]", text)
+
+    # Provider error pages occasionally echo request JSON. Drop large message
+    # arrays rather than persisting prompt/user-file content in local logs.
+    text = re.sub(r'("messages"\s*:\s*)\[[\s\S]*?\]', r'\1[redacted]', text, flags=re.IGNORECASE)
+    text = re.sub(r'("prompt"\s*:\s*)"[\s\S]*?"', r'\1"[redacted]"', text, flags=re.IGNORECASE)
+
+    if len(text) > max_chars:
+        return text[:max_chars] + "...[truncated]"
+    return text
+
+
 class OpenRouterClient:
     """Client for OpenRouter API."""
     
@@ -21,6 +47,9 @@ class OpenRouterClient:
     MAX_RETRIES = 3
     RETRY_DELAY = 2.0  # seconds
     RATE_LIMIT_COOLDOWN = 3600.0  # 1 hour in seconds
+    AUTO_IGNORED_PROVIDERS = ("Venice",)
+    HIGHEST_REASONING_EFFORT = "xhigh"
+    REASONING_EFFORT_LEVELS = {"xhigh", "high", "medium", "low", "minimal", "none"}
     
     # Per-model semaphores for rate limiting
     _model_semaphores: Dict[str, asyncio.Semaphore] = {}
@@ -50,7 +79,7 @@ def __init__(self, api_key: str):
     async def _get_model_semaphore(self, model: str) -> asyncio.Semaphore:
         """
         Get or create semaphore for a specific model.
-        Each model gets its own semaphore (limit=1) to prevent concurrent requests.
+        Each model gets its own semaphore to bound concurrent requests.
         
         Args:
             model: Model name/identifier
@@ -60,8 +89,9 @@ async def _get_model_semaphore(self, model: str) -> asyncio.Semaphore:
         """
         async with self._semaphore_lock:
             if model not in self._model_semaphores:
-                self._model_semaphores[model] = asyncio.Semaphore(1)
-                logger.debug(f"Created semaphore for OpenRouter model: {model}")
+                limit = max(1, int(system_config.max_model_concurrency_per_model or 1))
+                self._model_semaphores[model] = asyncio.Semaphore(limit)
+                logger.debug(f"Created semaphore for OpenRouter model: {model} (limit={limit})")
             return self._model_semaphores[model]
     
     def _is_free_model(self, model: str) -> bool:
@@ -329,6 +359,7 @@ async def generate_completion(
         max_tokens: Optional[int] = None,
         response_format: Optional[Dict[str, str]] = None,
         provider: Optional[str] = None,
+        reasoning_effort: Optional[str] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
@@ -342,6 +373,7 @@ async def generate_completion(
             max_tokens: Maximum tokens to generate
             response_format: Optional response format constraints
             provider: Optional specific provider to use (None lets OpenRouter choose)
+            reasoning_effort: Optional OpenRouter reasoning effort (auto/xhigh/high/medium/low/minimal/none).
             tools: Optional OpenAI-compatible tool schemas the model may call.
             tool_choice: Optional tool-choice directive (e.g. "auto", "none",
                 or ``{"type": "function", "function": {"name": "..."}}``).
@@ -355,7 +387,7 @@ async def generate_completion(
         """
         model_semaphore = await self._get_model_semaphore(model)
         
-        # ACQUIRE THIS MODEL'S SEMAPHORE to prevent concurrent requests
+        # Bound same-model parallelism so multi-submitter phases can overlap without unbounded fanout.
         async with model_semaphore:
             return await self._execute_completion_request(
                 model,
@@ -364,6 +396,7 @@ async def generate_completion(
                 max_tokens,
                 response_format,
                 provider,
+                reasoning_effort,
                 tools=tools,
                 tool_choice=tool_choice,
             )
@@ -392,6 +425,31 @@ def _is_reasoning_model_without_temperature(self, model: str) -> bool:
         ]
         
         return any(pattern in model_lower for pattern in reasoning_model_patterns)
+
+    def _build_reasoning_config(self, reasoning_effort: Optional[str]) -> Optional[Dict[str, str]]:
+        """
+        Build OpenRouter's normalized reasoning config.
+
+        ``auto`` intentionally means maximum reasoning for this app: OpenRouter
+        maps the normalized effort field onto provider-specific reasoning knobs
+        where supported and ignores unsupported parameters by default.
+        """
+        if reasoning_effort is None:
+            return None
+
+        effort = str(reasoning_effort).strip().lower()
+        if not effort:
+            return None
+        if effort in {"auto", "max", "maximum", "highest"}:
+            effort = self.HIGHEST_REASONING_EFFORT
+        elif effort in {"off", "disabled", "disable"}:
+            effort = "none"
+
+        if effort not in self.REASONING_EFFORT_LEVELS:
+            logger.warning("Unknown OpenRouter reasoning effort '%s'; defaulting to max", reasoning_effort)
+            effort = self.HIGHEST_REASONING_EFFORT
+
+        return {"effort": effort}
     
     async def _execute_completion_request(
         self,
@@ -401,6 +459,7 @@ async def _execute_completion_request(
         max_tokens: Optional[int],
         response_format: Optional[Dict[str, str]],
         provider: Optional[str] = None,
+        reasoning_effort: Optional[str] = None,
         tools: Optional[List[Dict[str, Any]]] = None,
         tool_choice: Optional[Any] = None,
     ) -> Dict[str, Any]:
@@ -433,15 +492,17 @@ async def _execute_completion_request(
         else:
             logger.debug(f"Skipping temperature parameter for reasoning model: {model}")
         
-        # Set max_tokens if provided
-        if max_tokens is None:
-            max_tokens = 25000  # Default for reasoning models
-            logger.debug(f"Auto-limiting max_tokens to {max_tokens}")
-        
-        payload["max_tokens"] = max_tokens
+        if max_tokens is not None:
+            payload["max_tokens"] = max_tokens
+        else:
+            logger.debug("No max_tokens supplied; letting OpenRouter/model defaults apply")
         
         if response_format:
             payload["response_format"] = response_format
+
+        reasoning_config = self._build_reasoning_config(reasoning_effort)
+        if reasoning_config:
+            payload["reasoning"] = reasoning_config
         
         # OpenAI-compatible tool calling: pass tools + tool_choice straight
         # through to OpenRouter. Providers that do not support tools tend to
@@ -454,8 +515,16 @@ async def _execute_completion_request(
         
         # Add provider routing if specified
         if provider:
-            payload["provider"] = {"order": [provider]}
+            payload["provider"] = {
+                "order": [provider],
+                "allow_fallbacks": False,
+            }
             logger.debug(f"Using specific provider: {provider}")
+        elif self.AUTO_IGNORED_PROVIDERS:
+            payload["provider"] = {
+                "ignore": list(self.AUTO_IGNORED_PROVIDERS),
+            }
+            logger.debug(f"Ignoring weak OpenRouter auto-routing providers: {self.AUTO_IGNORED_PROVIDERS}")
         
         # NOTE: Stop sequences were removed because they caused premature truncation
         # with certain models (e.g., Grok 4.1). Models will now generate until max_tokens
@@ -472,7 +541,7 @@ async def _execute_completion_request(
                 
                 # Check for credit exhaustion (402 Payment Required)
                 if response.status_code == 402:
-                    error_text = response.text
+                    error_text = sanitize_provider_error_text(response.text)
                     logger.error(
                         f"OpenRouter credit exhaustion detected (402): {error_text}"
                     )
@@ -496,7 +565,7 @@ async def _execute_completion_request(
                         body_text = response.text or ""
                     except Exception:
                         body_text = ""
-                    body_preview = body_text[:500]
+                    body_preview = sanitize_provider_error_text(body_text)
                     content_type = response.headers.get("content-type", "") if hasattr(response, "headers") else ""
                     logger.error(
                         f"OpenRouter returned non-JSON body (status={response.status_code}, "
@@ -529,7 +598,7 @@ async def _execute_completion_request(
                 raise
                 
             except httpx.HTTPStatusError as e:
-                error_detail = e.response.text if hasattr(e.response, 'text') else str(e)
+                error_detail = sanitize_provider_error_text(e.response.text if hasattr(e.response, 'text') else str(e))
                 
                 # Check for rate limit (429 Too Many Requests)
                 if e.response.status_code == 429:
@@ -667,7 +736,7 @@ async def get_embeddings(self, texts: List[str], model: str = None) -> List[List
             
             # Check for credit exhaustion (402 Payment Required)
             if response.status_code == 402:
-                error_text = response.text
+                error_text = sanitize_provider_error_text(response.text)
                 logger.error(f"OpenRouter credit exhaustion for embeddings (402): {error_text}")
                 raise CreditExhaustionError("OpenRouter credits exhausted for embeddings")
             
@@ -680,7 +749,7 @@ async def get_embeddings(self, texts: List[str], model: str = None) -> List[List
                     body_text = response.text or ""
                 except Exception:
                     body_text = ""
-                body_preview = body_text[:500]
+                body_preview = sanitize_provider_error_text(body_text)
                 content_type = response.headers.get("content-type", "") if hasattr(response, "headers") else ""
                 logger.error(
                     f"OpenRouter embeddings returned non-JSON body (status={response.status_code}, "
@@ -712,7 +781,7 @@ async def get_embeddings(self, texts: List[str], model: str = None) -> List[List
             raise
         
         except httpx.HTTPStatusError as e:
-            error_detail = e.response.text if hasattr(e.response, 'text') else str(e)
+            error_detail = sanitize_provider_error_text(e.response.text if hasattr(e.response, 'text') else str(e))
             
             # Check for rate limit (429 Too Many Requests)
             if e.response.status_code == 429:
diff --git a/backend/shared/smt_client.py b/backend/shared/smt_client.py
index e056829..1429c89 100644
--- a/backend/shared/smt_client.py
+++ b/backend/shared/smt_client.py
@@ -18,6 +18,8 @@
 class SmtClient:
     """Thin async wrapper around an external Z3 binary."""
 
+    _ALLOWED_EXECUTABLE_NAMES = {"z3", "z3.exe"}
+
     def __init__(self, z3_path: str, timeout: int) -> None:
         self.z3_path = str(z3_path or "").strip()
         self.timeout = max(int(timeout or 0), 1)
@@ -25,14 +27,15 @@ def __init__(self, z3_path: str, timeout: int) -> None:
     def _resolve_executable(self) -> str:
         if self.z3_path:
             candidate = Path(self.z3_path).resolve()
-            if candidate.exists():
+            if candidate.exists() and candidate.name.lower() in self._ALLOWED_EXECUTABLE_NAMES:
                 return str(candidate)
+            raise RuntimeError("Configured Z3 path must point to a z3 executable.")
 
         for name in ("z3", "z3.exe"):
             resolved = shutil.which(name)
             if resolved:
                 return resolved
-        return self.z3_path or "z3"
+        return "z3"
 
     async def _run_process(
         self,
diff --git a/backend/shared/wolfram_alpha_client.py b/backend/shared/wolfram_alpha_client.py
index 5acabde..982710e 100644
--- a/backend/shared/wolfram_alpha_client.py
+++ b/backend/shared/wolfram_alpha_client.py
@@ -48,12 +48,12 @@ async def query(self, question: str) -> Optional[str]:
                 "i": question
             }
             
-            logger.info(f"Querying Wolfram Alpha: {question[:100]}")
+            logger.info("Querying Wolfram Alpha (query_len=%d)", len(question or ""))
             response = await self.client.get(self.BASE_URL, params=params)
             
             if response.status_code == 200:
                 result = response.text.strip()
-                logger.info(f"Wolfram Alpha success: {result[:200]}")
+                logger.info("Wolfram Alpha success (result_len=%d)", len(result))
                 return result
             elif response.status_code == 401:
                 logger.warning("Wolfram Alpha: Invalid API key (401)")
@@ -62,14 +62,14 @@ async def query(self, question: str) -> Optional[str]:
                 logger.warning("Wolfram Alpha: API key forbidden or rate limited (403)")
                 return None
             elif response.status_code == 501:
-                logger.warning(f"Wolfram Alpha: Could not interpret query (501): {question}")
+                logger.warning("Wolfram Alpha: Could not interpret query (501; query_len=%d)", len(question or ""))
                 return None
             else:
                 logger.warning(f"Wolfram Alpha query failed: status {response.status_code}")
                 return None
                 
         except httpx.TimeoutException:
-            logger.warning(f"Wolfram Alpha query timeout after 30s: {question[:100]}")
+            logger.warning("Wolfram Alpha query timeout after 30s (query_len=%d)", len(question or ""))
             return None
         except Exception as e:
             logger.error(f"Wolfram Alpha API error: {e}", exc_info=True)
diff --git a/backend/shared/workflow_start_guard.py b/backend/shared/workflow_start_guard.py
new file mode 100644
index 0000000..1b11437
--- /dev/null
+++ b/backend/shared/workflow_start_guard.py
@@ -0,0 +1,23 @@
+"""
+Process-wide guard for mutually exclusive top-level workflow starts.
+"""
+from __future__ import annotations
+
+import asyncio
+from contextlib import asynccontextmanager
+from typing import AsyncIterator
+
+
+class WorkflowStartGuard:
+    """Serialize conflict checks and startup side effects across top-level modes."""
+
+    def __init__(self) -> None:
+        self._lock = asyncio.Lock()
+
+    @asynccontextmanager
+    async def reserve(self) -> AsyncIterator[None]:
+        async with self._lock:
+            yield
+
+
+workflow_start_guard = WorkflowStartGuard()
diff --git a/frontend/index.html b/frontend/index.html
index 5b7a03d..096b2b6 100644
--- a/frontend/index.html
+++ b/frontend/index.html
@@ -3,7 +3,7 @@
   <head>
     <meta charset="UTF-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>ASI Aggregator System</title>
+    <title>MOTO Autonomous ASI</title>
   </head>
   <body>
     <div id="root"></div>
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index 389caa3..2bee959 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.7",
+  "version": "1.0.8",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "asi-aggregator-frontend",
-      "version": "1.0.7",
+      "version": "1.0.8",
       "license": "MIT",
       "dependencies": {
         "dompurify": "^3.2.4",
diff --git a/frontend/package.json b/frontend/package.json
index 90b3c08..6f9e4e4 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -1,6 +1,6 @@
 {
   "name": "asi-aggregator-frontend",
-  "version": "1.0.7",
+  "version": "1.0.8",
   "description": "Frontend UI for MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "author": "Intrafere LLC",
   "license": "MIT",
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 56a16aa..ff19b56 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -19,6 +19,15 @@ import {
   MathematicalProofs,
   ProofLibrary
 } from './components/autonomous';
+import {
+  LeanOJBrainstorms,
+  LeanOJInterface,
+  LeanOJLogs,
+  LeanOJMasterProof,
+  LeanOJMathematicalProofs,
+  LeanOJProofLibrary,
+  LeanOJSettings,
+} from './components/leanoj';
 import WorkflowPanel from './components/WorkflowPanel';
 import BoostControlModal from './components/BoostControlModal';
 import StartupProviderSetupModal from './components/StartupProviderSetupModal';
@@ -31,7 +40,7 @@ import HungConnectionNotificationStack from './components/HungConnectionNotifica
 import UpdateNotificationBanner from './components/UpdateNotificationBanner';
 import PaperCritiqueModal from './components/PaperCritiqueModal';
 import { websocket } from './services/websocket';
-import { api, autonomousAPI, openRouterAPI } from './services/api';
+import { api, autonomousAPI, leanojAPI, openRouterAPI } from './services/api';
 import {
   LM_STUDIO_STARTUP_CHOICE,
   RECOMMENDED_PROFILE_KEY,
@@ -42,14 +51,27 @@ import {
   settingsToAutonomousConfig,
   persistAutonomousSettings,
 } from './utils/autonomousProfiles';
+import {
+  getStoredLeanOJSettings,
+  persistLeanOJSettings,
+} from './utils/leanojProfiles';
+import {
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+} from './utils/openRouterSelection';
 
 const APP_MODE_STORAGE_KEY = 'appMode';
 const AUTONOMOUS_TAB_STORAGE_KEY = 'autonomousActiveTab';
 const MANUAL_TAB_STORAGE_KEY = 'manualActiveTab';
+const LEANOJ_TAB_STORAGE_KEY = 'leanojActiveTab';
 const COMPLETED_WORKS_SUB_TAB_STORAGE_KEY = 'completedWorksSubTab';
 const LEGACY_SINGLE_PAPER_WRITER_STORAGE_KEY = 'singlePaperWriterExpanded';
+const DEVELOPER_MODE_STORAGE_KEY = 'developerModeSettingsEnabled';
 const EMBEDDING_MODEL_HINTS = ['embed', 'embedding', 'nomic', 'bge', 'e5', 'gte'];
 const AUTONOMOUS_ROLE_PREFIXES = ['validator', 'high_context', 'high_param', 'critique_submitter'];
+const HIGH_SCORE_CRITIQUE_THRESHOLD = 6.25;
+const SEEN_HIGH_SCORE_CRITIQUES_STORAGE_KEY = 'seenHighScoreCritiqueNotifications';
+const MAX_SEEN_HIGH_SCORE_CRITIQUES = 500;
 const DEFAULT_CAPABILITIES = Object.freeze({
   genericMode: false,
   lmStudioEnabled: true,
@@ -60,6 +82,60 @@ const DEFAULT_CAPABILITIES = Object.freeze({
   apiContractVersion: '',
 });
 
+function readDeveloperModeEnabled() {
+  return localStorage.getItem(DEVELOPER_MODE_STORAGE_KEY) === 'true';
+}
+
+function getHighScoreCritiqueNotificationKey(paperId, averageRating) {
+  const rating = Number(averageRating);
+  if (!paperId || !Number.isFinite(rating)) {
+    return null;
+  }
+  return `${paperId}:${rating.toFixed(1)}`;
+}
+
+function readSeenHighScoreCritiques() {
+  if (typeof window === 'undefined') {
+    return new Set();
+  }
+
+  try {
+    const raw = window.localStorage.getItem(SEEN_HIGH_SCORE_CRITIQUES_STORAGE_KEY);
+    const values = raw ? JSON.parse(raw) : [];
+    return new Set(Array.isArray(values) ? values.filter(value => typeof value === 'string') : []);
+  } catch (error) {
+    console.warn('Could not read seen high-score critique notifications:', error);
+    return new Set();
+  }
+}
+
+function persistSeenHighScoreCritiques(seenSet) {
+  if (typeof window === 'undefined') {
+    return;
+  }
+
+  try {
+    const values = Array.from(seenSet).slice(-MAX_SEEN_HIGH_SCORE_CRITIQUES);
+    window.localStorage.setItem(SEEN_HIGH_SCORE_CRITIQUES_STORAGE_KEY, JSON.stringify(values));
+  } catch (error) {
+    console.warn('Could not save seen high-score critique notifications:', error);
+  }
+}
+
+const createDefaultAggregatorSubmitterConfigs = () => (
+  [1, 2, 3].map((submitterId) => ({
+    submitterId,
+    provider: 'lm_studio',
+    modelId: '',
+    openrouterProvider: null,
+    openrouterReasoningEffort: 'auto',
+    lmStudioFallbackId: null,
+    contextWindow: DEFAULT_CONTEXT_WINDOW,
+    maxOutputTokens: DEFAULT_MAX_OUTPUT_TOKENS,
+    superchargeEnabled: false,
+  }))
+);
+
 function normalizeLoadedLmStudioModelId(modelId = '') {
   return String(modelId).replace(/:\d+$/, '');
 }
@@ -106,6 +182,7 @@ function normalizeRuntimeModelConfig(config = {}, lmStudioEnabled) {
     provider: normalizeRuntimeProvider(config.provider, lmStudioEnabled),
     modelId: shouldResetLmState ? '' : (config.modelId || ''),
     openrouterProvider: shouldResetLmState ? null : (config.openrouterProvider || null),
+    openrouterReasoningEffort: config.openrouterReasoningEffort || 'auto',
     lmStudioFallbackId: lmStudioEnabled ? (config.lmStudioFallbackId || null) : null,
   };
 }
@@ -124,6 +201,7 @@ function normalizeAggregatorConfigForCapabilities(config, lmStudioEnabled) {
     validatorOpenrouterProvider: shouldResetValidator
       ? null
       : (config.validatorOpenrouterProvider || null),
+    validatorOpenrouterReasoningEffort: config.validatorOpenrouterReasoningEffort || 'auto',
     validatorLmStudioFallback: lmStudioEnabled ? (config.validatorLmStudioFallback || null) : null,
   };
 }
@@ -149,6 +227,7 @@ function normalizeAutonomousConfigForCapabilities(config, lmStudioEnabled) {
     nextConfig[openRouterProviderKey] = shouldResetRole
       ? null
       : (nextConfig[openRouterProviderKey] || null);
+    nextConfig[`${rolePrefix}_openrouter_reasoning_effort`] = nextConfig[`${rolePrefix}_openrouter_reasoning_effort`] || 'auto';
     nextConfig[fallbackKey] = lmStudioEnabled ? (nextConfig[fallbackKey] || null) : null;
   });
 
@@ -158,7 +237,10 @@ function normalizeAutonomousConfigForCapabilities(config, lmStudioEnabled) {
 function App() {
   const [appMode, setAppMode] = useState(() => {
     const savedMode = localStorage.getItem(APP_MODE_STORAGE_KEY);
-    if (savedMode === 'autonomous' || savedMode === 'manual') {
+    if (savedMode === 'leanoj' && !readDeveloperModeEnabled()) {
+      return 'autonomous';
+    }
+    if (savedMode === 'autonomous' || savedMode === 'manual' || savedMode === 'leanoj') {
       return savedMode;
     }
 
@@ -181,6 +263,9 @@ function App() {
     return saved || 'auto-interface';
   });
   const [manualActiveTab, setManualActiveTab] = useState('aggregator-interface');
+  const [leanojActiveTab, setLeanojActiveTab] = useState(() => {
+    return localStorage.getItem(LEANOJ_TAB_STORAGE_KEY) || 'leanoj-interface';
+  });
   const [completedWorksSubTab, setCompletedWorksSubTab] = useState(() => {
     const savedSubTab = localStorage.getItem(COMPLETED_WORKS_SUB_TAB_STORAGE_KEY);
     if (savedSubTab) return savedSubTab;
@@ -189,7 +274,11 @@ function App() {
     if (savedTab === 'auto-final-answer-library') return 'stage3-history';
     return 'stage2-history';
   });
-  const activeTab = appMode === 'manual' ? manualActiveTab : autonomousActiveTab;
+  const activeTab = appMode === 'manual'
+    ? manualActiveTab
+    : appMode === 'leanoj'
+      ? leanojActiveTab
+      : autonomousActiveTab;
   const shimmerAccentsEnabled = (() => {
     const saved = localStorage.getItem('banner_shimmer_enabled');
     return saved !== null ? JSON.parse(saved) : true;
@@ -233,6 +322,9 @@ function App() {
     const savedState = localStorage.getItem('workflow_panel_collapsed');
     return savedState !== 'false';
   });
+  const [developerModeEnabled, setDeveloperModeEnabled] = useState(() => {
+    return readDeveloperModeEnabled();
+  });
 
   // Update notice banner state (dismissible per session, re-appears on restart)
   const [updateNotice, setUpdateNotice] = useState(null);
@@ -254,9 +346,90 @@ function App() {
     localStorage.setItem(MANUAL_TAB_STORAGE_KEY, manualActiveTab);
   }, [manualActiveTab]);
 
+  useEffect(() => {
+    localStorage.setItem(LEANOJ_TAB_STORAGE_KEY, leanojActiveTab);
+  }, [leanojActiveTab]);
+
   useEffect(() => {
     localStorage.setItem(COMPLETED_WORKS_SUB_TAB_STORAGE_KEY, completedWorksSubTab);
   }, [completedWorksSubTab]);
+
+  useEffect(() => {
+    if (!developerModeEnabled && appMode === 'leanoj') {
+      setAppMode('autonomous');
+    }
+  }, [developerModeEnabled, appMode]);
+
+  useEffect(() => {
+    const pressedCodes = new Set();
+    let shortcutChordActive = false;
+
+    const toggleDeveloperMode = () => {
+      setDeveloperModeEnabled((currentValue) => {
+        const nextValue = !currentValue;
+        localStorage.setItem(DEVELOPER_MODE_STORAGE_KEY, String(nextValue));
+        return nextValue;
+      });
+    };
+
+    const getShortcutCode = (event) => {
+      if (event.code?.startsWith('Shift') || event.key === 'Shift') {
+        return 'Shift';
+      }
+      if (event.code === 'KeyZ' || event.key?.toLowerCase() === 'z') {
+        return 'KeyZ';
+      }
+      if (event.code === 'KeyX' || event.key?.toLowerCase() === 'x') {
+        return 'KeyX';
+      }
+      return null;
+    };
+
+    const hasDeveloperShortcutChord = () => (
+      pressedCodes.has('Shift') &&
+      pressedCodes.has('KeyZ') &&
+      pressedCodes.has('KeyX')
+    );
+
+    const handleKeyDown = (event) => {
+      const shortcutCode = getShortcutCode(event);
+      if (!shortcutCode) {
+        return;
+      }
+
+      pressedCodes.add(shortcutCode);
+      if (hasDeveloperShortcutChord() && !shortcutChordActive) {
+        shortcutChordActive = true;
+        event.preventDefault();
+        toggleDeveloperMode();
+      }
+    };
+
+    const handleKeyUp = (event) => {
+      const shortcutCode = getShortcutCode(event);
+      if (shortcutCode) {
+        pressedCodes.delete(shortcutCode);
+      }
+      if (!hasDeveloperShortcutChord()) {
+        shortcutChordActive = false;
+      }
+    };
+
+    const clearPressedCodes = () => {
+      pressedCodes.clear();
+      shortcutChordActive = false;
+    };
+
+    window.addEventListener('keydown', handleKeyDown, true);
+    window.addEventListener('keyup', handleKeyUp, true);
+    window.addEventListener('blur', clearPressedCodes);
+
+    return () => {
+      window.removeEventListener('keydown', handleKeyDown, true);
+      window.removeEventListener('keyup', handleKeyUp, true);
+      window.removeEventListener('blur', clearPressedCodes);
+    };
+  }, []);
   
   // Initialize config from localStorage or use defaults
   // CRITICAL: Read from 'aggregator_settings' (used by AggregatorSettings component)
@@ -268,17 +441,15 @@ function App() {
         const settings = JSON.parse(settingsConfig);
         return {
           userPrompt: settings.userPrompt || '',
-          submitterConfigs: settings.submitterConfigs || [
-            { submitterId: 1, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 2, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 3, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 }
-          ],
+          submitterConfigs: settings.submitterConfigs || createDefaultAggregatorSubmitterConfigs(),
           validatorModel: settings.validatorModel || '',
           validatorProvider: settings.validatorProvider || 'lm_studio',
           validatorOpenrouterProvider: settings.validatorOpenrouterProvider || null,
+          validatorOpenrouterReasoningEffort: settings.validatorOpenrouterReasoningEffort || 'auto',
           validatorLmStudioFallback: settings.validatorLmStudioFallback || null,
-          validatorContextSize: settings.validatorContextSize || 131072,
-          validatorMaxOutput: settings.validatorMaxOutput || 25000,
+          validatorContextSize: settings.validatorContextSize || DEFAULT_CONTEXT_WINDOW,
+          validatorMaxOutput: settings.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+          validatorSuperchargeEnabled: Boolean(settings.validatorSuperchargeEnabled),
           uploadedFiles: [],
         };
       } catch (e) {
@@ -293,17 +464,15 @@ function App() {
         const parsed = JSON.parse(savedConfig);
         return {
           userPrompt: parsed.userPrompt || '',
-          submitterConfigs: parsed.submitterConfigs || [
-            { submitterId: 1, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 2, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-            { submitterId: 3, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 }
-          ],
+          submitterConfigs: parsed.submitterConfigs || createDefaultAggregatorSubmitterConfigs(),
           validatorModel: parsed.validatorModel || '',
           validatorProvider: parsed.validatorProvider || 'lm_studio',
           validatorOpenrouterProvider: parsed.validatorOpenrouterProvider || null,
+          validatorOpenrouterReasoningEffort: parsed.validatorOpenrouterReasoningEffort || 'auto',
           validatorLmStudioFallback: parsed.validatorLmStudioFallback || null,
-          validatorContextSize: parsed.validatorContextSize || 131072,
-          validatorMaxOutput: parsed.validatorMaxOutput || 25000,
+          validatorContextSize: parsed.validatorContextSize || DEFAULT_CONTEXT_WINDOW,
+          validatorMaxOutput: parsed.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+          validatorSuperchargeEnabled: Boolean(parsed.validatorSuperchargeEnabled),
           uploadedFiles: [],
         };
       } catch (e) {
@@ -312,17 +481,15 @@ function App() {
     }
     return {
       userPrompt: '',
-      submitterConfigs: [
-        { submitterId: 1, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-        { submitterId: 2, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 },
-        { submitterId: 3, provider: 'lm_studio', modelId: '', openrouterProvider: null, lmStudioFallbackId: null, contextWindow: 131072, maxOutputTokens: 25000 }
-      ],
+      submitterConfigs: createDefaultAggregatorSubmitterConfigs(),
       validatorModel: '',
       validatorProvider: 'lm_studio',
       validatorOpenrouterProvider: null,
+      validatorOpenrouterReasoningEffort: 'auto',
       validatorLmStudioFallback: null,
-      validatorContextSize: 131072,
-      validatorMaxOutput: 25000,
+      validatorContextSize: DEFAULT_CONTEXT_WINDOW,
+      validatorMaxOutput: DEFAULT_MAX_OUTPUT_TOKENS,
+      validatorSuperchargeEnabled: false,
       uploadedFiles: [],
     };
   });
@@ -336,14 +503,16 @@ function App() {
       validatorModel: config.validatorModel,
       validatorProvider: config.validatorProvider,
       validatorOpenrouterProvider: config.validatorOpenrouterProvider,
+      validatorOpenrouterReasoningEffort: config.validatorOpenrouterReasoningEffort,
       validatorLmStudioFallback: config.validatorLmStudioFallback,
       validatorContextSize: config.validatorContextSize,
       validatorMaxOutput: config.validatorMaxOutput,
+      validatorSuperchargeEnabled: config.validatorSuperchargeEnabled,
     };
     // Save to both old and new keys
     localStorage.setItem('aggregatorConfig', JSON.stringify(configToSave));
     localStorage.setItem('aggregator_settings', JSON.stringify(configToSave));
-  }, [config.userPrompt, config.submitterConfigs, config.validatorModel, config.validatorProvider, config.validatorOpenrouterProvider, config.validatorLmStudioFallback, config.validatorContextSize, config.validatorMaxOutput]);
+  }, [config.userPrompt, config.submitterConfigs, config.validatorModel, config.validatorProvider, config.validatorOpenrouterProvider, config.validatorOpenrouterReasoningEffort, config.validatorLmStudioFallback, config.validatorContextSize, config.validatorMaxOutput, config.validatorSuperchargeEnabled]);
 
   // Autonomous mode state
   const [autonomousRunning, setAutonomousRunning] = useState(false);
@@ -353,6 +522,13 @@ function App() {
   const [brainstorms, setBrainstorms] = useState([]);
   const [papers, setPapers] = useState([]);
   const [autonomousStats, setAutonomousStats] = useState(null);
+
+  // LeanOJ mode state
+  const [leanojRunning, setLeanojRunning] = useState(false);
+  const [leanojStatus, setLeanojStatus] = useState(null);
+  const [leanojActivity, setLeanojActivity] = useState([]);
+  const [leanojSettings, setLeanojSettings] = useState(() => getStoredLeanOJSettings());
+  const [leanojProofRefreshToken, setLeanojProofRefreshToken] = useState(0);
   
   // Disclaimer modal state (shows on every app load)
   const [showDisclaimer, setShowDisclaimer] = useState(true);
@@ -386,6 +562,12 @@ function App() {
   const autonomousRunningRef = useRef(autonomousRunning);
   const autonomousTierRef = useRef(autonomousStatus?.current_tier || null);
   const openRouterKeyJustSavedRef = useRef(false);
+  const seenHighScoreCritiquesRef = useRef(null);
+  const shownHighScoreCritiquesRef = useRef(null);
+  if (seenHighScoreCritiquesRef.current === null) {
+    seenHighScoreCritiquesRef.current = readSeenHighScoreCritiques();
+    shownHighScoreCritiquesRef.current = new Set(seenHighScoreCritiquesRef.current);
+  }
 
   useEffect(() => {
     autonomousRunningRef.current = autonomousRunning;
@@ -395,6 +577,20 @@ function App() {
     autonomousTierRef.current = autonomousStatus?.current_tier || null;
   }, [autonomousStatus]);
 
+  const markHighScoreCritiqueSeen = useCallback((seenKey) => {
+    if (!seenKey) {
+      return;
+    }
+
+    const seen = seenHighScoreCritiquesRef.current;
+    if (seen.has(seenKey)) {
+      return;
+    }
+
+    seen.add(seenKey);
+    persistSeenHighScoreCritiques(seen);
+  }, []);
+
   // Autonomous config with localStorage persistence
   // CRITICAL: Read from 'autonomous_research_settings' (used by AutonomousResearchSettings component)
   const [autonomousConfig, setAutonomousConfig] = useState(() => {
@@ -416,29 +612,37 @@ function App() {
         validator_lm_studio_fallback: autonomousConfig.validator_lm_studio_fallback,
         validator_context_window: autonomousConfig.validator_context_window,
         validator_max_tokens: autonomousConfig.validator_max_tokens,
+        validator_supercharge_enabled: autonomousConfig.validator_supercharge_enabled,
         high_context_provider: autonomousConfig.high_context_provider,
         high_context_model: autonomousConfig.high_context_model,
         high_context_openrouter_provider: autonomousConfig.high_context_openrouter_provider,
         high_context_lm_studio_fallback: autonomousConfig.high_context_lm_studio_fallback,
         high_context_context_window: autonomousConfig.high_context_context_window,
         high_context_max_tokens: autonomousConfig.high_context_max_tokens,
+        high_context_supercharge_enabled: autonomousConfig.high_context_supercharge_enabled,
         high_param_provider: autonomousConfig.high_param_provider,
         high_param_model: autonomousConfig.high_param_model,
         high_param_openrouter_provider: autonomousConfig.high_param_openrouter_provider,
         high_param_lm_studio_fallback: autonomousConfig.high_param_lm_studio_fallback,
         high_param_context_window: autonomousConfig.high_param_context_window,
         high_param_max_tokens: autonomousConfig.high_param_max_tokens,
+        high_param_supercharge_enabled: autonomousConfig.high_param_supercharge_enabled,
         critique_submitter_provider: autonomousConfig.critique_submitter_provider,
         critique_submitter_model: autonomousConfig.critique_submitter_model,
         critique_submitter_openrouter_provider: autonomousConfig.critique_submitter_openrouter_provider,
         critique_submitter_lm_studio_fallback: autonomousConfig.critique_submitter_lm_studio_fallback,
         critique_submitter_context_window: autonomousConfig.critique_submitter_context_window,
         critique_submitter_max_tokens: autonomousConfig.critique_submitter_max_tokens,
+        critique_submitter_supercharge_enabled: autonomousConfig.critique_submitter_supercharge_enabled,
       },
       tier3Enabled: autonomousConfig.tier3_enabled ?? existingSettings.tier3Enabled ?? false,
     });
   }, [autonomousConfig]);
 
+  useEffect(() => {
+    persistLeanOJSettings(leanojSettings);
+  }, [leanojSettings]);
+
   const syncProviderAvailability = useCallback(async () => {
     let nextCapabilities = DEFAULT_CAPABILITIES;
     try {
@@ -665,6 +869,7 @@ function App() {
         if (status.is_running) {
           console.log('Autonomous research detected as running, syncing state...');
           setAutonomousRunning(true);
+          setAnyWorkflowRunning(true);
         }
       } catch (error) {
         console.error('Failed to check initial autonomous status:', error);
@@ -674,6 +879,69 @@ function App() {
     checkInitialStatus();
   }, []);
 
+  // Recover high-score critique popups from persisted paper metadata. WebSocket
+  // events are best-effort, so a sleeping/closed browser can miss the live event.
+  useEffect(() => {
+    if (!papers || papers.length === 0) {
+      return;
+    }
+
+    const recoveredNotifications = [];
+    for (const paper of papers) {
+      const averageRating = Number(paper.critique_avg);
+      if (!Number.isFinite(averageRating) || averageRating < HIGH_SCORE_CRITIQUE_THRESHOLD) {
+        continue;
+      }
+
+      const seenKey = getHighScoreCritiqueNotificationKey(paper.paper_id, averageRating);
+      if (!seenKey || shownHighScoreCritiquesRef.current.has(seenKey)) {
+        continue;
+      }
+
+      shownHighScoreCritiquesRef.current.add(seenKey);
+      recoveredNotifications.push({
+        id: `critique_recovered_${seenKey}_${Date.now()}`,
+        paper_id: paper.paper_id,
+        paper_title: paper.title || paper.paper_title || paper.paper_id,
+        average_rating: averageRating,
+        timestamp: paper.created_at || new Date().toISOString(),
+        seenKey,
+        recovered: true,
+      });
+    }
+
+    if (recoveredNotifications.length === 0) {
+      return;
+    }
+
+    setCritiqueNotifications(prev => {
+      const existingSeenKeys = new Set(prev.map(notification => notification.seenKey).filter(Boolean));
+      const newNotifications = recoveredNotifications.filter(notification => !existingSeenKeys.has(notification.seenKey));
+      if (newNotifications.length === 0) {
+        return prev;
+      }
+
+      const newStack = [...prev, ...newNotifications];
+      return newStack.length > 3 ? newStack.slice(-3) : newStack;
+    });
+  }, [papers]);
+
+  useEffect(() => {
+    const checkLeanOJStatus = async () => {
+      try {
+        const status = await leanojAPI.getStatus();
+        setLeanojStatus(status);
+        if (status.is_running) {
+          setLeanojRunning(true);
+          setAnyWorkflowRunning(true);
+        }
+      } catch (error) {
+        console.error('Failed to check initial Proof Solver status:', error);
+      }
+    };
+    checkLeanOJStatus();
+  }, []);
+
   // WebSocket connection
   useEffect(() => {
     // Connect to WebSocket
@@ -719,6 +987,33 @@ function App() {
       if (!cleaned) return '';
       return cleaned.length > maxLen ? `${cleaned.slice(0, maxLen)}...` : cleaned;
     };
+    const proofName = (data = {}) => (data.proof_label ? `Proof ${data.proof_label}` : 'Proof');
+    const proofTarget = (data = {}) => data.theorem_statement || data.theorem_id || '';
+    const proofLeanResponse = (data = {}) => {
+      if (data.lean_response) return data.lean_response;
+      if (data.proof_verified === true) return 'Lean 4 response: proof verified.';
+      const error = formatReason(data.error_summary || data.error_output || data.reason || '', 960);
+      return error ? `Lean 4 response: ${error} - proof not verified.` : 'Lean 4 response: proof not verified.';
+    };
+    const isLeanOJProofEvent = (data = {}) => {
+      const sourceType = String(data.source_type || '');
+      const sourceId = String(data.source_id || '');
+      const trigger = String(data.trigger || '');
+      return sourceType === 'leanoj_final'
+        || sourceType === 'leanoj_subproof'
+        || sourceId.startsWith('leanoj_')
+        || trigger.startsWith('leanoj');
+    };
+    const formatProofCheckCompleteMessage = (data = {}) => {
+      const verified = data.verified_count ?? 0;
+      const novel = data.novel_count ?? 0;
+      const hasTotal = data.total_candidates !== undefined && data.total_candidates !== null;
+      const base = hasTotal
+        ? `Proof check complete: ${verified}/${data.total_candidates} candidates verified, ${novel} novel`
+        : `Proof check complete: ${verified} verified`;
+      const detail = formatReason(data.message, 220);
+      return detail ? `${base} - ${detail}` : base;
+    };
     
     // Topic exploration events (pre-brainstorm candidate collection)
     unsubscribers.push(websocket.on('topic_exploration_started', (data) => {
@@ -908,7 +1203,7 @@ function App() {
       addActivity({
         event: 'critique_phase_started',
         timestamp: getTimestamp(data),
-        message: `Critique phase started (Paper v${data.paper_version || '?'}, target: ${data.target_critiques || 5} critiques)`,
+        message: `Critique phase started (Paper v${data.paper_version || '?'}, target: ${data.target_critiques || 3} attempts)`,
         data
       });
     }));
@@ -925,20 +1220,11 @@ function App() {
       }
     }));
     
-    unsubscribers.push(websocket.on('body_rewrite_started', (data) => {
+    unsubscribers.push(websocket.on('self_review_appended', (data) => {
       addActivity({
-        event: 'body_rewrite_started',
+        event: 'self_review_appended',
         timestamp: getTimestamp(data),
-        message: `REWRITE PHASE: Total rewrite started for Paper v${data.version || '?'}${data.title_changed ? ' (Title updated)' : ''}`,
-        data
-      });
-    }));
-    
-    unsubscribers.push(websocket.on('partial_revision_complete', (data) => {
-      addActivity({
-        event: 'partial_revision_complete',
-        timestamp: getTimestamp(data),
-        message: `PARTIAL REVISION: Applied ${data.edits_applied || 0} targeted edits (Paper v${data.version || '?'})${data.title_changed ? ' (Title updated)' : ''}`,
+        message: `AI self-review appended (${data.critique_count || 0} accepted critique${data.critique_count === 1 ? '' : 's'})`,
         data
       });
     }));
@@ -947,7 +1233,7 @@ function App() {
       addActivity({
         event: 'critique_phase_ended',
         timestamp: getTimestamp(data),
-        message: `Critique phase complete (${data.decision || 'unknown'})`,
+        message: `Critique phase complete (self-review appended: ${data.self_review_appended ? 'yes' : 'no'})`,
         data
       });
     }));
@@ -1006,96 +1292,70 @@ function App() {
     }));
 
     unsubscribers.push(websocket.on('proof_check_started', (data) => {
-      const prefix = data.trigger === 'manual'
-        ? 'Manual proof check started'
-        : data.trigger === 'retry'
-          ? 'Paper-stage proof retry started'
-          : 'Proof check started';
-      addActivity({
-        event: 'proof_check_started',
-        timestamp: getTimestamp(data),
-        message: `${prefix} for ${data.source_type} ${data.source_id}`,
-        data
-      });
+      setProofRefreshToken((prev) => prev + 1);
     }));
 
     unsubscribers.push(websocket.on('proof_retry_scheduled', (data) => {
-      addActivity({
-        event: 'proof_retry_scheduled',
-        timestamp: getTimestamp(data),
-        message: `Scheduled ${data.count || 0} proof retry candidate(s) for paper ${data.source_id}`,
-        data
-      });
+      setProofRefreshToken((prev) => prev + 1);
     }));
 
     unsubscribers.push(websocket.on('proof_retry_started', (data) => {
-      addActivity({
-        event: 'proof_retry_started',
-        timestamp: getTimestamp(data),
-        message: `Retrying ${data.count || 0} failed proof candidate(s) against paper ${data.source_id}`,
-        data
-      });
+      setProofRefreshToken((prev) => prev + 1);
     }));
 
     unsubscribers.push(websocket.on('proof_check_no_candidates', (data) => {
-      addActivity({
-        event: 'proof_check_no_candidates',
-        timestamp: getTimestamp(data),
-        message: `No formal proof candidates found in ${data.source_type} ${data.source_id}`,
-        data
-      });
+      setProofRefreshToken((prev) => prev + 1);
     }));
 
     unsubscribers.push(websocket.on('proof_check_candidates_found', (data) => {
-      addActivity({
-        event: 'proof_check_candidates_found',
-        timestamp: getTimestamp(data),
-        message: `Proof check found ${data.count || 0} theorem candidate(s)`,
-        data
-      });
+      setProofRefreshToken((prev) => prev + 1);
     }));
 
     unsubscribers.push(websocket.on('proof_attempt_started', (data) => {
       addActivity({
         event: 'proof_attempt_started',
         timestamp: getTimestamp(data),
-        message: `Proof attempt ${data.attempt || 1} started: ${data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)}, Attempt ${data.attempt || 1} started: ${proofTarget(data)}`,
         data
       });
     }));
 
-    unsubscribers.push(websocket.on('smt_check_started', (data) => {
+    unsubscribers.push(websocket.on('smt_check_error', (data) => {
       addActivity({
-        event: 'smt_check_started',
+        event: 'smt_check_error',
         timestamp: getTimestamp(data),
-        message: `SMT check started: ${data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)} SMT error: ${formatReason(data.error_summary, 960) || proofTarget(data)}`,
         data
       });
     }));
 
-    unsubscribers.push(websocket.on('smt_check_complete', (data) => {
+    unsubscribers.push(websocket.on('proof_attempt_failed', (data) => {
       addActivity({
-        event: 'smt_check_complete',
+        event: 'proof_attempt_failed',
         timestamp: getTimestamp(data),
-        message: `SMT check complete (${data.result || 'unknown'}): ${data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)}, Attempt ${data.attempt || '?'} final: ${proofLeanResponse(data)}`,
         data
       });
     }));
 
-    unsubscribers.push(websocket.on('proof_attempt_failed', (data) => {
+    unsubscribers.push(websocket.on('proof_verified', (data) => {
+      setProofRefreshToken((prev) => prev + 1);
+    }));
+
+    unsubscribers.push(websocket.on('proof_lean_accepted', (data) => {
       addActivity({
-        event: 'proof_attempt_failed',
+        event: 'proof_lean_accepted',
         timestamp: getTimestamp(data),
-        message: `Proof attempt ${data.attempt || '?'} failed: ${formatReason(data.error_summary, 960) || data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)}, Attempt ${data.attempt || '?'} final: ${proofLeanResponse(data)}`,
         data
       });
     }));
 
-    unsubscribers.push(websocket.on('proof_verified', (data) => {
+    unsubscribers.push(websocket.on('proof_integrity_rejected', (data) => {
       addActivity({
-        event: 'proof_verified',
+        event: 'proof_integrity_rejected',
         timestamp: getTimestamp(data),
-        message: `Lean 4 verified: ${data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)} error: integrity rejected - ${formatReason(data.reason, 960) || proofTarget(data)}`,
         data
       });
     }));
@@ -1104,7 +1364,7 @@ function App() {
       addActivity({
         event: 'proof_attempts_exhausted',
         timestamp: getTimestamp(data),
-        message: `Proof attempts exhausted: ${data.theorem_statement || data.theorem_id}`,
+        message: `${proofName(data)} terminated: proof attempts exhausted for ${proofTarget(data)}`,
         data
       });
     }));
@@ -1126,41 +1386,28 @@ function App() {
         ];
         return next.length > 3 ? next.slice(-3) : next;
       });
-      addActivity({
-        event: 'novel_proof_discovered',
-        timestamp: getTimestamp(data),
-        message: `Novel proof discovered: ${data.theorem_statement}`,
-        data
-      });
     }));
 
     unsubscribers.push(websocket.on('known_proof_verified', (data) => {
       setProofRefreshToken((prev) => prev + 1);
-      addActivity({
-        event: 'known_proof_verified',
-        timestamp: getTimestamp(data),
-        message: `Verified known proof recorded for ${data.source_type} ${data.source_id}`,
-        data
-      });
     }));
 
     unsubscribers.push(websocket.on('proof_dependency_added', (data) => {
       setLatestProofDependencyEvent(data);
       setProofRefreshToken((prev) => prev + 1);
-      addActivity({
-        event: 'proof_dependency_added',
-        timestamp: getTimestamp(data),
-        message: `Dependency graph updated for ${data.theorem_name || data.proof_id}`,
-        data
-      });
     }));
 
     unsubscribers.push(websocket.on('proof_check_complete', (data) => {
+      if (isLeanOJProofEvent(data)) return;
+      if (data.source_type === 'compiler_rigor' && !isAutonomousTier2Active()) return;
+
       setProofRefreshToken((prev) => prev + 1);
+      const message = formatProofCheckCompleteMessage(data);
+
       addActivity({
         event: 'proof_check_complete',
         timestamp: getTimestamp(data),
-        message: `Proof check complete: ${data.verified_count || 0} verified, ${data.novel_count || 0} novel`,
+        message,
         data
       });
     }));
@@ -1168,6 +1415,7 @@ function App() {
     unsubscribers.push(websocket.on('auto_research_started', () => {
       setAutonomousActivity([]);
       setAutonomousRunning(true);
+      setAnyWorkflowRunning(true);
       setAutonomousStopping(false);
     }));
     
@@ -1175,6 +1423,7 @@ function App() {
       // Handle resume after crash/restart - sync running state
       console.log('Autonomous research resumed:', data);
       setAutonomousRunning(true);
+      setAnyWorkflowRunning(true);
       setAutonomousStopping(false);
       if (data?.tier) {
         autonomousTierRef.current = data.tier;
@@ -1585,6 +1834,14 @@ function App() {
       
       // Add to notification stack (max 3, FIFO)
       setCritiqueNotifications(prev => {
+        const seenKey = getHighScoreCritiqueNotificationKey(data.paper_id, data.average_rating);
+        if (seenKey && (seenHighScoreCritiquesRef.current.has(seenKey) || prev.some(notification => notification.seenKey === seenKey))) {
+          return prev;
+        }
+        if (seenKey) {
+          shownHighScoreCritiquesRef.current.add(seenKey);
+        }
+
         const newNotification = {
           id: `critique_${data.paper_id}_${Date.now()}`,
           paper_id: data.paper_id,
@@ -1593,7 +1850,8 @@ function App() {
           novelty_rating: data.novelty_rating,
           correctness_rating: data.correctness_rating,
           impact_rating: data.impact_rating,
-          timestamp: data.timestamp
+          timestamp: data.timestamp,
+          seenKey
         };
         
         // Add to stack, keep max 3 (remove oldest if full)
@@ -1618,6 +1876,233 @@ function App() {
     };
   }, []);
 
+  useEffect(() => {
+    const MAX_LEANOJ_ACTIVITY_EVENTS = 500;
+    const getTimestamp = (data = {}) => data?._serverTimestamp || data?.timestamp || new Date().toISOString();
+    const shouldTrackLeanOJModelCall = (data = {}) => {
+      const taskId = String(data.task_id || '');
+      const roleId = String(data.role_id || '');
+      const summary = String(data.result_summary || data.message || '').toLowerCase();
+      return !(
+        taskId === 'leanoj_sufficiency' ||
+        taskId === 'leanoj_path' ||
+        taskId === 'leanoj_path_val' ||
+        summary.startsWith('sufficiency result:') ||
+        summary.startsWith('path result:') ||
+        (
+          roleId === 'leanoj_path_validator' &&
+          (summary.startsWith('decision: accept') || summary.startsWith('decision: reject'))
+        )
+      );
+    };
+    const addLeanOJActivity = (event, data = {}, message = '') => {
+      setLeanojActivity(prev => [
+        ...prev,
+        {
+          event,
+          timestamp: getTimestamp(data),
+          message: message || data.message || data.reasoning || data.decision || data.phase || 'Proof Solver update',
+          data,
+        },
+      ].slice(-MAX_LEANOJ_ACTIVITY_EVENTS));
+    };
+    const summarizeLeanOJText = (text = '', limit = 220) => {
+      const cleaned = String(text || '').replace(/\s+/g, ' ').trim();
+      return cleaned.length > limit ? `${cleaned.slice(0, limit)}...` : cleaned;
+    };
+    const formatModelName = (modelId = '') => {
+      const cleaned = String(modelId || '').trim();
+      if (!cleaned) return '';
+      const displayName = cleaned.split('/').pop() || cleaned;
+      return displayName.length > 32 ? `${displayName.slice(0, 32)}...` : displayName;
+    };
+    const formatLeanOJRole = (roleId = '') => {
+      const cleaned = String(roleId || '').replace(/^leanoj_/, '').replace(/_/g, ' ').trim();
+      return cleaned ? cleaned.replace(/\b\w/g, (char) => char.toUpperCase()) : 'Proof Solver Model';
+    };
+    const formatLeanOJDuration = (durationMs) => {
+      if (durationMs === null || durationMs === undefined || Number.isNaN(Number(durationMs))) return '';
+      const seconds = Number(durationMs) / 1000;
+      return seconds >= 60 ? `${(seconds / 60).toFixed(1)}m` : `${seconds.toFixed(1)}s`;
+    };
+    const formatLeanOJCallResult = (data = {}) => {
+      const role = formatLeanOJRole(data.role_id);
+      const modelName = formatModelName(data.model) || 'model';
+      const summary = summarizeLeanOJText(data.result_summary || data.message || '', 220);
+      const attemptSuffix = Number(data.attempt || 1) > 1 ? `, attempt ${data.attempt}` : '';
+      const duration = formatLeanOJDuration(data.duration_ms);
+      const durationSuffix = duration ? `, ${duration}` : '';
+      return `${role} [${modelName}]: ✓ RESULT${attemptSuffix}${durationSuffix}${summary ? ` - ${summary}` : ''}`;
+    };
+    const formatLeanOJBrainstormMessage = (data = {}, accepted = true) => {
+      const submitterId = data.submitter_id ?? data.submitter ?? '?';
+      const modelName = formatModelName(data.submitter_model || data.model) || 'N/A';
+      const totalValue = accepted ? data.total_acceptances : data.total_rejections;
+      const total = totalValue !== undefined ? ` (total: ${totalValue})` : '';
+      const detail = accepted
+        ? summarizeLeanOJText(data.submission_preview || data.submission, 160)
+        : summarizeLeanOJText(
+          data.rejection_reason
+            || data.validator_summary
+            || data.validator_reasoning
+            || data.submission_preview
+            || data.submission,
+          160
+        );
+      return `Brainstorm Submitter ${submitterId} [${modelName}]: ${accepted ? '✓ ACCEPTED' : '✗ REJECTED'}${total}${detail ? ` - ${detail}` : ''}`;
+    };
+    const leanOJProofName = (data = {}) => {
+      const attempt = data.attempt || {};
+      if (data.proof_label) return `Proof ${data.proof_label}`;
+      if (data.source_type === 'leanoj_final' || attempt.target === 'final') return 'Final proof';
+      if (data.source_type === 'leanoj_subproof' || data.subproof_id || data.subproof || attempt.target === 'subproof') return 'Proof fragment';
+      return 'Proof';
+    };
+    const leanOJProofTarget = (data = {}) => {
+      const attempt = data.attempt || {};
+      const subproof = data.subproof || {};
+      return data.theorem_statement
+        || data.theorem_id
+        || subproof.theorem_or_lemma
+        || subproof.request
+        || attempt.request
+        || data.subproof_id
+        || '';
+    };
+    const leanOJLeanResponse = (data = {}) => {
+      const attempt = data.attempt || {};
+      if (data.lean_response) return data.lean_response;
+      if (data.proof_verified === true || attempt.success === true) return 'Lean 4 response: proof verified.';
+      const error = summarizeLeanOJText(
+        attempt.error_output || data.error_summary || data.error_output || data.reason || data.message || '',
+        960
+      );
+      return error ? `Lean 4 response: ${error} - proof not verified.` : 'Lean 4 response: proof not verified.';
+    };
+    const leanOJAttemptStartedMessage = (data = {}) => {
+      const attemptNumber = data.attempt?.attempt || data.attempt || 1;
+      const target = leanOJProofTarget(data);
+      return `${leanOJProofName(data)}, Attempt ${attemptNumber} started${target ? `: ${target}` : ''}`;
+    };
+    const leanOJAttemptFinalMessage = (data = {}) => {
+      const attemptNumber = data.attempt?.attempt || data.attempt || '?';
+      return `${leanOJProofName(data)}, Attempt ${attemptNumber} final: ${leanOJLeanResponse(data)}`;
+    };
+    const isLeanOJProofEvent = (data = {}) => {
+      const sourceType = String(data.source_type || '');
+      const sourceId = String(data.source_id || '');
+      const trigger = String(data.trigger || '');
+      return sourceType === 'leanoj_final'
+        || sourceType === 'leanoj_subproof'
+        || sourceId.startsWith('leanoj_')
+        || trigger.startsWith('leanoj');
+    };
+    const addLeanOJSharedProofActivity = (event, data = {}, messageFactory) => {
+      if (!isLeanOJProofEvent(data)) return;
+      setLeanojProofRefreshToken((prev) => prev + 1);
+      addLeanOJActivity(event, data, messageFactory(data));
+    };
+
+    const handlers = [
+      ['leanoj_started', (data) => {
+        setLeanojRunning(true);
+        addLeanOJActivity('leanoj_started', data, 'Proof Solver started');
+      }],
+      ['leanoj_stopped', (data) => {
+        setLeanojRunning(false);
+        setAnyWorkflowRunning(false);
+        addLeanOJActivity('leanoj_stopped', data, 'Proof Solver stopped');
+        leanojAPI.getStatus().then(setLeanojStatus).catch(console.error);
+      }],
+      ['leanoj_status_updated', (data) => setLeanojStatus(data)],
+      ['leanoj_phase_changed', (data) => addLeanOJActivity('leanoj_phase_changed', data, `Proof Solver phase: ${data.phase || 'unknown'}`)],
+      ['leanoj_model_call_completed', (data) => {
+        if (shouldTrackLeanOJModelCall(data)) {
+          addLeanOJActivity('leanoj_model_call_completed', data, formatLeanOJCallResult(data));
+        }
+      }],
+      ['leanoj_model_call_failed', (data) => addLeanOJActivity('leanoj_model_call_failed', data, `${formatLeanOJRole(data.role_id)} call failed${data.retryable ? '; retrying' : ''}: ${summarizeLeanOJText(data.message, 160)}`)],
+      ['leanoj_role_json_retrying', (data) => addLeanOJActivity('leanoj_role_json_retrying', data, `Proof Solver role ${data.role_id || 'model'} returned invalid JSON; retrying attempt ${data.attempt || '?'}`)],
+      ['leanoj_skip_brainstorm_requested', (data) => addLeanOJActivity('leanoj_skip_brainstorm_requested', data, 'Skip brainstorm requested')],
+      ['leanoj_brainstorm_skip_deferred', (data) => addLeanOJActivity('leanoj_brainstorm_skip_deferred', data, 'Brainstorm skip queued after topic setup')],
+      ['leanoj_brainstorm_skipped', (data) => addLeanOJActivity('leanoj_brainstorm_skipped', data, 'Brainstorm skipped; proceeding directly to proof solving')],
+      ['leanoj_force_brainstorm_requested', (data) => addLeanOJActivity('leanoj_force_brainstorm_requested', data, 'Force recursive brainstorm requested')],
+      ['leanoj_brainstorm_forced', (data) => addLeanOJActivity('leanoj_brainstorm_forced', data, 'Returning to recursive brainstorm with the current proof preserved')],
+      ['leanoj_topic_submitters_started', (data) => addLeanOJActivity('leanoj_topic_submitters_started', data, `Topic submitters started (${data.submitter_count || 0} parallel submitters)`)],
+      ['leanoj_topic_generation_started', (data) => addLeanOJActivity('leanoj_topic_generation_started', data, `Submitter ${data.submitter_id ?? data.submitter ?? '?'} generating topic ${data.topic_index || '?'}/${data.target_topics || 5}`)],
+      ['leanoj_topic_empty', (data) => addLeanOJActivity('leanoj_topic_empty', data, `Topic submitter ${data.submitter_id ?? data.submitter ?? '?'} returned empty output on attempt ${data.attempt || '?'}`)],
+      ['leanoj_topic_candidate_queued', (data) => addLeanOJActivity('leanoj_topic_candidate_queued', data, `Submitter ${data.submitter_id ?? data.submitter ?? '?'} queued topic for validation: ${summarizeLeanOJText(data.topic_preview, 140)}`)],
+      ['leanoj_topic_batch_validation_started', (data) => addLeanOJActivity('leanoj_topic_batch_validation_started', data, `Topic validator reviewing batch of ${data.batch_size || 0} topic(s)`)],
+      ['leanoj_topic_validated', (data) => addLeanOJActivity('leanoj_topic_validated', data, `Topic accepted: ${summarizeLeanOJText(data.topic, 140)}`)],
+      ['leanoj_topic_rejected', (data) => addLeanOJActivity('leanoj_topic_rejected', data, `Topic rejected: ${summarizeLeanOJText(data.topic, 140)}`)],
+      ['leanoj_recursive_brainstorm_started', (data) => addLeanOJActivity('leanoj_recursive_brainstorm_started', data, `Recursive brainstorm cycle ${data.cycle || '?'} ${data.resumed ? 'resumed' : 'started'}; targeting the current proof attempt`)],
+      ['leanoj_topic_submitter_failed', (data) => addLeanOJActivity('leanoj_topic_submitter_failed', data, `Topic submitter ${data.submitter || '?'} failed: ${summarizeLeanOJText(data.message, 160)}`)],
+      ['leanoj_recursive_brainstorm_completed', (data) => addLeanOJActivity('leanoj_recursive_brainstorm_completed', data, `Recursive brainstorm cycle ${data.cycle || '?'} completed with ${data.accepted_delta || 0} new accepted ideas`)],
+      ['leanoj_initial_topic_selected', (data) => addLeanOJActivity('leanoj_initial_topic_selected', data, `Initial topic: ${summarizeLeanOJText(data.topic, 140)}`)],
+      ['leanoj_brainstorm_submitters_started', (data) => addLeanOJActivity('leanoj_brainstorm_submitters_started', data, `Brainstorm submitters started for ${data.phase || 'brainstorm'} (${data.submitter_count || 0} parallel submitters)`)],
+      ['leanoj_brainstorm_submission_queued', (data) => addLeanOJActivity('leanoj_brainstorm_submission_queued', data, `Submitter ${data.submitter_id ?? data.submitter ?? '?'} queued brainstorm idea for validation: ${summarizeLeanOJText(data.submission_preview, 140)}`)],
+      ['leanoj_brainstorm_submitter_failed', (data) => addLeanOJActivity('leanoj_brainstorm_submitter_failed', data, `Brainstorm submitter ${data.submitter || '?'} failed: ${summarizeLeanOJText(data.message, 160)}`)],
+      ['leanoj_brainstorm_batch_validation_started', (data) => addLeanOJActivity('leanoj_brainstorm_batch_validation_started', data, `Brainstorm validator reviewing batch of ${data.batch_size || 0} submission(s)`)],
+      ['leanoj_brainstorm_accepted', (data) => addLeanOJActivity('leanoj_brainstorm_accepted', data, formatLeanOJBrainstormMessage(data, true))],
+      ['leanoj_brainstorm_rejected', (data) => addLeanOJActivity('leanoj_brainstorm_rejected', data, formatLeanOJBrainstormMessage(data, false))],
+      ['leanoj_brainstorm_phase_limit_reached', (data) => addLeanOJActivity('leanoj_brainstorm_phase_limit_reached', data, `Brainstorm phase limit reached for ${data.phase || 'brainstorm'} (${data.accepted_delta || 0}/${data.max_accepts || '?'})`)],
+      ['leanoj_brainstorm_prune_review_complete', (data) => addLeanOJActivity('leanoj_brainstorm_prune_review_complete', data, 'Brainstorm prune review complete: no removal needed')],
+      ['leanoj_brainstorm_prune_rejected', (data) => addLeanOJActivity('leanoj_brainstorm_prune_rejected', data, `Brainstorm prune rejected: ${summarizeLeanOJText(data.reasoning || data.reason, 140)}`)],
+      ['leanoj_brainstorm_prune_applied', (data) => addLeanOJActivity('leanoj_brainstorm_prune_applied', data, `Brainstorm prune applied: ${summarizeLeanOJText(data.reasoning || data.reason, 140)}`)],
+      ['leanoj_brainstorm_prune_apply_failed', (data) => addLeanOJActivity('leanoj_brainstorm_prune_apply_failed', data, 'Brainstorm prune apply failed')],
+      ['leanoj_brainstorm_prune_error', (data) => addLeanOJActivity('leanoj_brainstorm_prune_error', data, data.message || 'Brainstorm prune review error')],
+      ['leanoj_brainstorm_proof_failed', (data) => addLeanOJActivity('leanoj_brainstorm_proof_failed', data, `Brainstorm proof failed Lean gate: ${summarizeLeanOJText(data.feedback?.error_summary, 180)}`)],
+      ['leanoj_brainstorm_proof_registration_failed', (data) => addLeanOJActivity('leanoj_brainstorm_proof_registration_failed', data, `Brainstorm proof registration failed: ${summarizeLeanOJText(data.error, 180)}`)],
+      ['leanoj_brainstorm_proof_verified', (data) => {
+        setLeanojProofRefreshToken((prev) => prev + 1);
+        addLeanOJActivity('leanoj_brainstorm_proof_verified', data, `Brainstorm proof verified and accepted: ${leanOJProofTarget(data)}`);
+      }],
+      ['leanoj_path_decided', (data) => addLeanOJActivity('leanoj_path_decided', data, `Path decision: ${data.decision || ''}`)],
+      ['leanoj_partial_proof_saved', (data) => addLeanOJActivity('leanoj_partial_proof_saved', data, `Partial proof saved: ${data.partial_proof?.request || data.partial_proof?.target || ''}`)],
+      ['leanoj_master_proof_initialized', (data) => addLeanOJActivity('leanoj_master_proof_initialized', data, 'Proof Solver master proof initialized')],
+      ['leanoj_master_proof_edit_started', (data) => addLeanOJActivity('leanoj_master_proof_edit_started', data, `Master proof edit started for final attempt ${data.next_verification_attempt || '?'}`)],
+      ['leanoj_master_proof_edit_validation_started', (data) => addLeanOJActivity('leanoj_master_proof_edit_validation_started', data, `Master proof shortening validation started (${data.line_delta_removed || 0} line(s), ${data.char_delta_removed || 0} char(s) removed)`)],
+      ['leanoj_master_proof_edit_applied', (data) => addLeanOJActivity('leanoj_master_proof_edit_applied', data, `Master proof edit accepted (version ${data.master_proof_version || '?'})`)],
+      ['leanoj_master_proof_edit_rejected', (data) => addLeanOJActivity('leanoj_master_proof_edit_rejected', data, `Master proof edit rejected: ${summarizeLeanOJText(data.validator_feedback || data.error_summary || data.message, 180)}`)],
+      ['leanoj_master_proof_stuck', (data) => addLeanOJActivity('leanoj_master_proof_stuck', data, data.continuing_final_cycle ? `Master proof stuck; continuing final cycle (${data.attempts_in_cycle || '?'} / ${data.max_attempts || '?'})` : `Master proof stuck; path requested: ${data.requested_path || 'unknown'}`)],
+      ['leanoj_master_proof_progress_watchdog', (data) => addLeanOJActivity('leanoj_master_proof_progress_watchdog', data, data.continuing_final_cycle ? `Master proof watchdog fired; continuing final cycle (${data.attempts_in_cycle || '?'} / ${data.max_attempts || '?'})` : `Master proof watchdog returned to ${data.requested_path || 'path planning'}`)],
+      ['leanoj_final_attempt_started', (data) => addLeanOJActivity('leanoj_final_attempt_started', data, leanOJAttemptStartedMessage(data))],
+      ['leanoj_final_attempt_failed', (data) => addLeanOJActivity('leanoj_final_attempt_failed', data, leanOJAttemptFinalMessage(data))],
+      ['leanoj_final_attempt_cycle_exhausted', (data) => addLeanOJActivity('leanoj_final_attempt_cycle_exhausted', data, data.message || 'Final attempt cycle exhausted; returning to path planning')],
+      ['leanoj_final_verified', (data) => {
+        setLeanojRunning(false);
+        setAnyWorkflowRunning(false);
+        setLeanojProofRefreshToken((prev) => prev + 1);
+        addLeanOJActivity('leanoj_final_verified', data, `${leanOJProofName(data)} verified and accepted: ${leanOJProofTarget(data) || 'final Proof Solver submission'}`);
+        leanojAPI.getStatus().then(setLeanojStatus).catch(console.error);
+      }],
+      ['proof_check_started', (data) => addLeanOJSharedProofActivity('proof_check_started', data, (eventData) => `Proof check started for ${eventData.source_type} ${eventData.source_id}`)],
+      ['proof_check_no_candidates', (data) => addLeanOJSharedProofActivity('proof_check_no_candidates', data, (eventData) => `No formal theorem candidates found in ${eventData.source_type} ${eventData.source_id}`)],
+      ['proof_check_candidates_found', (data) => addLeanOJSharedProofActivity('proof_check_candidates_found', data, (eventData) => `Proof candidates found: ${eventData.count || 0}`)],
+      ['proof_attempt_started', (data) => addLeanOJSharedProofActivity('proof_attempt_started', data, leanOJAttemptStartedMessage)],
+      ['proof_attempt_failed', (data) => addLeanOJSharedProofActivity('proof_attempt_failed', data, leanOJAttemptFinalMessage)],
+      ['proof_lean_accepted', (data) => addLeanOJSharedProofActivity('proof_lean_accepted', data, leanOJAttemptFinalMessage)],
+      ['proof_integrity_rejected', (data) => addLeanOJSharedProofActivity('proof_integrity_rejected', data, (eventData) => `${leanOJProofName(eventData)} error: integrity rejected - ${summarizeLeanOJText(eventData.reason || leanOJProofTarget(eventData), 960)}`)],
+      ['proof_verified', (data) => addLeanOJSharedProofActivity('proof_verified', data, (eventData) => `${leanOJProofName(eventData)} verified and accepted: ${leanOJProofTarget(eventData)}`)],
+      ['proof_attempts_exhausted', (data) => addLeanOJSharedProofActivity('proof_attempts_exhausted', data, (eventData) => `${leanOJProofName(eventData)} terminated: proof attempts exhausted for ${leanOJProofTarget(eventData)}`)],
+      ['novel_proof_discovered', (data) => addLeanOJSharedProofActivity('novel_proof_discovered', data, (eventData) => `${leanOJProofName(eventData)} novel proof discovered: ${eventData.theorem_statement || leanOJProofTarget(eventData)}`)],
+      ['known_proof_verified', (data) => addLeanOJSharedProofActivity('known_proof_verified', data, (eventData) => `${leanOJProofName(eventData)} known proof verified for ${eventData.source_type} ${eventData.source_id}`)],
+      ['proof_dependency_added', (data) => addLeanOJSharedProofActivity('proof_dependency_added', data, () => 'Proof Solver proof dependency added')],
+      ['proof_check_complete', (data) => addLeanOJSharedProofActivity('proof_check_complete', data, (eventData) => `Proof check complete: ${eventData.verified_count || 0} verified, ${eventData.novel_count || 0} novel`)],
+      ['leanoj_error', (data) => addLeanOJActivity('leanoj_error', data, data.message || 'Proof Solver error')],
+      ['leanoj_cleared', (data) => {
+        setLeanojRunning(false);
+        setAnyWorkflowRunning(false);
+        setLeanojActivity([]);
+        setLeanojStatus(data);
+        setLeanojProofRefreshToken((prev) => prev + 1);
+      }],
+    ];
+
+    handlers.forEach(([event, handler]) => websocket.on(event, handler));
+    return () => handlers.forEach(([event, handler]) => websocket.off(event, handler));
+  }, []);
+
   // Poll for autonomous data while running
   useEffect(() => {
     if (!autonomousRunning) return;
@@ -1642,6 +2127,24 @@ function App() {
     
     return () => clearInterval(interval);
   }, [autonomousRunning]);
+
+  useEffect(() => {
+    if (!leanojRunning) return;
+
+    const interval = setInterval(async () => {
+      try {
+        const status = await leanojAPI.getStatus();
+        setLeanojStatus(status);
+        if (!status.is_running) {
+          setLeanojRunning(false);
+        }
+      } catch (error) {
+        console.error('Failed to poll Proof Solver status:', error);
+      }
+    }, 3000);
+
+    return () => clearInterval(interval);
+  }, [leanojRunning]);
   
   // Clean up expired rate limits every minute
   useEffect(() => {
@@ -1667,6 +2170,7 @@ function App() {
   const handleAutonomousStart = async (researchPrompt) => {
     try {
       const lmStudioEnabled = capabilities.lmStudioEnabled;
+      const superchargeAllowed = developerModeEnabled;
 
       // Convert frontend camelCase to backend snake_case for submitter_configs (includes OpenRouter fields)
       const submitterConfigs = autonomousConfig.submitter_configs?.map(cfg => ({
@@ -1674,9 +2178,11 @@ function App() {
         provider: normalizeRuntimeProvider(cfg.provider, lmStudioEnabled),
         model_id: cfg.modelId,
         openrouter_provider: cfg.openrouterProvider || null,
+        openrouter_reasoning_effort: cfg.openrouterReasoningEffort || 'auto',
         lm_studio_fallback_id: lmStudioEnabled ? (cfg.lmStudioFallbackId || null) : null,
         context_window: cfg.contextWindow,
-        max_output_tokens: cfg.maxOutputTokens
+        max_output_tokens: cfg.maxOutputTokens,
+        supercharge_enabled: superchargeAllowed && Boolean(cfg.superchargeEnabled || cfg.supercharge_enabled)
       })) || [];
 
       await autonomousAPI.start({
@@ -1689,11 +2195,13 @@ function App() {
         ),
         validator_model: autonomousConfig.validator_model,
         validator_openrouter_provider: autonomousConfig.validator_openrouter_provider,
+        validator_openrouter_reasoning_effort: autonomousConfig.validator_openrouter_reasoning_effort || 'auto',
         validator_lm_studio_fallback: lmStudioEnabled
           ? autonomousConfig.validator_lm_studio_fallback
           : null,
         validator_context_window: autonomousConfig.validator_context_window,
         validator_max_tokens: autonomousConfig.validator_max_tokens,
+        validator_supercharge_enabled: superchargeAllowed && Boolean(autonomousConfig.validator_supercharge_enabled),
         // High-context submitter config with OpenRouter support
         high_context_provider: normalizeRuntimeProvider(
           autonomousConfig.high_context_provider,
@@ -1701,11 +2209,13 @@ function App() {
         ),
         high_context_model: autonomousConfig.high_context_model,
         high_context_openrouter_provider: autonomousConfig.high_context_openrouter_provider,
+        high_context_openrouter_reasoning_effort: autonomousConfig.high_context_openrouter_reasoning_effort || 'auto',
         high_context_lm_studio_fallback: lmStudioEnabled
           ? autonomousConfig.high_context_lm_studio_fallback
           : null,
         high_context_context_window: autonomousConfig.high_context_context_window,
         high_context_max_tokens: autonomousConfig.high_context_max_tokens,
+        high_context_supercharge_enabled: superchargeAllowed && Boolean(autonomousConfig.high_context_supercharge_enabled),
         // High-param submitter config with OpenRouter support
         high_param_provider: normalizeRuntimeProvider(
           autonomousConfig.high_param_provider,
@@ -1713,11 +2223,13 @@ function App() {
         ),
         high_param_model: autonomousConfig.high_param_model,
         high_param_openrouter_provider: autonomousConfig.high_param_openrouter_provider,
+        high_param_openrouter_reasoning_effort: autonomousConfig.high_param_openrouter_reasoning_effort || 'auto',
         high_param_lm_studio_fallback: lmStudioEnabled
           ? autonomousConfig.high_param_lm_studio_fallback
           : null,
         high_param_context_window: autonomousConfig.high_param_context_window,
         high_param_max_tokens: autonomousConfig.high_param_max_tokens,
+        high_param_supercharge_enabled: superchargeAllowed && Boolean(autonomousConfig.high_param_supercharge_enabled),
         // Critique submitter config with OpenRouter support
         critique_submitter_provider: normalizeRuntimeProvider(
           autonomousConfig.critique_submitter_provider,
@@ -1725,16 +2237,19 @@ function App() {
         ),
         critique_submitter_model: autonomousConfig.critique_submitter_model,
         critique_submitter_openrouter_provider: autonomousConfig.critique_submitter_openrouter_provider,
+        critique_submitter_openrouter_reasoning_effort: autonomousConfig.critique_submitter_openrouter_reasoning_effort || 'auto',
         critique_submitter_lm_studio_fallback: lmStudioEnabled
           ? autonomousConfig.critique_submitter_lm_studio_fallback
           : null,
         critique_submitter_context_window: autonomousConfig.critique_submitter_context_window,
         critique_submitter_max_tokens: autonomousConfig.critique_submitter_max_tokens,
+        critique_submitter_supercharge_enabled: superchargeAllowed && Boolean(autonomousConfig.critique_submitter_supercharge_enabled),
         tier3_enabled: autonomousConfig.tier3_enabled ?? false
       });
       setAutonomousRunning(true);
       setAutonomousStopping(false);
       setAutonomousActivity([]);
+      setAnyWorkflowRunning(true);
     } catch (error) {
       alert(`Failed to start autonomous research: ${error.details || error.message}`);
     }
@@ -1785,6 +2300,94 @@ function App() {
     }
   };
 
+  const normalizeLeanOJRoleForCapabilities = (roleConfig = {}) => {
+    const lmStudioEnabled = capabilities.lmStudioEnabled;
+    const provider = normalizeRuntimeProvider(roleConfig.provider, lmStudioEnabled);
+    const shouldResetLmState = !lmStudioEnabled && roleConfig.provider !== 'openrouter';
+    return {
+      ...roleConfig,
+      provider,
+      model_id: shouldResetLmState ? '' : (roleConfig.model_id || ''),
+      openrouter_provider: shouldResetLmState ? null : (roleConfig.openrouter_provider || null),
+      lm_studio_fallback_id: lmStudioEnabled ? (roleConfig.lm_studio_fallback_id || null) : null,
+      supercharge_enabled: developerModeEnabled && Boolean(roleConfig.supercharge_enabled),
+    };
+  };
+
+  const normalizeLeanOJRequestForCapabilities = (request) => ({
+    ...request,
+    topic_generator: normalizeLeanOJRoleForCapabilities(request.topic_generator),
+    topic_validator: normalizeLeanOJRoleForCapabilities(request.topic_validator),
+    brainstorm_submitters: (request.brainstorm_submitters || []).map(normalizeLeanOJRoleForCapabilities),
+    brainstorm_validator: normalizeLeanOJRoleForCapabilities(request.brainstorm_validator),
+    path_decider: normalizeLeanOJRoleForCapabilities(request.path_decider || request.final_solver),
+    final_solver: normalizeLeanOJRoleForCapabilities(request.final_solver),
+  });
+
+  const handleLeanOJStart = async (request) => {
+    try {
+      await leanojAPI.start(normalizeLeanOJRequestForCapabilities(request));
+      setLeanojRunning(true);
+      setLeanojActivity([]);
+      const status = await leanojAPI.getStatus();
+      setLeanojStatus(status);
+      setLeanojProofRefreshToken((prev) => prev + 1);
+      setAnyWorkflowRunning(true);
+    } catch (error) {
+      alert(`Failed to start Proof Solver: ${error.details || error.message}`);
+    }
+  };
+
+  const handleLeanOJStop = async () => {
+    try {
+      await leanojAPI.stop();
+      setLeanojRunning(false);
+      setAnyWorkflowRunning(false);
+      const status = await leanojAPI.getStatus();
+      setLeanojStatus(status);
+    } catch (error) {
+      alert(`Failed to stop Proof Solver: ${error.message}`);
+    }
+  };
+
+  const handleLeanOJClear = async () => {
+    if (!window.confirm('Clear all saved Proof Solver progress?')) {
+      return;
+    }
+    try {
+      const result = await leanojAPI.clear();
+      setLeanojRunning(false);
+      setAnyWorkflowRunning(false);
+      setLeanojActivity([]);
+      setLeanojStatus(result.status || null);
+      setLeanojProofRefreshToken((prev) => prev + 1);
+    } catch (error) {
+      alert(`Failed to clear Proof Solver progress: ${error.message}`);
+    }
+  };
+
+  const handleLeanOJSkipBrainstorm = async () => {
+    try {
+      const result = await leanojAPI.skipBrainstorm();
+      if (result.status) {
+        setLeanojStatus(result.status);
+      }
+    } catch (error) {
+      alert(`Failed to skip Proof Solver brainstorming: ${error.message}`);
+    }
+  };
+
+  const handleLeanOJForceBrainstorm = async () => {
+    try {
+      const result = await leanojAPI.forceBrainstorm();
+      if (result.status) {
+        setLeanojStatus(result.status);
+      }
+    } catch (error) {
+      alert(`Failed to force Proof Solver recursive brainstorming: ${error.message}`);
+    }
+  };
+
   const refreshBrainstorms = async () => {
     try {
       const data = await autonomousAPI.getBrainstorms();
@@ -1796,8 +2399,12 @@ function App() {
 
   const refreshPapers = async () => {
     try {
-      const data = await autonomousAPI.getPapers();
+      const [data, stats] = await Promise.all([
+        autonomousAPI.getPapers(),
+        autonomousAPI.getStats(),
+      ]);
       setPapers(data.papers || []);
+      setAutonomousStats(stats);
     } catch (error) {
       console.error('Failed to refresh papers:', error);
     }
@@ -1816,10 +2423,13 @@ function App() {
   
   // Critique notification handlers
   const handleDismissNotification = (notificationId) => {
+    const notification = critiqueNotifications.find(item => item.id === notificationId);
+    markHighScoreCritiqueSeen(notification?.seenKey);
     setCritiqueNotifications(prev => prev.filter(n => n.id !== notificationId));
   };
   
-  const handleClickNotification = (paperId, paperTitle) => {
+  const handleClickNotification = (paperId, paperTitle, seenKey) => {
+    markHighScoreCritiqueSeen(seenKey);
     setSelectedCritiquePaper({ paper_id: paperId, paper_title: paperTitle });
     setShowCritiqueModal(true);
   };
@@ -1856,6 +2466,13 @@ function App() {
     }
   };
 
+  const handleLeanOJTabSelect = (tabId) => {
+    setLeanojActiveTab(tabId);
+    if (appMode !== 'leanoj') {
+      setAppMode('leanoj');
+    }
+  };
+
   // Credit exhaustion notification handler
   const handleDismissCreditNotification = (notificationId) => {
     setCreditExhaustionNotifications(prev => prev.filter(n => n.id !== notificationId));
@@ -2029,6 +2646,19 @@ function App() {
     { id: 'compiler-live-paper', label: 'Live Paper', subtext: 'Part 2 Live Results', subtextClass: 'green', group: 'compiler' },
   ];
 
+  const leanojMainTabs = [
+    { id: 'leanoj-interface', label: 'Proof Solver', group: 'leanoj-main' },
+    { id: 'leanoj-brainstorms', label: 'Brainstorms', group: 'leanoj-main' },
+    { id: 'leanoj-master-proof', label: 'Master Proof Draft', group: 'leanoj-main' },
+    { id: 'leanoj-proofs', label: 'Mathematical Proofs', group: 'leanoj-main' },
+  ];
+
+  const leanojSettingsTabs = [
+    { id: 'leanoj-completed-proof-works', label: 'Your Completed Proof Works Library', group: 'leanoj-settings' },
+    { id: 'leanoj-logs', label: 'API Call Logs', group: 'leanoj-settings' },
+    { id: 'leanoj-settings', label: 'Proof Solver Model Profiles & Settings', group: 'leanoj-settings' },
+  ];
+
   useEffect(() => {
     if (!autonomousConfig.tier3_enabled && autonomousActiveTab === 'auto-final-answer') {
       setAutonomousActiveTab('auto-interface');
@@ -2050,13 +2680,14 @@ function App() {
   useEffect(() => {
     const checkWorkflowStatus = async () => {
       try {
-        const [aggStatus, compStatus, autoStatus] = await Promise.all([
+        const [aggStatus, compStatus, autoStatus, leanojCurrentStatus] = await Promise.all([
           api.get('/api/aggregator/status').catch(() => ({ is_running: false })),
           api.get('/api/compiler/status').catch(() => ({ is_running: false })),
-          autonomousAPI.getStatus().catch(() => ({ is_running: false }))
+          autonomousAPI.getStatus().catch(() => ({ is_running: false })),
+          leanojAPI.getStatus().catch(() => ({ is_running: false }))
         ]);
         
-        const running = aggStatus.is_running || compStatus.is_running || autoStatus.is_running;
+        const running = aggStatus.is_running || compStatus.is_running || autoStatus.is_running || leanojCurrentStatus.is_running;
         setAnyWorkflowRunning(running);
       } catch (error) {
         console.error('Failed to check workflow status:', error);
@@ -2079,6 +2710,12 @@ function App() {
           </h1>
           <p className="banner-company">By Intrafere Research Group</p>
           <p className="banner-variant">A Prototype Artificial Superintelligence - Novelty Seeking Autonomous S.T.E.M. Researcher For Automated Theorem Generation</p>
+          <p
+            className={`banner-mode-subtitle ${appMode === 'manual' || appMode === 'leanoj' ? '' : 'banner-mode-subtitle--hidden'}`}
+            aria-hidden={appMode !== 'manual' && appMode !== 'leanoj'}
+          >
+            {appMode === 'manual' ? 'MANUAL S.T.E.M. WRITER' : 'Proof Solver Mode'}
+          </p>
         </div>
       </div>
 
@@ -2107,6 +2744,9 @@ function App() {
           >
             <option value="autonomous">Autonomous S.T.E.M. ASI</option>
             <option value="manual">Advanced Manual S.T.E.M. ASI</option>
+            {developerModeEnabled && (
+              <option value="leanoj">LeanOJ Proof Solver</option>
+            )}
           </select>
         </div>
         <div className="boost-control-row">
@@ -2178,9 +2818,17 @@ function App() {
             Hosted Web Mode
           </span>
         )}
+        {developerModeEnabled && (
+          <span
+            className="header-status-chip header-status-chip--ready"
+            title="Developer mode settings are enabled. Raw JSON editors are available in settings pages."
+          >
+            Developer Mode
+          </span>
+        )}
       </div>
       
-      <div className={`tabs ${appMode === 'manual' ? 'tabs-manual' : ''} ${shimmerAccentsEnabled ? 'tabs-shimmer-enabled' : ''}`}>
+      <div className={`tabs ${appMode === 'manual' ? 'tabs-manual' : ''} ${appMode === 'leanoj' ? 'tabs-leanoj' : ''} ${shimmerAccentsEnabled ? 'tabs-shimmer-enabled' : ''}`}>
         {appMode === 'autonomous' ? (
           <>
             {mainTabs.map((tab, index) => {
@@ -2227,6 +2875,32 @@ function App() {
               );
             })}
           </>
+        ) : appMode === 'leanoj' ? (
+          <>
+            {leanojMainTabs.map((tab) => (
+              <React.Fragment key={tab.id}>
+                <button
+                  className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group}`}
+                  onClick={() => handleLeanOJTabSelect(tab.id)}
+                >
+                  {tab.label}
+                </button>
+              </React.Fragment>
+            ))}
+
+            <div className="tab-group-spacer-large"></div>
+
+            {leanojSettingsTabs.map((tab) => (
+              <React.Fragment key={tab.id}>
+                <button
+                  className={`tab ${activeTab === tab.id ? 'active' : ''} tab-${tab.group}`}
+                  onClick={() => handleLeanOJTabSelect(tab.id)}
+                >
+                  {tab.label}
+                </button>
+              </React.Fragment>
+            ))}
+          </>
         ) : (
           <>
             {manualTabs.map((tab, index) => {
@@ -2309,10 +2983,11 @@ function App() {
             <PaperLibrary
               papers={papers}
               onRefresh={refreshPapers}
-              archivedCount={autonomousStats?.paper_counts?.archived || 0}
+              archivedCount={autonomousStats?.paper_counts?.pruned || autonomousStats?.paper_counts?.archived || 0}
               api={{ 
                 getAutonomousPaper: autonomousAPI.getAutonomousPaper,
-                deletePaper: autonomousAPI.deletePaper
+                deletePaper: autonomousAPI.deletePaper,
+                deleteAllPrunedPapers: autonomousAPI.deleteAllPrunedPapers
               }}
             />
           )}
@@ -2382,6 +3057,49 @@ function App() {
               events={autonomousActivity}
             />
           )}
+
+          {activeTab === 'leanoj-interface' && (
+            <LeanOJInterface
+              isRunning={leanojRunning}
+              anyWorkflowRunning={anyWorkflowRunning}
+              status={leanojStatus}
+              activity={leanojActivity}
+              settings={leanojSettings}
+              onSettingsChange={setLeanojSettings}
+              onStart={handleLeanOJStart}
+              onStop={handleLeanOJStop}
+              onClear={handleLeanOJClear}
+              onSkipBrainstorm={handleLeanOJSkipBrainstorm}
+              onForceBrainstorm={handleLeanOJForceBrainstorm}
+            />
+          )}
+          {activeTab === 'leanoj-brainstorms' && (
+            <LeanOJBrainstorms status={leanojStatus} />
+          )}
+          {activeTab === 'leanoj-proofs' && (
+            <LeanOJMathematicalProofs
+              api={leanojAPI}
+              status={leanojStatus}
+              refreshToken={leanojProofRefreshToken}
+            />
+          )}
+          {activeTab === 'leanoj-master-proof' && (
+            <LeanOJMasterProof
+              api={leanojAPI}
+              status={leanojStatus}
+              refreshToken={leanojProofRefreshToken}
+            />
+          )}
+          {activeTab === 'leanoj-completed-proof-works' && (
+            <LeanOJProofLibrary
+              api={leanojAPI}
+              refreshToken={leanojProofRefreshToken}
+            />
+          )}
+          {activeTab === 'leanoj-logs' && (
+            <LeanOJLogs />
+          )}
+          {/* Full-width settings screens with model sidebars are rendered outside the padded tab container. */}
           
           {activeTab === 'aggregator-interface' && (
             <AggregatorInterface
@@ -2389,15 +3107,11 @@ function App() {
               setConfig={setConfig}
               capabilities={capabilities}
               anyWorkflowRunning={anyWorkflowRunning}
+              onWorkflowRunningChange={setAnyWorkflowRunning}
+              developerModeEnabled={developerModeEnabled}
             />
           )}
-          {activeTab === 'aggregator-settings' && (
-            <AggregatorSettings
-              config={config}
-              setConfig={setConfig}
-              capabilities={capabilities}
-            />
-          )}
+          {/* Full-width settings screens with model sidebars are rendered outside the padded tab container. */}
           {activeTab === 'aggregator-logs' && <AggregatorLogs />}
           {activeTab === 'aggregator-results' && <LiveResults />}
           
@@ -2406,11 +3120,11 @@ function App() {
               activeTab={activeTab}
               capabilities={capabilities}
               anyWorkflowRunning={anyWorkflowRunning}
+              onWorkflowRunningChange={setAnyWorkflowRunning}
+              developerModeEnabled={developerModeEnabled}
             />
           )}
-          {activeTab === 'compiler-settings' && (
-            <CompilerSettings capabilities={capabilities} />
-          )}
+          {/* Full-width settings screens with model sidebars are rendered outside the padded tab container. */}
           {activeTab === 'compiler-logs' && <CompilerLogs />}
           {activeTab === 'compiler-live-paper' && <LivePaper />}
         </div>
@@ -2424,6 +3138,33 @@ function App() {
           models={models}
           capabilities={capabilities}
           isRunning={autonomousRunning}
+          developerModeEnabled={developerModeEnabled}
+        />
+      )}
+
+      {activeTab === 'leanoj-settings' && (
+        <LeanOJSettings
+          settings={leanojSettings}
+          onSettingsChange={setLeanojSettings}
+          capabilities={capabilities}
+          isRunning={leanojRunning}
+          developerModeEnabled={developerModeEnabled}
+        />
+      )}
+
+      {activeTab === 'aggregator-settings' && (
+        <AggregatorSettings
+          config={config}
+          setConfig={setConfig}
+          capabilities={capabilities}
+          developerModeEnabled={developerModeEnabled}
+        />
+      )}
+
+      {activeTab === 'compiler-settings' && (
+        <CompilerSettings
+          capabilities={capabilities}
+          developerModeEnabled={developerModeEnabled}
         />
       )}
       
@@ -2509,6 +3250,7 @@ function App() {
         isOpen={showBoostModal}
         onClose={() => setShowBoostModal(false)}
         capabilities={capabilities}
+        developerModeEnabled={developerModeEnabled}
       />
       
       {/* OpenRouter API Key Modal */}
@@ -2566,6 +3308,7 @@ function App() {
           paperTitle={selectedCritiquePaper.paper_title}
           onGenerateCritique={handleGenerateCritique}
           onGetCritiques={handleGetCritiques}
+          developerModeEnabled={developerModeEnabled}
         />
       )}
       
@@ -2585,7 +3328,6 @@ function App() {
               rel="noopener noreferrer"
               className="footer-link footer-link-github"
             >
-              <span className="footer-icon">ℹ️</span>
               How MOTO's Superintelligence Works
             </a>
             <a
@@ -2594,7 +3336,7 @@ function App() {
               rel="noopener noreferrer"
               className="footer-link footer-link-purchase"
             >
-              Purchase a Custom ASI Program
+              Purchase Custom Industrial-Grade ASI Programs
             </a>
             <a
               href="https://github.com/"
@@ -2602,8 +3344,7 @@ function App() {
               rel="noopener noreferrer"
               className="footer-link footer-link-github"
             >
-              <span className="footer-icon">⭐</span>
-              Visit MOTO's GitHub (Star Us for More ASI Programs)
+              Intrafere GitHub
             </a>
           </div>
         </div>
diff --git a/frontend/src/components/ApiCallLogs.jsx b/frontend/src/components/ApiCallLogs.jsx
new file mode 100644
index 0000000..1b4bffd
--- /dev/null
+++ b/frontend/src/components/ApiCallLogs.jsx
@@ -0,0 +1,412 @@
+import React, { useCallback, useEffect, useRef, useState } from 'react';
+import './autonomous/AutonomousResearch.css';
+
+const EMPTY_API_STATS = Object.freeze({
+  total_calls: 0,
+  successful_calls: 0,
+  failed_calls: 0,
+  success_rate: 0,
+  boosted_calls: 0,
+  by_phase: {},
+  by_model: {},
+  by_provider: {},
+  by_source: {},
+  by_boost_mode: {},
+});
+
+function formatDuration(ms) {
+  if (ms === null || ms === undefined) return '-';
+  if (ms < 1000) return `${Math.round(ms)}ms`;
+  return `${(ms / 1000).toFixed(1)}s`;
+}
+
+function formatTimestamp(timestamp) {
+  try {
+    return new Date(timestamp).toLocaleString();
+  } catch {
+    return timestamp;
+  }
+}
+
+function getPhaseLabel(phase) {
+  switch (phase) {
+    case 'topic_selection': return 'Topic';
+    case 'brainstorm': return 'Brainstorm';
+    case 'paper_compilation': return 'Paper';
+    case 'tier3': return 'Tier 3';
+    case 'boost': return 'Boost';
+    case 'initial_topic_candidates': return 'Initial Topics';
+    case 'initial_brainstorm': return 'Initial Brainstorm';
+    case 'recursive_brainstorm': return 'Recursive Brainstorm';
+    case 'proof_storm': return 'Legacy Proof Storm';
+    case 'path_decision': return 'Path Decision';
+    case 'final_proof_loop': return 'Final Proof Loop';
+    default: return phase || 'Unknown';
+  }
+}
+
+function getSourceLabel(source) {
+  switch (source) {
+    case 'api+boost': return 'Boosted';
+    case 'boost': return 'Boost Only';
+    default: return 'Standard';
+  }
+}
+
+function getBoostModeLabel(mode) {
+  switch (mode) {
+    case 'next_count': return 'Next X';
+    case 'category': return 'Category';
+    case 'task_id': return 'Task ID';
+    default: return mode || 'Unknown';
+  }
+}
+
+function getProviderLabel(provider) {
+  switch (provider) {
+    case 'openrouter': return 'OR';
+    case 'lm_studio': return 'LMS';
+    default: return provider || 'UNK';
+  }
+}
+
+export default function ApiCallLogs({
+  api,
+  workflow = null,
+  title = 'API Call Logs',
+  emptyHint = 'Run a workflow and make API calls to see the combined logs here.',
+  style,
+}) {
+  const [apiLogs, setApiLogs] = useState([]);
+  const [apiStats, setApiStats] = useState(null);
+  const [apiLogsLoading, setApiLogsLoading] = useState(true);
+  const [expandedApiLogIdx, setExpandedApiLogIdx] = useState(null);
+  const [apiAutoRefresh, setApiAutoRefresh] = useState(true);
+  const [apiLogDetails, setApiLogDetails] = useState({});
+  const abortControllerRef = useRef(null);
+
+  const fetchApiLogs = useCallback(async () => {
+    if (abortControllerRef.current) {
+      abortControllerRef.current.abort();
+    }
+
+    const controller = new AbortController();
+    abortControllerRef.current = controller;
+
+    try {
+      const response = await api.getApiLogs(100, { signal: controller.signal, workflow });
+      if (abortControllerRef.current !== controller) {
+        return;
+      }
+
+      if (response.success) {
+        const logs = response.logs || [];
+        setApiLogs(logs);
+        setApiLogDetails((prev) => {
+          const visibleKeys = new Set(logs.map((log) => log.log_key).filter(Boolean));
+          return Object.fromEntries(
+            Object.entries(prev).filter(([key]) => visibleKeys.has(key))
+          );
+        });
+        setApiStats(response.stats || EMPTY_API_STATS);
+      }
+    } catch (error) {
+      if (abortControllerRef.current !== controller) {
+        return;
+      }
+
+      if (error.name !== 'AbortError') {
+        console.error('Failed to fetch API logs:', error);
+      }
+    } finally {
+      if (abortControllerRef.current === controller) {
+        setApiLogsLoading(false);
+      }
+    }
+  }, [api, workflow]);
+
+  const fetchApiLogDetail = useCallback(async (log) => {
+    const logKey = log?.log_key;
+    if (!logKey || typeof api.getApiLogDetail !== 'function') {
+      return log;
+    }
+
+    if (apiLogDetails[logKey]) {
+      return apiLogDetails[logKey];
+    }
+
+    try {
+      const response = await api.getApiLogDetail(logKey, { workflow });
+      const detailedLog = response.log || log;
+      setApiLogDetails((prev) => ({
+        ...prev,
+        [logKey]: detailedLog,
+      }));
+      return detailedLog;
+    } catch (error) {
+      console.error('Failed to fetch API log detail:', error);
+      return log;
+    }
+  }, [api, apiLogDetails, workflow]);
+
+  useEffect(() => {
+    fetchApiLogs();
+
+    let interval;
+    if (apiAutoRefresh) {
+      interval = setInterval(fetchApiLogs, 5000);
+    }
+
+    return () => {
+      if (interval) clearInterval(interval);
+      if (abortControllerRef.current) {
+        abortControllerRef.current.abort();
+        abortControllerRef.current = null;
+      }
+    };
+  }, [fetchApiLogs, apiAutoRefresh]);
+
+  const handleClearApiLogs = async () => {
+    if (!window.confirm('Are you sure you want to clear these API logs?')) {
+      return;
+    }
+
+    try {
+      if (abortControllerRef.current) {
+        abortControllerRef.current.abort();
+        abortControllerRef.current = null;
+      }
+
+      await api.clearApiLogs({ workflow });
+      setApiLogs([]);
+      setApiLogDetails({});
+      setApiStats(EMPTY_API_STATS);
+      setExpandedApiLogIdx(null);
+      setApiLogsLoading(false);
+    } catch (error) {
+      console.error('Failed to clear API logs:', error);
+    }
+  };
+
+  const copyToClipboard = async (text) => {
+    try {
+      await navigator.clipboard.writeText(text);
+    } catch (error) {
+      console.error('Failed to copy to clipboard:', error);
+    }
+  };
+
+  const handleToggleApiLog = (log, index) => {
+    const nextIndex = expandedApiLogIdx === index ? null : index;
+    setExpandedApiLogIdx(nextIndex);
+    if (nextIndex !== null) {
+      fetchApiLogDetail(log);
+    }
+  };
+
+  const handleCopyLogText = async (log, fullField, previewField) => {
+    const detailedLog = await fetchApiLogDetail(log);
+    copyToClipboard(detailedLog?.[fullField] || log?.[previewField] || '');
+  };
+
+  return (
+    <div className="api-logs-section" style={style}>
+      <div className="api-logs-header">
+        <h3>{title}</h3>
+        <div className="api-logs-actions">
+          <label className="auto-refresh-toggle">
+            <input
+              type="checkbox"
+              checked={apiAutoRefresh}
+              onChange={(e) => setApiAutoRefresh(e.target.checked)}
+            />
+            Auto-refresh
+          </label>
+          <button onClick={fetchApiLogs} className="refresh-btn" title="Refresh now">
+            Refresh
+          </button>
+          <button
+            onClick={handleClearApiLogs}
+            className="clear-btn"
+            disabled={apiLogs.length === 0}
+          >
+            Clear Logs
+          </button>
+        </div>
+      </div>
+
+      {apiStats && (
+        <div className="api-stats">
+          <div className="stat-card">
+            <span className="stat-value">{apiStats.total_calls}</span>
+            <span className="stat-label">Total API Calls</span>
+          </div>
+          <div className="stat-card success">
+            <span className="stat-value">{apiStats.successful_calls}</span>
+            <span className="stat-label">Successful</span>
+          </div>
+          <div className="stat-card error">
+            <span className="stat-value">{apiStats.failed_calls}</span>
+            <span className="stat-label">Failed</span>
+          </div>
+          <div className="stat-card">
+            <span className="stat-value">
+              {(apiStats.success_rate * 100).toFixed(1)}%
+            </span>
+            <span className="stat-label">Success Rate</span>
+          </div>
+          <div className="stat-card">
+            <span className="stat-value">{apiStats.boosted_calls || 0}</span>
+            <span className="stat-label">Boosted Calls</span>
+          </div>
+        </div>
+      )}
+
+      {apiStats && apiStats.by_phase && Object.keys(apiStats.by_phase).length > 0 && (
+        <div className="phase-stats">
+          <span className="phase-stats-label">By Phase:</span>
+          {Object.entries(apiStats.by_phase).map(([phase, count]) => (
+            <span key={phase} className="phase-stat-badge">
+              {getPhaseLabel(phase)}: {count}
+            </span>
+          ))}
+        </div>
+      )}
+
+      {apiStats && apiStats.by_source && Object.keys(apiStats.by_source).length > 0 && (
+        <div className="phase-stats">
+          <span className="phase-stats-label">By Source:</span>
+          {Object.entries(apiStats.by_source).map(([source, count]) => (
+            <span key={source} className="phase-stat-badge">
+              {getSourceLabel(source)}: {count}
+            </span>
+          ))}
+        </div>
+      )}
+
+      {apiStats && apiStats.by_boost_mode && Object.keys(apiStats.by_boost_mode).length > 0 && (
+        <div className="phase-stats">
+          <span className="phase-stats-label">Boost Modes:</span>
+          {Object.entries(apiStats.by_boost_mode).map(([mode, count]) => (
+            <span key={mode} className="phase-stat-badge">
+              {getBoostModeLabel(mode)}: {count}
+            </span>
+          ))}
+        </div>
+      )}
+
+      <div className="api-logs-list">
+        {apiLogsLoading ? (
+          <div className="logs-loading">Loading API logs...</div>
+        ) : apiLogs.length === 0 ? (
+          <div className="logs-empty">
+            <p>No API calls logged yet.</p>
+            <p className="logs-empty-hint">{emptyHint}</p>
+          </div>
+        ) : (
+          apiLogs.map((log, index) => {
+            const detailedLog = log.log_key ? (apiLogDetails[log.log_key] || log) : log;
+            return (
+            <div
+              key={log.log_key || `${log.timestamp || 'log'}-${log.task_id || index}`}
+              className={`api-log-entry ${log.success ? 'success' : 'error'} ${expandedApiLogIdx === index ? 'expanded' : ''}`}
+            >
+              <div
+                className="log-summary"
+                onClick={() => handleToggleApiLog(log, index)}
+              >
+                <div className="log-status">
+                  {log.success ? '✓' : '✗'}
+                </div>
+                <div className="log-info">
+                  <div className="log-task">
+                    <span className="log-task-id">{log.task_id}</span>
+                    <span className="log-phase-badge">{getPhaseLabel(log.phase)}</span>
+                    <span className={`log-source-badge ${log.boosted ? 'boosted' : 'standard'}`}>
+                      {getSourceLabel(log.source)}
+                    </span>
+                    {log.boost_mode && (
+                      <span className="log-boost-mode-badge">{getBoostModeLabel(log.boost_mode)}</span>
+                    )}
+                  </div>
+                  <div className="log-meta">
+                    <span className="log-model">{log.model}</span>
+                    <span className="log-provider-badge">{getProviderLabel(log.provider)}</span>
+                    <span className="log-duration">{formatDuration(log.duration_ms)}</span>
+                    {log.tokens_used && (
+                      <span className="log-tokens">{log.tokens_used} tokens</span>
+                    )}
+                  </div>
+                </div>
+                <div className="log-timestamp">{formatTimestamp(log.timestamp)}</div>
+                <div className="log-expand-icon">{expandedApiLogIdx === index ? '▼' : '▶'}</div>
+              </div>
+
+              {expandedApiLogIdx === index && (
+                <div className="log-details">
+                  <div className="log-detail-section">
+                    <h4>Role</h4>
+                    <pre>{log.role_id}</pre>
+                  </div>
+
+                  <div className="log-detail-section">
+                    <h4>Source</h4>
+                    <pre>{getSourceLabel(log.source)}{log.boost_mode ? ` (${getBoostModeLabel(log.boost_mode)})` : ''}</pre>
+                  </div>
+
+                  {log.error && (
+                    <div className="log-detail-section error">
+                      <h4>Error</h4>
+                      <pre>{log.error}</pre>
+                    </div>
+                  )}
+
+                  <div className="log-detail-section">
+                    <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
+                      <h4>Sent Prompt</h4>
+                      <button
+                        onClick={(e) => {
+                          e.stopPropagation();
+                          handleCopyLogText(log, 'prompt_full', 'prompt_preview');
+                        }}
+                        className="copy-btn"
+                        title={detailedLog.has_full_prompt ? 'Copy full prompt to clipboard' : 'Copy prompt preview to clipboard'}
+                      >
+                        {detailedLog.has_full_prompt ? 'Copy Full' : 'Copy Preview'}
+                      </button>
+                    </div>
+                    {detailedLog.prompt_redacted && (
+                      <div className="settings-hint">Full prompt redacted; preview and size/hash metadata are retained.</div>
+                    )}
+                    <pre className="log-preview">{log.prompt_preview || '(empty)'}</pre>
+                  </div>
+
+                  <div className="log-detail-section">
+                    <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
+                      <h4>Received Response</h4>
+                      <button
+                        onClick={(e) => {
+                          e.stopPropagation();
+                          handleCopyLogText(log, 'response_full', 'response_preview');
+                        }}
+                        className="copy-btn"
+                        title={detailedLog.has_full_response ? 'Copy full response to clipboard' : 'Copy response preview to clipboard'}
+                      >
+                        {detailedLog.has_full_response ? 'Copy Full' : 'Copy Preview'}
+                      </button>
+                    </div>
+                    {detailedLog.response_redacted && (
+                      <div className="settings-hint">Full response redacted; preview and size/hash metadata are retained.</div>
+                    )}
+                    <pre className="log-response">{detailedLog.response_preview || log.response_preview || '(empty)'}</pre>
+                  </div>
+                </div>
+              )}
+            </div>
+            );
+          })
+        )}
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/BoostControlModal.jsx b/frontend/src/components/BoostControlModal.jsx
index 7aafed3..7364d6d 100644
--- a/frontend/src/components/BoostControlModal.jsx
+++ b/frontend/src/components/BoostControlModal.jsx
@@ -2,19 +2,31 @@ import React, { useState, useEffect, useRef } from 'react';
 import { boostAPI, openRouterAPI } from '../services/api';
 import {
   computeOpenRouterAutoSettings,
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
   findOpenRouterModel,
   getProviderNames,
+  getReasoningSupportInfo,
+  normalizeOpenRouterReasoningEffort,
+  OPENROUTER_REASONING_EFFORT_OPTIONS,
 } from '../utils/openRouterSelection';
 import './BoostControlModal.css';
 
 const BOOST_SETTINGS_STORAGE_KEY = 'boost_modal_settings';
 
-export default function BoostControlModal({ isOpen, onClose, capabilities }) {
+export default function BoostControlModal({
+  isOpen,
+  onClose,
+  capabilities,
+  developerModeEnabled = false,
+}) {
   const [apiKey, setApiKey] = useState('');
   const [boostModel, setBoostModel] = useState('');
   const [selectedProvider, setSelectedProvider] = useState('');
-  const [contextWindow, setContextWindow] = useState(131072);
-  const [maxOutputTokens, setMaxOutputTokens] = useState(25000);
+  const [reasoningEffort, setReasoningEffort] = useState(DEFAULT_OPENROUTER_REASONING_EFFORT);
+  const [contextWindow, setContextWindow] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [maxOutputTokens, setMaxOutputTokens] = useState(DEFAULT_MAX_OUTPUT_TOKENS);
   const [models, setModels] = useState([]);
   const [providerData, setProviderData] = useState(null);
   const [loading, setLoading] = useState(false);
@@ -31,6 +43,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
 
   const hasAvailableKey = Boolean(apiKey.trim() || hasGlobalKey);
   const providers = getProviderNames(providerData);
+  const reasoningInfo = getReasoningSupportInfo(providerData, selectedProvider || null);
   const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
   
   // Load saved settings from localStorage on mount
@@ -41,6 +54,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
         const settings = JSON.parse(saved);
         if (settings.boostModel) setBoostModel(settings.boostModel);
         if (settings.selectedProvider) setSelectedProvider(settings.selectedProvider);
+        if (settings.reasoningEffort) setReasoningEffort(normalizeOpenRouterReasoningEffort(settings.reasoningEffort));
         if (settings.contextWindow) setContextWindow(settings.contextWindow);
         if (settings.maxOutputTokens) setMaxOutputTokens(settings.maxOutputTokens);
         if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
@@ -53,11 +67,12 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
   // Save settings to localStorage whenever they change
   useEffect(() => {
     // Only save if we have meaningful values (not initial empty state)
-    if (boostModel || selectedProvider || contextWindow !== 131072 || maxOutputTokens !== 25000 || freeOnly) {
+    if (boostModel || selectedProvider || reasoningEffort !== DEFAULT_OPENROUTER_REASONING_EFFORT || contextWindow !== DEFAULT_CONTEXT_WINDOW || maxOutputTokens !== DEFAULT_MAX_OUTPUT_TOKENS || freeOnly) {
       try {
         const settings = {
           boostModel,
           selectedProvider,
+          reasoningEffort,
           contextWindow,
           maxOutputTokens,
           freeOnly
@@ -67,7 +82,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
         console.error('Failed to save boost settings to localStorage:', e);
       }
     }
-  }, [boostModel, selectedProvider, contextWindow, maxOutputTokens, freeOnly]);
+  }, [boostModel, selectedProvider, reasoningEffort, contextWindow, maxOutputTokens, freeOnly]);
 
   const fetchProviders = async (modelId, keyOverride = undefined) => {
     if (!modelId) {
@@ -128,6 +143,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
           // Boost is enabled - use backend values (they're authoritative)
           setBoostModel(response.status.model_id);
           setSelectedProvider(response.status.provider || '');
+          setReasoningEffort(normalizeOpenRouterReasoningEffort(response.status.reasoning_effort));
           setContextWindow(response.status.context_window);
           setMaxOutputTokens(response.status.max_output_tokens);
           if (response.status.model_id) {
@@ -139,6 +155,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
             const settings = {
               boostModel: response.status.model_id,
               selectedProvider: response.status.provider || '',
+              reasoningEffort: normalizeOpenRouterReasoningEffort(response.status.reasoning_effort),
               contextWindow: response.status.context_window,
               maxOutputTokens: response.status.max_output_tokens,
               freeOnly
@@ -161,6 +178,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
   const handleModelChange = async (modelId) => {
     setBoostModel(modelId);
     setSelectedProvider(''); // Reset provider when model changes
+    setReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
     if (modelId) {
       const autoSettings = await getAutoSettingsForModel(modelId, null);
       if (autoSettings) {
@@ -300,6 +318,7 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
         openrouter_api_key: trimmedApiKey,
         boost_model_id: boostModel,
         boost_provider: selectedProvider || null,
+        boost_reasoning_effort: reasoningEffort,
         boost_context_window: contextWindow,
         boost_max_output_tokens: maxOutputTokens
       };
@@ -504,6 +523,26 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
             </div>
           )}
 
+          {boostModel && (
+            <div className="boost-form-group">
+              <label>Reasoning Effort</label>
+              <select
+                value={normalizeOpenRouterReasoningEffort(reasoningEffort)}
+                onChange={(e) => setReasoningEffort(e.target.value)}
+                disabled={loading}
+              >
+                {OPENROUTER_REASONING_EFFORT_OPTIONS.map(option => (
+                  <option key={option.value} value={option.value}>{option.label}</option>
+                ))}
+              </select>
+              <small>
+                {reasoningInfo.hasEndpointMetadata && !reasoningInfo.supportsReasoning
+                  ? 'This selected provider does not advertise reasoning support; OpenRouter may ignore the setting.'
+                  : 'Auto sends OpenRouter max reasoning effort by default.'}
+              </small>
+            </div>
+          )}
+
           <div className="form-row">
             <div className="boost-form-group">
               <label>Context Window</label>
@@ -559,6 +598,9 @@ export default function BoostControlModal({ isOpen, onClose, capabilities }) {
             <ul>
               <li>Click tasks in the MOTO Workflow panel to toggle boost</li>
               <li>Boosted tasks use your selected OpenRouter model and optional host provider</li>
+              {developerModeEnabled && (
+                <li>Supercharge is enabled per role in each settings panel; when Boost also applies, all 5 Supercharge calls use this Boost model</li>
+              )}
               <li>
                 {lmStudioEnabled
                   ? 'If boost credits or provider capacity fail, the task falls back to its primary model path for that call'
diff --git a/frontend/src/components/CritiqueNotificationStack.jsx b/frontend/src/components/CritiqueNotificationStack.jsx
index b37a9fc..5b5f15f 100644
--- a/frontend/src/components/CritiqueNotificationStack.jsx
+++ b/frontend/src/components/CritiqueNotificationStack.jsx
@@ -41,12 +41,12 @@ function getRatingColor(rating) {
  * - Max 3 notifications (FIFO queue)
  * - Click to open critique modal
  * - X button to dismiss
- * - Persists across screens (not localStorage)
+ * - Seen notification keys are tracked by the parent to avoid replay loops
  * 
  * Props:
- * - notifications: Array of notification objects { id, paper_id, paper_title, average_rating, timestamp }
+ * - notifications: Array of notification objects { id, paper_id, paper_title, average_rating, timestamp, seenKey }
  * - onDismiss: (id) => void - callback when notification is dismissed
- * - onClickNotification: (paper_id, paper_title) => void - callback when notification is clicked
+ * - onClickNotification: (paper_id, paper_title, seenKey) => void - callback when notification is clicked
  */
 export default function CritiqueNotificationStack({ notifications, onDismiss, onClickNotification, panelCollapsed }) {
   if (!notifications || notifications.length === 0) {
@@ -98,7 +98,7 @@ function CritiqueNotification({ notification, index, onDismiss, onClickNotificat
   };
 
   const handleClick = () => {
-    onClickNotification(notification.paper_id, notification.paper_title);
+    onClickNotification(notification.paper_id, notification.paper_title, notification.seenKey);
   };
 
   return (
diff --git a/frontend/src/components/HelpTooltip.jsx b/frontend/src/components/HelpTooltip.jsx
index 7a0eac1..d84d253 100644
--- a/frontend/src/components/HelpTooltip.jsx
+++ b/frontend/src/components/HelpTooltip.jsx
@@ -10,6 +10,7 @@ export default function HelpTooltip({
   popupStyle,
   buttonContent = '?',
   useFixedPosition = false,
+  fixedPlacement = 'above-right',
 }) {
   const [isOpen, setIsOpen] = useState(false);
   const [fixedPopupStyle, setFixedPopupStyle] = useState(null);
@@ -31,11 +32,22 @@ export default function HelpTooltip({
     const viewportPadding = 16;
 
     let left = buttonRect.right + gap;
-    if (left + popupRect.width > window.innerWidth - viewportPadding) {
+    let top = buttonRect.top - popupRect.height - gap;
+
+    if (fixedPlacement === 'side-right') {
+      if (left + popupRect.width > window.innerWidth - viewportPadding) {
+        left = buttonRect.left - popupRect.width - gap;
+      }
+      left = Math.max(viewportPadding, left);
+      top = buttonRect.top + (buttonRect.height - popupRect.height) / 2;
+    } else if (left + popupRect.width > window.innerWidth - viewportPadding) {
       left = Math.max(viewportPadding, window.innerWidth - popupRect.width - viewportPadding);
     }
 
-    const top = Math.max(viewportPadding, buttonRect.top - popupRect.height - gap);
+    top = Math.min(
+      Math.max(viewportPadding, top),
+      Math.max(viewportPadding, window.innerHeight - popupRect.height - viewportPadding)
+    );
 
     setFixedPopupStyle({
       position: 'fixed',
@@ -45,7 +57,7 @@ export default function HelpTooltip({
       bottom: 'auto',
       zIndex: 100000,
     });
-  }, [useFixedPosition]);
+  }, [fixedPlacement, useFixedPosition]);
 
   const showTooltip = () => {
     setIsOpen(true);
diff --git a/frontend/src/components/HighlightedModelsSidebar.jsx b/frontend/src/components/HighlightedModelsSidebar.jsx
new file mode 100644
index 0000000..7b2a459
--- /dev/null
+++ b/frontend/src/components/HighlightedModelsSidebar.jsx
@@ -0,0 +1,200 @@
+import React, { useState } from 'react';
+import HelpTooltip from './HelpTooltip';
+import ProofStrengthBadge from './ProofStrengthBadge';
+import './settings-common.css';
+import './autonomous/AutonomousResearch.css';
+
+const OsTag = () => (
+  <span className="os-tag-tooltip-anchor" tabIndex={0}>
+    <span className="os-tag">OS</span>
+    <span className="os-tag-tooltip">
+      Open source — weights available on Hugging Face for local use with LM Studio.
+    </span>
+  </span>
+);
+
+export default function HighlightedModelsSidebar() {
+  const [showKothTooltip, setShowKothTooltip] = useState(false);
+
+  return (
+    <div className="settings-left-sidebar">
+      <div className="known-models-sidebar">
+        <h3 className="flex-row-center">
+          <span>Highlighted Models</span>
+          <HelpTooltip
+            label="Learn about highlighted models"
+            popupClassName="help-tooltip-popup--fixed"
+            useFixedPosition
+            fixedPlacement="side-right"
+          >
+            The models and hosts listed here are not affiliated with MOTO or Intrafere LLC. This chart reflects developer-tested configurations intended to help guide model selection. All statements regarding pricing, performance, roles, rankings, or capabilities are speculative and based on individual testing experience. Intrafere LLC and the MOTO development team make no guarantees about the accuracy of this chart. MOTO is compatible with the majority of models, including many not listed here.
+          </HelpTooltip>
+        </h3>
+        <p className="hint-text hint-text--dim" style={{ marginLeft: '20px', marginBottom: '0.45rem' }}>
+          Note: Most models over 20 billion parameters are compatible with MOTO.
+        </p>
+        <div className="models-list">
+          <div className="models-podium">
+            <div className="models-podium-label">Leaderboard</div>
+            <div className="model-item model-item--ranked model-item--gold model-item--os">
+              <OsTag />
+              <div className="flex-row-center">
+                <div className="model-item-name">Kimi K2.6</div>
+                <div
+                  className="help-tooltip-anchor"
+                  style={{ zIndex: 100 }}
+                  aria-label="Learn about the King of the Hill ranking"
+                  onMouseEnter={() => setShowKothTooltip(true)}
+                  onMouseLeave={() => setShowKothTooltip(false)}
+                  onFocus={() => setShowKothTooltip(true)}
+                  onBlur={() => setShowKothTooltip(false)}
+                  tabIndex={0}
+                >
+                  <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
+                  {showKothTooltip && (
+                    <div
+                      className="help-tooltip-popup"
+                      style={{ top: 'auto', bottom: 'calc(100% + 10px)', left: 'calc(100% + 10px)', right: 'auto' }}
+                    >
+                      This model was chosen by the Intrafere developers as the best overall performer in the MOTO harness, optimized for cost, speed, and knowledge.
+                    </div>
+                  )}
+                </div>
+              </div>
+              <div className="model-item-badge">Highly knowledgeable and balanced cost</div>
+            </div>
+
+            <div className="model-item model-item--ranked model-item--silver">
+              <div className="flex-row-center">
+                <div className="model-item-name">Gemini 3.1 Flash Light</div>
+                <div className="ranking-badge ranking-badge--silver">🥈 SILVER</div>
+              </div>
+              <div className="model-item-badge">Highly Knowledgeable, Fast</div>
+            </div>
+
+            <div className="model-item model-item--ranked model-item--bronze model-item--os">
+              <OsTag />
+              <div className="flex-row-center">
+                <div className="model-item-name">GPT OSS 120B</div>
+                <div className="ranking-badge ranking-badge--bronze">🥉 BRONZE</div>
+              </div>
+              <div className="model-item-badge">Balanced knowledge and speed at low cost</div>
+            </div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Arcee AI's Trinity Large</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Amazon Nova Pro/Premier</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <ProofStrengthBadge variant="leaderboard" className="ps-badge-anchor--model-only" />
+            <div className="model-item-name">Claude Opus/Sonnet/Haiku</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">DeepSeek</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Gemini Flash</div>
+            <div className="model-item-badge">Fast validator</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Gemini Pro</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Google's Gemma</div>
+            <div className="model-item-badge">Balanced knowledge and speed</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">GLM</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">GLM Turbo</div>
+            <div className="model-item-badge">Fast validator</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">OpenAI's GPT OSS</div>
+            <div className="model-item-badge">Balanced knowledge and speed</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Grok</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <ProofStrengthBadge variant="leaderboard" className="ps-badge-anchor--model-only" />
+            <div className="model-item-name">ChatGPT</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Inception's Mercury</div>
+            <div className="model-item-badge">Rapid knowledge</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Nemotron Super</div>
+            <div className="model-item-badge">Balanced knowledge and speed</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Nous Hermes</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">Perplexity's Sonar</div>
+            <div className="model-item-badge">Native internet search capability</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Microsoft's Phi</div>
+            <div className="model-item-badge">Balanced knowledge and speed</div>
+          </div>
+
+          <div className="model-item">
+            <div className="model-item-name">MiniMax</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Qwen Coder</div>
+            <div className="model-item-badge">Computer science</div>
+          </div>
+
+          <div className="model-item model-item--os">
+            <OsTag />
+            <div className="model-item-name">Qwen</div>
+            <div className="model-item-badge">Highly knowledgeable</div>
+          </div>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/LiveActivityFeed.jsx b/frontend/src/components/LiveActivityFeed.jsx
new file mode 100644
index 0000000..9404293
--- /dev/null
+++ b/frontend/src/components/LiveActivityFeed.jsx
@@ -0,0 +1,69 @@
+import React, { useEffect, useRef } from 'react';
+import { getActivityClass, getActivityIcon } from '../utils/activityStyles';
+import './autonomous/AutonomousResearch.css';
+
+const formatActivityTime = (timestamp) => {
+  if (!timestamp) return '';
+
+  const parsed = new Date(timestamp);
+  if (!Number.isNaN(parsed.getTime())) {
+    return parsed.toLocaleTimeString();
+  }
+
+  return timestamp;
+};
+
+export default function LiveActivityFeed({
+  title = 'Live Activity',
+  items = [],
+  emptyMessage = 'No activity yet.',
+  maxItems,
+  getEventName = (item) => item?.event || item?.type || '',
+  getMessage = (item) => item?.message || item?.data?.message || '',
+  getTimestamp = (item) => item?.timestamp || item?.fullTimestamp || '',
+  getIcon = getActivityIcon,
+  getClassName = getActivityClass,
+  headerAction = null,
+}) {
+  const feedRef = useRef(null);
+  const prevLengthRef = useRef(0);
+  const visibleItems = maxItems ? items.slice(-maxItems) : items;
+
+  useEffect(() => {
+    if (visibleItems.length > prevLengthRef.current && feedRef.current) {
+      feedRef.current.scrollTop = feedRef.current.scrollHeight;
+    }
+    prevLengthRef.current = visibleItems.length;
+  }, [visibleItems.length]);
+
+  return (
+    <div className="activity-section">
+      <div className="activity-section-header">
+        <h3>{title}</h3>
+        {headerAction}
+      </div>
+      <div className="activity-feed" ref={feedRef}>
+        {visibleItems.length === 0 ? (
+          <div className="activity-empty">{emptyMessage}</div>
+        ) : (
+          visibleItems.map((item, index) => {
+            const eventName = getEventName(item);
+            const timestamp = getTimestamp(item);
+            const message = getMessage(item) || eventName;
+
+            return (
+              <div
+                key={`${eventName}-${timestamp}-${index}`}
+                className={`activity-item ${getClassName(eventName, item)}`}
+              >
+                <span className="activity-icon">{getIcon(eventName, item)}</span>
+                <span className="activity-time">{formatActivityTime(timestamp)}</span>
+                <span className="activity-message">{message}</span>
+              </div>
+            );
+          })
+        )}
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/PaperCritiqueModal.jsx b/frontend/src/components/PaperCritiqueModal.jsx
index a0386f7..ee5326a 100644
--- a/frontend/src/components/PaperCritiqueModal.jsx
+++ b/frontend/src/components/PaperCritiqueModal.jsx
@@ -59,7 +59,7 @@ function getRatingBgColor(rating) {
 const AUTONOMOUS_SETTINGS_STORAGE_KEY = 'autonomous_research_settings';
 const COMPILER_SETTINGS_STORAGE_KEY = 'compiler_settings';
 
-function readStoredValidatorConfig(paperType) {
+function readStoredValidatorConfig(paperType, developerModeEnabled = false) {
   try {
     if (paperType === 'compiler_paper') {
       const raw = localStorage.getItem(COMPILER_SETTINGS_STORAGE_KEY);
@@ -79,6 +79,8 @@ function readStoredValidatorConfig(paperType) {
         validator_max_tokens: config.validatorMaxOutput,
         validator_provider: config.validatorProvider,
         validator_openrouter_provider: config.validatorOpenrouterProvider,
+        validator_openrouter_reasoning_effort: config.validatorOpenrouterReasoningEffort || 'auto',
+        validator_supercharge_enabled: developerModeEnabled && Boolean(config.validatorSuperchargeEnabled),
       };
     }
 
@@ -102,6 +104,8 @@ function readStoredValidatorConfig(paperType) {
       validator_max_tokens: localConfig.validator_max_tokens,
       validator_provider: localConfig.validator_provider,
       validator_openrouter_provider: localConfig.validator_openrouter_provider,
+      validator_openrouter_reasoning_effort: localConfig.validator_openrouter_reasoning_effort || 'auto',
+      validator_supercharge_enabled: developerModeEnabled && Boolean(localConfig.validator_supercharge_enabled),
     };
   } catch (error) {
     console.warn('Could not read validator config from localStorage:', error);
@@ -129,6 +133,7 @@ export default function PaperCritiqueModal({
   paperTitle,
   onGenerateCritique,
   onGetCritiques,
+  developerModeEnabled = false,
 }) {
   const [loading, setLoading] = useState(false);
   const [generating, setGenerating] = useState(false);
@@ -177,7 +182,7 @@ export default function PaperCritiqueModal({
         : 'autonomous_critique_custom_prompt';
       const customPrompt = localStorage.getItem(storageKey);
 
-      const validatorConfig = readStoredValidatorConfig(paperType);
+      const validatorConfig = readStoredValidatorConfig(paperType, developerModeEnabled);
       const result = await onGenerateCritique(customPrompt, validatorConfig);
       
       // Reload critiques to get the updated list
diff --git a/frontend/src/components/ProofStrengthBadge.jsx b/frontend/src/components/ProofStrengthBadge.jsx
new file mode 100644
index 0000000..e7402ec
--- /dev/null
+++ b/frontend/src/components/ProofStrengthBadge.jsx
@@ -0,0 +1,18 @@
+import React from 'react';
+import './settings-common.css';
+
+const LEADERBOARD_TOOLTIP = 'This company\'s state-of-the-art model has been seen in MOTO testing to solve complex mathematical proofs and perform well in Submitter 1 (Main Submitter), High-Context Submitter, and High-Parameter Submitter, the three primary proof-creation roles.';
+
+const ROLE_TOOLTIP = 'These are the three roles that submit proofs: Submitter 1 (Main Submitter), High-Context Submitter, and High-Parameter Submitter. For the best chance of creating novel proofs, use models comparable to those marked PS in the Highlighted Models list.';
+
+export default function ProofStrengthBadge({ variant = 'role', className = '' }) {
+  const tooltip = variant === 'leaderboard' ? LEADERBOARD_TOOLTIP : ROLE_TOOLTIP;
+  const variantClass = variant === 'leaderboard' ? 'ps-badge-anchor--leaderboard' : 'ps-badge-anchor--role';
+
+  return (
+    <span className={`ps-badge-anchor ${variantClass} ${className}`.trim()} tabIndex={0}>
+      <span className="ps-badge">PS</span>
+      <span className="ps-badge-tooltip">{tooltip}</span>
+    </span>
+  );
+}
diff --git a/frontend/src/components/RawSettingsEditor.jsx b/frontend/src/components/RawSettingsEditor.jsx
new file mode 100644
index 0000000..111d14e
--- /dev/null
+++ b/frontend/src/components/RawSettingsEditor.jsx
@@ -0,0 +1,39 @@
+import React from 'react';
+
+export default function RawSettingsEditor({
+  value,
+  onChange,
+  onSave,
+  message,
+  disabled = false,
+}) {
+  return (
+    <div className="settings-group">
+      <h4>Raw Settings JSON</h4>
+      <p className="settings-info">
+        Edit the full settings payload directly. Save only valid JSON.
+      </p>
+      <textarea
+        className="textarea-dark-mono"
+        value={value}
+        onChange={(event) => onChange(event.target.value)}
+        disabled={disabled}
+        spellCheck={false}
+        style={{ minHeight: '440px' }}
+      />
+      <div className="actions-row">
+        <span className={message?.startsWith('Saved') ? 'status-success-text' : 'error-text'}>
+          {message}
+        </span>
+        <button
+          type="button"
+          className="btn-success-sm"
+          onClick={onSave}
+          disabled={disabled}
+        >
+          Save Raw Settings
+        </button>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/WorkflowPanel.css b/frontend/src/components/WorkflowPanel.css
index a47c3e0..767b4e8 100644
--- a/frontend/src/components/WorkflowPanel.css
+++ b/frontend/src/components/WorkflowPanel.css
@@ -257,6 +257,14 @@
   border-bottom: 1px solid var(--border-subtle);
 }
 
+.token-stats-heading {
+  font-size: 0.75rem;
+  color: var(--text-muted);
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
+  margin-bottom: 0.6rem;
+}
+
 .research-timer {
   display: flex;
   justify-content: space-between;
@@ -373,6 +381,7 @@
 
 .model-tokens {
   display: flex;
+  flex-wrap: wrap;
   gap: 0.75rem;
   font-family: 'Courier New', Courier, monospace;
   font-size: 0.7rem;
diff --git a/frontend/src/components/WorkflowPanel.jsx b/frontend/src/components/WorkflowPanel.jsx
index 4b45212..100b7ce 100644
--- a/frontend/src/components/WorkflowPanel.jsx
+++ b/frontend/src/components/WorkflowPanel.jsx
@@ -319,7 +319,7 @@ export default function WorkflowPanel({ isRunning }) {
                 <div className={`boost-section ${boostNextCount > 0 || boostAlwaysPrefer ? 'boost-mode-inactive' : ''}`}>
                   <label className="boost-label">Boost by Category:</label>
                   <div className="boost-categories">
-                    {['Aggregator', 'Compiler', 'Autonomous'].map(group => {
+                    {['Aggregator', 'Compiler', 'Autonomous', 'Proof Solver'].map(group => {
                       const groupCats = availableCategories.filter(cat => cat.group === group);
                       if (!groupCats.length) return null;
                       return (
@@ -349,6 +349,8 @@ export default function WorkflowPanel({ isRunning }) {
 
           {/* RESEARCH TIMER & TOKEN STATS */}
           <div className="token-stats-section">
+            <div className="token-stats-heading">Token Usage</div>
+
             <div className="research-timer">
               <span className="timer-label">Elapsed</span>
               <span className="timer-value">{formatTime(localElapsed)}</span>
@@ -356,15 +358,15 @@ export default function WorkflowPanel({ isRunning }) {
 
             <div className="token-totals">
               <div className="token-row">
-                <span className="token-label">Input</span>
+                <span className="token-label">Input tokens</span>
                 <span className="token-value">{formatNumber(tokenStats.total_input)}</span>
               </div>
               <div className="token-row">
-                <span className="token-label">Output</span>
+                <span className="token-label">Output tokens</span>
                 <span className="token-value">{formatNumber(tokenStats.total_output)}</span>
               </div>
               <div className="token-row token-total-row">
-                <span className="token-label">Total</span>
+                <span className="token-label">Total tokens</span>
                 <span className="token-value">{formatNumber(tokenStats.total_input + tokenStats.total_output)}</span>
               </div>
             </div>
@@ -375,7 +377,7 @@ export default function WorkflowPanel({ isRunning }) {
                   className="per-model-toggle"
                   onClick={() => setShowPerModel(prev => !prev)}
                 >
-                  {showPerModel ? '▾' : '▸'} Per Model ({Object.keys(tokenStats.by_model).length})
+                  {showPerModel ? '▾' : '▸'} Per-model tokens ({Object.keys(tokenStats.by_model).length})
                 </button>
                 {showPerModel && (
                   <div className="per-model-list">
@@ -385,8 +387,8 @@ export default function WorkflowPanel({ isRunning }) {
                         <div key={modelId} className="model-row">
                           <div className="model-name" title={modelId}>{modelId}</div>
                           <div className="model-tokens">
-                            <span className="model-in">In: {formatNumber(usage.input)}</span>
-                            <span className="model-out">Out: {formatNumber(usage.output)}</span>
+                            <span className="model-in">Input tokens: {formatNumber(usage.input)}</span>
+                            <span className="model-out">Output tokens: {formatNumber(usage.output)}</span>
                           </div>
                         </div>
                       ))}
diff --git a/frontend/src/components/aggregator/AggregatorInterface.jsx b/frontend/src/components/aggregator/AggregatorInterface.jsx
index 7be6406..9a71a8e 100644
--- a/frontend/src/components/aggregator/AggregatorInterface.jsx
+++ b/frontend/src/components/aggregator/AggregatorInterface.jsx
@@ -1,5 +1,6 @@
 import React, { useState, useEffect } from 'react';
 import { api } from '../../services/api';
+import { DEFAULT_MAX_OUTPUT_TOKENS } from '../../utils/openRouterSelection';
 import TextFileUploader from '../TextFileUploader';
 import '../settings-common.css';
 
@@ -8,6 +9,8 @@ export default function AggregatorInterface({
   setConfig,
   capabilities,
   anyWorkflowRunning = false,
+  onWorkflowRunningChange = null,
+  developerModeEnabled = false,
 }) {
   const [isRunning, setIsRunning] = useState(false);
   const [status, setStatus] = useState(null);
@@ -25,6 +28,9 @@ export default function AggregatorInterface({
       const data = await api.getStatus();
       setStatus(data);
       setIsRunning(data.is_running);
+      if (data.is_running) {
+        onWorkflowRunningChange?.(true);
+      }
     } catch (error) {
       console.error('Failed to fetch status:', error);
     }
@@ -89,9 +95,11 @@ export default function AggregatorInterface({
         provider: lmStudioEnabled ? (s.provider || 'lm_studio') : 'openrouter',
         model_id: s.modelId,
         openrouter_provider: s.openrouterProvider || null,
+        openrouter_reasoning_effort: s.openrouterReasoningEffort || 'auto',
         lm_studio_fallback_id: lmStudioEnabled ? (s.lmStudioFallbackId || null) : null,
         context_window: s.contextWindow,
-        max_output_tokens: s.maxOutputTokens
+        max_output_tokens: s.maxOutputTokens,
+        supercharge_enabled: developerModeEnabled && Boolean(s.superchargeEnabled)
       }));
 
       await api.startAggregator({
@@ -101,12 +109,15 @@ export default function AggregatorInterface({
         validator_provider: lmStudioEnabled ? (config.validatorProvider || 'lm_studio') : 'openrouter',
         validator_model: config.validatorModel,
         validator_openrouter_provider: config.validatorOpenrouterProvider || null,
+        validator_openrouter_reasoning_effort: config.validatorOpenrouterReasoningEffort || 'auto',
         validator_lm_studio_fallback: lmStudioEnabled ? (config.validatorLmStudioFallback || null) : null,
         validator_context_size: config.validatorContextSize,
-        validator_max_output_tokens: config.validatorMaxOutput || 25000,
+        validator_max_output_tokens: config.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+        validator_supercharge_enabled: developerModeEnabled && Boolean(config.validatorSuperchargeEnabled),
         uploaded_files: config.uploadedFiles,
       });
       setIsRunning(true);
+      onWorkflowRunningChange?.(true);
     } catch (error) {
       console.error('Failed to start aggregator:', error);
       alert(`Failed to start aggregator: ${error.details || error.message}`);
@@ -117,6 +128,7 @@ export default function AggregatorInterface({
     try {
       await api.stopAggregator();
       setIsRunning(false);
+      onWorkflowRunningChange?.(false);
     } catch (error) {
       console.error('Failed to stop aggregator:', error);
       alert('Failed to stop aggregator');
@@ -124,7 +136,7 @@ export default function AggregatorInterface({
   };
 
   return (
-    <div>
+    <div className={`workflow-main-interface aggregator-interface ${isRunning ? 'workflow-main-interface--running' : ''}`}>
       <h1>Aggregator Interface</h1>
       
       <div className="metric-card">
diff --git a/frontend/src/components/aggregator/AggregatorSettings.jsx b/frontend/src/components/aggregator/AggregatorSettings.jsx
index a90b700..6768875 100644
--- a/frontend/src/components/aggregator/AggregatorSettings.jsx
+++ b/frontend/src/components/aggregator/AggregatorSettings.jsx
@@ -2,11 +2,21 @@ import React, { useState, useEffect } from 'react';
 import { api, openRouterAPI } from '../../services/api';
 import {
   computeOpenRouterAutoSettings,
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
   findOpenRouterModel,
   getProviderNames,
+  getReasoningSupportInfo,
   hasEndpointMetadata,
+  normalizeOpenRouterReasoningEffort,
+  OPENROUTER_REASONING_EFFORT_OPTIONS,
 } from '../../utils/openRouterSelection';
 import HelpTooltip from '../HelpTooltip';
+import HighlightedModelsSidebar from '../HighlightedModelsSidebar';
+import ProofStrengthBadge from '../ProofStrengthBadge';
+import RawSettingsEditor from '../RawSettingsEditor';
+import '../autonomous/AutonomousResearch.css';
 import '../settings-common.css';
 
 const DEFAULT_SUBMITTER_CONFIG = {
@@ -14,12 +24,24 @@ const DEFAULT_SUBMITTER_CONFIG = {
   provider: 'lm_studio',
   modelId: '',
   openrouterProvider: null,
+  openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   lmStudioFallbackId: null,
-  contextWindow: 131072,
-  maxOutputTokens: 25000
+  contextWindow: DEFAULT_CONTEXT_WINDOW,
+  maxOutputTokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  superchargeEnabled: false
 };
 
-export default function AggregatorSettings({ config, setConfig, capabilities }) {
+const RAW_VIEW_EXIT_WARNING = 'Switching back to the GUI view will restore your last GUI settings/profile and discard raw-only changes. Continue?';
+const SUPERCHARGE_TOOLTIP = 'Supercharge makes this role generate 4 full answer attempts, then run a 5th same-model call to choose or synthesize the best final answer. It uses 5x the API calls, so it is about 5x slower and 5x more costly, but can produce more intelligent answers.';
+
+const formatRawSettings = (value) => JSON.stringify(value, null, 2);
+
+export default function AggregatorSettings({
+  config,
+  setConfig,
+  capabilities,
+  developerModeEnabled = false,
+}) {
   const [lmStudioModels, setLmStudioModels] = useState([]);
   const [openRouterModels, setOpenRouterModels] = useState([]);
   const [modelProviders, setModelProviders] = useState({}); // { modelId: { providers: [], endpoints: [] } }
@@ -35,12 +57,14 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       { ...DEFAULT_SUBMITTER_CONFIG, submitterId: 3 }
     ]
   );
-  const [validatorMaxOutput, setValidatorMaxOutput] = useState(config.validatorMaxOutput || 25000);
+  const [validatorMaxOutput, setValidatorMaxOutput] = useState(config.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS);
   
   // Validator OpenRouter state
   const [validatorProvider, setValidatorProvider] = useState(config.validatorProvider || 'lm_studio');
   const [validatorOpenrouterProvider, setValidatorOpenrouterProvider] = useState(config.validatorOpenrouterProvider || null);
+  const [validatorOpenrouterReasoningEffort, setValidatorOpenrouterReasoningEffort] = useState(normalizeOpenRouterReasoningEffort(config.validatorOpenrouterReasoningEffort));
   const [validatorLmStudioFallback, setValidatorLmStudioFallback] = useState(config.validatorLmStudioFallback || null);
+  const [validatorSuperchargeEnabled, setValidatorSuperchargeEnabled] = useState(Boolean(config.validatorSuperchargeEnabled));
   
   // OpenRouter API key status
   const [hasOpenRouterKey, setHasOpenRouterKey] = useState(false);
@@ -49,8 +73,19 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
   const [freeModelLooping, setFreeModelLooping] = useState(true);
   const [freeModelAutoSelector, setFreeModelAutoSelector] = useState(true);
   const [isLoaded, setIsLoaded] = useState(false);
+  const [editRawSettings, setEditRawSettings] = useState(false);
+  const [rawSettingsText, setRawSettingsText] = useState('');
+  const [rawSettingsMessage, setRawSettingsMessage] = useState('');
+  const [guiSettingsBeforeRaw, setGuiSettingsBeforeRaw] = useState(null);
   const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
 
+  useEffect(() => {
+    if (!developerModeEnabled && editRawSettings) {
+      setEditRawSettings(false);
+      setRawSettingsMessage('');
+    }
+  }, [developerModeEnabled, editRawSettings]);
+
   // Load settings from localStorage on mount
   useEffect(() => {
     const loadSettings = async () => {
@@ -60,10 +95,17 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
           const settings = JSON.parse(savedSettings);
           // Restore all state variables
           if (settings.numSubmitters) setNumSubmitters(settings.numSubmitters);
-          if (settings.submitterConfigs) setSubmitterConfigs(settings.submitterConfigs);
+          if (settings.submitterConfigs) {
+            setSubmitterConfigs(settings.submitterConfigs.map((item) => ({
+              ...item,
+              openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(item.openrouterReasoningEffort),
+            })));
+          }
           if (settings.validatorProvider) setValidatorProvider(settings.validatorProvider);
           if (settings.validatorOpenrouterProvider) setValidatorOpenrouterProvider(settings.validatorOpenrouterProvider);
+          if (settings.validatorOpenrouterReasoningEffort) setValidatorOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(settings.validatorOpenrouterReasoningEffort));
           if (settings.validatorLmStudioFallback) setValidatorLmStudioFallback(settings.validatorLmStudioFallback);
+          if (settings.validatorSuperchargeEnabled !== undefined) setValidatorSuperchargeEnabled(settings.validatorSuperchargeEnabled);
           if (settings.validatorMaxOutput) setValidatorMaxOutput(settings.validatorMaxOutput);
           if (settings.freeOnly !== undefined) setFreeOnly(settings.freeOnly);
           if (settings.freeModelLooping !== undefined) setFreeModelLooping(settings.freeModelLooping);
@@ -104,7 +146,9 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       submitterConfigs,
       validatorProvider,
       validatorOpenrouterProvider,
+      validatorOpenrouterReasoningEffort,
       validatorLmStudioFallback,
+      validatorSuperchargeEnabled,
       validatorMaxOutput,
       freeOnly,
       freeModelLooping,
@@ -112,7 +156,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       modelProviders
     };
     localStorage.setItem('aggregator_settings', JSON.stringify(settings));
-  }, [isLoaded, numSubmitters, submitterConfigs, validatorProvider, validatorOpenrouterProvider, validatorLmStudioFallback, validatorMaxOutput, freeOnly, freeModelLooping, freeModelAutoSelector, modelProviders]);
+  }, [isLoaded, numSubmitters, submitterConfigs, validatorProvider, validatorOpenrouterProvider, validatorOpenrouterReasoningEffort, validatorLmStudioFallback, validatorSuperchargeEnabled, validatorMaxOutput, freeOnly, freeModelLooping, freeModelAutoSelector, modelProviders]);
 
   useEffect(() => {
     if (lmStudioEnabled) {
@@ -136,6 +180,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
         provider: 'openrouter',
         modelId: keepOpenRouterState ? (submitterConfig.modelId || '') : '',
         openrouterProvider: keepOpenRouterState ? (submitterConfig.openrouterProvider || null) : null,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(submitterConfig.openrouterReasoningEffort),
         lmStudioFallbackId: null,
       };
     });
@@ -163,6 +208,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
         validatorOpenrouterProvider: keepValidatorOpenRouterState
           ? (prev.validatorOpenrouterProvider || null)
           : null,
+        validatorOpenrouterReasoningEffort: normalizeOpenRouterReasoningEffort(prev.validatorOpenrouterReasoningEffort),
         validatorLmStudioFallback: null,
       };
       return JSON.stringify(next) === JSON.stringify(prev) ? prev : next;
@@ -257,7 +303,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
   const handleSubmitterModelChange = async (submitterId, modelId) => {
     const baseConfigs = submitterConfigs.map(c =>
       c.submitterId === submitterId
-        ? { ...c, modelId, openrouterProvider: null }
+        ? { ...c, modelId, openrouterProvider: null, openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT }
         : c
     );
     setSubmitterConfigs(baseConfigs);
@@ -323,8 +369,10 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       ...prev,
       validatorModel: modelId,
       validatorOpenrouterProvider: null,
+      validatorOpenrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     }));
     setValidatorOpenrouterProvider(null);
+    setValidatorOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
 
     if (validatorProvider !== 'openrouter' || !modelId) {
       return;
@@ -342,6 +390,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       ...prev,
       validatorModel: modelId,
       validatorOpenrouterProvider: null,
+      validatorOpenrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
       ...(autoSettings.contextWindowKnown ? { validatorContextSize: autoSettings.contextWindow } : {}),
       ...(autoSettings.outputCapKnown ? { validatorMaxOutput: autoSettings.maxOutputTokens } : {}),
     }));
@@ -368,7 +417,6 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
     }
     setConfig(prev => ({
       ...prev,
-      validatorOpenrouterProvider: providerName,
       ...(autoSettings.contextWindowKnown ? { validatorContextSize: autoSettings.contextWindow } : {}),
       ...(autoSettings.outputCapKnown ? { validatorMaxOutput: autoSettings.maxOutputTokens } : {}),
     }));
@@ -376,7 +424,8 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
 
   // Handle number of submitters change - expand/contract configs
   const handleNumSubmittersChange = (newNum) => {
-    const num = parseInt(newNum);
+    const parsed = parseInt(newNum, 10);
+    const num = Number.isFinite(parsed) ? Math.min(10, Math.max(1, parsed)) : 1;
     setNumSubmitters(num);
     
     const newConfigs = [];
@@ -393,9 +442,11 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
           provider: template.provider,
           modelId: template.modelId,
           openrouterProvider: template.openrouterProvider,
+          openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(template.openrouterReasoningEffort),
           lmStudioFallbackId: template.lmStudioFallbackId,
           contextWindow: template.contextWindow,
-          maxOutputTokens: template.maxOutputTokens
+          maxOutputTokens: template.maxOutputTokens,
+          superchargeEnabled: Boolean(template.superchargeEnabled)
         });
       }
     }
@@ -443,9 +494,9 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
     // Handle NaN for numeric fields - use defaults
     let safeValue = value;
     if (field === 'contextWindow' && isNaN(value)) {
-      safeValue = 131072;
+      safeValue = DEFAULT_CONTEXT_WINDOW;
     } else if (field === 'maxOutputTokens' && isNaN(value)) {
-      safeValue = 25000;
+      safeValue = DEFAULT_MAX_OUTPUT_TOKENS;
     }
     
     const newConfigs = submitterConfigs.map(c => {
@@ -457,6 +508,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       if (field === 'provider') {
         updated.modelId = '';
         updated.openrouterProvider = null;
+        updated.openrouterReasoningEffort = DEFAULT_OPENROUTER_REASONING_EFFORT;
         updated.lmStudioFallbackId = null;
       }
 
@@ -476,9 +528,11 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       provider: source.provider,
       modelId: source.modelId,
       openrouterProvider: source.openrouterProvider,
+      openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(source.openrouterReasoningEffort),
       lmStudioFallbackId: source.lmStudioFallbackId,
       contextWindow: source.contextWindow,
-      maxOutputTokens: source.maxOutputTokens
+      maxOutputTokens: source.maxOutputTokens,
+      superchargeEnabled: Boolean(source.superchargeEnabled)
     }));
     setSubmitterConfigs(newConfigs);
     setConfig(prev => ({ ...prev, submitterConfigs: newConfigs }));
@@ -490,6 +544,7 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
     setValidatorProvider(provider);
     if (provider === 'lm_studio') {
       setValidatorOpenrouterProvider(null);
+      setValidatorOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
       setValidatorLmStudioFallback(null);
     }
     setConfig(prev => ({
@@ -497,19 +552,131 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
       validatorProvider: provider,
       validatorModel: '',
       validatorOpenrouterProvider: null,
+      validatorOpenrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
       validatorLmStudioFallback: null
     }));
   };
 
+  const getAggregatorRawSettings = () => ({
+    userPrompt: config.userPrompt || '',
+    numSubmitters,
+    submitterConfigs,
+    validatorModel: config.validatorModel || '',
+    validatorProvider,
+    validatorOpenrouterProvider,
+    validatorOpenrouterReasoningEffort,
+    validatorLmStudioFallback,
+    validatorSuperchargeEnabled,
+    validatorContextSize: config.validatorContextSize || DEFAULT_CONTEXT_WINDOW,
+    validatorMaxOutput,
+    freeOnly,
+    freeModelLooping,
+    freeModelAutoSelector,
+    modelProviders,
+  });
+
+  const applyAggregatorRawSettings = (rawSettings, { updateRawText = true } = {}) => {
+    const nextSubmitters = Array.isArray(rawSettings.submitterConfigs) && rawSettings.submitterConfigs.length > 0
+      ? rawSettings.submitterConfigs.map((item) => ({
+          ...item,
+          openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(item.openrouterReasoningEffort),
+        }))
+      : submitterConfigs;
+    const nextNumSubmitters = Number(rawSettings.numSubmitters || nextSubmitters.length || 3);
+    const nextValidatorProvider = rawSettings.validatorProvider || 'lm_studio';
+    const nextValidatorOpenrouterProvider = rawSettings.validatorOpenrouterProvider || null;
+    const nextValidatorOpenrouterReasoningEffort = normalizeOpenRouterReasoningEffort(rawSettings.validatorOpenrouterReasoningEffort);
+    const nextValidatorLmStudioFallback = rawSettings.validatorLmStudioFallback || null;
+    const nextValidatorSuperchargeEnabled = Boolean(rawSettings.validatorSuperchargeEnabled);
+    const nextValidatorContextSize = Number(rawSettings.validatorContextSize || DEFAULT_CONTEXT_WINDOW);
+    const nextValidatorMaxOutput = Number(rawSettings.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS);
+    const nextModelProviders = rawSettings.modelProviders || {};
+
+    setNumSubmitters(nextNumSubmitters);
+    setSubmitterConfigs(nextSubmitters);
+    setValidatorProvider(nextValidatorProvider);
+    setValidatorOpenrouterProvider(nextValidatorOpenrouterProvider);
+    setValidatorOpenrouterReasoningEffort(nextValidatorOpenrouterReasoningEffort);
+    setValidatorLmStudioFallback(nextValidatorLmStudioFallback);
+    setValidatorSuperchargeEnabled(nextValidatorSuperchargeEnabled);
+    setValidatorMaxOutput(nextValidatorMaxOutput);
+    setFreeOnly(rawSettings.freeOnly ?? false);
+    setFreeModelLooping(rawSettings.freeModelLooping ?? true);
+    setFreeModelAutoSelector(rawSettings.freeModelAutoSelector ?? true);
+    setModelProviders(nextModelProviders);
+
+    const nextConfig = {
+      ...config,
+      userPrompt: rawSettings.userPrompt || '',
+      submitterConfigs: nextSubmitters,
+      validatorModel: rawSettings.validatorModel || '',
+      validatorProvider: nextValidatorProvider,
+      validatorOpenrouterProvider: nextValidatorOpenrouterProvider,
+      validatorOpenrouterReasoningEffort: nextValidatorOpenrouterReasoningEffort,
+      validatorLmStudioFallback: nextValidatorLmStudioFallback,
+      validatorSuperchargeEnabled: nextValidatorSuperchargeEnabled,
+      validatorContextSize: nextValidatorContextSize,
+      validatorMaxOutput: nextValidatorMaxOutput,
+    };
+    setConfig(nextConfig);
+
+    if (updateRawText) {
+      setRawSettingsText(formatRawSettings({
+        ...rawSettings,
+        ...nextConfig,
+        numSubmitters: nextNumSubmitters,
+        freeOnly: rawSettings.freeOnly ?? false,
+        validatorOpenrouterReasoningEffort: nextValidatorOpenrouterReasoningEffort,
+        validatorSuperchargeEnabled: nextValidatorSuperchargeEnabled,
+        freeModelLooping: rawSettings.freeModelLooping ?? true,
+        freeModelAutoSelector: rawSettings.freeModelAutoSelector ?? true,
+        modelProviders: nextModelProviders,
+      }));
+    }
+  };
+
+  const handleRawEditToggle = (checked) => {
+    if (checked) {
+      const currentSettings = getAggregatorRawSettings();
+      setGuiSettingsBeforeRaw(currentSettings);
+      setRawSettingsText(formatRawSettings(currentSettings));
+      setRawSettingsMessage('');
+      setEditRawSettings(true);
+      return;
+    }
+
+    if (!confirm(RAW_VIEW_EXIT_WARNING)) {
+      return;
+    }
+
+    if (guiSettingsBeforeRaw) {
+      applyAggregatorRawSettings(guiSettingsBeforeRaw, { updateRawText: false });
+    }
+    setRawSettingsMessage('');
+    setEditRawSettings(false);
+  };
+
+  const saveRawSettings = () => {
+    try {
+      const parsed = JSON.parse(rawSettingsText);
+      applyAggregatorRawSettings(parsed);
+      setRawSettingsMessage('Saved raw settings.');
+    } catch (error) {
+      setRawSettingsMessage(`Invalid JSON: ${error.message}`);
+    }
+  };
+
   // Model selector component for either provider
   const ModelSelector = ({ 
     provider, 
     modelId, 
     openrouterProvider: orProvider, 
+    openrouterReasoningEffort,
     lmStudioFallbackId, 
     onModelChange, 
     onProviderChange, 
     onOpenrouterProviderChange, 
+    onOpenrouterReasoningEffortChange,
     onFallbackChange,
     label = 'Model'
   }) => {
@@ -518,12 +685,15 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
     const providers = modelId && effectiveProvider === 'openrouter'
       ? getProviderNames(modelProviders[modelId])
       : [];
+    const reasoningInfo = effectiveProvider === 'openrouter'
+      ? getReasoningSupportInfo(modelProviders[modelId], orProvider || null)
+      : { hasEndpointMetadata: false, supportsReasoning: false };
     
     return (
       <>
         {/* Provider Toggle */}
-        <div className="form-group form-group--compact">
-          <label className="label--sm">Provider</label>
+        <div className="settings-row">
+          <label>Provider</label>
           {lmStudioEnabled ? (
             <div className="provider-toggle-group">
               <button
@@ -537,26 +707,25 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                 type="button"
                 onClick={() => hasOpenRouterKey && onProviderChange('openrouter')}
                 disabled={!hasOpenRouterKey}
-                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
+                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
                 title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
               >
                 OpenRouter
               </button>
             </div>
           ) : (
-            <small className="hint-text hint-text--dim">
+            <small className="settings-hint">
               OpenRouter is required in this deployment.
             </small>
           )}
         </div>
 
         {/* Model Selection */}
-        <div className="form-group form-group--compact">
-          <label className="label--sm">{label}</label>
+        <div className="settings-row">
+          <label>{label}</label>
           <select
             value={modelId || ''}
             onChange={(e) => onModelChange(e.target.value)}
-            className="select--sm"
           >
             <option value="">Select model...</option>
             {models.map(model => {
@@ -577,12 +746,11 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
 
         {/* OpenRouter Provider Selection (only for OpenRouter) */}
         {effectiveProvider === 'openrouter' && modelId && (
-          <div className="form-group form-group--compact">
-            <label className="label--sm">Host Provider (optional)</label>
+          <div className="settings-row">
+            <label>Host Provider (optional)</label>
             <select
               value={orProvider || ''}
               onChange={(e) => onOpenrouterProviderChange(e.target.value || null)}
-              className="select--sm"
             >
               <option value="">Auto (let OpenRouter choose)</option>
               {providers.map(p => (
@@ -592,23 +760,41 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
           </div>
         )}
 
+        {effectiveProvider === 'openrouter' && modelId && (
+          <div className="settings-row">
+            <label>Reasoning Effort</label>
+            <select
+              value={normalizeOpenRouterReasoningEffort(openrouterReasoningEffort)}
+              onChange={(e) => onOpenrouterReasoningEffortChange(e.target.value)}
+            >
+              {OPENROUTER_REASONING_EFFORT_OPTIONS.map(option => (
+                <option key={option.value} value={option.value}>{option.label}</option>
+              ))}
+            </select>
+            <small className="settings-hint">
+              {reasoningInfo.hasEndpointMetadata && !reasoningInfo.supportsReasoning
+                ? 'This selected host does not advertise reasoning support; OpenRouter may ignore the setting.'
+                : 'Auto sends OpenRouter max reasoning effort by default.'}
+            </small>
+          </div>
+        )}
+
         {/* LM Studio Fallback (only for OpenRouter) */}
         {effectiveProvider === 'openrouter' && lmStudioEnabled && (
-          <div className="form-group form-group--compact">
-            <label className="label--sm label--muted">
+          <div className="settings-row">
+            <label className="label--muted">
               LM Studio Fallback (optional)
             </label>
             <select
               value={lmStudioFallbackId || ''}
               onChange={(e) => onFallbackChange(e.target.value || null)}
-              className="select--sm"
             >
               <option value="">No fallback</option>
               {lmStudioModels.map(model => (
                 <option key={model.id} value={model.id}>{model.id}</option>
               ))}
             </select>
-            <small className="hint-text hint-text--dim" style={{ marginTop: '0.25rem' }}>
+            <small className="settings-hint" style={{ marginTop: '0.25rem' }}>
               Used if OpenRouter credits run out
             </small>
           </div>
@@ -618,15 +804,17 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
   };
 
   return (
-    <div>
-      <div className="settings-header-row">
-        <h1>Aggregator Settings</h1>
-        {saveMessage && (
-          <div className="save-message">
-            {saveMessage}
+    <div className="autonomous-settings-layout">
+      <HighlightedModelsSidebar />
+      <div className="autonomous-settings">
+          <div className="settings-header-row">
+            <h2>Aggregator Settings</h2>
+            {saveMessage && (
+              <div className="save-message">
+                {saveMessage}
+              </div>
+            )}
           </div>
-        )}
-      </div>
 
       {/* OpenRouter Status Banner */}
       {!hasOpenRouterKey && (
@@ -650,70 +838,113 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
         </div>
       ) : (
         <>
-          {/* Number of Submitters Slider */}
-          <div className="form-group settings-panel settings-panel--blue">
-            <label className="label--lg">
-              Number of Aggregator Submitters: {numSubmitters}
-            </label>
-            <input
-              type="range"
-              min="1"
-              max="10"
-              value={numSubmitters}
-              onChange={(e) => handleNumSubmittersChange(e.target.value)}
-              className="range-slider"
-            />
-            <div className="range-labels">
-              <span>1</span>
-              <span>5</span>
-              <span>10</span>
-            </div>
-            <small className="hint-text">
-              Multiple submitters run in parallel exploring different avenues. Each can use a different model.
-            </small>
+          <div className="model-refresh-controls">
+            {lmStudioEnabled && (
+              <button onClick={fetchModels} className="secondary">
+                Refresh LM Studio Models
+              </button>
+            )}
+            {hasOpenRouterKey && (
+              <>
+                <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary" disabled={loadingOpenRouter}>
+                  {loadingOpenRouter ? 'Loading...' : 'Refresh OpenRouter Models'}
+                </button>
+                <label className="settings-checkbox-label model-refresh-controls__toggle">
+                  <input
+                    type="checkbox"
+                    checked={freeOnly}
+                    onChange={(e) => setFreeOnly(e.target.checked)}
+                  />
+                  Free models only
+                </label>
+              </>
+            )}
+            {developerModeEnabled ? (
+              <label className="settings-checkbox-label model-refresh-controls__toggle">
+                <input
+                  type="checkbox"
+                  checked={editRawSettings}
+                  onChange={(e) => handleRawEditToggle(e.target.checked)}
+                />
+                Edit Raw
+              </label>
+            ) : (
+              <span className="settings-developer-mode-hint">
+                Developer mode: press Shift + Z + X to toggle raw JSON settings.
+              </span>
+            )}
           </div>
 
-          {/* Per-Submitter Configuration Cards */}
-          <div className="mb-2">
-            <h3 className="section-heading--bordered">
-              Submitter Configurations
-            </h3>
+          {editRawSettings ? (
+            <RawSettingsEditor
+              value={rawSettingsText}
+              onChange={setRawSettingsText}
+              onSave={saveRawSettings}
+              message={rawSettingsMessage}
+            />
+          ) : (
+            <>
+          <div className="settings-group">
+            <h4>Brainstorm Submitters (Tier 1 Aggregation)</h4>
+            <p className="settings-info">
+              Configure multiple parallel submitters for brainstorm exploration. Each submitter can use a different model or provider.
+            </p>
+
+            <div className="settings-row">
+              <label title="Number of parallel brainstorm submitters (1-10)">
+                Number of Submitters
+              </label>
+              <input
+                type="number"
+                min={1}
+                max={10}
+                step={1}
+                value={numSubmitters}
+                onChange={(e) => handleNumSubmittersChange(e.target.value)}
+              />
+              {numSubmitters > 1 && (
+                <button
+                  type="button"
+                  className="copy-btn"
+                  onClick={() => applyToAll(1)}
+                  title="Copy Main Submitter settings to all others"
+                >
+                  Copy Main to All
+                </button>
+              )}
+            </div>
             
             {submitterConfigs.map((cfg, idx) => (
+              (() => {
+                const effectiveProvider = lmStudioEnabled ? cfg.provider : 'openrouter';
+                return (
               <div 
                 key={cfg.submitterId}
-                className={`role-config-card${cfg.provider === 'openrouter' ? ' role-config-card--openrouter role-config-card--highlight' : (cfg.submitterId === 1 ? ' role-config-card--main role-config-card--highlight' : '')}`}
+                className={`submitter-config-section${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter-orange' : (idx === 0 ? ' role-config-card--main' : '')}`}
               >
-                <div className="card-header-row">
-                  <h4 style={{ margin: 0 }} className={cfg.provider === 'openrouter' ? 'card-title--purple' : (cfg.submitterId === 1 ? 'card-title--green' : '')}>
-                    Submitter {cfg.submitterId} 
-                    {cfg.submitterId === 1 && <span className="provider-badge-inline"> (Main Submitter)</span>}
-                    {cfg.provider === 'openrouter' && <span className="provider-badge-inline" style={{ color: '#18cc17' }}> [OpenRouter]</span>}
-                  </h4>
-                  {cfg.submitterId === 1 && numSubmitters > 1 && (
-                    <button 
-                      onClick={() => applyToAll(1)}
-                      className="btn-apply-all"
-                    >
-                      Apply to All
-                    </button>
-                  )}
-                </div>
+                <h5 className={effectiveProvider === 'openrouter' ? 'card-title--orange' : (idx === 0 ? 'card-title--green' : '')}>
+                  <span className="role-title-with-badges">
+                    <span>{idx === 0 ? 'Submitter 1 (Main Submitter)' : `Submitter ${idx + 1}`}</span>
+                    {idx === 0 && <ProofStrengthBadge />}
+                  </span>
+                  {effectiveProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
+                </h5>
 
-                <div className={`config-grid ${cfg.provider === 'openrouter' ? 'config-grid--2col' : 'config-grid--3col'}`}>
                   <ModelSelector
                     provider={cfg.provider}
                     modelId={cfg.modelId}
                     openrouterProvider={cfg.openrouterProvider}
+                    openrouterReasoningEffort={cfg.openrouterReasoningEffort}
                     lmStudioFallbackId={cfg.lmStudioFallbackId}
                     onProviderChange={(p) => updateSubmitterConfig(cfg.submitterId, 'provider', p)}
                     onModelChange={(m) => handleSubmitterModelChange(cfg.submitterId, m)}
                     onOpenrouterProviderChange={(p) => handleSubmitterOpenRouterProviderChange(cfg.submitterId, p)}
+                    onOpenrouterReasoningEffortChange={(effort) => updateSubmitterConfig(cfg.submitterId, 'openrouterReasoningEffort', effort)}
                     onFallbackChange={(f) => updateSubmitterConfig(cfg.submitterId, 'lmStudioFallbackId', f)}
                   />
 
-                  <div className="form-group form-group--compact">
-                    <label className="label--sm">Context Window</label>
+                  <div className="settings-row">
+                    <label>Context Window</label>
                     <input
                       type="number"
                       value={cfg.contextWindow}
@@ -721,12 +952,11 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       min="4096"
                       max="50000000"
                       step="1024"
-                      className="input--sm"
                     />
                   </div>
 
-                  <div className="form-group form-group--compact">
-                    <label className="label--sm">Max Output Tokens</label>
+                  <div className="settings-row">
+                    <label>Max Output Tokens</label>
                     <input
                       type="number"
                       value={cfg.maxOutputTokens}
@@ -734,109 +964,147 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       min="1000"
                       max="50000000"
                       step="1000"
-                      className="input--sm"
                     />
                   </div>
-                </div>
+
+                  {developerModeEnabled && (
+                    <div className="settings-row settings-row--inline-checkbox">
+                      <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+                        <input
+                          type="checkbox"
+                          checked={Boolean(cfg.superchargeEnabled)}
+                          onChange={(e) => updateSubmitterConfig(cfg.submitterId, 'superchargeEnabled', e.target.checked)}
+                        />
+                        <HelpTooltip
+                          label="Learn about Supercharge"
+                          buttonContent="Supercharge"
+                          buttonClassName="help-tooltip-btn--text"
+                          popupClassName="help-tooltip-popup--fixed"
+                          useFixedPosition
+                        >
+                          {SUPERCHARGE_TOOLTIP}
+                        </HelpTooltip>
+                      </label>
+                    </div>
+                  )}
               </div>
+                );
+              })()
             ))}
           </div>
 
           {/* Validator Configuration (Single) */}
-          <div className={`role-config-card${validatorProvider === 'openrouter' ? ' role-config-card--openrouter role-config-card--highlight' : ' settings-panel--validator'}`}>
-            <h3 className={validatorProvider === 'openrouter' ? 'card-title--purple' : ''} style={{ marginBottom: '1rem', color: validatorProvider === 'openrouter' ? undefined : '#ff6b6b' }}>
-              Validator Configuration (Single)
-              {validatorProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
-            </h3>
-            <small className="hint-text" style={{ marginBottom: '1rem' }}>
+          <div className="settings-group">
+            <h4>Validator (Single Instance)</h4>
+            <p className="settings-info">
               Only one validator is allowed to maintain a single Markov chain evolution of the database.
-            </small>
+            </p>
+
+            <div
+              className={`submitter-config-section${validatorProvider === 'openrouter' ? ' role-config-card--openrouter-orange' : ''}`}
+              style={{ borderColor: validatorProvider === 'openrouter' ? undefined : '#ff6b6b' }}
+            >
+              <h5 className={validatorProvider === 'openrouter' ? 'card-title--orange' : ''} style={validatorProvider === 'openrouter' ? undefined : { color: '#ff6b6b' }}>
+                Validator
+                {validatorProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
+              </h5>
 
-            <div className={`config-grid ${validatorProvider === 'openrouter' ? 'config-grid--2col' : 'config-grid--1col'}`}>
               <ModelSelector
                 provider={validatorProvider}
                 modelId={config.validatorModel}
                 openrouterProvider={validatorOpenrouterProvider}
+                openrouterReasoningEffort={validatorOpenrouterReasoningEffort}
                 lmStudioFallbackId={validatorLmStudioFallback}
                 onProviderChange={updateValidatorProvider}
                 onModelChange={handleValidatorModelChange}
                 onOpenrouterProviderChange={handleValidatorOpenRouterProviderChange}
+                onOpenrouterReasoningEffortChange={(effort) => {
+                  const normalized = normalizeOpenRouterReasoningEffort(effort);
+                  setValidatorOpenrouterReasoningEffort(normalized);
+                  setConfig({ ...config, validatorOpenrouterReasoningEffort: normalized });
+                }}
                 onFallbackChange={(f) => {
                   setValidatorLmStudioFallback(f);
                   setConfig({ ...config, validatorLmStudioFallback: f });
                 }}
                 label="Validator Model"
               />
-            </div>
 
-            <div className="form-group" style={{ marginTop: '1rem' }}>
-              <label>Validator Context Window Size (tokens)</label>
-              <input
-                type="number"
-                value={config.validatorContextSize}
-                onChange={(e) => {
-                  const parsed = parseInt(e.target.value);
-                  setConfig({ ...config, validatorContextSize: isNaN(parsed) ? 131072 : parsed });
-                }}
-                min="4096"
-                max="50000000"
-                step="1024"
-              />
-              <small className="hint-text">
-                {validatorProvider === 'lm_studio' && lmStudioEnabled
-                  ? 'Must match the context length you set in LM Studio for this model.'
-                  : 'Set based on the OpenRouter model\'s context window.'
-                }
-              </small>
-            </div>
+              <div className="settings-row">
+                <label>Context Window</label>
+                <input
+                  type="number"
+                  value={config.validatorContextSize}
+                  onChange={(e) => {
+                    const parsed = parseInt(e.target.value);
+                    setConfig({ ...config, validatorContextSize: isNaN(parsed) ? DEFAULT_CONTEXT_WINDOW : parsed });
+                  }}
+                  min="4096"
+                  max="50000000"
+                  step="1024"
+                />
+              </div>
 
-            <div className="form-group">
-              <label>
-                Validator Max Output Tokens{' '}
-                <HelpTooltip
-                  label="Learn about validator max output tokens"
-                  anchorClassName="help-tooltip-anchor--inline"
-                  buttonContent="?"
-                >
-                  Default: 25000
-                </HelpTooltip>
-              </label>
-              <input
-                type="number"
-                value={validatorMaxOutput}
-                onChange={(e) => {
-                  const parsed = parseInt(e.target.value);
-                  const value = isNaN(parsed) ? 25000 : parsed;
-                  setValidatorMaxOutput(value);
-                  setConfig({ ...config, validatorMaxOutput: value });
-                }}
-                min="1000"
-                max="50000000"
-                step="1000"
-              />
+              <div className="settings-row">
+                <label>
+                  Max Output Tokens{' '}
+                  <HelpTooltip
+                    label="Learn about validator max output tokens"
+                    anchorClassName="help-tooltip-anchor--inline"
+                    buttonContent="?"
+                  >
+                    LM Studio default: {DEFAULT_MAX_OUTPUT_TOKENS}. OpenRouter selections auto-fill from provider metadata when available.
+                  </HelpTooltip>
+                </label>
+                <input
+                  type="number"
+                  value={validatorMaxOutput}
+                  onChange={(e) => {
+                    const parsed = parseInt(e.target.value);
+                    const value = isNaN(parsed) ? DEFAULT_MAX_OUTPUT_TOKENS : parsed;
+                    setValidatorMaxOutput(value);
+                    setConfig({ ...config, validatorMaxOutput: value });
+                  }}
+                  min="1000"
+                  max="50000000"
+                  step="1000"
+                />
+              </div>
+
+              {developerModeEnabled && (
+                <div className="settings-row settings-row--inline-checkbox">
+                  <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+                    <input
+                      type="checkbox"
+                      checked={validatorSuperchargeEnabled}
+                      onChange={(e) => {
+                        setValidatorSuperchargeEnabled(e.target.checked);
+                        setConfig({ ...config, validatorSuperchargeEnabled: e.target.checked });
+                      }}
+                    />
+                    <HelpTooltip
+                      label="Learn about Supercharge"
+                      buttonContent="Supercharge"
+                      buttonClassName="help-tooltip-btn--text"
+                      popupClassName="help-tooltip-popup--fixed"
+                      useFixedPosition
+                    >
+                      {SUPERCHARGE_TOOLTIP}
+                    </HelpTooltip>
+                  </label>
+                </div>
+              )}
             </div>
           </div>
 
-          {lmStudioEnabled && (
-            <button onClick={fetchModels} className="secondary mr-05">
-              Refresh LM Studio Models
-            </button>
-          )}
           {hasOpenRouterKey && (
-            <>
-              <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary mr-05" disabled={loadingOpenRouter}>
-                {loadingOpenRouter ? 'Loading...' : 'Refresh OpenRouter Models'}
-              </button>
-              <label className="settings-checkbox-label" style={{ marginLeft: '1rem' }}>
-                <input
-                  type="checkbox"
-                  checked={freeOnly}
-                  onChange={(e) => setFreeOnly(e.target.checked)}
-                />
-                Show only free models
-              </label>
+            <div className="settings-group">
+              <h4>OpenRouter Fallback</h4>
+              <p className="settings-info">
+                Fallback behavior for OpenRouter free-model rate limits.
+              </p>
               <div className="checkbox-group-col">
-                <label className="settings-checkbox-label">
+                <label className="settings-checkbox-label settings-checkbox-label--stacked">
                   <input
                     type="checkbox"
                     checked={freeModelLooping}
@@ -845,15 +1113,22 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
                     }}
                   />
-                  Enable Free Model Looping
-                  <HelpTooltip
-                    label="Learn about free model looping"
-                    anchorClassName="help-tooltip-anchor--inline"
-                  >
-                    When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
-                  </HelpTooltip>
+                  <span className="settings-option-copy">
+                    <span className="settings-option-title">
+                      Enable Free Model Looping
+                      <HelpTooltip
+                        label="Learn about free model looping"
+                        anchorClassName="help-tooltip-anchor--inline"
+                      >
+                        When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
+                      </HelpTooltip>
+                    </span>
+                    <span className="settings-option-description">
+                      Automatically rotate to the next selected free model when one hits a rate limit.
+                    </span>
+                  </span>
                 </label>
-                <label className="settings-checkbox-label">
+                <label className="settings-checkbox-label settings-checkbox-label--stacked">
                   <input
                     type="checkbox"
                     checked={freeModelAutoSelector}
@@ -862,15 +1137,24 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
                       openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
                     }}
                   />
-                  Use OpenRouter Free Models Auto-Selector as Backup
-                  <HelpTooltip
-                    label="Learn about the free models auto-selector backup"
-                    anchorClassName="help-tooltip-anchor--inline"
-                  >
-                    When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
-                  </HelpTooltip>
+                  <span className="settings-option-copy">
+                    <span className="settings-option-title">
+                      Use OpenRouter Free Models Auto-Selector as Backup
+                      <HelpTooltip
+                        label="Learn about the free models auto-selector backup"
+                        anchorClassName="help-tooltip-anchor--inline"
+                      >
+                        When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
+                      </HelpTooltip>
+                    </span>
+                    <span className="settings-option-description">
+                      Falls back to OpenRouter&apos;s free router when every selected free model is temporarily exhausted.
+                    </span>
+                  </span>
                 </label>
               </div>
+            </div>
+          )}
             </>
           )}
         </>
@@ -889,7 +1173,8 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
               host: s.provider === 'openrouter' ? (s.openrouterProvider || 'Auto') : 'N/A',
               fallback: s.provider === 'openrouter' ? (s.lmStudioFallbackId?.split('/').pop() || 'None') : 'N/A',
               context: s.contextWindow,
-              maxOutput: s.maxOutputTokens
+              maxOutput: s.maxOutputTokens,
+              supercharge: Boolean(s.superchargeEnabled)
             })),
             validator: {
               provider: validatorProvider,
@@ -897,12 +1182,14 @@ export default function AggregatorSettings({ config, setConfig, capabilities })
               host: validatorProvider === 'openrouter' ? (validatorOpenrouterProvider || 'Auto') : 'N/A',
               fallback: validatorProvider === 'openrouter' ? (validatorLmStudioFallback?.split('/').pop() || 'None') : 'N/A',
               context: config.validatorContextSize,
-              maxOutput: validatorMaxOutput
+              maxOutput: validatorMaxOutput,
+              supercharge: validatorSuperchargeEnabled
             },
             uploadedFiles: config.uploadedFiles?.length || 0
           }, null, 2)}
         </pre>
       </div>
+      </div>
     </div>
   );
 }
diff --git a/frontend/src/components/autonomous/AutonomousResearch.css b/frontend/src/components/autonomous/AutonomousResearch.css
index c9ad866..652f6da 100644
--- a/frontend/src/components/autonomous/AutonomousResearch.css
+++ b/frontend/src/components/autonomous/AutonomousResearch.css
@@ -185,6 +185,29 @@
   gap: 0.5rem;
 }
 
+.leanoj-header {
+  align-items: flex-start;
+  gap: 1.5rem;
+}
+
+.leanoj-header-copy {
+  flex: 1 1 420px;
+  min-width: 0;
+  max-width: 560px;
+}
+
+.leanoj-proof-solver-intro {
+  max-width: 480px;
+  margin: 0.5rem 0 0 0;
+  line-height: 1.45;
+}
+
+.leanoj-header .autonomous-controls {
+  flex-shrink: 0;
+  flex-wrap: wrap;
+  justify-content: flex-end;
+}
+
 /* Buttons */
 .btn-start {
   background: linear-gradient(135deg, #2ecc71, #27ae60);
@@ -507,6 +530,18 @@
   font-size: 1rem;
 }
 
+.activity-section-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  gap: 1rem;
+  margin-bottom: 0.75rem;
+}
+
+.activity-section-header h3 {
+  margin: 0;
+}
+
 .activity-feed {
   flex: 1;
   background: var(--bg-secondary, #1e1e1e);
@@ -582,6 +617,104 @@
   border: 1px solid rgba(30, 255, 28, 0.3);
 }
 
+.code-block {
+  background: var(--bg-secondary, #1e1e1e);
+  border: 1px solid var(--border-color, #333);
+  border-radius: 8px;
+  color: var(--text-primary, #e0e0e0);
+  font-family: 'Fira Code', 'Courier New', monospace;
+  font-size: 0.85rem;
+  line-height: 1.5;
+  max-height: 420px;
+  overflow: auto;
+  padding: 1rem;
+  white-space: pre-wrap;
+}
+
+.leanoj-brainstorms__metrics {
+  grid-template-columns: repeat(auto-fit, minmax(150px, 1fr));
+  margin-bottom: 0.5rem;
+}
+
+.leanoj-brainstorms .brainstorm-list-header {
+  align-items: flex-start;
+}
+
+.leanoj-brainstorms .settings-hint {
+  margin: 0.25rem 0 0 0;
+  max-width: 920px;
+}
+
+.leanoj-brainstorms .brainstorm-card {
+  cursor: default;
+}
+
+.leanoj-brainstorms .brainstorm-card-clickable {
+  cursor: pointer;
+}
+
+.leanoj-brainstorms .brainstorm-submissions-container {
+  cursor: default;
+}
+
+.leanoj-brainstorms__ideas {
+  display: flex;
+  flex-direction: column;
+  gap: 0.5rem;
+}
+
+.leanoj-brainstorms__idea-header {
+  cursor: default;
+}
+
+.leanoj-brainstorms__idea-header:hover {
+  background: transparent;
+}
+
+.leanoj-brainstorms__idea-header .brainstorm-status {
+  flex-shrink: 0;
+  white-space: nowrap;
+}
+
+.leanoj-brainstorms__idea-card .submission-content pre {
+  color: var(--text-primary, #e0e0e0);
+}
+
+.leanoj-brainstorms__reasoning {
+  border-top: 1px solid var(--border-color, #333);
+  display: flex;
+  flex-direction: column;
+  gap: 0.35rem;
+  margin-top: 0.85rem;
+  padding-top: 0.85rem;
+}
+
+.leanoj-brainstorms__reasoning strong {
+  color: var(--text-secondary, #888);
+  font-size: 0.8rem;
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
+}
+
+.leanoj-brainstorms__reasoning span {
+  color: var(--text-primary, #e0e0e0);
+  line-height: 1.45;
+}
+
+.leanoj-log-card {
+  margin-top: 0.75rem;
+  padding: 1rem;
+}
+
+.leanoj-log-card h4 {
+  margin: 0 0 0.5rem 0;
+  color: var(--text-primary, #e0e0e0);
+}
+
+.leanoj-log-card p {
+  margin: 0.5rem 0;
+}
+
 /* Brainstorm List */
 .brainstorm-list {
   display: flex;
@@ -727,6 +860,12 @@
   margin-bottom: 0.5rem;
 }
 
+.paper-library-pruned-actions {
+  display: flex;
+  justify-content: center;
+  margin: 0.5rem 0 1rem;
+}
+
 .paper-grid {
   display: grid;
   grid-template-columns: repeat(auto-fill, minmax(300px, 1fr));
@@ -883,6 +1022,35 @@
   min-height: 100vh;
 }
 
+.settings-with-model-sidebar {
+  display: flex;
+  gap: 0;
+  width: 100%;
+  min-height: 100vh;
+}
+
+.settings-with-model-sidebar__main {
+  flex: 1;
+  min-width: 0;
+  padding: 1.5rem;
+  overflow-y: auto;
+  width: 100%;
+  max-width: calc(100vw - 322px - 3rem);
+  box-sizing: border-box;
+  position: relative;
+  z-index: 10;
+}
+
+.app.workflow-panel-expanded .settings-with-model-sidebar__main {
+  max-width: calc(100vw - 322px - 3rem - 320px);
+  padding-right: 1.5rem;
+}
+
+.app.workflow-panel-collapsed .settings-with-model-sidebar__main {
+  max-width: calc(100vw - 322px - 3rem - 50px);
+  padding-right: 1.5rem;
+}
+
 .settings-left-sidebar {
   width: 322px;
   background: linear-gradient(180deg, rgba(15, 19, 16, 0.98) 0%, rgba(20, 29, 22, 0.96) 100%);
@@ -949,6 +1117,7 @@
 }
 
 .known-models-sidebar .model-item {
+  position: relative;
   background: linear-gradient(180deg, rgba(32, 36, 33, 0.96) 0%, rgba(24, 28, 25, 0.98) 100%);
   border: 1px solid var(--leaderboard-accent-border);
   border-radius: 6px;
@@ -959,6 +1128,7 @@
 }
 
 .known-models-sidebar .model-item:hover {
+  z-index: 5;
   background: linear-gradient(180deg, var(--leaderboard-accent-hover) 0%, rgba(76, 175, 80, 0.08) 100%);
   border-color: rgba(125, 223, 147, 0.66);
   box-shadow:
@@ -967,6 +1137,11 @@
   transform: translateX(4px);
 }
 
+.known-models-sidebar .model-item--os:hover,
+.known-models-sidebar .model-item--os:focus-within {
+  z-index: 50;
+}
+
 .model-item-name {
   color: var(--text-primary, #e0e0e0);
   font-weight: 600;
@@ -1068,7 +1243,8 @@
   white-space: normal;
 }
 
-.os-tag-tooltip-anchor:hover .os-tag-tooltip {
+.os-tag-tooltip-anchor:hover .os-tag-tooltip,
+.os-tag-tooltip-anchor:focus .os-tag-tooltip {
   display: block;
 }
 
@@ -1852,13 +2028,17 @@
 }
 
 .btn-force-paper {
-  padding: 10px 20px;
+  position: relative;
+  align-self: flex-start;
+  padding: 0.45rem 0.85rem;
   background: linear-gradient(135deg, #e74c3c 0%, #c0392b 100%);
   color: white;
   border: none;
   border-radius: 6px;
   cursor: pointer;
-  font-weight: 500;
+  font-weight: 600;
+  font-size: 0.85rem;
+  line-height: 1.2;
   transition: all 0.3s ease;
 }
 
@@ -2657,22 +2837,58 @@
 
 /* Force Paper Text Hierarchy */
 .force-paper-text {
-  display: flex;
-  flex-direction: column;
-  gap: 0.25rem;
+  display: inline-flex;
+  align-items: center;
 }
 
 .force-paper-action {
   display: block;
   font-weight: 700;
-  font-size: 1rem;
 }
 
 .force-paper-hint {
-  display: block;
+  position: absolute;
+  left: 0;
+  bottom: calc(100% + 10px);
+  width: min(430px, calc(100vw - 3rem));
+  padding: 0.75rem 0.85rem;
+  background: linear-gradient(180deg, rgba(28, 18, 18, 0.98), rgba(15, 10, 10, 0.99));
+  border: 1px solid rgba(231, 76, 60, 0.42);
+  border-radius: 6px;
+  box-shadow: 0 12px 28px rgba(0, 0, 0, 0.36);
+  color: #fff;
   font-weight: 400;
-  font-size: 0.75rem;
-  opacity: 0.85;
+  font-size: 0.78rem;
+  line-height: 1.45;
+  text-align: left;
+  white-space: normal;
+  opacity: 0;
+  visibility: hidden;
+  pointer-events: none;
+  z-index: 20;
+  transition:
+    opacity 0.16s ease,
+    visibility 0s linear 0.16s;
+}
+
+.force-paper-hint::after {
+  content: '';
+  position: absolute;
+  left: 18px;
+  bottom: -7px;
+  width: 12px;
+  height: 12px;
+  background: rgba(15, 10, 10, 0.99);
+  border-right: 1px solid rgba(231, 76, 60, 0.42);
+  border-bottom: 1px solid rgba(231, 76, 60, 0.42);
+  transform: rotate(45deg);
+}
+
+.btn-force-paper:hover:not(:disabled) .force-paper-hint,
+.btn-force-paper:focus-visible:not(:disabled) .force-paper-hint {
+  opacity: 1;
+  visibility: visible;
+  transition-delay: 0.75s, 0.75s;
 }
 
 /* ============================================================ */
@@ -2680,7 +2896,8 @@
 /* ============================================================ */
 
 @media (max-width: 768px) {
-  .autonomous-settings-layout {
+  .autonomous-settings-layout,
+  .settings-with-model-sidebar {
     flex-direction: column;
   }
   
@@ -2691,14 +2908,16 @@
     max-height: 300px;
   }
   
-  .autonomous-settings {
+  .autonomous-settings,
+  .settings-with-model-sidebar__main {
     padding: 1rem;
+    max-width: 100%;
   }
   
   .stats-section {
     grid-template-columns: repeat(2, 1fr);
   }
-  
+
   .paper-grid {
     grid-template-columns: 1fr;
   }
diff --git a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
index 69ae366..13d19ae 100644
--- a/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchInterface.jsx
@@ -7,6 +7,7 @@ import './AutonomousResearch.css';
 import LivePaperProgress from './LivePaperProgress';
 import LiveTier3Progress from './LiveTier3Progress';
 import TextFileUploader from '../TextFileUploader';
+import { getActivityClass as getSharedActivityClass, getActivityIcon as getSharedActivityIcon } from '../../utils/activityStyles';
 
 const AutonomousResearchInterface = ({
   isRunning,
@@ -254,9 +255,7 @@ const AutonomousResearchInterface = ({
         return '◎';
       case 'critique_progress':
         return '⊟';
-      case 'body_rewrite_started':
-        return '▬';
-      case 'partial_revision_complete':
+      case 'self_review_appended':
         return '◈';
       case 'critique_phase_ended':
         return '✓';
@@ -329,6 +328,10 @@ const AutonomousResearchInterface = ({
         return 'Z';
       case 'proof_attempt_started':
         return '>';
+      case 'proof_lean_accepted':
+        return '>';
+      case 'proof_integrity_rejected':
+        return '⚠';
       case 'proof_attempt_failed':
       case 'proof_attempts_exhausted':
         return '⚠';
@@ -355,7 +358,7 @@ const AutonomousResearchInterface = ({
         event === 'compiler_acceptance' ||
         event === 'outline_locked' ||
         event === 'paper_completed' || 
-        event === 'partial_revision_complete' ||
+        event === 'self_review_appended' ||
         event === 'topic_exploration_complete' ||
         event === 'paper_title_exploration_complete' ||
         event === 'tier3_chapter_complete' ||
@@ -363,6 +366,7 @@ const AutonomousResearchInterface = ({
         event === 'tier3_long_form_complete' ||
         event === 'reference_selection_complete' ||
         event === 'proof_verified' ||
+        event === 'proof_lean_accepted' ||
         event === 'novel_proof_discovered' ||
         event === 'known_proof_verified' ||
         event === 'proof_check_complete' ||
@@ -376,7 +380,8 @@ const AutonomousResearchInterface = ({
         event === 'compiler_rejection' ||
         event === 'tier3_rejection' ||
         event === 'proof_attempt_failed' ||
-        event === 'proof_attempts_exhausted'
+        event === 'proof_attempts_exhausted' ||
+        event === 'proof_integrity_rejected'
     ) {
       return 'activity-reject';
     }
@@ -413,7 +418,7 @@ const AutonomousResearchInterface = ({
   };
 
   return (
-    <div className="autonomous-interface">
+    <div className={`autonomous-interface workflow-main-interface ${isRunning || isStopping ? 'workflow-main-interface--running' : ''}`}>
       {/* Header */}
       <div className="autonomous-header">
         <h2>Autonomous Research</h2>
@@ -550,8 +555,10 @@ const AutonomousResearchInterface = ({
                     ? (isForcing ? 'Forcing...' : 'Confirm Force Paper Writing') 
                     : (
                       <span className="force-paper-text">
-                        <span className="force-paper-action">Skip AI Autonomy and Force Paper Writing</span>
-                        <span className="force-paper-hint">(We recommend at minimum 5 ACCEPTED submissions - it is normal for a very low % acceptance rate as the validator is only seeking novel solutions - higher parameter models may help submission acceptance rate, however optimizing for both speed (rapid submissions) and knowledge can also work well. The validator provides feedback on rejections to avoid rejection-loops. Harder problems may require hundreds or more of rejections before a single submission acceptance - the first submission acceptance often takes the longest. View brainstorms in the brainstorm tab.)</span>
+                        <span className="force-paper-action">Skip AI Autonomy</span>
+                        <span className="force-paper-hint" role="tooltip">
+                          We recommend at minimum 5 ACCEPTED submissions. A very low acceptance rate is normal because the validator is seeking novel solutions. Higher parameter models may improve acceptance, though optimizing for both speed and knowledge can also work well. Validator feedback on rejections helps avoid rejection loops. Harder problems may require hundreds or more rejections before a single acceptance, and the first acceptance often takes the longest. View brainstorms in the brainstorm tab.
+                        </span>
                       </span>
                     )}
                 </button>
@@ -731,15 +738,15 @@ const AutonomousResearchInterface = ({
         <div className="activity-feed" ref={activityFeedRef}>
           {activity.length === 0 ? (
             <div className="activity-empty">
-              No activity yet. Wait about 20 to 30 minutes. If you have not yet, press the start button under your prompt entry to begin research.
+              No activity yet. Wait about 20 to 30 minutes. If you have not yet, press the start button above your prompt entry to begin research.
             </div>
           ) : (
             activity.map((item, index) => (
               <div 
                 key={index} 
-                className={`activity-item ${getActivityClass(item.event)}`}
+                className={`activity-item ${getSharedActivityClass(item.event)}`}
               >
-                <span className="activity-icon">{getActivityIcon(item.event)}</span>
+                <span className="activity-icon">{getSharedActivityIcon(item.event)}</span>
                 <span className="activity-time">
                   {new Date(item.timestamp).toLocaleTimeString()}
                 </span>
diff --git a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
index b7a1aff..bdcfd57 100644
--- a/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchLogs.jsx
@@ -3,35 +3,15 @@
  * Shows submission accept/reject statistics broken down by each submitter role.
  * Includes API call logging with full request/response details.
  */
-import React, { useRef, useEffect, useMemo, useState, useCallback } from 'react';
+import React, { useRef, useEffect, useMemo, useState } from 'react';
 import { autonomousAPI } from '../../services/api';
+import ApiCallLogs from '../ApiCallLogs';
 import './AutonomousResearch.css';
 
-const EMPTY_API_STATS = Object.freeze({
-  total_calls: 0,
-  successful_calls: 0,
-  failed_calls: 0,
-  success_rate: 0,
-  boosted_calls: 0,
-  by_phase: {},
-  by_model: {},
-  by_provider: {},
-  by_source: {},
-  by_boost_mode: {},
-});
-
 const AutonomousResearchLogs = ({ stats, events }) => {
   const eventsContainerRef = useRef(null);
   const prevEventsLengthRef = useRef(0);
   const [expandedSubmitters, setExpandedSubmitters] = useState({});
-  
-  // API Logs state
-  const [apiLogs, setApiLogs] = useState([]);
-  const [apiStats, setApiStats] = useState(null);
-  const [apiLogsLoading, setApiLogsLoading] = useState(true);
-  const [expandedApiLogIdx, setExpandedApiLogIdx] = useState(null);
-  const [apiAutoRefresh, setApiAutoRefresh] = useState(true);
-  const abortControllerRef = useRef(null);
 
   // Auto-scroll event log only when new events are added (not on mount/tab switch)
   useEffect(() => {
@@ -42,153 +22,6 @@ const AutonomousResearchLogs = ({ stats, events }) => {
     prevEventsLengthRef.current = currentLength;
   }, [events]);
 
-  // Fetch API logs
-  const fetchApiLogs = useCallback(async () => {
-    // Abort previous request if still pending
-    if (abortControllerRef.current) {
-      abortControllerRef.current.abort();
-    }
-    
-    // Create new abort controller for this request
-    const controller = new AbortController();
-    abortControllerRef.current = controller;
-    
-    try {
-      const response = await autonomousAPI.getApiLogs(100, { signal: controller.signal });
-      if (abortControllerRef.current !== controller) {
-        return;
-      }
-
-      if (response.success) {
-        setApiLogs(response.logs || []);
-        setApiStats(response.stats || EMPTY_API_STATS);
-      }
-    } catch (error) {
-      if (abortControllerRef.current !== controller) {
-        return;
-      }
-
-      // Don't log abort errors as they're expected on cleanup
-      if (error.name !== 'AbortError') {
-        console.error('Failed to fetch autonomous API logs:', error);
-      }
-    } finally {
-      if (abortControllerRef.current === controller) {
-        setApiLogsLoading(false);
-      }
-    }
-  }, []);
-
-  // Initial fetch and auto-refresh for API logs
-  useEffect(() => {
-    fetchApiLogs();
-
-    let interval;
-    if (apiAutoRefresh) {
-      // Set interval to refresh every 5 seconds (skip first call since we already called above)
-      interval = setInterval(fetchApiLogs, 5000);
-    }
-
-    return () => {
-      if (interval) clearInterval(interval);
-      // Cancel any pending requests on unmount
-      if (abortControllerRef.current) {
-        abortControllerRef.current.abort();
-        abortControllerRef.current = null;
-      }
-    };
-  }, [fetchApiLogs, apiAutoRefresh]);
-
-  // Handle clear API logs
-  const handleClearApiLogs = async () => {
-    if (!window.confirm('Are you sure you want to clear all API logs?')) {
-      return;
-    }
-
-    try {
-      if (abortControllerRef.current) {
-        abortControllerRef.current.abort();
-        abortControllerRef.current = null;
-      }
-
-      await autonomousAPI.clearApiLogs();
-      setApiLogs([]);
-      setApiStats(EMPTY_API_STATS);
-      setExpandedApiLogIdx(null);
-      setApiLogsLoading(false);
-    } catch (error) {
-      console.error('Failed to clear API logs:', error);
-    }
-  };
-
-  // Toggle API log expansion
-  const toggleApiLogExpand = (index) => {
-    setExpandedApiLogIdx(expandedApiLogIdx === index ? null : index);
-  };
-
-  // Copy to clipboard
-  const copyToClipboard = async (text) => {
-    try {
-      await navigator.clipboard.writeText(text);
-    } catch (error) {
-      console.error('Failed to copy to clipboard:', error);
-    }
-  };
-
-  // Format duration
-  const formatDuration = (ms) => {
-    if (ms === null || ms === undefined) return '-';
-    if (ms < 1000) return `${Math.round(ms)}ms`;
-    return `${(ms / 1000).toFixed(1)}s`;
-  };
-
-  // Format timestamp
-  const formatTimestamp = (timestamp) => {
-    try {
-      const date = new Date(timestamp);
-      return date.toLocaleString();
-    } catch {
-      return timestamp;
-    }
-  };
-
-  // Get phase label
-  const getPhaseLabel = (phase) => {
-    switch (phase) {
-      case 'topic_selection': return 'Topic';
-      case 'brainstorm': return 'Brainstorm';
-      case 'paper_compilation': return 'Paper';
-      case 'tier3': return 'Tier 3';
-      case 'boost': return 'Boost';
-      default: return phase || 'Unknown';
-    }
-  };
-
-  const getSourceLabel = (source) => {
-    switch (source) {
-      case 'api+boost': return 'Boosted';
-      case 'boost': return 'Boost Only';
-      default: return 'Standard';
-    }
-  };
-
-  const getBoostModeLabel = (mode) => {
-    switch (mode) {
-      case 'next_count': return 'Next X';
-      case 'category': return 'Category';
-      case 'task_id': return 'Task ID';
-      default: return mode || 'Unknown';
-    }
-  };
-
-  const getProviderLabel = (provider) => {
-    switch (provider) {
-      case 'openrouter': return 'OR';
-      case 'lm_studio': return 'LMS';
-      default: return provider || 'UNK';
-    }
-  };
-
   // Calculate per-submitter statistics from individual events
   // These come from the aggregator's direct 'submission_accepted'/'submission_rejected' events
   const submitterStats = useMemo(() => {
@@ -247,6 +80,14 @@ const AutonomousResearchLogs = ({ stats, events }) => {
 
   const formatEventMessage = (event) => {
     const data = event.data || {};
+    const proofName = data.proof_label ? `Proof ${data.proof_label}` : 'Proof';
+    const proofTarget = data.theorem_statement || data.theorem_id || '';
+    const proofLeanResponse = () => {
+      if (data.lean_response) return data.lean_response;
+      if (data.proof_verified === true) return 'Lean 4 response: proof verified.';
+      const error = data.error_summary || data.error_output || data.reason || '';
+      return error ? `Lean 4 response: ${error} - proof not verified.` : 'Lean 4 response: proof not verified.';
+    };
     
     switch (event.event) {
       case 'auto_research_started':
@@ -319,17 +160,21 @@ const AutonomousResearchLogs = ({ stats, events }) => {
       case 'proof_check_candidates_found':
         return `Proof candidates found: ${data.count || 0}`;
       case 'proof_attempt_started':
-        return `Proof attempt ${data.attempt || 1}: ${data.theorem_statement || data.theorem_id}`;
+        return `${proofName}, Attempt ${data.attempt || 1} started: ${proofTarget}`;
       case 'proof_attempt_failed':
-        return `Proof attempt ${data.attempt || '?'} failed: ${data.error_summary || data.theorem_statement || data.theorem_id}`;
+        return `${proofName}, Attempt ${data.attempt || '?'} final: ${proofLeanResponse()}`;
+      case 'proof_lean_accepted':
+        return `${proofName}, Attempt ${data.attempt || '?'} final: ${proofLeanResponse()}`;
+      case 'proof_integrity_rejected':
+        return `${proofName} error: integrity rejected - ${data.reason || proofTarget}`;
       case 'proof_verified':
-        return `Lean 4 verified: ${data.theorem_statement || data.theorem_id}`;
+        return `${proofName} verified and accepted: ${proofTarget}`;
       case 'proof_attempts_exhausted':
-        return `Proof attempts exhausted: ${data.theorem_statement || data.theorem_id}`;
+        return `${proofName} terminated: proof attempts exhausted for ${proofTarget}`;
       case 'novel_proof_discovered':
-        return `Novel proof discovered: ${data.theorem_statement}`;
+        return `${proofName} novel proof discovered: ${data.theorem_statement}`;
       case 'known_proof_verified':
-        return `Known proof verified for ${data.source_type} ${data.source_id}`;
+        return `${proofName} known proof verified for ${data.source_type} ${data.source_id}`;
       case 'proof_check_complete':
         return `Proof check complete: ${data.verified_count || 0} verified, ${data.novel_count || 0} novel`;
       default:
@@ -339,10 +184,16 @@ const AutonomousResearchLogs = ({ stats, events }) => {
 
   const getEventClass = (event) => {
     const eventName = event.event || '';
-    if (eventName === 'proof_attempt_failed' || eventName === 'proof_attempts_exhausted') {
+    if (
+      eventName === 'proof_attempt_failed' ||
+      eventName === 'proof_attempts_exhausted' ||
+      eventName === 'proof_integrity_rejected' ||
+      eventName === 'smt_check_error'
+    ) {
       return 'log-reject';
     }
     if (
+      eventName === 'proof_lean_accepted' ||
       eventName === 'proof_verified' ||
       eventName === 'novel_proof_discovered' ||
       eventName === 'known_proof_verified' ||
@@ -400,8 +251,8 @@ const AutonomousResearchLogs = ({ stats, events }) => {
         </div>
         
         <div className="metric-card">
-          <span className="metric-value">{stats?.total_papers_archived || 0}</span>
-          <span className="metric-label">Archived</span>
+          <span className="metric-value">{stats?.total_papers_pruned || stats?.total_papers_archived || 0}</span>
+          <span className="metric-label">Pruned</span>
         </div>
         
         <div className="metric-card">
@@ -525,201 +376,11 @@ const AutonomousResearchLogs = ({ stats, events }) => {
         )}
       </div>
 
-      {/* API Call Logs Section */}
-      <div className="api-logs-section" style={{ marginTop: '30px' }}>
-        <div className="api-logs-header">
-          <h3>API Call Logs</h3>
-          <div className="api-logs-actions">
-            <label className="auto-refresh-toggle">
-              <input
-                type="checkbox"
-                checked={apiAutoRefresh}
-                onChange={(e) => setApiAutoRefresh(e.target.checked)}
-              />
-              Auto-refresh
-            </label>
-            <button onClick={fetchApiLogs} className="refresh-btn" title="Refresh now">
-              Refresh
-            </button>
-            <button 
-              onClick={handleClearApiLogs} 
-              className="clear-btn"
-              disabled={apiLogs.length === 0}
-            >
-              Clear Logs
-            </button>
-          </div>
-        </div>
-
-        {/* API Stats Summary */}
-        {apiStats && (
-          <div className="api-stats">
-            <div className="stat-card">
-              <span className="stat-value">{apiStats.total_calls}</span>
-              <span className="stat-label">Total API Calls</span>
-            </div>
-            <div className="stat-card success">
-              <span className="stat-value">{apiStats.successful_calls}</span>
-              <span className="stat-label">Successful</span>
-            </div>
-            <div className="stat-card error">
-              <span className="stat-value">{apiStats.failed_calls}</span>
-              <span className="stat-label">Failed</span>
-            </div>
-            <div className="stat-card">
-              <span className="stat-value">
-                {(apiStats.success_rate * 100).toFixed(1)}%
-              </span>
-              <span className="stat-label">Success Rate</span>
-            </div>
-            <div className="stat-card">
-              <span className="stat-value">{apiStats.boosted_calls || 0}</span>
-              <span className="stat-label">Boosted Calls</span>
-            </div>
-          </div>
-        )}
-
-        {/* Stats by Phase */}
-        {apiStats && apiStats.by_phase && Object.keys(apiStats.by_phase).length > 0 && (
-          <div className="phase-stats">
-            <span className="phase-stats-label">By Phase:</span>
-            {Object.entries(apiStats.by_phase).map(([phase, count]) => (
-              <span key={phase} className="phase-stat-badge">
-                {getPhaseLabel(phase)}: {count}
-              </span>
-            ))}
-          </div>
-        )}
-
-        {apiStats && apiStats.by_source && Object.keys(apiStats.by_source).length > 0 && (
-          <div className="phase-stats">
-            <span className="phase-stats-label">By Source:</span>
-            {Object.entries(apiStats.by_source).map(([source, count]) => (
-              <span key={source} className="phase-stat-badge">
-                {getSourceLabel(source)}: {count}
-              </span>
-            ))}
-          </div>
-        )}
-
-        {apiStats && apiStats.by_boost_mode && Object.keys(apiStats.by_boost_mode).length > 0 && (
-          <div className="phase-stats">
-            <span className="phase-stats-label">Boost Modes:</span>
-            {Object.entries(apiStats.by_boost_mode).map(([mode, count]) => (
-              <span key={mode} className="phase-stat-badge">
-                {getBoostModeLabel(mode)}: {count}
-              </span>
-            ))}
-          </div>
-        )}
-
-        {/* API Logs List */}
-        <div className="api-logs-list">
-          {apiLogsLoading ? (
-            <div className="logs-loading">Loading API logs...</div>
-          ) : apiLogs.length === 0 ? (
-            <div className="logs-empty">
-              <p>No API calls logged yet.</p>
-              <p className="logs-empty-hint">
-                Run a workflow and make API calls to see the combined logs here.
-              </p>
-            </div>
-          ) : (
-            apiLogs.map((log, index) => (
-              <div 
-                key={index} 
-                className={`api-log-entry ${log.success ? 'success' : 'error'} ${expandedApiLogIdx === index ? 'expanded' : ''}`}
-              >
-                <div 
-                  className="log-summary"
-                  onClick={() => toggleApiLogExpand(index)}
-                >
-                  <div className="log-status">
-                    {log.success ? '✓' : '✗'}
-                  </div>
-                  <div className="log-info">
-                    <div className="log-task">
-                      <span className="log-task-id">{log.task_id}</span>
-                      <span className="log-phase-badge">{getPhaseLabel(log.phase)}</span>
-                      <span className={`log-source-badge ${log.boosted ? 'boosted' : 'standard'}`}>
-                        {getSourceLabel(log.source)}
-                      </span>
-                      {log.boost_mode && (
-                        <span className="log-boost-mode-badge">{getBoostModeLabel(log.boost_mode)}</span>
-                      )}
-                    </div>
-                    <div className="log-meta">
-                      <span className="log-model">{log.model}</span>
-                      <span className="log-provider-badge">{getProviderLabel(log.provider)}</span>
-                      <span className="log-duration">{formatDuration(log.duration_ms)}</span>
-                      {log.tokens_used && (
-                        <span className="log-tokens">{log.tokens_used} tokens</span>
-                      )}
-                    </div>
-                  </div>
-                  <div className="log-timestamp">{formatTimestamp(log.timestamp)}</div>
-                  <div className="log-expand-icon">{expandedApiLogIdx === index ? '▼' : '▶'}</div>
-                </div>
-
-                {expandedApiLogIdx === index && (
-                  <div className="log-details">
-                    <div className="log-detail-section">
-                      <h4>Role</h4>
-                      <pre>{log.role_id}</pre>
-                    </div>
-
-                    <div className="log-detail-section">
-                      <h4>Source</h4>
-                      <pre>{getSourceLabel(log.source)}{log.boost_mode ? ` (${getBoostModeLabel(log.boost_mode)})` : ''}</pre>
-                    </div>
-
-                    {log.error && (
-                      <div className="log-detail-section error">
-                        <h4>Error</h4>
-                        <pre>{log.error}</pre>
-                      </div>
-                    )}
-
-                    <div className="log-detail-section">
-                      <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
-                        <h4>Sent Prompt</h4>
-                        <button 
-                          onClick={(e) => {
-                            e.stopPropagation();
-                            copyToClipboard(log.prompt_full || log.prompt_preview || '');
-                          }}
-                          className="copy-btn"
-                          title="Copy full prompt to clipboard"
-                        >
-                          Copy Full
-                        </button>
-                      </div>
-                      <pre className="log-preview">{log.prompt_preview || '(empty)'}</pre>
-                    </div>
-
-                    <div className="log-detail-section">
-                      <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
-                        <h4>Received Response</h4>
-                        <button 
-                          onClick={(e) => {
-                            e.stopPropagation();
-                            copyToClipboard(log.response_full || log.response_preview || '');
-                          }}
-                          className="copy-btn"
-                          title="Copy full response to clipboard"
-                        >
-                          Copy Full
-                        </button>
-                      </div>
-                      <pre className="log-response">{log.response_full || log.response_preview || '(empty)'}</pre>
-                    </div>
-                  </div>
-                )}
-              </div>
-            ))
-          )}
-        </div>
-      </div>
+      <ApiCallLogs
+        api={autonomousAPI}
+        workflow="autonomous"
+        style={{ marginTop: '30px' }}
+      />
 
       {/* Event Log */}
       <h4 style={{ marginTop: '20px' }}>Event Log</h4>
diff --git a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
index f75c92f..476722a 100644
--- a/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
+++ b/frontend/src/components/autonomous/AutonomousResearchSettings.jsx
@@ -8,9 +8,15 @@ import React, { useState, useEffect } from 'react';
 import { openRouterAPI, api, autonomousAPI } from '../../services/api';
 import {
   computeOpenRouterAutoSettings,
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
   findOpenRouterModel,
   getProviderNames,
+  getReasoningSupportInfo,
   hasEndpointMetadata,
+  normalizeOpenRouterReasoningEffort,
+  OPENROUTER_REASONING_EFFORT_OPTIONS,
 } from '../../utils/openRouterSelection';
 import {
   AUTONOMOUS_SETTINGS_STORAGE_KEY,
@@ -19,8 +25,13 @@ import {
   RECOMMENDED_PROFILES,
   applyAutonomousProfileSelection,
   getStoredAutonomousSettings,
+  persistAutonomousSettings,
+  settingsToAutonomousConfig,
 } from '../../utils/autonomousProfiles';
 import HelpTooltip from '../HelpTooltip';
+import HighlightedModelsSidebar from '../HighlightedModelsSidebar';
+import ProofStrengthBadge from '../ProofStrengthBadge';
+import RawSettingsEditor from '../RawSettingsEditor';
 import './AutonomousResearch.css';
 import '../settings-common.css';
 
@@ -29,29 +40,28 @@ const DEFAULT_SUBMITTER_CONFIG = {
   provider: 'lm_studio',
   modelId: '',
   openrouterProvider: null,
+  openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   lmStudioFallbackId: null,
-  contextWindow: 131072,
-  maxOutputTokens: 25000
+  contextWindow: DEFAULT_CONTEXT_WINDOW,
+  maxOutputTokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  superchargeEnabled: false
 };
 
-const OsTag = () => (
-  <span className="os-tag-tooltip-anchor">
-    <span className="os-tag">OS</span>
-    <span className="os-tag-tooltip">
-      Open source — weights available on Hugging Face for local use with LM Studio.
-    </span>
-  </span>
-);
+const RAW_VIEW_EXIT_WARNING = 'Switching back to the GUI view will restore your last GUI settings/profile and discard raw-only changes. Continue?';
+const formatRawSettings = (value) => JSON.stringify(value, null, 2);
+const SUPERCHARGE_TOOLTIP = 'Supercharge makes this role generate 4 full answer attempts, then run a 5th same-model call to choose or synthesize the best final answer. It uses 5x the API calls, so it is about 5x slower and 5x more costly, but can produce more intelligent answers.';
 
 // ModelSelector component - extracted outside to prevent recreation on every render
 const ModelSelector = ({
   provider,
   modelId,
   openrouterProv,
+  openrouterReasoningEffort,
   fallback,
   onProviderChange,
   onModelChange,
   onOpenrouterProviderChange,
+  onOpenrouterReasoningEffortChange,
   onFallbackChange,
   lmStudioModels,
   openRouterModels,
@@ -65,6 +75,9 @@ const ModelSelector = ({
   const providers = modelId && effectiveProvider === 'openrouter'
     ? getProviderNames(modelProviders[modelId])
     : [];
+  const reasoningInfo = effectiveProvider === 'openrouter'
+    ? getReasoningSupportInfo(modelProviders[modelId], openrouterProv || null)
+    : { hasEndpointMetadata: false, supportsReasoning: false };
 
   return (
     <>
@@ -139,6 +152,26 @@ const ModelSelector = ({
         </div>
       )}
 
+      {effectiveProvider === 'openrouter' && modelId && (
+        <div className="settings-row">
+          <label>Reasoning Effort</label>
+          <select
+            value={normalizeOpenRouterReasoningEffort(openrouterReasoningEffort)}
+            onChange={(e) => onOpenrouterReasoningEffortChange(e.target.value)}
+            disabled={isRunning}
+          >
+            {OPENROUTER_REASONING_EFFORT_OPTIONS.map(option => (
+              <option key={option.value} value={option.value}>{option.label}</option>
+            ))}
+          </select>
+          <small className="settings-hint">
+            {reasoningInfo.hasEndpointMetadata && !reasoningInfo.supportsReasoning
+              ? 'This selected host does not advertise reasoning support; OpenRouter may ignore the setting.'
+              : 'Auto sends OpenRouter max reasoning effort by default.'}
+          </small>
+        </div>
+      )}
+
       {/* LM Studio Fallback (if OpenRouter) */}
       {effectiveProvider === 'openrouter' && lmStudioEnabled && (
         <div className="settings-row">
@@ -178,21 +211,28 @@ const RoleConfig = ({
   modelProviders,
   hasOpenRouterKey,
   lmStudioEnabled,
+  developerModeEnabled = false,
+  showProofStrengthBadge = false,
 }) => {
   const storedProvider = localConfig[`${rolePrefix}_provider`] || 'lm_studio';
   const provider = lmStudioEnabled ? storedProvider : 'openrouter';
   const modelId = localConfig[`${rolePrefix}_model`] || '';
   const openrouterProv = localConfig[`${rolePrefix}_openrouter_provider`];
+  const openrouterReasoningEffort = localConfig[`${rolePrefix}_openrouter_reasoning_effort`];
   const fallback = localConfig[`${rolePrefix}_lm_studio_fallback`];
-  const contextWindow = localConfig[`${rolePrefix}_context_window`] || 131072;
-  const maxTokens = localConfig[`${rolePrefix}_max_tokens`] || 25000;
+  const contextWindow = localConfig[`${rolePrefix}_context_window`] || DEFAULT_CONTEXT_WINDOW;
+  const maxTokens = localConfig[`${rolePrefix}_max_tokens`] || DEFAULT_MAX_OUTPUT_TOKENS;
+  const superchargeEnabled = Boolean(localConfig[`${rolePrefix}_supercharge_enabled`]);
 
   return (
     <div className={`submitter-config-section${provider === 'openrouter' ? ' role-config-card--openrouter-orange' : ''}`} style={{
       borderColor: provider === 'openrouter' ? undefined : borderColor
     }}>
       <h5 className={provider === 'openrouter' ? 'card-title--orange' : ''} style={provider !== 'openrouter' ? { color: borderColor } : undefined}>
-        {title}
+        <span className="role-title-with-badges">
+          <span>{title}</span>
+          {showProofStrengthBadge && <ProofStrengthBadge />}
+        </span>
         {provider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
       </h5>
       {hint && <p className="settings-hint">{hint}</p>}
@@ -201,10 +241,12 @@ const RoleConfig = ({
         provider={provider}
         modelId={modelId}
         openrouterProv={openrouterProv}
+        openrouterReasoningEffort={openrouterReasoningEffort}
         fallback={fallback}
         onProviderChange={(p) => handleProviderChange(rolePrefix, p)}
         onModelChange={(m) => handleModelChange(rolePrefix, m)}
         onOpenrouterProviderChange={(p) => handleOpenRouterProviderChange(rolePrefix, p)}
+        onOpenrouterReasoningEffortChange={(effort) => handleChange(`${rolePrefix}_openrouter_reasoning_effort`, normalizeOpenRouterReasoningEffort(effort))}
         onFallbackChange={(f) => handleChange(`${rolePrefix}_lm_studio_fallback`, f)}
         lmStudioModels={lmStudioModels}
         openRouterModels={openRouterModels}
@@ -241,11 +283,40 @@ const RoleConfig = ({
           step={1000}
         />
       </div>
+
+      {developerModeEnabled && (
+        <div className="settings-row settings-row--inline-checkbox">
+          <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+            <input
+              type="checkbox"
+              checked={superchargeEnabled}
+              onChange={(e) => handleChange(`${rolePrefix}_supercharge_enabled`, e.target.checked)}
+              disabled={isRunning}
+            />
+            <HelpTooltip
+              label="Learn about Supercharge"
+              buttonContent="Supercharge"
+              buttonClassName="help-tooltip-btn--text"
+              popupClassName="help-tooltip-popup--fixed"
+              useFixedPosition
+            >
+              {SUPERCHARGE_TOOLTIP}
+            </HelpTooltip>
+          </label>
+        </div>
+      )}
     </div>
   );
 };
 
-const AutonomousResearchSettings = ({ config, onConfigChange, models, capabilities, isRunning }) => {
+const AutonomousResearchSettings = ({
+  config,
+  onConfigChange,
+  models,
+  capabilities,
+  isRunning,
+  developerModeEnabled = false,
+}) => {
   // Models and OpenRouter state
   const [lmStudioModels, setLmStudioModels] = useState(models || []);
   const [openRouterModels, setOpenRouterModels] = useState([]);
@@ -257,14 +328,16 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
   const [freeModelAutoSelector, setFreeModelAutoSelector] = useState(true);
   const [tier3Enabled, setTier3Enabled] = useState(false);
   const [isLoadedFromStorage, setIsLoadedFromStorage] = useState(false);
-  const [showKothTooltip, setShowKothTooltip] = useState(false);
-  const [showTestedModelsTooltip, setShowTestedModelsTooltip] = useState(false);
 
   // Profile management state
   const [userProfiles, setUserProfiles] = useState({});
   const [selectedProfile, setSelectedProfile] = useState('');
   const [showSaveDialog, setShowSaveDialog] = useState(false);
   const [newProfileName, setNewProfileName] = useState('');
+  const [editRawSettings, setEditRawSettings] = useState(false);
+  const [rawSettingsText, setRawSettingsText] = useState('');
+  const [rawSettingsMessage, setRawSettingsMessage] = useState('');
+  const [guiSettingsBeforeRaw, setGuiSettingsBeforeRaw] = useState(null);
 
   // Wolfram Alpha settings (shared with compiler)
   const [wolframEnabled, setWolframEnabled] = useState(false);
@@ -278,7 +351,6 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
   const [proofSettingsLspEnabled, setProofSettingsLspEnabled] = useState(false);
   const [proofSettingsLspIdleTimeout, setProofSettingsLspIdleTimeout] = useState('600');
   const [proofSettingsSmtEnabled, setProofSettingsSmtEnabled] = useState(false);
-  const [proofSettingsZ3Path, setProofSettingsZ3Path] = useState('');
   const [proofSettingsSmtTimeout, setProofSettingsSmtTimeout] = useState('30');
   const [savingProofSettings, setSavingProofSettings] = useState(false);
   const [proofSettingsMessage, setProofSettingsMessage] = useState('');
@@ -293,6 +365,13 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
   const genericMode = Boolean(capabilities?.genericMode);
   const showLean4Settings = Boolean(lmStudioEnabled && proofStatus?.lean4_path && !genericMode);
 
+  useEffect(() => {
+    if (!developerModeEnabled && editRawSettings) {
+      setEditRawSettings(false);
+      setRawSettingsMessage('');
+    }
+  }, [developerModeEnabled, editRawSettings]);
+
   const handleCollapsibleKeyDown = (event, toggleFn) => {
     if (event.key === 'Enter' || event.key === ' ') {
       event.preventDefault();
@@ -305,7 +384,8 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
     if (cfg?.submitter_configs && Array.isArray(cfg.submitter_configs)) {
       return cfg.submitter_configs.map(c => ({
         ...DEFAULT_SUBMITTER_CONFIG,
-        ...c
+        ...c,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(c.openrouterReasoningEffort || c.openrouter_reasoning_effort),
       }));
     }
     return [
@@ -327,30 +407,38 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
     validator_provider: 'lm_studio',
     validator_model: '',
     validator_openrouter_provider: null,
+    validator_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     validator_lm_studio_fallback: null,
-    validator_context_window: 131072,
-    validator_max_tokens: 25000,
+    validator_context_window: DEFAULT_CONTEXT_WINDOW,
+    validator_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+    validator_supercharge_enabled: false,
     // High-Context
     high_context_provider: 'lm_studio',
     high_context_model: '',
     high_context_openrouter_provider: null,
+    high_context_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     high_context_lm_studio_fallback: null,
-    high_context_context_window: 131072,
-    high_context_max_tokens: 25000,
+    high_context_context_window: DEFAULT_CONTEXT_WINDOW,
+    high_context_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+    high_context_supercharge_enabled: false,
     // High-Param
     high_param_provider: 'lm_studio',
     high_param_model: '',
     high_param_openrouter_provider: null,
+    high_param_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     high_param_lm_studio_fallback: null,
-    high_param_context_window: 131072,
-    high_param_max_tokens: 25000,
+    high_param_context_window: DEFAULT_CONTEXT_WINDOW,
+    high_param_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+    high_param_supercharge_enabled: false,
     // Critique Submitter
     critique_submitter_provider: 'lm_studio',
     critique_submitter_model: '',
     critique_submitter_openrouter_provider: null,
+    critique_submitter_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     critique_submitter_lm_studio_fallback: null,
-    critique_submitter_context_window: 131072,
-    critique_submitter_max_tokens: 25000,
+    critique_submitter_context_window: DEFAULT_CONTEXT_WINDOW,
+    critique_submitter_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+    critique_submitter_supercharge_enabled: false,
     ...config
   });
 
@@ -371,6 +459,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
             normalized_submitter.modelId = normalized.submitters[0].modelId;
             normalized_submitter.provider = normalized.submitters[0].provider || 'openrouter';
             normalized_submitter.openrouterProvider = normalized.submitters[0].openrouterProvider || null;
+            normalized_submitter.openrouterReasoningEffort = normalizeOpenRouterReasoningEffort(normalized.submitters[0].openrouterReasoningEffort);
             normalized_submitter.lmStudioFallbackId = normalized.submitters[0].lmStudioFallbackId || null;
             console.log(`[Profile Normalization] Fixed blank submitter 3: using "${normalized_submitter.modelId}"`);
           }
@@ -488,7 +577,6 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
         setProofSettingsLspEnabled(Boolean(status.lean4_lsp_enabled));
         setProofSettingsLspIdleTimeout(String(status.lean4_lsp_idle_timeout ?? 600));
         setProofSettingsSmtEnabled(Boolean(status.smt_enabled));
-        setProofSettingsZ3Path(status.z3_path || '');
         setProofSettingsSmtTimeout(String(status.smt_timeout ?? 30));
       } catch (err) {
         console.error('Failed to load Lean 4 proof status:', err);
@@ -562,6 +650,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
         provider: 'openrouter',
         modelId: keepOpenRouterState ? (submitterConfig.modelId || '') : '',
         openrouterProvider: keepOpenRouterState ? (submitterConfig.openrouterProvider || null) : null,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(submitterConfig.openrouterReasoningEffort),
         lmStudioFallbackId: null,
       };
     });
@@ -571,6 +660,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
       const providerKey = `${rolePrefix}_provider`;
       const modelKey = `${rolePrefix}_model`;
       const openRouterProviderKey = `${rolePrefix}_openrouter_provider`;
+      const reasoningEffortKey = `${rolePrefix}_openrouter_reasoning_effort`;
       const fallbackKey = `${rolePrefix}_lm_studio_fallback`;
       const keepOpenRouterState = normalizedLocalConfig[providerKey] === 'openrouter';
 
@@ -579,6 +669,7 @@ const AutonomousResearchSettings = ({ config, onConfigChange, models, capabiliti
       normalizedLocalConfig[openRouterProviderKey] = keepOpenRouterState
         ? (normalizedLocalConfig[openRouterProviderKey] || null)
         : null;
+      normalizedLocalConfig[reasoningEffortKey] = normalizeOpenRouterReasoningEffort(normalizedLocalConfig[reasoningEffortKey]);
       normalizedLocalConfig[fallbackKey] = null;
     });
 
@@ -794,7 +885,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     if (numericFields.includes(field)) {
       const parsed = parseInt(value, 10);
       const isContextField = field.includes('context_window');
-      const finalValue = isNaN(parsed) ? (isContextField ? 131072 : 25000) : parsed;
+      const finalValue = isNaN(parsed) ? (isContextField ? DEFAULT_CONTEXT_WINDOW : DEFAULT_MAX_OUTPUT_TOKENS) : parsed;
       
       const newConfig = { ...localConfig, [field]: finalValue };
       markProfileAsCustom();
@@ -806,7 +897,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   // Handle provider change for a role (keeps existing model settings)
   const handleProviderChange = (rolePrefix, provider) => {
     const updates = {
-      [`${rolePrefix}_provider`]: provider
+      [`${rolePrefix}_provider`]: provider,
+      [`${rolePrefix}_openrouter_reasoning_effort`]: DEFAULT_OPENROUTER_REASONING_EFFORT
       // Keep existing model, openrouter_provider, and lm_studio_fallback - don't reset them
     };
     const newConfig = { ...localConfig, ...updates };
@@ -821,6 +913,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       ...localConfig,
       [`${rolePrefix}_model`]: modelId,
       [`${rolePrefix}_openrouter_provider`]: null,
+      [`${rolePrefix}_openrouter_reasoning_effort`]: DEFAULT_OPENROUTER_REASONING_EFFORT,
     };
     markProfileAsCustom();
     setLocalConfig(newConfig);
@@ -931,6 +1024,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         provider: newValue,
         modelId: '',
         openrouterProvider: null,
+        openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
         lmStudioFallbackId: null
       };
     } else {
@@ -955,6 +1049,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       ...newConfigs[index],
       modelId,
       openrouterProvider: null,
+      openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
     };
 
     markProfileAsCustom();
@@ -1019,7 +1114,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     
     if (numericFields.includes(field)) {
       const parsed = parseInt(value, 10);
-      const finalValue = isNaN(parsed) ? (field === 'contextWindow' ? 131072 : 25000) : parsed;
+      const finalValue = isNaN(parsed) ? (field === 'contextWindow' ? DEFAULT_CONTEXT_WINDOW : DEFAULT_MAX_OUTPUT_TOKENS) : parsed;
       
       const newConfigs = [...submitterConfigs];
       newConfigs[index] = {
@@ -1042,9 +1137,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         provider: main.provider,
         modelId: main.modelId,
         openrouterProvider: main.openrouterProvider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(main.openrouterReasoningEffort),
         lmStudioFallbackId: main.lmStudioFallbackId,
         contextWindow: main.contextWindow,
-        maxOutputTokens: main.maxOutputTokens
+        maxOutputTokens: main.maxOutputTokens,
+        superchargeEnabled: Boolean(main.superchargeEnabled)
       }));
       markProfileAsCustom();
       setSubmitterConfigs(newConfigs);
@@ -1121,7 +1218,6 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         lean4_lsp_enabled: proofSettingsLspEnabled,
         lean4_lsp_idle_timeout: lspIdleTimeout,
         smt_enabled: proofSettingsSmtEnabled,
-        z3_path: proofSettingsZ3Path,
         smt_timeout: smtTimeout,
       });
       setProofStatus(status);
@@ -1130,7 +1226,6 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       setProofSettingsLspEnabled(Boolean(status.lean4_lsp_enabled));
       setProofSettingsLspIdleTimeout(String(status.lean4_lsp_idle_timeout ?? lspIdleTimeout));
       setProofSettingsSmtEnabled(Boolean(status.smt_enabled));
-      setProofSettingsZ3Path(status.z3_path || '');
       setProofSettingsSmtTimeout(String(status.smt_timeout ?? smtTimeout));
       setProofSettingsMessage('Lean 4 / SMT proof settings saved.');
     } catch (err) {
@@ -1186,41 +1281,51 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         modelId: cfg.modelId,
         provider: cfg.provider,
         openrouterProvider: cfg.openrouterProvider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(cfg.openrouterReasoningEffort),
         lmStudioFallbackId: cfg.lmStudioFallbackId,
         contextWindow: cfg.contextWindow,
-        maxOutputTokens: cfg.maxOutputTokens
+        maxOutputTokens: cfg.maxOutputTokens,
+        superchargeEnabled: Boolean(cfg.superchargeEnabled)
       })),
       validator: {
         modelId: localConfig.validator_model,
         provider: localConfig.validator_provider,
         openrouterProvider: localConfig.validator_openrouter_provider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(localConfig.validator_openrouter_reasoning_effort),
         lmStudioFallbackId: localConfig.validator_lm_studio_fallback,
         contextWindow: localConfig.validator_context_window,
-        maxOutputTokens: localConfig.validator_max_tokens
+        maxOutputTokens: localConfig.validator_max_tokens,
+        superchargeEnabled: Boolean(localConfig.validator_supercharge_enabled)
       },
       highContext: {
         modelId: localConfig.high_context_model,
         provider: localConfig.high_context_provider,
         openrouterProvider: localConfig.high_context_openrouter_provider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(localConfig.high_context_openrouter_reasoning_effort),
         lmStudioFallbackId: localConfig.high_context_lm_studio_fallback,
         contextWindow: localConfig.high_context_context_window,
-        maxOutputTokens: localConfig.high_context_max_tokens
+        maxOutputTokens: localConfig.high_context_max_tokens,
+        superchargeEnabled: Boolean(localConfig.high_context_supercharge_enabled)
       },
       highParam: {
         modelId: localConfig.high_param_model,
         provider: localConfig.high_param_provider,
         openrouterProvider: localConfig.high_param_openrouter_provider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(localConfig.high_param_openrouter_reasoning_effort),
         lmStudioFallbackId: localConfig.high_param_lm_studio_fallback,
         contextWindow: localConfig.high_param_context_window,
-        maxOutputTokens: localConfig.high_param_max_tokens
+        maxOutputTokens: localConfig.high_param_max_tokens,
+        superchargeEnabled: Boolean(localConfig.high_param_supercharge_enabled)
       },
       critique: {
         modelId: localConfig.critique_submitter_model,
         provider: localConfig.critique_submitter_provider,
         openrouterProvider: localConfig.critique_submitter_openrouter_provider,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(localConfig.critique_submitter_openrouter_reasoning_effort),
         lmStudioFallbackId: localConfig.critique_submitter_lm_studio_fallback,
         contextWindow: localConfig.critique_submitter_context_window,
-        maxOutputTokens: localConfig.critique_submitter_max_tokens
+        maxOutputTokens: localConfig.critique_submitter_max_tokens,
+        superchargeEnabled: Boolean(localConfig.critique_submitter_supercharge_enabled)
       }
     };
 
@@ -1260,206 +1365,81 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
   };
 
-  return (
-    <div className="autonomous-settings-layout">
-      {/* Left Sidebar - Known Compatible Models */}
-      <div className="settings-left-sidebar">
-        <div className="known-models-sidebar">
-          <h3 className="flex-row-center">
-            <span>Highlighted Models</span>
-            <div className="help-tooltip-anchor">
-              <button
-                type="button"
-                className="help-tooltip-btn"
-                aria-label="Learn about highlighted models"
-                onMouseEnter={() => setShowTestedModelsTooltip(true)}
-                onMouseLeave={() => setShowTestedModelsTooltip(false)}
-                onFocus={() => setShowTestedModelsTooltip(true)}
-                onBlur={() => setShowTestedModelsTooltip(false)}
-              >
-                ?
-              </button>
-              {showTestedModelsTooltip && (
-                /* sidebar-escape: fixed positioning so the tooltip breaks out of the
-                   322px sidebar and renders freely. See index.css for coords. */
-                <div className="help-tooltip-popup help-tooltip-popup--sidebar-escape">
-                  The models and hosts listed here are not affiliated with MOTO or Intrafere LLC. This chart reflects developer-tested configurations intended to help guide model selection. All statements regarding pricing, performance, roles, rankings, or capabilities are speculative and based on individual testing experience. Intrafere LLC and the MOTO development team make no guarantees about the accuracy of this chart. MOTO is compatible with the majority of models, including many not listed here.
-                </div>
-              )}
-            </div>
-          </h3>
-          <p className="hint-text hint-text--dim" style={{ marginLeft: '20px', marginBottom: '0.45rem' }}>
-            Note: Most models over 20 billion parameters are compatible with MOTO.
-          </p>
-          <div className="models-list">
-            {/* Podium - Top 3 */}
-            <div className="models-podium">
-              <div className="models-podium-label">Leaderboard</div>
-              <div className="model-item model-item--ranked model-item--gold model-item--os">
-                <OsTag />
-                <div className="flex-row-center">
-                  <div className="model-item-name">Kimi K2.6</div>
-                  <div
-                    className="help-tooltip-anchor"
-                    style={{ zIndex: 100 }}
-                    aria-label="Learn about the King of the Hill ranking"
-                    onMouseEnter={() => setShowKothTooltip(true)}
-                    onMouseLeave={() => setShowKothTooltip(false)}
-                    onFocus={() => setShowKothTooltip(true)}
-                    onBlur={() => setShowKothTooltip(false)}
-                    tabIndex={0}
-                  >
-                    <div className="ranking-badge ranking-badge--gold">👑 KING OF THE HILL</div>
-                    {showKothTooltip && (
-                      <div
-                        className="help-tooltip-popup"
-                        style={{ top: 'auto', bottom: 'calc(100% + 10px)', left: 'calc(100% + 10px)', right: 'auto' }}
-                      >
-                        This model was chosen by the Intrafere developers as the best overall performer in the MOTO harness, optimized for cost, speed, and knowledge.
-                      </div>
-                    )}
-                  </div>
-                </div>
-                <div className="model-item-badge">Highly knowledgeable and balanced cost</div>
-              </div>
-
-              <div className="model-item model-item--ranked model-item--silver">
-                <div className="flex-row-center">
-                  <div className="model-item-name">Grok 4.1 Fast</div>
-                  <div className="ranking-badge ranking-badge--silver">🥈 SILVER</div>
-                </div>
-                <div className="model-item-badge">Fast validator</div>
-              </div>
+  const getAutonomousRawSettings = () => ({
+    numSubmitters,
+    submitterConfigs: submitterConfigs.slice(0, numSubmitters),
+    localConfig,
+    freeOnly,
+    freeModelLooping,
+    freeModelAutoSelector,
+    tier3Enabled,
+    modelProviders,
+    selectedProfile,
+  });
 
-              <div className="model-item model-item--ranked model-item--bronze model-item--os">
-                <OsTag />
-                <div className="flex-row-center">
-                  <div className="model-item-name">GPT OSS 120B</div>
-                  <div className="ranking-badge ranking-badge--bronze">🥉 BRONZE</div>
-                </div>
-                <div className="model-item-badge">Balanced knowledge and speed at low cost</div>
-              </div>
-            </div>
+  const applyAutonomousRawSettings = (rawSettings, { updateRawText = true } = {}) => {
+    const nextSettings = persistAutonomousSettings({
+      numSubmitters: rawSettings.numSubmitters,
+      submitterConfigs: rawSettings.submitterConfigs,
+      localConfig: rawSettings.localConfig,
+      freeOnly: rawSettings.freeOnly,
+      freeModelLooping: rawSettings.freeModelLooping,
+      freeModelAutoSelector: rawSettings.freeModelAutoSelector,
+      tier3Enabled: rawSettings.tier3Enabled,
+      modelProviders: rawSettings.modelProviders,
+      selectedProfile: rawSettings.selectedProfile,
+    });
 
-            {/* Alphabetical list (rest of models) */}
+    setNumSubmitters(nextSettings.numSubmitters);
+    setSubmitterConfigs(nextSettings.submitterConfigs);
+    setLocalConfig(nextSettings.localConfig);
+    setFreeOnly(nextSettings.freeOnly);
+    setFreeModelLooping(nextSettings.freeModelLooping);
+    setFreeModelAutoSelector(nextSettings.freeModelAutoSelector);
+    setTier3Enabled(nextSettings.tier3Enabled);
+    setModelProviders(nextSettings.modelProviders || {});
+    setSelectedProfile(nextSettings.selectedProfile || '');
+    onConfigChange(settingsToAutonomousConfig(nextSettings));
+
+    if (updateRawText) {
+      setRawSettingsText(formatRawSettings(nextSettings));
+    }
+  };
 
-            <div className="model-item">
-              <div className="model-item-name">Arcee AI's Trinity Large</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Amazon Nova Pro/Premier</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Claude Opus/Sonnet</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">DeepSeek</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Gemini Flash</div>
-              <div className="model-item-badge">Fast validator</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Gemini Pro</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Google's Gemma</div>
-              <div className="model-item-badge">Balanced knowledge and speed</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">GLM</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">GLM Turbo</div>
-              <div className="model-item-badge">Fast validator</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">GPT Codex</div>
-              <div className="model-item-badge">Computer science</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">OpenAI's GPT OSS</div>
-              <div className="model-item-badge">Balanced knowledge and speed</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Grok</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">ChatGPT</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
+  const handleRawEditToggle = (checked) => {
+    if (checked) {
+      const currentSettings = getAutonomousRawSettings();
+      setGuiSettingsBeforeRaw(currentSettings);
+      setRawSettingsText(formatRawSettings(currentSettings));
+      setRawSettingsMessage('');
+      setEditRawSettings(true);
+      return;
+    }
 
-            <div className="model-item">
-              <div className="model-item-name">Inception's Mercury</div>
-              <div className="model-item-badge">Rapid knowledge</div>
-            </div>
+    if (!confirm(RAW_VIEW_EXIT_WARNING)) {
+      return;
+    }
 
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Nemotron Super</div>
-              <div className="model-item-badge">Balanced knowledge and speed</div>
-            </div>
+    if (guiSettingsBeforeRaw) {
+      applyAutonomousRawSettings(guiSettingsBeforeRaw, { updateRawText: false });
+    }
+    setRawSettingsMessage('');
+    setEditRawSettings(false);
+  };
 
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Nous Hermes</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item">
-              <div className="model-item-name">Perplexity's Sonar</div>
-              <div className="model-item-badge">Native internet search capability</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Microsoft's Phi</div>
-              <div className="model-item-badge">Balanced knowledge and speed</div>
-            </div>
+  const saveRawSettings = () => {
+    try {
+      const parsed = JSON.parse(rawSettingsText);
+      applyAutonomousRawSettings(parsed);
+      setRawSettingsMessage('Saved raw settings.');
+    } catch (error) {
+      setRawSettingsMessage(`Invalid JSON: ${error.message}`);
+    }
+  };
 
-            <div className="model-item">
-              <div className="model-item-name">MiniMax</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Qwen Coder</div>
-              <div className="model-item-badge">Computer science</div>
-            </div>
-            
-            <div className="model-item model-item--os">
-              <OsTag />
-              <div className="model-item-name">Qwen</div>
-              <div className="model-item-badge">Highly knowledgeable</div>
-            </div>
-          </div>
-        </div>
-      </div>
+  return (
+    <div className="autonomous-settings-layout">
+      <HighlightedModelsSidebar />
 
       {/* Main Content Area */}
       <div className="autonomous-settings">
@@ -1471,23 +1451,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         </p>
         
         <div className="settings-row">
-          <label>
-            Select Profile
-            <HelpTooltip
-              label="Learn how profile selection works"
-              anchorClassName="help-tooltip-anchor--inline"
-              buttonClassName="help-tooltip-btn--green"
-              useFixedPosition
-            >
-              <strong>Profile menu guide</strong>
-              <br /><br />
-              <code>-- Custom Settings --</code> means no saved profile is currently loaded, so you are editing the settings manually.
-              <br /><br />
-              <code>Recommended Profiles</code> are preselected example profiles you can load as starting points.
-              <br /><br />
-              <code>My Profiles</code> contains any custom profiles you save from your current settings.
-            </HelpTooltip>
-          </label>
+          <label>Select Profile</label>
           <select
             value={selectedProfile}
             onChange={(e) => {
@@ -1655,8 +1619,36 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             </label>
           </>
         )}
+        {developerModeEnabled ? (
+          <label
+            className="settings-checkbox-label model-refresh-controls__toggle"
+            style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}
+          >
+            <input
+              type="checkbox"
+              checked={editRawSettings}
+              onChange={(e) => handleRawEditToggle(e.target.checked)}
+              disabled={isRunning}
+            />
+            Edit Raw
+          </label>
+        ) : (
+          <span className="settings-developer-mode-hint">
+            Developer mode: press Shift + Z + X to toggle raw JSON settings.
+          </span>
+        )}
       </div>
 
+      {editRawSettings ? (
+        <RawSettingsEditor
+          value={rawSettingsText}
+          onChange={setRawSettingsText}
+          onSave={saveRawSettings}
+          message={rawSettingsMessage}
+          disabled={isRunning}
+        />
+      ) : (
+        <>
       {/* Brainstorm Submitters Section */}
       <div className="settings-group">
         <h4>Brainstorm Submitters (Tier 1 Aggregation)</h4>
@@ -1700,7 +1692,10 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
             className={`submitter-config-section${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter-orange' : (idx === 0 ? ' role-config-card--main' : '')}`}
           >
             <h5 className={effectiveProvider === 'openrouter' ? 'card-title--orange' : (idx === 0 ? 'card-title--green' : '')}>
-              {idx === 0 ? 'Submitter 1 (Main Submitter)' : `Submitter ${idx + 1}`}
+              <span className="role-title-with-badges">
+                <span>{idx === 0 ? 'Submitter 1 (Main Submitter)' : `Submitter ${idx + 1}`}</span>
+                {idx === 0 && <ProofStrengthBadge />}
+              </span>
               {effectiveProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
             </h5>
             
@@ -1708,10 +1703,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               provider={cfg.provider}
               modelId={cfg.modelId}
               openrouterProv={cfg.openrouterProvider}
+              openrouterReasoningEffort={cfg.openrouterReasoningEffort}
               fallback={cfg.lmStudioFallbackId}
               onProviderChange={(p) => handleSubmitterConfigChange(idx, 'provider', p)}
               onModelChange={(m) => handleSubmitterModelChange(idx, m)}
               onOpenrouterProviderChange={(p) => handleSubmitterOpenRouterProviderChange(idx, p)}
+              onOpenrouterReasoningEffortChange={(effort) => handleSubmitterConfigChange(idx, 'openrouterReasoningEffort', normalizeOpenRouterReasoningEffort(effort))}
               onFallbackChange={(f) => handleSubmitterConfigChange(idx, 'lmStudioFallbackId', f)}
               lmStudioModels={lmStudioModels}
               openRouterModels={openRouterModels}
@@ -1748,6 +1745,28 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 step={1000}
               />
             </div>
+
+            {developerModeEnabled && (
+              <div className="settings-row settings-row--inline-checkbox">
+                <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+                  <input
+                    type="checkbox"
+                    checked={Boolean(cfg.superchargeEnabled)}
+                    onChange={(e) => handleSubmitterConfigChange(idx, 'superchargeEnabled', e.target.checked)}
+                    disabled={isRunning}
+                  />
+                  <HelpTooltip
+                    label="Learn about Supercharge"
+                    buttonContent="Supercharge"
+                    buttonClassName="help-tooltip-btn--text"
+                    popupClassName="help-tooltip-popup--fixed"
+                    useFixedPosition
+                  >
+                    {SUPERCHARGE_TOOLTIP}
+                  </HelpTooltip>
+                </label>
+              </div>
+            )}
           </div>
             );
           })()
@@ -1777,6 +1796,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
           lmStudioEnabled={lmStudioEnabled}
+          developerModeEnabled={developerModeEnabled}
         />
       </div>
 
@@ -1804,6 +1824,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
           lmStudioEnabled={lmStudioEnabled}
+          developerModeEnabled={developerModeEnabled}
+          showProofStrengthBadge
         />
 
         <RoleConfig
@@ -1823,11 +1845,13 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
           lmStudioEnabled={lmStudioEnabled}
+          developerModeEnabled={developerModeEnabled}
+          showProofStrengthBadge
         />
 
         <RoleConfig
           title="Critique Submitter"
-          hint="Handles post-body peer review feedback and rewrite decisions."
+          hint="Handles post-body peer review feedback for the AI self-review section."
           rolePrefix="critique_submitter"
           borderColor="#e74c3c"
           localConfig={localConfig}
@@ -1842,6 +1866,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           modelProviders={modelProviders}
           hasOpenRouterKey={hasOpenRouterKey}
           lmStudioEnabled={lmStudioEnabled}
+          developerModeEnabled={developerModeEnabled}
         />
       </div>
 
@@ -2020,13 +2045,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
                   <div className="settings-row">
                     <label>Z3 Binary Path</label>
-                    <input
-                      type="text"
-                      value={proofSettingsZ3Path}
-                      onChange={(e) => setProofSettingsZ3Path(e.target.value)}
-                      disabled={isRunning || savingProofSettings}
-                      placeholder="Optional explicit z3 path"
-                    />
+                    <div>
+                      <strong>{proofStatus?.z3_path || 'System PATH lookup'}</strong>
+                      <small className="settings-hint" style={{ display: 'block', marginTop: '0.35rem' }}>
+                        Configure this only through trusted startup environment settings.
+                      </small>
+                    </div>
                   </div>
 
                   <div className="settings-row">
@@ -2340,6 +2364,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           </div>
         )}
       </div>
+        </>
+      )}
     </div>
     </div>
   );
diff --git a/frontend/src/components/autonomous/BrainstormList.jsx b/frontend/src/components/autonomous/BrainstormList.jsx
index 6633a7c..df5b1f8 100644
--- a/frontend/src/components/autonomous/BrainstormList.jsx
+++ b/frontend/src/components/autonomous/BrainstormList.jsx
@@ -267,17 +267,14 @@ const BrainstormList = ({ brainstorms, onRefresh, api }) => {
                     : proofCheckState?.status === 'running'
                       ? `Proof Check Running${proofCheckState.candidateCount ? ` (${proofCheckState.candidateCount})` : '...'}`
                       : 'Try to prove with Lean 4 theorem prover';
-                  const disabledReason = brainstorm.status !== 'complete'
-                    ? 'Manual proof checks require a completed brainstorm.'
-                    : manualCheckReason;
                   return (
                     <button
                       className="btn-download-small"
                       onClick={(e) => handleProofCheck(e, brainstorm)}
-                      disabled={!manualCheckEnabled || Boolean(proofCheckState) || brainstorm.status !== 'complete'}
+                      disabled={!manualCheckEnabled || Boolean(proofCheckState)}
                       title={proofCheckState?.status === 'running'
                         ? 'A proof verification is already running for this brainstorm.'
-                        : disabledReason || 'Queue a manual proof check for this brainstorm.'}
+                        : manualCheckReason || 'Queue a manual proof check for this brainstorm.'}
                     >
                       {proofCheckLabel}
                     </button>
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.css b/frontend/src/components/autonomous/FinalAnswerLibrary.css
index 84fa075..4beda71 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.css
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.css
@@ -222,6 +222,83 @@
   box-shadow: 0 8px 24px rgba(30, 255, 28, 0.12);
 }
 
+.pruned-papers-expansion {
+  margin-top: 16px;
+  border-top: 1px solid rgba(156, 163, 175, 0.18);
+  padding-top: 14px;
+}
+
+.pruned-papers-toggle {
+  width: 100%;
+  text-align: left;
+  padding: 10px 14px;
+  border-radius: 8px;
+  border: 1px solid rgba(156, 163, 175, 0.28);
+  background: rgba(75, 85, 99, 0.22);
+  color: #d1d5db;
+  cursor: pointer;
+  font-weight: 700;
+}
+
+.pruned-papers-list {
+  display: flex;
+  flex-direction: column;
+  gap: 10px;
+  margin-top: 10px;
+}
+
+.pruned-paper-card {
+  padding: 14px;
+  border-radius: 10px;
+  border: 1px solid rgba(156, 163, 175, 0.26);
+  background: linear-gradient(180deg, rgba(75, 85, 99, 0.2) 0%, rgba(31, 41, 55, 0.6) 100%);
+  color: #d1d5db;
+  cursor: pointer;
+  opacity: 0.78;
+}
+
+.pruned-paper-card.expanded {
+  border-color: rgba(209, 213, 219, 0.45);
+  opacity: 0.95;
+}
+
+.pruned-paper-card h4 {
+  margin: 8px 0;
+  color: #e5e7eb;
+}
+
+.pruned-paper-card p {
+  margin: 0 0 10px;
+  color: #cbd5e1;
+  font-size: 0.86rem;
+}
+
+.pruned-paper-card-header {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  flex-wrap: wrap;
+  font-size: 0.78rem;
+}
+
+.stage2-history-pruned-badge {
+  display: inline-flex;
+  align-items: center;
+  padding: 0.18rem 0.5rem;
+  border-radius: 999px;
+  background: rgba(156, 163, 175, 0.18);
+  border: 1px solid rgba(156, 163, 175, 0.34);
+  color: #d1d5db;
+  font-size: 0.7rem;
+  font-weight: 700;
+  text-transform: uppercase;
+  letter-spacing: 0.04em;
+}
+
+.pruned-paper-content {
+  margin-top: 12px;
+}
+
 .run-history-group .answer-list {
   gap: 14px;
 }
diff --git a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
index 8b700e5..949047e 100644
--- a/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
+++ b/frontend/src/components/autonomous/FinalAnswerLibrary.jsx
@@ -24,6 +24,7 @@ import './FinalAnswerLibrary.css';
 function FinalAnswerLibrary() {
   const [finalAnswers, setFinalAnswers] = useState([]);
   const [stage2Papers, setStage2Papers] = useState([]);
+  const [prunedPapers, setPrunedPapers] = useState([]);
   const [sessionsResponse, setSessionsResponse] = useState(null);
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState(null);
@@ -33,6 +34,10 @@ function FinalAnswerLibrary() {
   const [filterFormat, setFilterFormat] = useState('all'); // 'all', 'short_form', 'long_form'
   const [showLatex, setShowLatex] = useState(false); // Raw text by default for performance with large docs
   const [downloadingPDF, setDownloadingPDF] = useState(null); // Track which answer is generating PDF
+  const [expandedPrunedRuns, setExpandedPrunedRuns] = useState({});
+  const [expandedPrunedPaperId, setExpandedPrunedPaperId] = useState(null);
+  const [expandedPrunedContent, setExpandedPrunedContent] = useState(null);
+  const [downloadingPrunedPDF, setDownloadingPrunedPDF] = useState(null);
   
   // Critique modal state
   const [critiqueModalOpen, setCritiqueModalOpen] = useState(false);
@@ -47,7 +52,7 @@ function FinalAnswerLibrary() {
       setLoading(true);
       setError(null);
 
-      const [answersResult, sessionsResult, papersResult] = await Promise.allSettled([
+      const [answersResult, sessionsResult, papersResult, prunedPapersResult] = await Promise.allSettled([
         fetch('/api/auto-research/final-answer-library').then(async (response) => {
           if (!response.ok) {
             throw new Error('Failed to load final answer library');
@@ -56,6 +61,7 @@ function FinalAnswerLibrary() {
         }),
         autonomousAPI.getSessions(),
         autonomousAPI.getPaperHistory(),
+        autonomousAPI.getPrunedPaperHistory(),
       ]);
 
       if (answersResult.status !== 'fulfilled') {
@@ -81,6 +87,13 @@ function FinalAnswerLibrary() {
         setStage2Papers([]);
         console.warn('Stage 3 history: failed to load Stage 2 paper metadata', papersResult.reason);
       }
+
+      if (prunedPapersResult.status === 'fulfilled') {
+        setPrunedPapers(prunedPapersResult.value.papers || []);
+      } else {
+        setPrunedPapers([]);
+        console.warn('Stage 3 history: failed to load pruned paper metadata', prunedPapersResult.reason);
+      }
     } catch (err) {
       setError(`Error loading library: ${err.message}`);
       console.error('Failed to load final answer library:', err);
@@ -196,6 +209,65 @@ function FinalAnswerLibrary() {
     }
   };
 
+  const loadPrunedPaperContent = async (paper) => {
+    if (expandedPrunedPaperId === paper.history_id) {
+      setExpandedPrunedPaperId(null);
+      setExpandedPrunedContent(null);
+      return;
+    }
+
+    const data = await autonomousAPI.getPrunedHistoryPaper(paper.session_id, paper.paper_id);
+    setExpandedPrunedPaperId(paper.history_id);
+    setExpandedPrunedContent(data);
+  };
+
+  const downloadPrunedRaw = async (e, paper) => {
+    e.stopPropagation();
+    try {
+      const data = await autonomousAPI.getPrunedHistoryPaper(paper.session_id, paper.paper_id);
+      const filename = sanitizeFilename(`pruned_${paper.session_id}_${paper.paper_id}_${paper.title}`);
+      downloadRawText(data.content || '', filename, data.outline || '');
+    } catch (err) {
+      console.error('Pruned paper download failed:', err);
+      alert(`Download failed: ${err.message}`);
+    }
+  };
+
+  const downloadPrunedPDF = async (e, paper) => {
+    e.stopPropagation();
+    if (downloadingPrunedPDF) {
+      alert('Already preparing a PDF, please wait...');
+      return;
+    }
+
+    try {
+      const data = await autonomousAPI.getPrunedHistoryPaper(paper.session_id, paper.paper_id);
+      const filename = sanitizeFilename(`pruned_${paper.session_id}_${paper.paper_id}_${paper.title}`);
+      await downloadPDFViaBackend(
+        data.content || '',
+        {
+          title: data.title || paper.title,
+          wordCount: paper.word_count,
+          date: paper.created_at ? new Date(paper.created_at).toLocaleDateString() : new Date().toLocaleDateString(),
+          models: paper.model_usage ? Object.keys(paper.model_usage).join(', ') : null,
+        },
+        filename,
+        data.outline || null,
+        () => setDownloadingPrunedPDF(paper.history_id),
+        () => setDownloadingPrunedPDF(null),
+        (error) => {
+          setDownloadingPrunedPDF(null);
+          console.error('Pruned paper PDF generation failed:', error);
+          alert(`PDF generation failed: ${error.message}`);
+        },
+      );
+    } catch (error) {
+      setDownloadingPrunedPDF(null);
+      console.error('Pruned paper PDF generation failed:', error);
+      alert(`Failed to generate PDF: ${error.message}`);
+    }
+  };
+
   const getCertaintyBadgeColor = (level) => {
     switch (level) {
       case 'total_answer': return '#2d5f2d';
@@ -254,6 +326,16 @@ function FinalAnswerLibrary() {
       .filter((runGroup) => runGroup.visibleStage3Answers.length > 0);
   }, [runGroups, filterFormat, searchTerm]);
 
+  const prunedPapersBySession = useMemo(() => {
+    const grouped = new Map();
+    for (const paper of prunedPapers) {
+      const sessionPapers = grouped.get(paper.session_id) || [];
+      sessionPapers.push(paper);
+      grouped.set(paper.session_id, sessionPapers);
+    }
+    return grouped;
+  }, [prunedPapers]);
+
   if (loading) {
     return (
       <div className="final-answer-library">
@@ -523,6 +605,63 @@ function FinalAnswerLibrary() {
                     </div>
                   ))}
                 </div>
+                {(prunedPapersBySession.get(runGroup.sessionId) || []).length > 0 && (
+                  <div className="pruned-papers-expansion">
+                    <button
+                      className="pruned-papers-toggle"
+                      onClick={() => setExpandedPrunedRuns((prev) => ({
+                        ...prev,
+                        [runGroup.sessionId]: !prev[runGroup.sessionId],
+                      }))}
+                    >
+                      {expandedPrunedRuns[runGroup.sessionId] ? '▼' : '▶'} Pruned Papers ({prunedPapersBySession.get(runGroup.sessionId).length})
+                    </button>
+                    {expandedPrunedRuns[runGroup.sessionId] && (
+                      <div className="pruned-papers-list">
+                        {prunedPapersBySession.get(runGroup.sessionId).map((paper) => (
+                          <div
+                            key={paper.history_id}
+                            className={`pruned-paper-card ${expandedPrunedPaperId === paper.history_id ? 'expanded' : ''}`}
+                            onClick={() => loadPrunedPaperContent(paper)}
+                          >
+                            <div className="pruned-paper-card-header">
+                              <span className="stage2-history-pruned-badge">Pruned Paper</span>
+                              <span>{paper.paper_id}</span>
+                              <span>{paper.word_count?.toLocaleString()} words</span>
+                            </div>
+                            <h4>{paper.title}</h4>
+                            <p>{paper.pruned_note || 'The system decided autonomously that this paper hurt context cumulation.'}</p>
+                            <div className="quick-download-buttons" onClick={(e) => e.stopPropagation()}>
+                              <button className="quick-download-raw" onClick={(e) => downloadPrunedRaw(e, paper)}>
+                                Download Raw
+                              </button>
+                              <button
+                                className="quick-download-pdf"
+                                onClick={(e) => downloadPrunedPDF(e, paper)}
+                                disabled={downloadingPrunedPDF === paper.history_id}
+                              >
+                                {downloadingPrunedPDF === paper.history_id ? 'Preparing PDF...' : 'Download PDF'}
+                              </button>
+                            </div>
+                            {expandedPrunedPaperId === paper.history_id && expandedPrunedContent && (
+                              <div className="full-content pruned-paper-content">
+                                <LatexRenderer
+                                  content={
+                                    expandedPrunedContent.outline
+                                      ? `${expandedPrunedContent.outline}\n\n${'='.repeat(80)}\n\n${expandedPrunedContent.content || ''}`
+                                      : expandedPrunedContent.content || ''
+                                  }
+                                  showToggle={true}
+                                  defaultRaw={true}
+                                />
+                              </div>
+                            )}
+                          </div>
+                        ))}
+                      </div>
+                    )}
+                  </div>
+                )}
               </div>
             </section>
           ))}
diff --git a/frontend/src/components/autonomous/MathematicalProofs.css b/frontend/src/components/autonomous/MathematicalProofs.css
index 12e8e01..6386800 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.css
+++ b/frontend/src/components/autonomous/MathematicalProofs.css
@@ -173,6 +173,25 @@
   color: #86efac;
 }
 
+.math-proofs-filter--platinum.active {
+  position: relative;
+  overflow: hidden;
+  background: linear-gradient(120deg, rgba(226, 232, 240, 0.12), rgba(255, 255, 255, 0.24), rgba(148, 163, 184, 0.12));
+  border-color: rgba(226, 232, 240, 0.65);
+  color: #f8fafc;
+  box-shadow: 0 0 16px rgba(226, 232, 240, 0.18);
+}
+
+.math-proofs-filter--platinum.active::before {
+  content: '';
+  position: absolute;
+  inset: 0;
+  background: linear-gradient(110deg, transparent 0%, rgba(255, 255, 255, 0.38) 48%, transparent 100%);
+  transform: translateX(-130%);
+  animation: platinum-shimmer 2.6s ease-in-out infinite;
+  pointer-events: none;
+}
+
 .math-proofs-filter--gold.active {
   background: rgba(255, 214, 92, 0.14);
   color: #ffd65c;
@@ -229,6 +248,31 @@
   border-color: rgba(96, 165, 250, 0.28);
 }
 
+.math-proof-card.platinum {
+  position: relative;
+  overflow: hidden;
+  border-color: rgba(226, 232, 240, 0.7);
+  background:
+    linear-gradient(180deg, rgba(15, 23, 42, 0.96), rgba(17, 24, 39, 0.98)),
+    linear-gradient(120deg, rgba(226, 232, 240, 0.2), rgba(255, 255, 255, 0.08), rgba(148, 163, 184, 0.16));
+  box-shadow: 0 12px 36px rgba(0, 0, 0, 0.25), 0 0 24px rgba(226, 232, 240, 0.18);
+}
+
+.math-proof-card.platinum::before {
+  content: '';
+  position: absolute;
+  inset: 0;
+  background: linear-gradient(110deg, transparent 0%, rgba(255, 255, 255, 0.12) 45%, transparent 70%);
+  transform: translateX(-120%);
+  animation: platinum-shimmer 3.4s ease-in-out infinite;
+  pointer-events: none;
+}
+
+.math-proof-card.platinum > * {
+  position: relative;
+  z-index: 1;
+}
+
 .math-proof-card.gold {
   border-color: rgba(255, 214, 92, 0.45);
 }
@@ -248,6 +292,14 @@
   align-items: flex-start;
 }
 
+.math-proof-card-actions {
+  display: flex;
+  align-items: flex-start;
+  gap: 0.6rem;
+  flex-wrap: wrap;
+  justify-content: flex-end;
+}
+
 .math-proof-card-topline {
   display: flex;
   gap: 0.65rem;
@@ -276,6 +328,25 @@
   border-color: rgba(96, 165, 250, 0.35);
 }
 
+.math-proof-badge.platinum {
+  position: relative;
+  overflow: hidden;
+  color: #f8fafc;
+  border-color: rgba(226, 232, 240, 0.65);
+  background: linear-gradient(120deg, rgba(226, 232, 240, 0.14), rgba(255, 255, 255, 0.26), rgba(148, 163, 184, 0.14));
+  box-shadow: 0 0 14px rgba(226, 232, 240, 0.18);
+}
+
+.math-proof-badge.platinum::after {
+  content: '';
+  position: absolute;
+  inset: 0;
+  background: linear-gradient(110deg, transparent 0%, rgba(255, 255, 255, 0.45) 48%, transparent 100%);
+  transform: translateX(-130%);
+  animation: platinum-shimmer 2.4s ease-in-out infinite;
+  pointer-events: none;
+}
+
 .math-proof-badge.gold {
   color: #ffd65c;
   border-color: rgba(255, 214, 92, 0.5);
@@ -294,6 +365,24 @@
   background: rgba(205, 127, 50, 0.08);
 }
 
+@keyframes platinum-shimmer {
+  0% {
+    transform: translateX(-130%);
+  }
+  55%,
+  100% {
+    transform: translateX(130%);
+  }
+}
+
+@media (prefers-reduced-motion: reduce) {
+  .math-proofs-filter--platinum.active::before,
+  .math-proof-card.platinum::before,
+  .math-proof-badge.platinum::after {
+    animation: none;
+  }
+}
+
 .math-proof-source {
   color: var(--text-secondary, #9ca3af);
 }
@@ -343,20 +432,33 @@
 .math-proof-download {
   display: inline-flex;
   align-items: center;
+  justify-content: center;
   border-radius: 0.8rem;
   border: 1px solid rgba(34, 197, 94, 0.28);
   background: rgba(34, 197, 94, 0.08);
   color: #86efac;
   padding: 0.55rem 0.8rem;
+  font: inherit;
+  cursor: pointer;
   text-decoration: none;
   transition: border-color 0.2s ease, transform 0.2s ease;
 }
 
-.math-proof-download:hover {
+.math-proof-download--compact {
+  white-space: nowrap;
+}
+
+.math-proof-download:hover:not(:disabled) {
   border-color: rgba(34, 197, 94, 0.5);
   transform: translateY(-1px);
 }
 
+.math-proof-download:disabled {
+  cursor: not-allowed;
+  opacity: 0.55;
+  transform: none;
+}
+
 .math-proof-detail-block {
   border: 1px solid rgba(148, 163, 184, 0.16);
   border-radius: 0.85rem;
@@ -439,7 +541,9 @@
     flex-direction: column;
   }
 
-  .math-proof-expand {
+  .math-proof-card-actions,
+  .math-proof-expand,
+  .math-proof-download--compact {
     width: 100%;
   }
 }
diff --git a/frontend/src/components/autonomous/MathematicalProofs.jsx b/frontend/src/components/autonomous/MathematicalProofs.jsx
index 829f44c..4dfca8a 100644
--- a/frontend/src/components/autonomous/MathematicalProofs.jsx
+++ b/frontend/src/components/autonomous/MathematicalProofs.jsx
@@ -1,6 +1,10 @@
 import React, { useEffect, useMemo, useState } from 'react';
 import './MathematicalProofs.css';
 import ProofGraph from './ProofGraph';
+import {
+  buildCurrentProofRuntimeConfig,
+  isProofRuntimeConfigComplete,
+} from '../../hooks/useProofCheckRuntime';
 
 function formatDate(isoString) {
   if (!isoString) {
@@ -49,8 +53,11 @@ function createEmptyGraphState() {
 
 function getTierBadge(proof) {
   const tier = proof.novelty_tier;
+  if (tier === 'major_mathematical_discovery') {
+    return { cardClass: 'platinum', badgeClass: 'platinum', label: 'Major Mathematical Discovery' };
+  }
   if (tier === 'mathematical_discovery') {
-    return { cardClass: 'gold', badgeClass: 'gold', label: 'Mathematical Discovery' };
+    return { cardClass: 'gold', badgeClass: 'gold', label: 'Minor Mathematical Discovery' };
   }
   if (tier === 'novel_variant') {
     return { cardClass: 'silver', badgeClass: 'silver', label: 'Novel Reformulation' };
@@ -299,7 +306,7 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
   }, [api, proofGraphState.loaded, proofGraphState.loading, proofStatus?.lean4_enabled, viewMode]);
 
   const availableBrainstorms = useMemo(
-    () => brainstorms.filter((brainstorm) => brainstorm.status === 'complete'),
+    () => brainstorms,
     [brainstorms]
   );
 
@@ -328,14 +335,16 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
 
   const counts = useMemo(() => {
     const novel = proofs.filter((proof) => proof.novel).length;
+    const majorDiscovery = proofs.filter((proof) => proof.novelty_tier === 'major_mathematical_discovery').length;
     const discovery = proofs.filter((proof) => proof.novelty_tier === 'mathematical_discovery').length;
     const variant = proofs.filter((proof) => proof.novelty_tier === 'novel_variant').length;
     const formulation = proofs.filter((proof) => proof.novelty_tier === 'novel_formulation').length;
-    const legacyNovel = novel - discovery - variant - formulation;
+    const legacyNovel = novel - majorDiscovery - discovery - variant - formulation;
     return {
       total: proofs.length,
       novel,
       known: proofs.length - novel,
+      majorDiscovery,
       discovery,
       variant,
       formulation,
@@ -347,6 +356,9 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
     if (filter === 'novel') {
       return proofs.filter((proof) => proof.novel);
     }
+    if (filter === 'major_mathematical_discovery') {
+      return proofs.filter((proof) => proof.novelty_tier === 'major_mathematical_discovery');
+    }
     if (filter === 'mathematical_discovery') {
       return proofs.filter((proof) => proof.novelty_tier === 'mathematical_discovery');
     }
@@ -363,15 +375,21 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
     [visibleProofs]
   );
   const showManualPanel = Boolean(proofStatus?.lean4_path);
-  const manualChecksDisabled = !proofStatus?.lean4_enabled || !proofStatus?.manual_check_ready || availableSources.length === 0;
+  const currentProofRuntimeConfig = buildCurrentProofRuntimeConfig();
+  const hasCurrentProofRuntimeConfig = isProofRuntimeConfigComplete(currentProofRuntimeConfig);
+  const manualChecksDisabled = (
+    !proofStatus?.lean4_enabled ||
+    (!proofStatus?.manual_check_ready && !hasCurrentProofRuntimeConfig) ||
+    availableSources.length === 0
+  );
   const manualChecksDisabledReason = !proofStatus
     ? 'Loading proof runtime status...'
     : !proofStatus?.lean4_enabled
       ? 'Lean 4 proof checks are disabled.'
-    : !proofStatus?.manual_check_ready
+    : !proofStatus?.manual_check_ready && !hasCurrentProofRuntimeConfig
       ? (proofStatus?.manual_check_message || 'Manual proof checks are not ready yet.')
       : availableSources.length === 0
-        ? 'No completed sources are available yet.'
+        ? (manualSourceType === 'brainstorm' ? 'No brainstorms are available yet.' : 'No completed papers are available yet.')
         : '';
 
   const handleSelectGraphProof = (proofId) => {
@@ -387,9 +405,11 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
     try {
       setManualCheckPending(true);
       setManualCheckMessage('');
+      const proofRuntimeConfig = buildCurrentProofRuntimeConfig();
       await api.runProofCheck({
         sourceType: manualSourceType,
         sourceId: manualSourceId,
+        proofRuntimeConfig: isProofRuntimeConfigComplete(proofRuntimeConfig) ? proofRuntimeConfig : null,
       });
       setManualCheckMessage(`Queued proof check for ${manualSourceType} ${manualSourceId}.`);
     } catch (err) {
@@ -431,11 +451,17 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
             >
               All Novel ({counts.novel || 0})
             </button>
+            <button
+              className={`math-proofs-filter math-proofs-filter--platinum ${filter === 'major_mathematical_discovery' ? 'active' : ''}`}
+              onClick={() => setFilter('major_mathematical_discovery')}
+            >
+              Major Discovery ({counts.majorDiscovery || 0})
+            </button>
             <button
               className={`math-proofs-filter math-proofs-filter--gold ${filter === 'mathematical_discovery' ? 'active' : ''}`}
               onClick={() => setFilter('mathematical_discovery')}
             >
-              Discovery ({counts.discovery || 0})
+              Minor Mathematical Discovery ({counts.discovery || 0})
             </button>
             <button
               className={`math-proofs-filter math-proofs-filter--silver ${filter === 'novel_variant' ? 'active' : ''}`}
@@ -496,7 +522,7 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
         <div className="math-proofs-manual-panel">
           <div className="math-proofs-manual-copy">
             <strong>Manual proof check</strong>
-            <span>Queue a Lean 4 proof pass for any completed brainstorm or paper.</span>
+            <span>Queue a Lean 4 proof pass for any brainstorm or completed paper.</span>
           </div>
           <div className="math-proofs-manual-controls">
             <select
@@ -512,7 +538,11 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
               onChange={(event) => setManualSourceId(event.target.value)}
               disabled={manualCheckPending || availableSources.length === 0}
             >
-              {availableSources.length === 0 && <option value="">No completed sources available</option>}
+              {availableSources.length === 0 && (
+                <option value="">
+                  {manualSourceType === 'brainstorm' ? 'No brainstorms available' : 'No completed papers available'}
+                </option>
+              )}
               {manualSourceType === 'brainstorm' &&
                 availableBrainstorms.map((brainstorm) => (
                   <option key={brainstorm.topic_id} value={brainstorm.topic_id}>
@@ -615,12 +645,21 @@ function MathematicalProofs({ api, refreshToken = 0, selectedProofId = null, lat
                     </p>
                   </div>
 
-                  <button
-                    className="math-proof-expand"
-                    onClick={() => setExpandedProofId(isExpanded ? null : proof.proof_id)}
-                  >
-                    {isExpanded ? 'Hide Details' : 'View Details'}
-                  </button>
+                  <div className="math-proof-card-actions">
+                    <a
+                      className="math-proof-download math-proof-download--compact"
+                      href={api.getProofLeanDownloadUrl(proof.proof_id)}
+                      download={`${proof.proof_id}.lean`}
+                    >
+                      Download .lean
+                    </a>
+                    <button
+                      className="math-proof-expand"
+                      onClick={() => setExpandedProofId(isExpanded ? null : proof.proof_id)}
+                    >
+                      {isExpanded ? 'Hide Details' : 'View Details'}
+                    </button>
+                  </div>
                 </div>
 
                 <div className="math-proof-meta">
diff --git a/frontend/src/components/autonomous/PaperLibrary.jsx b/frontend/src/components/autonomous/PaperLibrary.jsx
index 5ea4a56..1bd2f24 100644
--- a/frontend/src/components/autonomous/PaperLibrary.jsx
+++ b/frontend/src/components/autonomous/PaperLibrary.jsx
@@ -18,6 +18,8 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
   const [showLibraryTooltip, setShowLibraryTooltip] = useState(false);
   const [deleteConfirm, setDeleteConfirm] = useState(null);
   const [deleting, setDeleting] = useState(false);
+  const [deleteAllPrunedConfirm, setDeleteAllPrunedConfirm] = useState(false);
+  const [deletingAllPruned, setDeletingAllPruned] = useState(false);
   const [isGeneratingPDF, setIsGeneratingPDF] = useState(false);
   
   // Critique modal state
@@ -100,6 +102,21 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
     }
   };
 
+  const handleDeleteAllPrunedConfirm = async () => {
+    if (!api.deleteAllPrunedPapers) return;
+    setDeletingAllPruned(true);
+    try {
+      await api.deleteAllPrunedPapers();
+      setDeleteAllPrunedConfirm(false);
+      onRefresh();
+    } catch (error) {
+      console.error('Failed to delete pruned papers:', error);
+      alert(`Failed to delete pruned papers: ${error.message}`);
+    } finally {
+      setDeletingAllPruned(false);
+    }
+  };
+
   const handleDeleteCancel = (e) => {
     e.stopPropagation();
     setDeleteConfirm(null);
@@ -206,6 +223,33 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
         <div className="paper-library-pruned-counter">
           Pruned Papers: {archivedCount}
         </div>
+        {archivedCount > 0 && api.deleteAllPrunedPapers && (
+          <div className="paper-library-pruned-actions">
+            {deleteAllPrunedConfirm ? (
+              <div className="delete-confirm-inline">
+                <span>Delete all pruned papers permanently?</span>
+                <button
+                  className="btn-delete-confirm"
+                  onClick={handleDeleteAllPrunedConfirm}
+                  disabled={deletingAllPruned}
+                >
+                  {deletingAllPruned ? 'Deleting...' : 'Yes'}
+                </button>
+                <button
+                  className="btn-delete-cancel"
+                  onClick={() => setDeleteAllPrunedConfirm(false)}
+                  disabled={deletingAllPruned}
+                >
+                  Cancel
+                </button>
+              </div>
+            ) : (
+              <button className="btn-delete-paper" onClick={() => setDeleteAllPrunedConfirm(true)}>
+                Delete All Pruned Papers
+              </button>
+            )}
+          </div>
+        )}
         <div className="auto-empty-state">
           No papers completed yet. Autonomous research will generate papers from brainstorm databases.
         </div>
@@ -255,6 +299,33 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
       <div className="paper-library-pruned-counter">
         Pruned Papers: {archivedCount}
       </div>
+      {archivedCount > 0 && api.deleteAllPrunedPapers && (
+        <div className="paper-library-pruned-actions">
+          {deleteAllPrunedConfirm ? (
+            <div className="delete-confirm-inline">
+              <span>Delete all pruned papers permanently?</span>
+              <button
+                className="btn-delete-confirm"
+                onClick={handleDeleteAllPrunedConfirm}
+                disabled={deletingAllPruned}
+              >
+                {deletingAllPruned ? 'Deleting...' : 'Yes'}
+              </button>
+              <button
+                className="btn-delete-cancel"
+                onClick={() => setDeleteAllPrunedConfirm(false)}
+                disabled={deletingAllPruned}
+              >
+                Cancel
+              </button>
+            </div>
+          ) : (
+            <button className="btn-delete-paper" onClick={() => setDeleteAllPrunedConfirm(true)}>
+              Delete All Pruned Papers
+            </button>
+          )}
+        </div>
+      )}
 
       {proofActionMessage && (
         <div className={`test-result-banner ${proofActionMessage.startsWith('Failed') ? 'test-result-banner--error' : 'test-result-banner--success'}`}>
@@ -374,7 +445,7 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
                   
                   {deleteConfirm === paper.paper_id ? (
                     <div className="delete-confirm-inline" onClick={(e) => e.stopPropagation()}>
-                      <span>Delete this paper?</span>
+                      <span>Prune this paper from model context?</span>
                       <button 
                         className="btn-delete-confirm" 
                         onClick={() => handleDeleteConfirm(paper.paper_id)}
@@ -394,9 +465,9 @@ const PaperLibrary = ({ papers, onRefresh, api, archivedCount = 0 }) => {
                     <button
                       className="btn-delete-paper"
                       onClick={(e) => handleDeleteClick(e, paper.paper_id)}
-                      title="Delete this paper"
+                      title="Prune this paper from future model context"
                     >
-                      Delete
+                      Prune
                     </button>
                   )}
                 </div>
diff --git a/frontend/src/components/autonomous/ProofGraph.css b/frontend/src/components/autonomous/ProofGraph.css
index f370021..d1175fa 100644
--- a/frontend/src/components/autonomous/ProofGraph.css
+++ b/frontend/src/components/autonomous/ProofGraph.css
@@ -119,6 +119,11 @@
   stroke: rgba(96, 165, 250, 0.32);
 }
 
+.proof-graph-node-group.platinum .proof-graph-node-frame {
+  stroke: rgba(226, 232, 240, 0.85);
+  filter: drop-shadow(0 0 5px rgba(226, 232, 240, 0.45));
+}
+
 .proof-graph-node-group.gold .proof-graph-node-frame {
   stroke: rgba(255, 214, 92, 0.55);
 }
diff --git a/frontend/src/components/autonomous/ProofGraph.jsx b/frontend/src/components/autonomous/ProofGraph.jsx
index bb27fa9..5fec97b 100644
--- a/frontend/src/components/autonomous/ProofGraph.jsx
+++ b/frontend/src/components/autonomous/ProofGraph.jsx
@@ -3,6 +3,7 @@ import './ProofGraph.css';
 
 function getGraphNodeTierClass(node) {
   const tier = node.novelty_tier;
+  if (tier === 'major_mathematical_discovery') return 'platinum';
   if (tier === 'mathematical_discovery') return 'gold';
   if (tier === 'novel_variant') return 'silver';
   if (tier === 'novel_formulation') return 'bronze';
diff --git a/frontend/src/components/autonomous/ProofLibrary.css b/frontend/src/components/autonomous/ProofLibrary.css
index affd3d4..3d900e4 100644
--- a/frontend/src/components/autonomous/ProofLibrary.css
+++ b/frontend/src/components/autonomous/ProofLibrary.css
@@ -14,6 +14,11 @@
 }
 
 /* Tier-specific card accents */
+.proof-card--platinum {
+  border-left: 3px solid #e2e8f0;
+  box-shadow: inset 3px 0 12px rgba(226, 232, 240, 0.16);
+}
+
 .proof-card--gold {
   border-left: 3px solid #ffd65c;
 }
@@ -38,6 +43,24 @@
 }
 
 /* Tier-specific badges */
+.proof-badge--platinum {
+  position: relative;
+  overflow: hidden;
+  background: linear-gradient(135deg, #e2e8f0 0%, #ffffff 45%, #94a3b8 100%);
+  color: #0f172a;
+  box-shadow: 0 0 14px rgba(226, 232, 240, 0.35);
+}
+
+.proof-badge--platinum::after {
+  content: '';
+  position: absolute;
+  inset: 0;
+  background: linear-gradient(110deg, transparent 0%, rgba(255, 255, 255, 0.65) 48%, transparent 100%);
+  transform: translateX(-130%);
+  animation: proof-library-platinum-shimmer 2.5s ease-in-out infinite;
+  pointer-events: none;
+}
+
 .proof-badge--gold {
   background: linear-gradient(135deg, #ffd65c 0%, #ffe99a 100%);
   color: #1a1a00;
@@ -53,11 +76,60 @@
   color: #1a0a00;
 }
 
+@keyframes proof-library-platinum-shimmer {
+  0% {
+    transform: translateX(-130%);
+  }
+  55%,
+  100% {
+    transform: translateX(130%);
+  }
+}
+
+@media (prefers-reduced-motion: reduce) {
+  .proof-badge--platinum::after {
+    animation: none;
+  }
+}
+
 .proof-title {
   font-family: 'Courier New', monospace;
   letter-spacing: 0.02em;
 }
 
+.proof-card-actions {
+  display: flex;
+  align-items: center;
+  justify-content: flex-end;
+  gap: 8px;
+  flex-wrap: wrap;
+  flex-shrink: 0;
+}
+
+.proof-header-download {
+  padding: 7px 12px;
+  border: 1px solid rgba(30, 255, 28, 0.32);
+  border-radius: 999px;
+  background: rgba(30, 255, 28, 0.1);
+  color: #b7ffb6;
+  font-size: 0.82rem;
+  font-weight: 700;
+  cursor: pointer;
+  white-space: nowrap;
+  transition: border-color 0.2s ease, background 0.2s ease, transform 0.2s ease;
+}
+
+.proof-header-download:hover:not(:disabled) {
+  border-color: rgba(30, 255, 28, 0.56);
+  background: rgba(30, 255, 28, 0.16);
+  transform: translateY(-1px);
+}
+
+.proof-header-download:disabled {
+  cursor: not-allowed;
+  opacity: 0.55;
+}
+
 .proof-statement {
   color: #b9b9c6;
   font-size: 0.92rem;
@@ -164,3 +236,15 @@
 .proof-code-block::-webkit-scrollbar-thumb:hover {
   background: #666;
 }
+
+@media (max-width: 700px) {
+  .proof-library .answer-title-row {
+    align-items: flex-start;
+    flex-direction: column;
+  }
+
+  .proof-card-actions,
+  .proof-header-download {
+    width: 100%;
+  }
+}
diff --git a/frontend/src/components/autonomous/ProofLibrary.jsx b/frontend/src/components/autonomous/ProofLibrary.jsx
index 324e161..41679dd 100644
--- a/frontend/src/components/autonomous/ProofLibrary.jsx
+++ b/frontend/src/components/autonomous/ProofLibrary.jsx
@@ -1,7 +1,7 @@
 import React, { useState, useEffect, useMemo } from 'react';
 import { autonomousAPI } from '../../services/api';
 import { buildResearchRunGroups } from '../../utils/researchRunHistory';
-import { downloadRawText } from '../../utils/downloadHelpers';
+import { downloadTextFile } from '../../utils/downloadHelpers';
 import './FinalAnswerLibrary.css';
 import './ProofLibrary.css';
 
@@ -21,8 +21,11 @@ function truncate(text, maxLength = 220) {
 
 function getTierBadge(proof) {
   const tier = proof.novelty_tier;
+  if (tier === 'major_mathematical_discovery') {
+    return { cssClass: 'proof-badge--platinum', label: 'Major Mathematical Discovery' };
+  }
   if (tier === 'mathematical_discovery') {
-    return { cssClass: 'proof-badge--gold', label: 'Mathematical Discovery' };
+    return { cssClass: 'proof-badge--gold', label: 'Minor Mathematical Discovery' };
   }
   if (tier === 'novel_variant') {
     return { cssClass: 'proof-badge--silver', label: 'Novel Reformulation' };
@@ -38,6 +41,7 @@ function getTierBadge(proof) {
 
 function getCardClass(proof) {
   const tier = proof.novelty_tier;
+  if (tier === 'major_mathematical_discovery') return 'proof-card--platinum';
   if (tier === 'mathematical_discovery') return 'proof-card--gold';
   if (tier === 'novel_variant') return 'proof-card--silver';
   if (tier === 'novel_formulation') return 'proof-card--bronze';
@@ -152,11 +156,23 @@ export default function ProofLibrary() {
     }
   };
 
-  const handleDownloadLean = (proof) => {
-    const leanCode = proof.lean_code || '';
+  const handleDownloadLean = async (proof, event) => {
+    event?.stopPropagation();
+
+    let proofForDownload = proof;
+    let leanCode = proof.lean_code || '';
+    if (!leanCode && proof.session_id && proof.proof_id) {
+      try {
+        proofForDownload = await autonomousAPI.getLibraryProof(proof.session_id, proof.proof_id);
+        leanCode = proofForDownload.lean_code || '';
+      } catch {
+        return;
+      }
+    }
+
     if (!leanCode) return;
-    const filename = `${proof.theorem_name || proof.proof_id}.lean`;
-    downloadRawText(leanCode, filename);
+    const filename = `${proofForDownload.theorem_name || proof.theorem_name || proof.proof_id}.lean`;
+    downloadTextFile(leanCode, filename);
   };
 
   const novelCount = proofs.filter((p) => p.novel).length;
@@ -288,9 +304,18 @@ export default function ProofLibrary() {
                               <h4 className="answer-title proof-title">
                                 {proof.theorem_name || proof.proof_id}
                               </h4>
-                              <button className="expand-button">
-                                {isExpanded ? '\u25B2' : '\u25BC'}
-                              </button>
+                              <div className="proof-card-actions">
+                                <button
+                                  type="button"
+                                  className="proof-header-download"
+                                  onClick={(event) => handleDownloadLean(proof, event)}
+                                >
+                                  Download .lean
+                                </button>
+                                <button className="expand-button">
+                                  {isExpanded ? '\u25B2' : '\u25BC'}
+                                </button>
+                              </div>
                             </div>
 
                             <div className="answer-metadata">
@@ -423,7 +448,16 @@ export default function ProofLibrary() {
             return (
               <div key={id} className="answer-card proof-card">
                 <div className="answer-header" onClick={() => handleExpand(proof)}>
-                  <h4 className="answer-title">{proof.theorem_name || proof.proof_id}</h4>
+                  <div className="answer-title-row">
+                    <h4 className="answer-title">{proof.theorem_name || proof.proof_id}</h4>
+                    <button
+                      type="button"
+                      className="proof-header-download"
+                      onClick={(event) => handleDownloadLean(proof, event)}
+                    >
+                      Download .lean
+                    </button>
+                  </div>
                 </div>
               </div>
             );
diff --git a/frontend/src/components/autonomous/ProofNotificationStack.jsx b/frontend/src/components/autonomous/ProofNotificationStack.jsx
index b4cda04..0ad1411 100644
--- a/frontend/src/components/autonomous/ProofNotificationStack.jsx
+++ b/frontend/src/components/autonomous/ProofNotificationStack.jsx
@@ -14,6 +14,16 @@ function truncate(text, maxLength = 120) {
 }
 
 const TIER_STYLES = {
+  major_mathematical_discovery: {
+    borderColor: '#f8fafc',
+    glowColor: 'rgba(226, 232, 240, 0.55)',
+    glowInset: 'rgba(255, 255, 255, 0.32)',
+    labelColor: '#f8fafc',
+    background: 'linear-gradient(135deg, rgba(30, 41, 59, 0.98), rgba(15, 23, 42, 0.96), rgba(226, 232, 240, 0.16))',
+    label: 'Congratulations!\nMajor Mathematical Discovery Found!',
+    subLabel:
+      'Your validator deemed this may be competitive for a major prize or medal in a related field.',
+  },
   novel_formulation: {
     borderColor: '#cd7f32',
     glowColor: 'rgba(205, 127, 50, 0.35)',
@@ -37,7 +47,7 @@ const TIER_STYLES = {
     glowColor: 'rgba(255, 214, 92, 0.35)',
     glowInset: 'rgba(255, 194, 57, 0.25)',
     labelColor: '#ffd65c',
-    label: 'Congratulations!\nMathematical Discovery Found!',
+    label: 'Minor Mathematical Discovery Found!',
     subLabel:
       'Your validator has determined this proof is a mathematical discovery or a novel alternative proof that changes our understanding.',
   },
@@ -85,7 +95,7 @@ export default function ProofNotificationStack({ notifications, onDismiss, onCli
               textAlign: 'left',
               borderRadius: scalePx(14),
               border: `1.5px solid ${tier.borderColor}`,
-              background: 'linear-gradient(135deg, rgba(8, 35, 22, 0.96), rgba(15, 23, 42, 0.96))',
+              background: tier.background || 'linear-gradient(135deg, rgba(8, 35, 22, 0.96), rgba(15, 23, 42, 0.96))',
               boxShadow: `0 16px 36px rgba(0, 0, 0, 0.35), 0 0 12px ${tier.glowColor}, inset 0 0 0 1px ${tier.glowInset}`,
               padding: `${scalePx(14)} ${scalePx(14)} ${scalePx(12)} ${scalePx(14)}`,
               color: '#f8fafc',
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.css b/frontend/src/components/autonomous/Stage2PaperHistory.css
index a740f36..8780c82 100644
--- a/frontend/src/components/autonomous/Stage2PaperHistory.css
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.css
@@ -49,3 +49,46 @@
 .stage2-history-prompt strong {
   color: #1eff1c;
 }
+
+.stage2-history-card--pruned {
+  opacity: 0.68;
+  filter: grayscale(0.65);
+  border-color: rgba(156, 163, 175, 0.32) !important;
+  background: linear-gradient(180deg, rgba(75, 85, 99, 0.22) 0%, rgba(31, 41, 55, 0.62) 100%) !important;
+}
+
+.stage2-history-pruned-badge {
+  display: inline-flex;
+  align-items: center;
+  padding: 0.18rem 0.5rem;
+  border-radius: 999px;
+  background: rgba(156, 163, 175, 0.18);
+  border: 1px solid rgba(156, 163, 175, 0.34);
+  color: #d1d5db;
+  font-size: 0.7rem;
+  font-weight: 700;
+  text-transform: uppercase;
+  letter-spacing: 0.04em;
+}
+
+.stage2-history-pruned-note {
+  margin-top: 0.75rem;
+  padding: 0.65rem 0.75rem;
+  border-radius: 8px;
+  background: rgba(156, 163, 175, 0.12);
+  border: 1px solid rgba(156, 163, 175, 0.22);
+  color: #d1d5db;
+  font-size: 0.82rem;
+  line-height: 1.45;
+}
+
+.stat-badge--pruned {
+  color: #d1d5db;
+  border-color: rgba(156, 163, 175, 0.28);
+}
+
+.pruned-delete-control {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+}
diff --git a/frontend/src/components/autonomous/Stage2PaperHistory.jsx b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
index fd415f6..93d4633 100644
--- a/frontend/src/components/autonomous/Stage2PaperHistory.jsx
+++ b/frontend/src/components/autonomous/Stage2PaperHistory.jsx
@@ -30,6 +30,7 @@ function truncateAbstract(abstract, maxLength = 220) {
 
 export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
   const [papers, setPapers] = useState([]);
+  const [prunedPapers, setPrunedPapers] = useState([]);
   const [finalAnswers, setFinalAnswers] = useState([]);
   const [sessionsResponse, setSessionsResponse] = useState(null);
   const [loading, setLoading] = useState(true);
@@ -40,6 +41,8 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
   const [searchTerm, setSearchTerm] = useState('');
   const [deleteConfirmId, setDeleteConfirmId] = useState(null);
   const [deletingId, setDeletingId] = useState(null);
+  const [deleteAllPrunedConfirm, setDeleteAllPrunedConfirm] = useState(false);
+  const [deletingAllPruned, setDeletingAllPruned] = useState(false);
   const [generatingPdfId, setGeneratingPdfId] = useState(null);
   const [critiqueModalOpen, setCritiqueModalOpen] = useState(false);
   const [critiquePaper, setCritiquePaper] = useState(null);
@@ -88,8 +91,9 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
       setLoading(true);
       setError(null);
 
-      const [papersResult, sessionsResult, finalAnswersResult] = await Promise.allSettled([
+      const [papersResult, prunedPapersResult, sessionsResult, finalAnswersResult] = await Promise.allSettled([
         autonomousAPI.getPaperHistory(),
+        autonomousAPI.getPrunedPaperHistory(),
         autonomousAPI.getSessions(),
         fetch('/api/auto-research/final-answer-library').then(async (response) => {
           if (!response.ok) {
@@ -103,7 +107,16 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
         throw papersResult.reason;
       }
 
-      setPapers(papersResult.value.papers || []);
+      const activePapers = papersResult.value.papers || [];
+      const prunedHistoryPapers = prunedPapersResult.status === 'fulfilled'
+        ? (prunedPapersResult.value.papers || [])
+        : [];
+      setPrunedPapers(prunedHistoryPapers);
+      setPapers([...activePapers, ...prunedHistoryPapers]);
+
+      if (prunedPapersResult.status !== 'fulfilled') {
+        console.warn('Stage 2 history: failed to load pruned paper history', prunedPapersResult.reason);
+      }
 
       if (sessionsResult.status === 'fulfilled') {
         setSessionsResponse(sessionsResult.value);
@@ -187,7 +200,9 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
     setLoadingContentId(paper.history_id);
 
     try {
-      const data = await autonomousAPI.getHistoryPaper(paper.session_id, paper.paper_id);
+      const data = paper.is_pruned
+        ? await autonomousAPI.getPrunedHistoryPaper(paper.session_id, paper.paper_id)
+        : await autonomousAPI.getHistoryPaper(paper.session_id, paper.paper_id);
       setExpandedContent(data);
     } catch (err) {
       console.error('Failed to load history paper content:', err);
@@ -210,7 +225,8 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
       return;
     }
 
-    const filename = sanitizeFilename(`${paper.session_id}_${paper.paper_id}_${paper.title}`);
+    const filenamePrefix = paper.is_pruned ? 'pruned_' : '';
+    const filename = sanitizeFilename(`${filenamePrefix}${paper.session_id}_${paper.paper_id}_${paper.title}`);
     downloadRawText(
       expandedContent.content || '',
       filename,
@@ -226,7 +242,8 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
       return;
     }
 
-    const filename = sanitizeFilename(`${paper.session_id}_${paper.paper_id}_${paper.title}`);
+    const filenamePrefix = paper.is_pruned ? 'pruned_' : '';
+    const filename = sanitizeFilename(`${filenamePrefix}${paper.session_id}_${paper.paper_id}_${paper.title}`);
     const metadata = {
       title: expandedContent.title || paper.title,
       wordCount: paper.word_count,
@@ -290,6 +307,24 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
     }
   };
 
+  const handleDeleteAllPrunedConfirm = async () => {
+    setDeletingAllPruned(true);
+    try {
+      const sessionIds = Array.from(new Set(prunedPapers.map((paper) => paper.session_id)));
+      await Promise.all(sessionIds.map((sessionId) => autonomousAPI.deleteAllPrunedPapers(sessionId)));
+      setDeleteAllPrunedConfirm(false);
+      await loadPaperHistory();
+      if (onCurrentSessionDataChanged) {
+        await onCurrentSessionDataChanged();
+      }
+    } catch (err) {
+      console.error('Failed to delete pruned papers:', err);
+      alert(`Failed to delete pruned papers: ${err.message}`);
+    } finally {
+      setDeletingAllPruned(false);
+    }
+  };
+
   if (loading) {
     return (
       <div className="final-answer-library stage2-paper-history">
@@ -326,10 +361,13 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
     <div className="final-answer-library stage2-paper-history">
       <div className="library-header">
         <h2>Stage 2 Final Answer History</h2>
-        <p>Browse completed Stage 2 papers from all autonomous research sessions. This history excludes pruned and archived papers.</p>
+        <p>Browse completed Stage 2 papers from all autonomous research sessions. Pruned papers are preserved here for user review but are excluded from model context.</p>
         <div className="library-stats">
           <span className="stat-badge">
-            {papers.length} {papers.length === 1 ? 'Paper' : 'Papers'}
+            {papers.filter((paper) => !paper.is_pruned).length} Active {papers.filter((paper) => !paper.is_pruned).length === 1 ? 'Paper' : 'Papers'}
+          </span>
+          <span className="stat-badge stat-badge--pruned">
+            {prunedPapers.length} Pruned {prunedPapers.length === 1 ? 'Paper' : 'Papers'}
           </span>
           <span className="stat-badge">
             {runGroups.length} {runGroups.length === 1 ? 'Research Run' : 'Research Runs'}
@@ -354,6 +392,37 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
           onChange={(e) => setSearchTerm(e.target.value)}
           className="search-input"
         />
+        {prunedPapers.length > 0 && (
+          <div className="pruned-delete-control">
+            {deleteAllPrunedConfirm ? (
+              <div className="delete-confirm-inline">
+                <span>Delete all pruned papers permanently?</span>
+                <button
+                  className="btn-delete-confirm"
+                  onClick={handleDeleteAllPrunedConfirm}
+                  disabled={deletingAllPruned}
+                >
+                  {deletingAllPruned ? 'Deleting...' : 'Yes'}
+                </button>
+                <button
+                  className="btn-delete-cancel"
+                  onClick={() => setDeleteAllPrunedConfirm(false)}
+                  disabled={deletingAllPruned}
+                >
+                  Cancel
+                </button>
+              </div>
+            ) : (
+              <button
+                className="btn-delete-paper"
+                onClick={() => setDeleteAllPrunedConfirm(true)}
+                title="Permanently delete all pruned paper files"
+              >
+                Delete All Pruned Papers
+              </button>
+            )}
+          </div>
+        )}
       </div>
 
       {visibleRunGroups.length === 0 ? (
@@ -363,7 +432,7 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
           <p>
             {searchTerm
               ? 'Try adjusting your search.'
-              : 'Completed non-archived Stage 2 papers will appear here.'}
+              : 'Completed and pruned Stage 2 papers will appear here.'}
           </p>
         </div>
       ) : (
@@ -409,7 +478,7 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                   {runGroup.visibleStage2Papers.map((paper) => (
                     <div
                       key={paper.history_id}
-                      className={`paper-card stage2-history-card ${expandedId === paper.history_id ? 'expanded' : ''}`}
+                      className={`paper-card stage2-history-card ${paper.is_pruned ? 'stage2-history-card--pruned' : ''} ${expandedId === paper.history_id ? 'expanded' : ''}`}
                       onClick={() => handleCardClick(paper)}
                     >
                       <div className="paper-card-header">
@@ -418,6 +487,9 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                           <span className="stage2-history-session-badge">
                             {paper.session_id === 'legacy' ? 'Legacy' : paper.session_id}
                           </span>
+                          {paper.is_pruned && (
+                            <span className="stage2-history-pruned-badge">Pruned Paper</span>
+                          )}
                         </div>
                         <span className="paper-word-count">{paper.word_count?.toLocaleString()} words</span>
                       </div>
@@ -439,6 +511,12 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                         {truncateAbstract(paper.abstract)}
                       </div>
 
+                      {paper.is_pruned && (
+                        <div className="stage2-history-pruned-note">
+                          {paper.pruned_note || 'The system decided autonomously that this paper hurt context cumulation.'}
+                        </div>
+                      )}
+
                       <div className="stage2-history-prompt">
                         <strong>Research Question:</strong> {paper.user_prompt}
                       </div>
@@ -457,7 +535,7 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                       {expandedId === paper.history_id && (
                         <>
                           <div className="paper-actions">
-                            {(() => {
+                            {!paper.is_pruned && (() => {
                               const proofCheckState = getSourceState('paper', paper.history_id);
                               const proofCheckLabel = proofCheckState?.status === 'queued'
                                 ? 'Queueing Proof Check...'
@@ -497,27 +575,29 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                               Download Raw
                             </button>
 
-                            <button
-                              className="btn-critique"
-                              onClick={(e) => handleOpenCritique(e, paper)}
-                              title="Ask validator to critique this paper"
-                              style={{
-                                background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
-                                border: 'none',
-                                color: '#0b2e0b',
-                                padding: '0.35rem 0.7rem',
-                                borderRadius: '4px',
-                                cursor: 'pointer',
-                                fontWeight: '500',
-                                fontSize: '0.75rem',
-                              }}
-                            >
-                              ⭐ Critique
-                            </button>
+                            {!paper.is_pruned && (
+                              <button
+                                className="btn-critique"
+                                onClick={(e) => handleOpenCritique(e, paper)}
+                                title="Ask validator to critique this paper"
+                                style={{
+                                  background: 'linear-gradient(135deg, #1eff1c 0%, #0fcc0d 100%)',
+                                  border: 'none',
+                                  color: '#0b2e0b',
+                                  padding: '0.35rem 0.7rem',
+                                  borderRadius: '4px',
+                                  cursor: 'pointer',
+                                  fontWeight: '500',
+                                  fontSize: '0.75rem',
+                                }}
+                              >
+                                ⭐ Critique
+                              </button>
+                            )}
 
-                            {deleteConfirmId === paper.history_id ? (
+                            {!paper.is_pruned && (deleteConfirmId === paper.history_id ? (
                               <div className="delete-confirm-inline" onClick={(e) => e.stopPropagation()}>
-                                <span>Delete this paper?</span>
+                                <span>Prune this paper from model context?</span>
                                 <button
                                   className="btn-delete-confirm"
                                   onClick={() => handleDeleteConfirm(paper)}
@@ -537,11 +617,11 @@ export default function Stage2PaperHistory({ onCurrentSessionDataChanged }) {
                               <button
                                 className="btn-delete-paper"
                                 onClick={(e) => handleDeleteClick(e, paper)}
-                                title="Delete this paper"
+                                title="Prune this paper from future model context"
                               >
-                                Delete
+                                Prune
                               </button>
-                            )}
+                            ))}
                           </div>
 
                           <div className="paper-full-content">
diff --git a/frontend/src/components/compiler/CompilerInterface.jsx b/frontend/src/components/compiler/CompilerInterface.jsx
index 4b53975..9949eaa 100644
--- a/frontend/src/components/compiler/CompilerInterface.jsx
+++ b/frontend/src/components/compiler/CompilerInterface.jsx
@@ -1,18 +1,29 @@
 import React, { useState, useEffect } from 'react';
 import { compilerAPI } from '../../services/api';
 import { websocket } from '../../services/websocket';
+import {
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+} from '../../utils/openRouterSelection';
 import TextFileUploader from '../TextFileUploader';
 import { getRuntimeDataPath } from '../../utils/runtimeConfig';
+import '../autonomous/AutonomousResearch.css';
 
-function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false }) {
+function CompilerInterface({
+  activeTab,
+  capabilities,
+  anyWorkflowRunning = false,
+  onWorkflowRunningChange = null,
+  developerModeEnabled = false,
+}) {
   const [compilerPrompt, setCompilerPrompt] = useState('');
   const [status, setStatus] = useState({ is_running: false });
   const [isStarting, setIsStarting] = useState(false);
   const [error, setError] = useState(null);
-  const [validatorContextSize, setValidatorContextSize] = useState(131072);
-  const [highContextContextSize, setHighContextContextSize] = useState(131072);
-  const [highParamContextSize, setHighParamContextSize] = useState(131072);
-  const [critiqueSubmitterContextSize, setCritiqueSubmitterContextSize] = useState(131072);
+  const [validatorContextSize, setValidatorContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [highContextContextSize, setHighContextContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [highParamContextSize, setHighParamContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [critiqueSubmitterContextSize, setCritiqueSubmitterContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
   const [critiquePhaseActive, setCritiquePhaseActive] = useState(false);
   const [critiqueAcceptances, setCritiqueAcceptances] = useState(0);
   const [paperVersion, setPaperVersion] = useState(1);
@@ -75,16 +86,10 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
       // Skip worked! Keep skipQueued=true to show checkmark
     };
     
-    const handleBodyRewriteStarted = (data) => {
-      setPaperVersion(data.version || 1);
-      setSkipQueued(false);  // Reset skip state for new paper version
-    };
-    
     websocket.on('critique_phase_started', handleCritiquePhaseStarted);
     websocket.on('critique_progress', handleCritiqueProgress);
     websocket.on('critique_phase_ended', handleCritiquePhaseEnded);
     websocket.on('critique_phase_skipped', handleCritiquePhaseSkipped);
-    websocket.on('body_rewrite_started', handleBodyRewriteStarted);
     
     return () => {
       clearInterval(interval);
@@ -92,7 +97,6 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
       websocket.off('critique_progress', handleCritiqueProgress);
       websocket.off('critique_phase_ended', handleCritiquePhaseEnded);
       websocket.off('critique_phase_skipped', handleCritiquePhaseSkipped);
-      websocket.off('body_rewrite_started', handleBodyRewriteStarted);
     };
   }, []);
 
@@ -127,6 +131,9 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
     try {
       const response = await compilerAPI.getStatus();
       setStatus(response.data);
+      if (response.data.is_running) {
+        onWorkflowRunningChange?.(true);
+      }
       // Update critique phase state from status
       if (response.data.in_critique_phase !== undefined) {
         setCritiquePhaseActive(response.data.in_critique_phase);
@@ -181,35 +188,44 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
         validator_provider: lmStudioEnabled ? (settings.validatorProvider || 'lm_studio') : 'openrouter',
         validator_model: settings.validatorModel,
         validator_openrouter_provider: settings.validatorOpenrouterProvider || null,
+        validator_openrouter_reasoning_effort: settings.validatorOpenrouterReasoningEffort || 'auto',
         validator_lm_studio_fallback: lmStudioEnabled ? (settings.validatorLmStudioFallback || null) : null,
         validator_context_size: settings.validatorContextSize || validatorContextSize,
-        validator_max_output_tokens: settings.validatorMaxOutput || 25000,
+        validator_max_output_tokens: settings.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+        validator_supercharge_enabled: developerModeEnabled && Boolean(settings.validatorSuperchargeEnabled),
         // High-context submitter config with OpenRouter support
         high_context_provider: lmStudioEnabled ? (settings.highContextProvider || 'lm_studio') : 'openrouter',
         high_context_model: settings.highContextModel,
         high_context_openrouter_provider: settings.highContextOpenrouterProvider || null,
+        high_context_openrouter_reasoning_effort: settings.highContextOpenrouterReasoningEffort || 'auto',
         high_context_lm_studio_fallback: lmStudioEnabled ? (settings.highContextLmStudioFallback || null) : null,
         high_context_context_size: settings.highContextContextSize || highContextContextSize,
-        high_context_max_output_tokens: settings.highContextMaxOutput || 25000,
+        high_context_max_output_tokens: settings.highContextMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+        high_context_supercharge_enabled: developerModeEnabled && Boolean(settings.highContextSuperchargeEnabled),
         // High-param submitter config with OpenRouter support
         high_param_provider: lmStudioEnabled ? (settings.highParamProvider || 'lm_studio') : 'openrouter',
         high_param_model: settings.highParamModel,
         high_param_openrouter_provider: settings.highParamOpenrouterProvider || null,
+        high_param_openrouter_reasoning_effort: settings.highParamOpenrouterReasoningEffort || 'auto',
         high_param_lm_studio_fallback: lmStudioEnabled ? (settings.highParamLmStudioFallback || null) : null,
         high_param_context_size: settings.highParamContextSize || highParamContextSize,
-        high_param_max_output_tokens: settings.highParamMaxOutput || 25000,
+        high_param_max_output_tokens: settings.highParamMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+        high_param_supercharge_enabled: developerModeEnabled && Boolean(settings.highParamSuperchargeEnabled),
         // Critique submitter config with OpenRouter support
         critique_submitter_provider: lmStudioEnabled
           ? (settings.critiqueSubmitterProvider || 'lm_studio')
           : 'openrouter',
         critique_submitter_model: settings.critiqueSubmitterModel,
         critique_submitter_openrouter_provider: settings.critiqueSubmitterOpenrouterProvider || null,
+        critique_submitter_openrouter_reasoning_effort: settings.critiqueSubmitterOpenrouterReasoningEffort || 'auto',
         critique_submitter_lm_studio_fallback: lmStudioEnabled
           ? (settings.critiqueSubmitterLmStudioFallback || null)
           : null,
         critique_submitter_context_window: settings.critiqueSubmitterContextSize || critiqueSubmitterContextSize,
-        critique_submitter_max_tokens: settings.critiqueSubmitterMaxOutput || 25000
+        critique_submitter_max_tokens: settings.critiqueSubmitterMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS,
+        critique_submitter_supercharge_enabled: developerModeEnabled && Boolean(settings.critiqueSubmitterSuperchargeEnabled)
       });
+      onWorkflowRunningChange?.(true);
       
       await loadStatus();
     } catch (err) {
@@ -240,6 +256,7 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
     try {
       await compilerAPI.stop();
       setSkipQueued(false);  // Reset skip state when compiler stops
+      onWorkflowRunningChange?.(false);
       await loadStatus();
     } catch (error) {
       console.error('Failed to stop compiler:', error);
@@ -274,16 +291,50 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
   };
 
   return (
-    <div className="compiler-interface">
-      <h2>Compiler Interface</h2>
-      
-      <div className="status-indicator">
-        <span className={`status-badge ${status.is_running ? 'running' : 'stopped'}`}>
-          {status.is_running ? '● Running' : '○ Stopped'}
-        </span>
-        {status.current_mode && status.current_mode !== 'idle' && (
-          <span className="mode-badge">Mode: {status.current_mode}</span>
-        )}
+    <div className={`autonomous-interface compiler-interface workflow-main-interface ${status.is_running ? 'workflow-main-interface--running' : ''}`}>
+      <div className="autonomous-header">
+        <div>
+          <h2>Single Paper Writer</h2>
+          <p className="settings-hint">
+            Compile the accepted aggregator database into one live mathematical paper.
+          </p>
+        </div>
+        <div className="autonomous-controls">
+          {!status.is_running ? (
+            <button
+              onClick={handleStart}
+              className="btn-start"
+              disabled={isStarting || (anyWorkflowRunning && !status.is_running)}
+            >
+              {isStarting ? 'Starting...' : 'Start Writer'}
+            </button>
+          ) : (
+            <>
+              <span className="runtime-indicator" role="status" aria-live="polite" title="Single paper writer is running">
+                <span className="runtime-indicator-dot" aria-hidden="true"></span>
+                <span className="runtime-indicator-label">Running</span>
+              </span>
+              <button
+                onClick={handleStop}
+                className="btn-stop"
+              >
+                Stop Writer
+              </button>
+            </>
+          )}
+        </div>
+      </div>
+
+      <div className="status-section">
+        <div className="status-tier">
+          <span className="status-label">Current Status:</span>
+          <span className={`status-value ${status.is_running ? 'status-running' : 'status-idle'}`}>
+            {status.is_running ? 'Paper Writing' : 'Not Running'}
+          </span>
+          {status.current_mode && status.current_mode !== 'idle' && (
+            <span className="mode-badge">Mode: {status.current_mode}</span>
+          )}
+        </div>
       </div>
 
       {status.is_running && (
@@ -345,13 +396,13 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
           </div>
           {error.suggestion && (
             <div className="error-suggestion">
-              <p><strong>💡 Suggestion:</strong> {error.suggestion}</p>
+              <p><strong>Suggestion:</strong> {error.suggestion}</p>
             </div>
           )}
         </div>
       )}
 
-      <div className="form-group">
+      <div className="research-prompt-section">
         <label htmlFor="compilerPrompt">Compiler-Directing Prompt:</label>
         <textarea
           id="compilerPrompt"
@@ -372,39 +423,26 @@ function CompilerInterface({ activeTab, capabilities, anyWorkflowRunning = false
         <small>This prompt directs the compiler on what kind of mathematical document to create from the aggregated database. View your in-progress and final answer in the "Live Paper" tab.</small>
       </div>
 
-      <div className="form-group">
-        <label htmlFor="contextSizeDisplay">Context Window Sizes:</label>
-        <div className="context-size-display">
-          <div><strong>Validator:</strong> {validatorContextSize.toLocaleString()} tokens</div>
-          <div><strong>High-Context:</strong> {highContextContextSize.toLocaleString()} tokens</div>
-          <div><strong>High-Parameter:</strong> {highParamContextSize.toLocaleString()} tokens</div>
-          <div><strong>Critique Submitter:</strong> {critiqueSubmitterContextSize.toLocaleString()} tokens</div>
-          <small style={{marginTop: '0.5rem', display: 'block', color: '#666'}}>
-            (Change these in the Compiler Settings tab)
-          </small>
+      <div className="stats-section">
+        <div className="stat-item">
+          <span className="stat-value">{validatorContextSize.toLocaleString()}</span>
+          <span className="stat-label">Validator Tokens</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{highContextContextSize.toLocaleString()}</span>
+          <span className="stat-label">High-Context Tokens</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{highParamContextSize.toLocaleString()}</span>
+          <span className="stat-label">High-Param Tokens</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{critiqueSubmitterContextSize.toLocaleString()}</span>
+          <span className="stat-label">Critique Tokens</span>
         </div>
       </div>
 
-      <div className="button-group">
-        {!status.is_running ? (
-          <button 
-            onClick={handleStart} 
-            className="btn btn-primary"
-            disabled={isStarting || (anyWorkflowRunning && !status.is_running)}
-          >
-            {isStarting ? 'Starting...' : 'Start Compiler'}
-          </button>
-        ) : (
-          <button 
-            onClick={handleStop} 
-            className="btn btn-danger"
-          >
-            Stop Compiler
-          </button>
-        )}
-      </div>
-
-      <div className="info-section">
+      <div className="status-section">
         <h3>Aggregator Database</h3>
         <p>The compiler will read from the aggregator's accepted submissions database.</p>
         <p>Location: <code>{getRuntimeDataPath('rag_shared_training.txt')}</code></p>
diff --git a/frontend/src/components/compiler/CompilerLogs.jsx b/frontend/src/components/compiler/CompilerLogs.jsx
index 0d56f57..fde1cb5 100644
--- a/frontend/src/components/compiler/CompilerLogs.jsx
+++ b/frontend/src/components/compiler/CompilerLogs.jsx
@@ -1,6 +1,9 @@
 import React, { useState, useEffect } from 'react';
 import { compilerAPI } from '../../services/api';
 import { websocket } from '../../services/websocket';
+import LiveActivityFeed from '../LiveActivityFeed';
+import { getActivityClass, getActivityIcon } from '../../utils/activityStyles';
+import '../autonomous/AutonomousResearch.css';
 
 function CompilerLogs() {
   const [metrics, setMetrics] = useState({
@@ -128,11 +131,7 @@ function CompilerLogs() {
     websocket.on('critique_removed', handleCompilerEvent);
     websocket.on('critique_phase_ended', handleCritiquePhaseEnded);
     websocket.on('critique_phase_skipped', handleCompilerEvent);
-
-    // Rewrite events
-    websocket.on('rewrite_decision_rejected', handleCompilerEvent);
-    websocket.on('rewrite_decision_max_retries_exceeded', handleCompilerEvent);
-    websocket.on('body_rewrite_started', handleCompilerEvent);
+    websocket.on('self_review_appended', handleCompilerEvent);
 
     // Phase transition events
     websocket.on('phase_transition', handleCompilerEvent);
@@ -167,11 +166,7 @@ function CompilerLogs() {
       websocket.off('critique_removed', handleCompilerEvent);
       websocket.off('critique_phase_ended', handleCritiquePhaseEnded);
       websocket.off('critique_phase_skipped', handleCompilerEvent);
-
-      // Rewrite events cleanup
-      websocket.off('rewrite_decision_rejected', handleCompilerEvent);
-      websocket.off('rewrite_decision_max_retries_exceeded', handleCompilerEvent);
-      websocket.off('body_rewrite_started', handleCompilerEvent);
+      websocket.off('self_review_appended', handleCompilerEvent);
 
       // Phase transition events cleanup
       websocket.off('phase_transition', handleCompilerEvent);
@@ -263,13 +258,13 @@ function CompilerLogs() {
 
     // Critique phase events
     if (type === 'critique_phase_started') {
-      return `Critique phase started (paper v${data.paper_version || 1}, target: ${data.target_critiques || 5} attempts)`;
+      return `Critique phase started (paper v${data.paper_version || 1}, target: ${data.target_critiques || 3} attempts)`;
     }
     if (type === 'critique_progress') {
-      return `Progress: ${data.acceptances || 0} accepted, ${data.rejections || 0} rejected, ${data.total_attempts || 0}/5 total`;
+      return `Progress: ${data.acceptances || 0} accepted, ${data.rejections || 0} rejected, ${data.total_attempts || 0}/${data.target || 3} total`;
     }
     if (type === 'critique_accepted') {
-      return `Critique ACCEPTED (${data.count || '?'}/5): ${(data.preview || '').substring(0, 80)}...`;
+      return `Critique ACCEPTED (${data.count || '?'}/${data.target || 3}): ${(data.preview || '').substring(0, 80)}...`;
     }
     if (type === 'critique_rejected') {
       return `Critique REJECTED: ${(data.reasoning || '').substring(0, 100)}...`;
@@ -284,21 +279,13 @@ function CompilerLogs() {
       return `Critique #${data.critique_number} removed via cleanup`;
     }
     if (type === 'critique_phase_ended') {
-      return `Critique phase ended (rewrite: ${data.rewrite ? 'YES' : 'NO'})`;
+      return `Critique phase ended (self-review appended: ${data.self_review_appended ? 'YES' : 'NO'})`;
     }
     if (type === 'critique_phase_skipped') {
       return `Critique phase skipped: ${data.reason || 'no critiques accepted'}`;
     }
-
-    // Rewrite events
-    if (type === 'rewrite_decision_rejected') {
-      return `Rewrite decision rejected (attempt ${data.attempt || '?'}/${data.max_retries || 5})`;
-    }
-    if (type === 'rewrite_decision_max_retries_exceeded') {
-      return `Rewrite decision failed after max retries - defaulting to ${data.action || 'continue'}`;
-    }
-    if (type === 'body_rewrite_started') {
-      return `Body REWRITE started (v${data.version || '?'}) - title changed: ${data.title_changed ? 'YES' : 'NO'}`;
+    if (type === 'self_review_appended') {
+      return `AI self-review appended (${data.critique_count || 0} accepted critique${data.critique_count === 1 ? '' : 's'})`;
     }
 
     // Phase transitions
@@ -351,7 +338,7 @@ function CompilerLogs() {
     if (type?.includes('rejected') || type?.includes('rejection') || type === 'compiler_error') {
       return 'event-error';
     }
-    if (type?.includes('critique') || type?.includes('phase') || type?.includes('rewrite')) {
+    if (type?.includes('critique') || type?.includes('phase') || type?.includes('self_review')) {
       return 'event-info';
     }
     if (type === 'compiler_wolfram_call') {
@@ -363,9 +350,13 @@ function CompilerLogs() {
     return '';
   };
 
+  const chronologicalEvents = events.slice().reverse();
+
   return (
-    <div className="compiler-logs">
-      <h2>Compiler Logs</h2>
+    <div className="autonomous-logs compiler-logs">
+      <div className="autonomous-header">
+        <h2>Single Paper Writer Logs</h2>
+      </div>
 
       {/* Error Alert */}
       {error && (
@@ -489,32 +480,21 @@ function CompilerLogs() {
             )}
           </div>
 
-          <div className="events-section">
-            <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: '1rem' }}>
-              <h3>Recent Events (Last 10,000 - Persistent)</h3>
-              <button onClick={clearEventsLog} className="clear-log-btn" style={{ padding: '0.5rem 1rem', cursor: 'pointer' }}>
+          <LiveActivityFeed
+            title={`Live Activity${events.length > 0 ? ` (${events.length} saved)` : ''}`}
+            items={chronologicalEvents}
+            emptyMessage="No events yet"
+            getEventName={(event) => event.type || ''}
+            getMessage={formatEventDisplay}
+            getTimestamp={(event) => event.fullTimestamp || event.timestamp}
+            getClassName={getActivityClass}
+            getIcon={getActivityIcon}
+            headerAction={(
+              <button onClick={clearEventsLog} className="btn-clear">
                 Clear Events Log
               </button>
-            </div>
-            <div className="events-list">
-              {events.length === 0 ? (
-                <p className="no-events">No events yet</p>
-              ) : (
-                <>
-                  <div style={{ marginBottom: '0.5rem', color: '#aaa', fontSize: '0.9rem' }}>
-                    Showing {events.length} events (saved to browser storage)
-                  </div>
-                  {events.map((event, index) => (
-                    <div key={index} className={`event-item event-${event.type} ${getEventClass(event.type)}`}>
-                      <span className="event-time">{event.timestamp}</span>
-                      <span className="event-type">{(event.type || '').replace(/_/g, ' ')}</span>
-                      <span className="event-data">{formatEventDisplay(event)}</span>
-                    </div>
-                  ))}
-                </>
-              )}
-            </div>
-          </div>
+            )}
+          />
 
           <div className="info-section">
             <h4>Convergence Indicators</h4>
diff --git a/frontend/src/components/compiler/CompilerSettings.jsx b/frontend/src/components/compiler/CompilerSettings.jsx
index 37de78e..9aaf1de 100644
--- a/frontend/src/components/compiler/CompilerSettings.jsx
+++ b/frontend/src/components/compiler/CompilerSettings.jsx
@@ -2,16 +2,29 @@ import React, { useState, useEffect } from 'react';
 import { openRouterAPI, api, aggregatorAPI, compilerAPI } from '../../services/api';
 import {
   computeOpenRouterAutoSettings,
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
   findOpenRouterModel,
   getProviderNames,
+  getReasoningSupportInfo,
   hasEndpointMetadata,
+  normalizeOpenRouterReasoningEffort,
+  OPENROUTER_REASONING_EFFORT_OPTIONS,
 } from '../../utils/openRouterSelection';
 import HelpTooltip from '../HelpTooltip';
+import HighlightedModelsSidebar from '../HighlightedModelsSidebar';
+import ProofStrengthBadge from '../ProofStrengthBadge';
+import RawSettingsEditor from '../RawSettingsEditor';
+import '../autonomous/AutonomousResearch.css';
 import '../settings-common.css';
 
 const SETTINGS_KEY = 'compiler_settings';
+const RAW_VIEW_EXIT_WARNING = 'Switching back to the GUI view will restore your last GUI settings/profile and discard raw-only changes. Continue?';
+const formatRawSettings = (value) => JSON.stringify(value, null, 2);
+const SUPERCHARGE_TOOLTIP = 'Supercharge makes this role generate 4 full answer attempts, then run a 5th same-model call to choose or synthesize the best final answer. It uses 5x the API calls, so it is about 5x slower and 5x more costly, but can produce more intelligent answers.';
 
-function CompilerSettings({ capabilities }) {
+function CompilerSettings({ capabilities, developerModeEnabled = false }) {
   // LM Studio and OpenRouter models
   const [lmStudioModels, setLmStudioModels] = useState([]);
   const [openRouterModels, setOpenRouterModels] = useState([]);
@@ -26,36 +39,48 @@ function CompilerSettings({ capabilities }) {
   const [validatorProvider, setValidatorProvider] = useState('lm_studio');
   const [validatorModel, setValidatorModel] = useState('');
   const [validatorOpenrouterProvider, setValidatorOpenrouterProvider] = useState(null);
+  const [validatorOpenrouterReasoningEffort, setValidatorOpenrouterReasoningEffort] = useState(DEFAULT_OPENROUTER_REASONING_EFFORT);
   const [validatorLmStudioFallback, setValidatorLmStudioFallback] = useState(null);
-  const [validatorContextSize, setValidatorContextSize] = useState(131072);
-  const [validatorMaxOutput, setValidatorMaxOutput] = useState(25000);
+  const [validatorContextSize, setValidatorContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [validatorMaxOutput, setValidatorMaxOutput] = useState(DEFAULT_MAX_OUTPUT_TOKENS);
+  const [validatorSuperchargeEnabled, setValidatorSuperchargeEnabled] = useState(false);
 
   // High-Context settings
   const [highContextProvider, setHighContextProvider] = useState('lm_studio');
   const [highContextModel, setHighContextModel] = useState('');
   const [highContextOpenrouterProvider, setHighContextOpenrouterProvider] = useState(null);
+  const [highContextOpenrouterReasoningEffort, setHighContextOpenrouterReasoningEffort] = useState(DEFAULT_OPENROUTER_REASONING_EFFORT);
   const [highContextLmStudioFallback, setHighContextLmStudioFallback] = useState(null);
-  const [highContextContextSize, setHighContextContextSize] = useState(131072);
-  const [highContextMaxOutput, setHighContextMaxOutput] = useState(25000);
+  const [highContextContextSize, setHighContextContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [highContextMaxOutput, setHighContextMaxOutput] = useState(DEFAULT_MAX_OUTPUT_TOKENS);
+  const [highContextSuperchargeEnabled, setHighContextSuperchargeEnabled] = useState(false);
 
   // High-Param settings
   const [highParamProvider, setHighParamProvider] = useState('lm_studio');
   const [highParamModel, setHighParamModel] = useState('');
   const [highParamOpenrouterProvider, setHighParamOpenrouterProvider] = useState(null);
+  const [highParamOpenrouterReasoningEffort, setHighParamOpenrouterReasoningEffort] = useState(DEFAULT_OPENROUTER_REASONING_EFFORT);
   const [highParamLmStudioFallback, setHighParamLmStudioFallback] = useState(null);
-  const [highParamContextSize, setHighParamContextSize] = useState(131072);
-  const [highParamMaxOutput, setHighParamMaxOutput] = useState(25000);
+  const [highParamContextSize, setHighParamContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [highParamMaxOutput, setHighParamMaxOutput] = useState(DEFAULT_MAX_OUTPUT_TOKENS);
+  const [highParamSuperchargeEnabled, setHighParamSuperchargeEnabled] = useState(false);
 
   // Critique Submitter settings
   const [critiqueSubmitterProvider, setCritiqueSubmitterProvider] = useState('lm_studio');
   const [critiqueSubmitterModel, setCritiqueSubmitterModel] = useState('');
   const [critiqueSubmitterOpenrouterProvider, setCritiqueSubmitterOpenrouterProvider] = useState(null);
+  const [critiqueSubmitterOpenrouterReasoningEffort, setCritiqueSubmitterOpenrouterReasoningEffort] = useState(DEFAULT_OPENROUTER_REASONING_EFFORT);
   const [critiqueSubmitterLmStudioFallback, setCritiqueSubmitterLmStudioFallback] = useState(null);
-  const [critiqueSubmitterContextSize, setCritiqueSubmitterContextSize] = useState(131072);
-  const [critiqueSubmitterMaxOutput, setCritiqueSubmitterMaxOutput] = useState(25000);
+  const [critiqueSubmitterContextSize, setCritiqueSubmitterContextSize] = useState(DEFAULT_CONTEXT_WINDOW);
+  const [critiqueSubmitterMaxOutput, setCritiqueSubmitterMaxOutput] = useState(DEFAULT_MAX_OUTPUT_TOKENS);
+  const [critiqueSubmitterSuperchargeEnabled, setCritiqueSubmitterSuperchargeEnabled] = useState(false);
 
   const [saveStatus, setSaveStatus] = useState('');
   const [isLoaded, setIsLoaded] = useState(false);
+  const [editRawSettings, setEditRawSettings] = useState(false);
+  const [rawSettingsText, setRawSettingsText] = useState('');
+  const [rawSettingsMessage, setRawSettingsMessage] = useState('');
+  const [guiSettingsBeforeRaw, setGuiSettingsBeforeRaw] = useState(null);
 
   // Wolfram Alpha settings
   const [wolframEnabled, setWolframEnabled] = useState(false);
@@ -72,12 +97,20 @@ function CompilerSettings({ capabilities }) {
   const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
   const genericMode = Boolean(capabilities?.genericMode);
 
-  const normalizeRoleState = (provider, model, openrouterProvider) => {
+  useEffect(() => {
+    if (!developerModeEnabled && editRawSettings) {
+      setEditRawSettings(false);
+      setRawSettingsMessage('');
+    }
+  }, [developerModeEnabled, editRawSettings]);
+
+  const normalizeRoleState = (provider, model, openrouterProvider, reasoningEffort) => {
     const keepOpenRouterState = provider === 'openrouter';
     return {
       provider: 'openrouter',
       model: keepOpenRouterState ? (model || '') : '',
       openrouterProvider: keepOpenRouterState ? (openrouterProvider || null) : null,
+      openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(reasoningEffort),
       lmStudioFallback: null,
     };
   };
@@ -117,30 +150,38 @@ function CompilerSettings({ capabilities }) {
           if (settings.validatorProvider) setValidatorProvider(settings.validatorProvider);
           if (settings.validatorModel) setValidatorModel(settings.validatorModel);
           if (settings.validatorOpenrouterProvider) setValidatorOpenrouterProvider(settings.validatorOpenrouterProvider);
+          if (settings.validatorOpenrouterReasoningEffort) setValidatorOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(settings.validatorOpenrouterReasoningEffort));
           if (settings.validatorLmStudioFallback) setValidatorLmStudioFallback(settings.validatorLmStudioFallback);
           if (settings.validatorContextSize) setValidatorContextSize(settings.validatorContextSize);
           if (settings.validatorMaxOutput) setValidatorMaxOutput(settings.validatorMaxOutput);
+          if (settings.validatorSuperchargeEnabled !== undefined) setValidatorSuperchargeEnabled(settings.validatorSuperchargeEnabled);
           // High-Context
           if (settings.highContextProvider) setHighContextProvider(settings.highContextProvider);
           if (settings.highContextModel) setHighContextModel(settings.highContextModel);
           if (settings.highContextOpenrouterProvider) setHighContextOpenrouterProvider(settings.highContextOpenrouterProvider);
+          if (settings.highContextOpenrouterReasoningEffort) setHighContextOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(settings.highContextOpenrouterReasoningEffort));
           if (settings.highContextLmStudioFallback) setHighContextLmStudioFallback(settings.highContextLmStudioFallback);
           if (settings.highContextContextSize) setHighContextContextSize(settings.highContextContextSize);
           if (settings.highContextMaxOutput) setHighContextMaxOutput(settings.highContextMaxOutput);
+          if (settings.highContextSuperchargeEnabled !== undefined) setHighContextSuperchargeEnabled(settings.highContextSuperchargeEnabled);
           // High-Param
           if (settings.highParamProvider) setHighParamProvider(settings.highParamProvider);
           if (settings.highParamModel) setHighParamModel(settings.highParamModel);
           if (settings.highParamOpenrouterProvider) setHighParamOpenrouterProvider(settings.highParamOpenrouterProvider);
+          if (settings.highParamOpenrouterReasoningEffort) setHighParamOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(settings.highParamOpenrouterReasoningEffort));
           if (settings.highParamLmStudioFallback) setHighParamLmStudioFallback(settings.highParamLmStudioFallback);
           if (settings.highParamContextSize) setHighParamContextSize(settings.highParamContextSize);
           if (settings.highParamMaxOutput) setHighParamMaxOutput(settings.highParamMaxOutput);
+          if (settings.highParamSuperchargeEnabled !== undefined) setHighParamSuperchargeEnabled(settings.highParamSuperchargeEnabled);
           // Critique Submitter
           if (settings.critiqueSubmitterProvider) setCritiqueSubmitterProvider(settings.critiqueSubmitterProvider);
           if (settings.critiqueSubmitterModel) setCritiqueSubmitterModel(settings.critiqueSubmitterModel);
           if (settings.critiqueSubmitterOpenrouterProvider) setCritiqueSubmitterOpenrouterProvider(settings.critiqueSubmitterOpenrouterProvider);
+          if (settings.critiqueSubmitterOpenrouterReasoningEffort) setCritiqueSubmitterOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(settings.critiqueSubmitterOpenrouterReasoningEffort));
           if (settings.critiqueSubmitterLmStudioFallback) setCritiqueSubmitterLmStudioFallback(settings.critiqueSubmitterLmStudioFallback);
           if (settings.critiqueSubmitterContextSize) setCritiqueSubmitterContextSize(settings.critiqueSubmitterContextSize);
           if (settings.critiqueSubmitterMaxOutput) setCritiqueSubmitterMaxOutput(settings.critiqueSubmitterMaxOutput);
+          if (settings.critiqueSubmitterSuperchargeEnabled !== undefined) setCritiqueSubmitterSuperchargeEnabled(settings.critiqueSubmitterSuperchargeEnabled);
           // Wolfram Alpha
           if (settings.wolframEnabled !== undefined) setWolframEnabled(settings.wolframEnabled);
           // Free-only toggle
@@ -183,22 +224,26 @@ function CompilerSettings({ capabilities }) {
     const nextValidator = normalizeRoleState(
       validatorProvider,
       validatorModel,
-      validatorOpenrouterProvider
+      validatorOpenrouterProvider,
+      validatorOpenrouterReasoningEffort
     );
     const nextHighContext = normalizeRoleState(
       highContextProvider,
       highContextModel,
-      highContextOpenrouterProvider
+      highContextOpenrouterProvider,
+      highContextOpenrouterReasoningEffort
     );
     const nextHighParam = normalizeRoleState(
       highParamProvider,
       highParamModel,
-      highParamOpenrouterProvider
+      highParamOpenrouterProvider,
+      highParamOpenrouterReasoningEffort
     );
     const nextCritique = normalizeRoleState(
       critiqueSubmitterProvider,
       critiqueSubmitterModel,
-      critiqueSubmitterOpenrouterProvider
+      critiqueSubmitterOpenrouterProvider,
+      critiqueSubmitterOpenrouterReasoningEffort
     );
 
     if (validatorProvider !== nextValidator.provider) setValidatorProvider(nextValidator.provider);
@@ -206,6 +251,9 @@ function CompilerSettings({ capabilities }) {
     if (validatorOpenrouterProvider !== nextValidator.openrouterProvider) {
       setValidatorOpenrouterProvider(nextValidator.openrouterProvider);
     }
+    if (validatorOpenrouterReasoningEffort !== nextValidator.openrouterReasoningEffort) {
+      setValidatorOpenrouterReasoningEffort(nextValidator.openrouterReasoningEffort);
+    }
     if (validatorLmStudioFallback !== null) setValidatorLmStudioFallback(null);
 
     if (highContextProvider !== nextHighContext.provider) setHighContextProvider(nextHighContext.provider);
@@ -213,6 +261,9 @@ function CompilerSettings({ capabilities }) {
     if (highContextOpenrouterProvider !== nextHighContext.openrouterProvider) {
       setHighContextOpenrouterProvider(nextHighContext.openrouterProvider);
     }
+    if (highContextOpenrouterReasoningEffort !== nextHighContext.openrouterReasoningEffort) {
+      setHighContextOpenrouterReasoningEffort(nextHighContext.openrouterReasoningEffort);
+    }
     if (highContextLmStudioFallback !== null) setHighContextLmStudioFallback(null);
 
     if (highParamProvider !== nextHighParam.provider) setHighParamProvider(nextHighParam.provider);
@@ -220,6 +271,9 @@ function CompilerSettings({ capabilities }) {
     if (highParamOpenrouterProvider !== nextHighParam.openrouterProvider) {
       setHighParamOpenrouterProvider(nextHighParam.openrouterProvider);
     }
+    if (highParamOpenrouterReasoningEffort !== nextHighParam.openrouterReasoningEffort) {
+      setHighParamOpenrouterReasoningEffort(nextHighParam.openrouterReasoningEffort);
+    }
     if (highParamLmStudioFallback !== null) setHighParamLmStudioFallback(null);
 
     if (critiqueSubmitterProvider !== nextCritique.provider) {
@@ -229,24 +283,31 @@ function CompilerSettings({ capabilities }) {
     if (critiqueSubmitterOpenrouterProvider !== nextCritique.openrouterProvider) {
       setCritiqueSubmitterOpenrouterProvider(nextCritique.openrouterProvider);
     }
+    if (critiqueSubmitterOpenrouterReasoningEffort !== nextCritique.openrouterReasoningEffort) {
+      setCritiqueSubmitterOpenrouterReasoningEffort(nextCritique.openrouterReasoningEffort);
+    }
     if (critiqueSubmitterLmStudioFallback !== null) setCritiqueSubmitterLmStudioFallback(null);
   }, [
     lmStudioEnabled,
     validatorProvider,
     validatorModel,
     validatorOpenrouterProvider,
+    validatorOpenrouterReasoningEffort,
     validatorLmStudioFallback,
     highContextProvider,
     highContextModel,
     highContextOpenrouterProvider,
+    highContextOpenrouterReasoningEffort,
     highContextLmStudioFallback,
     highParamProvider,
     highParamModel,
     highParamOpenrouterProvider,
+    highParamOpenrouterReasoningEffort,
     highParamLmStudioFallback,
     critiqueSubmitterProvider,
     critiqueSubmitterModel,
     critiqueSubmitterOpenrouterProvider,
+    critiqueSubmitterOpenrouterReasoningEffort,
     critiqueSubmitterLmStudioFallback,
   ]);
 
@@ -280,14 +341,14 @@ function CompilerSettings({ capabilities }) {
     if (!isLoaded) return;
     
     const settings = {
-      validatorProvider, validatorModel, validatorOpenrouterProvider, validatorLmStudioFallback,
-      validatorContextSize, validatorMaxOutput,
-      highContextProvider, highContextModel, highContextOpenrouterProvider, highContextLmStudioFallback,
-      highContextContextSize, highContextMaxOutput,
-      highParamProvider, highParamModel, highParamOpenrouterProvider, highParamLmStudioFallback,
-      highParamContextSize, highParamMaxOutput,
-      critiqueSubmitterProvider, critiqueSubmitterModel, critiqueSubmitterOpenrouterProvider, critiqueSubmitterLmStudioFallback,
-      critiqueSubmitterContextSize, critiqueSubmitterMaxOutput,
+      validatorProvider, validatorModel, validatorOpenrouterProvider, validatorOpenrouterReasoningEffort, validatorLmStudioFallback,
+      validatorContextSize, validatorMaxOutput, validatorSuperchargeEnabled,
+      highContextProvider, highContextModel, highContextOpenrouterProvider, highContextOpenrouterReasoningEffort, highContextLmStudioFallback,
+      highContextContextSize, highContextMaxOutput, highContextSuperchargeEnabled,
+      highParamProvider, highParamModel, highParamOpenrouterProvider, highParamOpenrouterReasoningEffort, highParamLmStudioFallback,
+      highParamContextSize, highParamMaxOutput, highParamSuperchargeEnabled,
+      critiqueSubmitterProvider, critiqueSubmitterModel, critiqueSubmitterOpenrouterProvider, critiqueSubmitterOpenrouterReasoningEffort, critiqueSubmitterLmStudioFallback,
+      critiqueSubmitterContextSize, critiqueSubmitterMaxOutput, critiqueSubmitterSuperchargeEnabled,
       wolframEnabled,
       freeOnly,
       freeModelLooping,
@@ -299,14 +360,14 @@ function CompilerSettings({ capabilities }) {
     const timer = setTimeout(() => setSaveStatus(''), 2000);
     return () => clearTimeout(timer);
   }, [
-    isLoaded, validatorProvider, validatorModel, validatorOpenrouterProvider, validatorLmStudioFallback,
-    validatorContextSize, validatorMaxOutput,
-    highContextProvider, highContextModel, highContextOpenrouterProvider, highContextLmStudioFallback,
-    highContextContextSize, highContextMaxOutput,
-    highParamProvider, highParamModel, highParamOpenrouterProvider, highParamLmStudioFallback,
-    highParamContextSize, highParamMaxOutput,
-    critiqueSubmitterProvider, critiqueSubmitterModel, critiqueSubmitterOpenrouterProvider, critiqueSubmitterLmStudioFallback,
-    critiqueSubmitterContextSize, critiqueSubmitterMaxOutput,
+    isLoaded, validatorProvider, validatorModel, validatorOpenrouterProvider, validatorOpenrouterReasoningEffort, validatorLmStudioFallback,
+    validatorContextSize, validatorMaxOutput, validatorSuperchargeEnabled,
+    highContextProvider, highContextModel, highContextOpenrouterProvider, highContextOpenrouterReasoningEffort, highContextLmStudioFallback,
+    highContextContextSize, highContextMaxOutput, highContextSuperchargeEnabled,
+    highParamProvider, highParamModel, highParamOpenrouterProvider, highParamOpenrouterReasoningEffort, highParamLmStudioFallback,
+    highParamContextSize, highParamMaxOutput, highParamSuperchargeEnabled,
+    critiqueSubmitterProvider, critiqueSubmitterModel, critiqueSubmitterOpenrouterProvider, critiqueSubmitterOpenrouterReasoningEffort, critiqueSubmitterLmStudioFallback,
+    critiqueSubmitterContextSize, critiqueSubmitterMaxOutput, critiqueSubmitterSuperchargeEnabled,
     wolframEnabled,
     freeOnly, freeModelLooping, freeModelAutoSelector, modelProviders
   ]);
@@ -491,21 +552,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         setValidatorProvider('lm_studio');
         setValidatorModel(settings.validator_model || settings.submitter_model);
         setValidatorOpenrouterProvider(null);
+        setValidatorOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
         setValidatorLmStudioFallback(null);
         
         setHighContextProvider('lm_studio');
         setHighContextModel(settings.submitter_model);
         setHighContextOpenrouterProvider(null);
+        setHighContextOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
         setHighContextLmStudioFallback(null);
         
         setHighParamProvider('lm_studio');
         setHighParamModel(settings.submitter_model);
         setHighParamOpenrouterProvider(null);
+        setHighParamOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
         setHighParamLmStudioFallback(null);
         
         setCritiqueSubmitterProvider('lm_studio');
         setCritiqueSubmitterModel(settings.submitter_model);
         setCritiqueSubmitterOpenrouterProvider(null);
+        setCritiqueSubmitterOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
         setCritiqueSubmitterLmStudioFallback(null);
         
         alert('Successfully loaded aggregator models for all roles!');
@@ -518,6 +583,140 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     }
   };
 
+  const getCompilerRawSettings = () => ({
+    validatorProvider,
+    validatorModel,
+    validatorOpenrouterProvider,
+    validatorOpenrouterReasoningEffort,
+    validatorLmStudioFallback,
+    validatorContextSize,
+    validatorMaxOutput,
+    validatorSuperchargeEnabled,
+    highContextProvider,
+    highContextModel,
+    highContextOpenrouterProvider,
+    highContextOpenrouterReasoningEffort,
+    highContextLmStudioFallback,
+    highContextContextSize,
+    highContextMaxOutput,
+    highContextSuperchargeEnabled,
+    highParamProvider,
+    highParamModel,
+    highParamOpenrouterProvider,
+    highParamOpenrouterReasoningEffort,
+    highParamLmStudioFallback,
+    highParamContextSize,
+    highParamMaxOutput,
+    highParamSuperchargeEnabled,
+    critiqueSubmitterProvider,
+    critiqueSubmitterModel,
+    critiqueSubmitterOpenrouterProvider,
+    critiqueSubmitterOpenrouterReasoningEffort,
+    critiqueSubmitterLmStudioFallback,
+    critiqueSubmitterContextSize,
+    critiqueSubmitterMaxOutput,
+    critiqueSubmitterSuperchargeEnabled,
+    wolframEnabled,
+    freeOnly,
+    freeModelLooping,
+    freeModelAutoSelector,
+    modelProviders,
+  });
+
+  const applyCompilerRawSettings = (rawSettings, { updateRawText = true } = {}) => {
+    setValidatorProvider(rawSettings.validatorProvider || 'lm_studio');
+    setValidatorModel(rawSettings.validatorModel || '');
+    setValidatorOpenrouterProvider(rawSettings.validatorOpenrouterProvider || null);
+    setValidatorOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(rawSettings.validatorOpenrouterReasoningEffort));
+    setValidatorLmStudioFallback(rawSettings.validatorLmStudioFallback || null);
+    setValidatorContextSize(Number(rawSettings.validatorContextSize || DEFAULT_CONTEXT_WINDOW));
+    setValidatorMaxOutput(Number(rawSettings.validatorMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS));
+    setValidatorSuperchargeEnabled(Boolean(rawSettings.validatorSuperchargeEnabled));
+    setHighContextProvider(rawSettings.highContextProvider || 'lm_studio');
+    setHighContextModel(rawSettings.highContextModel || '');
+    setHighContextOpenrouterProvider(rawSettings.highContextOpenrouterProvider || null);
+    setHighContextOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(rawSettings.highContextOpenrouterReasoningEffort));
+    setHighContextLmStudioFallback(rawSettings.highContextLmStudioFallback || null);
+    setHighContextContextSize(Number(rawSettings.highContextContextSize || DEFAULT_CONTEXT_WINDOW));
+    setHighContextMaxOutput(Number(rawSettings.highContextMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS));
+    setHighContextSuperchargeEnabled(Boolean(rawSettings.highContextSuperchargeEnabled));
+    setHighParamProvider(rawSettings.highParamProvider || 'lm_studio');
+    setHighParamModel(rawSettings.highParamModel || '');
+    setHighParamOpenrouterProvider(rawSettings.highParamOpenrouterProvider || null);
+    setHighParamOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(rawSettings.highParamOpenrouterReasoningEffort));
+    setHighParamLmStudioFallback(rawSettings.highParamLmStudioFallback || null);
+    setHighParamContextSize(Number(rawSettings.highParamContextSize || DEFAULT_CONTEXT_WINDOW));
+    setHighParamMaxOutput(Number(rawSettings.highParamMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS));
+    setHighParamSuperchargeEnabled(Boolean(rawSettings.highParamSuperchargeEnabled));
+    setCritiqueSubmitterProvider(rawSettings.critiqueSubmitterProvider || 'lm_studio');
+    setCritiqueSubmitterModel(rawSettings.critiqueSubmitterModel || '');
+    setCritiqueSubmitterOpenrouterProvider(rawSettings.critiqueSubmitterOpenrouterProvider || null);
+    setCritiqueSubmitterOpenrouterReasoningEffort(normalizeOpenRouterReasoningEffort(rawSettings.critiqueSubmitterOpenrouterReasoningEffort));
+    setCritiqueSubmitterLmStudioFallback(rawSettings.critiqueSubmitterLmStudioFallback || null);
+    setCritiqueSubmitterContextSize(Number(rawSettings.critiqueSubmitterContextSize || DEFAULT_CONTEXT_WINDOW));
+    setCritiqueSubmitterMaxOutput(Number(rawSettings.critiqueSubmitterMaxOutput || DEFAULT_MAX_OUTPUT_TOKENS));
+    setCritiqueSubmitterSuperchargeEnabled(Boolean(rawSettings.critiqueSubmitterSuperchargeEnabled));
+    setWolframEnabled(rawSettings.wolframEnabled ?? false);
+    setFreeOnly(rawSettings.freeOnly ?? false);
+    setFreeModelLooping(rawSettings.freeModelLooping ?? true);
+    setFreeModelAutoSelector(rawSettings.freeModelAutoSelector ?? true);
+    setModelProviders(rawSettings.modelProviders || {});
+
+    if (updateRawText) {
+      setRawSettingsText(formatRawSettings({
+        ...rawSettings,
+        validatorProvider: rawSettings.validatorProvider || 'lm_studio',
+        validatorModel: rawSettings.validatorModel || '',
+        validatorOpenrouterReasoningEffort: normalizeOpenRouterReasoningEffort(rawSettings.validatorOpenrouterReasoningEffort),
+        highContextProvider: rawSettings.highContextProvider || 'lm_studio',
+        highContextModel: rawSettings.highContextModel || '',
+        highContextOpenrouterReasoningEffort: normalizeOpenRouterReasoningEffort(rawSettings.highContextOpenrouterReasoningEffort),
+        highParamProvider: rawSettings.highParamProvider || 'lm_studio',
+        highParamModel: rawSettings.highParamModel || '',
+        highParamOpenrouterReasoningEffort: normalizeOpenRouterReasoningEffort(rawSettings.highParamOpenrouterReasoningEffort),
+        critiqueSubmitterProvider: rawSettings.critiqueSubmitterProvider || 'lm_studio',
+        critiqueSubmitterModel: rawSettings.critiqueSubmitterModel || '',
+        critiqueSubmitterOpenrouterReasoningEffort: normalizeOpenRouterReasoningEffort(rawSettings.critiqueSubmitterOpenrouterReasoningEffort),
+        wolframEnabled: rawSettings.wolframEnabled ?? false,
+        freeOnly: rawSettings.freeOnly ?? false,
+        freeModelLooping: rawSettings.freeModelLooping ?? true,
+        freeModelAutoSelector: rawSettings.freeModelAutoSelector ?? true,
+        modelProviders: rawSettings.modelProviders || {},
+      }));
+    }
+  };
+
+  const handleRawEditToggle = (checked) => {
+    if (checked) {
+      const currentSettings = getCompilerRawSettings();
+      setGuiSettingsBeforeRaw(currentSettings);
+      setRawSettingsText(formatRawSettings(currentSettings));
+      setRawSettingsMessage('');
+      setEditRawSettings(true);
+      return;
+    }
+
+    if (!confirm(RAW_VIEW_EXIT_WARNING)) {
+      return;
+    }
+
+    if (guiSettingsBeforeRaw) {
+      applyCompilerRawSettings(guiSettingsBeforeRaw, { updateRawText: false });
+    }
+    setRawSettingsMessage('');
+    setEditRawSettings(false);
+  };
+
+  const saveRawSettings = () => {
+    try {
+      const parsed = JSON.parse(rawSettingsText);
+      applyCompilerRawSettings(parsed);
+      setRawSettingsMessage('Saved raw settings.');
+    } catch (error) {
+      setRawSettingsMessage(`Invalid JSON: ${error.message}`);
+    }
+  };
+
   // Reusable Role Configuration Component
   const RoleConfig = ({ 
     title, 
@@ -525,30 +724,39 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
     provider, setProvider,
     model, setModel,
     openrouterProv, setOpenrouterProv,
+    openrouterReasoningEffort, setOpenrouterReasoningEffort,
     fallback, setFallback,
     contextSize, setContextSize,
     maxOutput, setMaxOutput,
-    borderColor = '#333'
+    superchargeEnabled, setSuperchargeEnabled,
+    borderColor = '#333',
+    showProofStrengthBadge = false
   }) => {
     const effectiveProvider = lmStudioEnabled ? provider : 'openrouter';
     const models = effectiveProvider === 'openrouter' ? openRouterModels : lmStudioModels;
     const providers = model && effectiveProvider === 'openrouter'
       ? getProviderNames(modelProviders[model])
       : [];
+    const reasoningInfo = effectiveProvider === 'openrouter'
+      ? getReasoningSupportInfo(modelProviders[model], openrouterProv || null)
+      : { hasEndpointMetadata: false, supportsReasoning: false };
 
     return (
       <div
-        className={`role-config-card role-config-card--highlight${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter' : ''}`}
-        style={{ borderColor: effectiveProvider === 'openrouter' ? undefined : borderColor, padding: '1.5rem' }}
+        className={`submitter-config-section${effectiveProvider === 'openrouter' ? ' role-config-card--openrouter-orange' : ''}`}
+        style={{ borderColor: effectiveProvider === 'openrouter' ? undefined : borderColor }}
       >
-        <h3 style={{ margin: '0 0 0.5rem 0', color: effectiveProvider === 'openrouter' ? '#18cc17' : borderColor }}>
-          {title}
+        <h5 className={effectiveProvider === 'openrouter' ? 'card-title--orange' : ''} style={effectiveProvider === 'openrouter' ? undefined : { color: borderColor }}>
+          <span className="role-title-with-badges">
+            <span>{title}</span>
+            {showProofStrengthBadge && <ProofStrengthBadge />}
+          </span>
           {effectiveProvider === 'openrouter' && <span className="provider-badge-inline">[OpenRouter]</span>}
-        </h3>
-        <small className="role-description">{description}</small>
+        </h5>
+        <p className="settings-hint">{description}</p>
 
         {/* Provider Toggle */}
-        <div className="form-group">
+        <div className="settings-row">
           <label>Provider</label>
           {lmStudioEnabled ? (
             <div className="provider-toggle-group">
@@ -558,6 +766,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   setProvider('lm_studio');
                   setModel('');
                   setOpenrouterProv(null);
+                  setOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
                   setFallback(null);
                 }}
                 className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
@@ -571,25 +780,26 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                     setProvider('openrouter');
                     setModel('');
                     setOpenrouterProv(null);
+                    setOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
                     setFallback(null);
                   }
                 }}
                 disabled={!hasOpenRouterKey}
-                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or' : ''}`}
+                className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
                 title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
               >
                 OpenRouter
               </button>
             </div>
           ) : (
-            <small className="hint-text hint-text--dim">
+            <small className="settings-hint">
               OpenRouter is required in this deployment.
             </small>
           )}
         </div>
 
         {/* Model Selection */}
-        <div className="form-group">
+        <div className="settings-row">
           <label>Model</label>
           <select
             value={model || ''}
@@ -597,6 +807,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               const m = e.target.value;
               setModel(m);
               setOpenrouterProv(null);
+              setOpenrouterReasoningEffort(DEFAULT_OPENROUTER_REASONING_EFFORT);
               if (effectiveProvider === 'openrouter' && m) {
                 const autoSettings = await getAutoSettingsForModel(m, null);
                 if (autoSettings) {
@@ -629,7 +840,7 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
 
         {/* OpenRouter Provider (if OpenRouter) */}
         {effectiveProvider === 'openrouter' && model && (
-          <div className="form-group">
+          <div className="settings-row">
             <label>Host Provider (optional)</label>
             <select
               value={openrouterProv || ''}
@@ -655,9 +866,28 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           </div>
         )}
 
+        {effectiveProvider === 'openrouter' && model && (
+          <div className="settings-row">
+            <label>Reasoning Effort</label>
+            <select
+              value={normalizeOpenRouterReasoningEffort(openrouterReasoningEffort)}
+              onChange={(e) => setOpenrouterReasoningEffort(e.target.value)}
+            >
+              {OPENROUTER_REASONING_EFFORT_OPTIONS.map(option => (
+                <option key={option.value} value={option.value}>{option.label}</option>
+              ))}
+            </select>
+            <small className="settings-hint">
+              {reasoningInfo.hasEndpointMetadata && !reasoningInfo.supportsReasoning
+                ? 'This selected host does not advertise reasoning support; OpenRouter may ignore the setting.'
+                : 'Auto sends OpenRouter max reasoning effort by default.'}
+            </small>
+          </div>
+        )}
+
         {/* LM Studio Fallback (if OpenRouter) */}
         {effectiveProvider === 'openrouter' && lmStudioEnabled && (
-          <div className="form-group">
+          <div className="settings-row">
             <label className="label--muted">LM Studio Fallback (optional)</label>
             <select
               value={fallback || ''}
@@ -668,41 +898,60 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                 <option key={m.id} value={m.id}>{m.id}</option>
               ))}
             </select>
-            <small>Used if OpenRouter credits run out</small>
+            <small className="settings-hint">Used if OpenRouter credits run out</small>
           </div>
         )}
 
-        <div className="config-grid config-grid--2col">
-          <div className="form-group form-group--compact">
-            <label>Context Window (tokens)</label>
-            <input
-              type="number"
-              value={contextSize}
-              onChange={(e) => {
-                const parsed = parseInt(e.target.value);
-                setContextSize(isNaN(parsed) ? 131072 : parsed);
-              }}
-              min={4096}
-              max={50000000}
-              step={1024}
-            />
-          </div>
+        <div className="settings-row">
+          <label>Context Window</label>
+          <input
+            type="number"
+            value={contextSize}
+            onChange={(e) => {
+              const parsed = parseInt(e.target.value, 10);
+              setContextSize(isNaN(parsed) ? DEFAULT_CONTEXT_WINDOW : parsed);
+            }}
+            min={4096}
+            max={50000000}
+            step={1024}
+          />
+        </div>
 
-          <div className="form-group form-group--compact">
-            <label>Max Output Tokens</label>
-            <input
-              type="number"
-              value={maxOutput}
-              onChange={(e) => {
-                const parsed = parseInt(e.target.value);
-                setMaxOutput(isNaN(parsed) ? 25000 : parsed);
-              }}
-              min={1000}
-              max={50000000}
-              step={1000}
-            />
-          </div>
+        <div className="settings-row">
+          <label>Max Output Tokens</label>
+          <input
+            type="number"
+            value={maxOutput}
+            onChange={(e) => {
+              const parsed = parseInt(e.target.value, 10);
+              setMaxOutput(isNaN(parsed) ? DEFAULT_MAX_OUTPUT_TOKENS : parsed);
+            }}
+            min={1000}
+            max={50000000}
+            step={1000}
+          />
         </div>
+
+        {developerModeEnabled && (
+          <div className="settings-row settings-row--inline-checkbox">
+            <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+              <input
+                type="checkbox"
+                checked={Boolean(superchargeEnabled)}
+                onChange={(e) => setSuperchargeEnabled(e.target.checked)}
+              />
+              <HelpTooltip
+                label="Learn about Supercharge"
+                buttonContent="Supercharge"
+                buttonClassName="help-tooltip-btn--text"
+                popupClassName="help-tooltip-popup--fixed"
+                useFixedPosition
+              >
+                {SUPERCHARGE_TOOLTIP}
+              </HelpTooltip>
+            </label>
+          </div>
+        )}
       </div>
     );
   };
@@ -712,8 +961,10 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
   }
 
   return (
-    <div className="compiler-settings">
-      <h2>Compiler Settings</h2>
+    <div className="autonomous-settings-layout">
+      <HighlightedModelsSidebar />
+      <div className="autonomous-settings">
+          <h2>Compiler Settings</h2>
 
       {saveStatus && (
         <div className="save-message" style={{ marginBottom: '1rem' }}>
@@ -730,8 +981,78 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         </div>
       )}
 
-      <div className="settings-section">
-        <h3 className="section-heading--bordered">Model Configuration</h3>
+      <div className="model-refresh-controls">
+        {lmStudioEnabled && (
+          <>
+            <button
+              onClick={handleUseAggregatorModels}
+              className="secondary"
+            >
+              Use Aggregator Models
+            </button>
+            <button
+              onClick={async () => {
+                const models = await api.getModels();
+                setLmStudioModels(models.models || models || []);
+              }}
+              className="secondary"
+            >
+              Refresh LM Studio Models
+            </button>
+          </>
+        )}
+        {hasOpenRouterKey && (
+          <>
+            <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary">
+              Refresh OpenRouter Models
+            </button>
+            <button
+              className="secondary"
+              onClick={() => window.open('https://openrouter.ai/models', '_blank', 'noopener,noreferrer')}
+              title="Browse all available OpenRouter models"
+            >
+              🔗 OpenRouter Model List
+            </button>
+            <label className="settings-checkbox-label model-refresh-controls__toggle">
+              <input
+                type="checkbox"
+                checked={freeOnly}
+                onChange={(e) => setFreeOnly(e.target.checked)}
+              />
+              Free models only
+            </label>
+          </>
+        )}
+        {developerModeEnabled ? (
+          <label className="settings-checkbox-label model-refresh-controls__toggle">
+            <input
+              type="checkbox"
+              checked={editRawSettings}
+              onChange={(e) => handleRawEditToggle(e.target.checked)}
+            />
+            Edit Raw
+          </label>
+        ) : (
+          <span className="settings-developer-mode-hint">
+            Developer mode: press Shift + Z + X to toggle raw JSON settings.
+          </span>
+        )}
+      </div>
+
+      {editRawSettings ? (
+        <RawSettingsEditor
+          value={rawSettingsText}
+          onChange={setRawSettingsText}
+          onSave={saveRawSettings}
+          message={rawSettingsMessage}
+        />
+      ) : (
+        <>
+      <div className="settings-group">
+        <h4>Model Configuration</h4>
+        <p className="settings-info">
+          Configure the validator and compiler roles used by manual paper compilation.
+        </p>
         
         <RoleConfig
           title="Validator"
@@ -740,9 +1061,11 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           provider={validatorProvider} setProvider={setValidatorProvider}
           model={validatorModel} setModel={setValidatorModel}
           openrouterProv={validatorOpenrouterProvider} setOpenrouterProv={setValidatorOpenrouterProvider}
+          openrouterReasoningEffort={validatorOpenrouterReasoningEffort} setOpenrouterReasoningEffort={setValidatorOpenrouterReasoningEffort}
           fallback={validatorLmStudioFallback} setFallback={setValidatorLmStudioFallback}
           contextSize={validatorContextSize} setContextSize={setValidatorContextSize}
           maxOutput={validatorMaxOutput} setMaxOutput={setValidatorMaxOutput}
+          superchargeEnabled={validatorSuperchargeEnabled} setSuperchargeEnabled={setValidatorSuperchargeEnabled}
         />
 
         <RoleConfig
@@ -752,9 +1075,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           provider={highContextProvider} setProvider={setHighContextProvider}
           model={highContextModel} setModel={setHighContextModel}
           openrouterProv={highContextOpenrouterProvider} setOpenrouterProv={setHighContextOpenrouterProvider}
+          openrouterReasoningEffort={highContextOpenrouterReasoningEffort} setOpenrouterReasoningEffort={setHighContextOpenrouterReasoningEffort}
           fallback={highContextLmStudioFallback} setFallback={setHighContextLmStudioFallback}
           contextSize={highContextContextSize} setContextSize={setHighContextContextSize}
           maxOutput={highContextMaxOutput} setMaxOutput={setHighContextMaxOutput}
+          superchargeEnabled={highContextSuperchargeEnabled} setSuperchargeEnabled={setHighContextSuperchargeEnabled}
+          showProofStrengthBadge
         />
 
         <RoleConfig
@@ -764,70 +1090,47 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
           provider={highParamProvider} setProvider={setHighParamProvider}
           model={highParamModel} setModel={setHighParamModel}
           openrouterProv={highParamOpenrouterProvider} setOpenrouterProv={setHighParamOpenrouterProvider}
+          openrouterReasoningEffort={highParamOpenrouterReasoningEffort} setOpenrouterReasoningEffort={setHighParamOpenrouterReasoningEffort}
           fallback={highParamLmStudioFallback} setFallback={setHighParamLmStudioFallback}
           contextSize={highParamContextSize} setContextSize={setHighParamContextSize}
           maxOutput={highParamMaxOutput} setMaxOutput={setHighParamMaxOutput}
+          superchargeEnabled={highParamSuperchargeEnabled} setSuperchargeEnabled={setHighParamSuperchargeEnabled}
+          showProofStrengthBadge
         />
 
         <RoleConfig
           title="Critique Submitter"
-          description="Generates peer review critiques and decides on rewrites after body completion."
+          description="Generates validated peer review critiques for the paper's AI self-review section."
           borderColor="#e74c3c"
           provider={critiqueSubmitterProvider} setProvider={setCritiqueSubmitterProvider}
           model={critiqueSubmitterModel} setModel={setCritiqueSubmitterModel}
           openrouterProv={critiqueSubmitterOpenrouterProvider} setOpenrouterProv={setCritiqueSubmitterOpenrouterProvider}
+          openrouterReasoningEffort={critiqueSubmitterOpenrouterReasoningEffort} setOpenrouterReasoningEffort={setCritiqueSubmitterOpenrouterReasoningEffort}
           fallback={critiqueSubmitterLmStudioFallback} setFallback={setCritiqueSubmitterLmStudioFallback}
           contextSize={critiqueSubmitterContextSize} setContextSize={setCritiqueSubmitterContextSize}
           maxOutput={critiqueSubmitterMaxOutput} setMaxOutput={setCritiqueSubmitterMaxOutput}
+          superchargeEnabled={critiqueSubmitterSuperchargeEnabled} setSuperchargeEnabled={setCritiqueSubmitterSuperchargeEnabled}
         />
       </div>
 
-      {/* Model Refresh Controls */}
-      <div className="settings-panel settings-panel--blue">
-        <h3 style={{ marginBottom: '1rem' }}>Model Management</h3>
-        <div className="model-refresh-controls">
-          {lmStudioEnabled && (
-            <>
-              <button 
-                onClick={handleUseAggregatorModels}
-                className="secondary btn-primary-blue"
-              >
-                Use Aggregator Models
-              </button>
-              <button 
-                onClick={async () => {
-                  const models = await api.getModels();
-                  setLmStudioModels(models.models || models || []);
-                }} 
-                className="secondary"
-              >
-                Refresh LM Studio Models
-              </button>
-            </>
-          )}
-          {hasOpenRouterKey && (
-            <>
-              <button onClick={() => fetchOpenRouterModels(freeOnly)} className="secondary">
-                Refresh OpenRouter Models
-              </button>
-              <label className="settings-checkbox-label">
-                <input
-                  type="checkbox"
-                  checked={freeOnly}
-                  onChange={(e) => setFreeOnly(e.target.checked)}
-                />
-                Show only free models
-              </label>
-              <div className="checkbox-group-col">
-                <label className="settings-checkbox-label">
-                  <input
-                    type="checkbox"
-                    checked={freeModelLooping}
-                    onChange={(e) => {
-                      setFreeModelLooping(e.target.checked);
-                      openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
-                    }}
-                  />
+      {hasOpenRouterKey && (
+        <div className="settings-group">
+          <h4>OpenRouter Fallback</h4>
+          <p className="settings-info">
+            Fallback behavior for OpenRouter free-model rate limits.
+          </p>
+          <div className="checkbox-group-col">
+            <label className="settings-checkbox-label settings-checkbox-label--stacked">
+              <input
+                type="checkbox"
+                checked={freeModelLooping}
+                onChange={(e) => {
+                  setFreeModelLooping(e.target.checked);
+                  openRouterAPI.setFreeModelSettings(e.target.checked, freeModelAutoSelector).catch(() => {});
+                }}
+              />
+              <span className="settings-option-copy">
+                <span className="settings-option-title">
                   Enable Free Model Looping
                   <HelpTooltip
                     label="Learn about free model looping"
@@ -835,16 +1138,23 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   >
                     When a free model is rate-limited, automatically try the next available free model sorted by highest context limit. Prevents workflow stalls from rate limits.
                   </HelpTooltip>
-                </label>
-                <label className="settings-checkbox-label">
-                  <input
-                    type="checkbox"
-                    checked={freeModelAutoSelector}
-                    onChange={(e) => {
-                      setFreeModelAutoSelector(e.target.checked);
-                      openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
-                    }}
-                  />
+                </span>
+                <span className="settings-option-description">
+                  Automatically rotate to the next selected free model when one hits a rate limit.
+                </span>
+              </span>
+            </label>
+            <label className="settings-checkbox-label settings-checkbox-label--stacked">
+              <input
+                type="checkbox"
+                checked={freeModelAutoSelector}
+                onChange={(e) => {
+                  setFreeModelAutoSelector(e.target.checked);
+                  openRouterAPI.setFreeModelSettings(freeModelLooping, e.target.checked).catch(() => {});
+                }}
+              />
+              <span className="settings-option-copy">
+                <span className="settings-option-title">
                   Use OpenRouter Free Models Auto-Selector as Backup
                   <HelpTooltip
                     label="Learn about the free models auto-selector backup"
@@ -852,27 +1162,25 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
                   >
                     When all selected free models are rate-limited, use OpenRouter&apos;s Free Models Router (`openrouter/free`) as a last resort backup. Works independently of Free Model Looping.
                   </HelpTooltip>
-                </label>
-              </div>
-            </>
-          )}
+                </span>
+                <span className="settings-option-description">
+                  Falls back to OpenRouter&apos;s free router when every selected free model is temporarily exhausted.
+                </span>
+              </span>
+            </label>
+          </div>
         </div>
-        <small className="hint-text" style={{ marginTop: '0.75rem' }}>
-          {lmStudioEnabled
-            ? '"Use Aggregator Models" copies your aggregator\'s model selection to all compiler roles.'
-            : 'LM Studio tools are hidden in hosted mode. Configure compiler roles directly with OpenRouter models below.'}
-        </small>
-      </div>
+      )}
 
       {/* Wolfram Alpha Integration */}
-      <div className="settings-section">
-        <h3>Wolfram Alpha Integration (Optional)</h3>
-        <small className="hint-text" style={{ marginBottom: '1rem' }}>
+      <div className="settings-group">
+        <h4>Wolfram Alpha Integration (Optional)</h4>
+        <p className="settings-info">
           Enable Wolfram Alpha API for computational verification in rigor mode. 
           Get your API key from <a href="https://products.wolframalpha.com/api" target="_blank" rel="noopener noreferrer">developer.wolframalpha.com</a>
-        </small>
+        </p>
         
-        <label className="settings-checkbox-label" style={{ marginBottom: '1rem' }}>
+        <label className="settings-checkbox-label settings-checkbox-label--stacked" style={{ marginBottom: '1rem' }}>
           <input
             type="checkbox"
             checked={wolframEnabled}
@@ -885,7 +1193,12 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               }
             }}
           />
-          <span className="label-medium">Enable Wolfram Alpha Verification in Rigor Mode</span>
+          <span className="settings-option-copy">
+            <span className="settings-option-title">Enable Wolfram Alpha Verification in Rigor Mode</span>
+            <span className="settings-option-description">
+              Lets rigor mode request computational verification for equations, properties, and theorem checks.
+            </span>
+          </span>
         </label>
         
         {wolframEnabled && (
@@ -952,8 +1265,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
         )}
       </div>
 
-      <div className="settings-section">
-        <h3>Workflow Configuration</h3>
+      <div className="settings-group">
+        <h4>Workflow Configuration</h4>
         
         <div className="info-box">
           <h4>Sequential Markov Chain</h4>
@@ -969,24 +1282,27 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       </div>
 
       {/* Validator Critique Prompt Editor */}
-      <div className="settings-panel settings-panel--blue">
+      <div className="settings-group">
         <div 
           onClick={() => setCritiquePromptExpanded(!critiquePromptExpanded)}
-          className="collapsible-trigger"
-          style={{ padding: '0.5rem 0', background: 'transparent', border: 'none' }}
+          className="collapsible-trigger settings-trigger--multiline"
         >
-          <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
-            <span style={{ fontSize: '1.1rem' }}>📝</span>
-            <h3 style={{ margin: 0 }}>Edit Validator Critique Prompt</h3>
-            {isUsingCustomCritiquePrompt && (
-              <span className="tag-badge tag-badge--purple">CUSTOM</span>
-            )}
+          <div className="settings-trigger-copy">
+            <div className="settings-trigger-title-row">
+              <h4 className="form-group--compact settings-trigger-title">Edit Validator Critique Prompt</h4>
+              {isUsingCustomCritiquePrompt && (
+                <span className="tag-badge tag-badge--purple">CUSTOM</span>
+              )}
+            </div>
+            <p className="settings-subsection-description">
+              Optional prompt customization for the user-facing paper critique mode.
+            </p>
           </div>
           <span className={`collapse-chevron${critiquePromptExpanded ? ' collapse-chevron--open' : ''}`}>▼</span>
         </div>
 
         {critiquePromptExpanded && (
-          <div style={{ marginTop: '1rem' }}>
+          <div className="collapsible-body" style={{ marginTop: '1rem' }}>
             <p className="text-muted-sm">
               Customize the prompt sent to your validator when requesting a paper critique. 
               The JSON output schema is automatically appended and cannot be modified.
@@ -1025,8 +1341,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
       </div>
 
       {/* Configuration Summary */}
-      <div className="settings-panel" style={{ marginTop: '2rem' }}>
-        <h3>Current Configuration Summary</h3>
+      <div className="settings-group">
+        <h4>Current Configuration Summary</h4>
         <pre className="config-summary-pre">
           {JSON.stringify({
             validator: {
@@ -1035,7 +1351,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               host: validatorProvider === 'openrouter' ? (validatorOpenrouterProvider || 'Auto') : 'N/A',
               fallback: validatorProvider === 'openrouter' ? (validatorLmStudioFallback?.split('/').pop() || 'None') : 'N/A',
               context: validatorContextSize,
-              maxOutput: validatorMaxOutput
+              maxOutput: validatorMaxOutput,
+              supercharge: validatorSuperchargeEnabled
             },
             highContext: {
               provider: highContextProvider,
@@ -1043,7 +1360,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               host: highContextProvider === 'openrouter' ? (highContextOpenrouterProvider || 'Auto') : 'N/A',
               fallback: highContextProvider === 'openrouter' ? (highContextLmStudioFallback?.split('/').pop() || 'None') : 'N/A',
               context: highContextContextSize,
-              maxOutput: highContextMaxOutput
+              maxOutput: highContextMaxOutput,
+              supercharge: highContextSuperchargeEnabled
             },
             highParam: {
               provider: highParamProvider,
@@ -1051,7 +1369,8 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               host: highParamProvider === 'openrouter' ? (highParamOpenrouterProvider || 'Auto') : 'N/A',
               fallback: highParamProvider === 'openrouter' ? (highParamLmStudioFallback?.split('/').pop() || 'None') : 'N/A',
               context: highParamContextSize,
-              maxOutput: highParamMaxOutput
+              maxOutput: highParamMaxOutput,
+              supercharge: highParamSuperchargeEnabled
             },
             critiqueSubmitter: {
               provider: critiqueSubmitterProvider,
@@ -1059,11 +1378,15 @@ Be honest and constructive. Identify both strengths and weaknesses.`;
               host: critiqueSubmitterProvider === 'openrouter' ? (critiqueSubmitterOpenrouterProvider || 'Auto') : 'N/A',
               fallback: critiqueSubmitterProvider === 'openrouter' ? (critiqueSubmitterLmStudioFallback?.split('/').pop() || 'None') : 'N/A',
               context: critiqueSubmitterContextSize,
-              maxOutput: critiqueSubmitterMaxOutput
+              maxOutput: critiqueSubmitterMaxOutput,
+              supercharge: critiqueSubmitterSuperchargeEnabled
             }
           }, null, 2)}
         </pre>
       </div>
+        </>
+      )}
+      </div>
     </div>
   );
 }
diff --git a/frontend/src/components/compiler/LivePaper.jsx b/frontend/src/components/compiler/LivePaper.jsx
index b3c4c8a..7888ca1 100644
--- a/frontend/src/components/compiler/LivePaper.jsx
+++ b/frontend/src/components/compiler/LivePaper.jsx
@@ -14,8 +14,6 @@ function LivePaper() {
   const [version, setVersion] = useState(0);
   const [autoScroll, setAutoScroll] = useState(true);
   const [isSaving, setIsSaving] = useState(false);
-  const [previousVersions, setPreviousVersions] = useState([]);
-  const [showVersions, setShowVersions] = useState(false);
   const [showLatex, setShowLatex] = useState(true);
   const [isGeneratingPDF, setIsGeneratingPDF] = useState(false);
   const paperContainerRef = useRef(null);
@@ -37,22 +35,20 @@ function LivePaper() {
   useEffect(() => {
     loadPaper();
     loadStatus();
-    loadPreviousVersions();
     
     const interval = setInterval(() => {
       loadPaper();
       loadStatus();
-      loadPreviousVersions();
     }, 10000);
 
     websocket.on('paper_updated', debouncedLoadPaper);
-    websocket.on('body_rewrite_started', handleBodyRewrite);
+    websocket.on('self_review_appended', debouncedLoadPaper);
 
     return () => {
       clearInterval(interval);
       if (wsDebounceRef.current) clearTimeout(wsDebounceRef.current);
       websocket.off('paper_updated', debouncedLoadPaper);
-      websocket.off('body_rewrite_started', handleBodyRewrite);
+      websocket.off('self_review_appended', debouncedLoadPaper);
     };
   }, []);
 
@@ -93,21 +89,6 @@ function LivePaper() {
     }
   };
 
-  const handleBodyRewrite = (event) => {
-    // Reload previous versions when rewrite starts
-    loadPreviousVersions();
-    loadPaper();
-  };
-
-  const loadPreviousVersions = async () => {
-    try {
-      const response = await compilerAPI.getPreviousVersions();
-      setPreviousVersions(response.data.previous_versions || []);
-    } catch (error) {
-      console.error('Failed to load previous versions:', error);
-    }
-  };
-
   const handleSaveDraft = async () => {
     setIsSaving(true);
     try {
@@ -330,62 +311,6 @@ function LivePaper() {
         )}
       </div>
 
-      {previousVersions.length > 0 && (
-        <div className="previous-versions-section">
-          <button 
-            className="btn btn-secondary mt-1"
-            onClick={() => setShowVersions(!showVersions)}
-            style={{ marginBottom: '0.5rem' }}
-          >
-            📜 Previous Versions ({previousVersions.length})
-          </button>
-          
-          {showVersions && (
-            <div className="versions-list">
-              {previousVersions.map(v => (
-                <div key={v.version} className="version-card" style={{
-                  border: '1px solid #444',
-                  borderRadius: '4px',
-                  padding: '1rem',
-                  marginBottom: '1rem',
-                  backgroundColor: '#2a2a2a'
-                }}>
-                  <h3 style={{ color: '#1eff1c', marginBottom: '0.5rem' }}>
-                    Version {v.version}: {v.title}
-                  </h3>
-                  
-                  <div className="version-body" style={{ marginBottom: '1rem' }}>
-                    <h4 style={{ color: '#4CAF50', marginBottom: '0.5rem' }}>Body Section:</h4>
-                    <pre style={{
-                      backgroundColor: '#1a1a1a',
-                      padding: '1rem',
-                      borderRadius: '4px',
-                      maxHeight: '400px',
-                      overflow: 'auto',
-                      fontSize: '0.85rem',
-                      whiteSpace: 'pre-wrap'
-                    }}>{v.body}</pre>
-                  </div>
-                  
-                  <div className="version-critique">
-                    <h4 style={{ color: '#ff6b6b', marginBottom: '0.5rem' }}>Critique Feedback (triggered rewrite):</h4>
-                    <pre style={{
-                      backgroundColor: '#1a1a1a',
-                      padding: '1rem',
-                      borderRadius: '4px',
-                      maxHeight: '300px',
-                      overflow: 'auto',
-                      fontSize: '0.85rem',
-                      whiteSpace: 'pre-wrap'
-                    }}>{v.critique_feedback}</pre>
-                  </div>
-                </div>
-              ))}
-            </div>
-          )}
-        </div>
-      )}
-
       <div className="paper-footer">
         <p className="info-text">
           This paper is being constructed in real-time from the aggregator database.
diff --git a/frontend/src/components/leanoj/LeanOJBrainstorms.jsx b/frontend/src/components/leanoj/LeanOJBrainstorms.jsx
new file mode 100644
index 0000000..c8e5669
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJBrainstorms.jsx
@@ -0,0 +1,265 @@
+import React, { useMemo, useState } from 'react';
+import '../autonomous/AutonomousResearch.css';
+
+const BRAINSTORM_PHASES = [
+  {
+    key: 'initial_brainstorm',
+    title: 'Initial Brainstorm',
+    description: 'Accepted proof ideas gathered before the first path decision.',
+  },
+  {
+    key: 'recursive_brainstorm',
+    title: 'Recursive Brainstorm',
+    description: 'Accepted proof ideas gathered when the solver returns for more context.',
+  },
+];
+
+function toNumber(value, fallback = 0) {
+  const number = Number(value);
+  return Number.isFinite(number) ? number : fallback;
+}
+
+function formatDate(isoString) {
+  if (!isoString) return '';
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function hasValue(value) {
+  return value !== undefined && value !== null && value !== '';
+}
+
+function dateValue(value) {
+  const timestamp = Date.parse(value || '');
+  return Number.isFinite(timestamp) ? timestamp : 0;
+}
+
+function sortEvent(record) {
+  const number = Number(record.acceptanceEvent);
+  return Number.isFinite(number) && number > 0 ? number : record.fallbackIndex;
+}
+
+function compareRecordsChronologically(a, b) {
+  const eventA = sortEvent(a);
+  const eventB = sortEvent(b);
+  if (eventA !== eventB) return eventA - eventB;
+
+  const createdA = dateValue(a.createdAt);
+  const createdB = dateValue(b.createdAt);
+  if (createdA !== createdB) return createdA - createdB;
+
+  return a.fallbackIndex - b.fallbackIndex;
+}
+
+function pluralize(count, singular, plural = `${singular}s`) {
+  return `${count} ${count === 1 ? singular : plural}`;
+}
+
+function normalizeRecords(status) {
+  const acceptedIdeas = Array.isArray(status?.accepted_ideas) ? status.accepted_ideas : [];
+  const records = Array.isArray(status?.accepted_idea_records) ? status.accepted_idea_records : [];
+
+  if (records.length > 0) {
+    return records
+      .map((record, index) => ({
+        content: record.content || acceptedIdeas[index] || '',
+        phase: record.phase || 'initial_brainstorm',
+        submitterIndex: record.submitter_index,
+        createdAt: record.created_at,
+        editedAt: record.edited_at,
+        acceptanceEvent: record.acceptance_event,
+        pruneAdd: Boolean(record.prune_add),
+        reasoning: record.reasoning || record.edit_reasoning || '',
+        fallbackIndex: index + 1,
+      }))
+      .sort(compareRecordsChronologically);
+  }
+
+  return acceptedIdeas
+    .map((content, index) => ({
+      content,
+      phase: 'initial_brainstorm',
+      submitterIndex: null,
+      createdAt: '',
+      acceptanceEvent: index + 1,
+      pruneAdd: false,
+      reasoning: '',
+      fallbackIndex: index + 1,
+    }))
+    .sort(compareRecordsChronologically);
+}
+
+export default function LeanOJBrainstorms({ status }) {
+  const [expandedPhase, setExpandedPhase] = useState('initial_brainstorm');
+
+  const summary = useMemo(() => {
+    const records = normalizeRecords(status);
+    const acceptedCount = toNumber(status?.accepted_brainstorm_count, records.length);
+    const acceptanceEvents = toNumber(status?.brainstorm_acceptance_events, Math.max(acceptedCount, records.length));
+    const prunedCount = Math.max(0, acceptanceEvents - acceptedCount);
+
+    const grouped = BRAINSTORM_PHASES.reduce((acc, phase) => {
+      acc[phase.key] = [];
+      return acc;
+    }, {});
+
+    records.forEach((record) => {
+      const phaseKey = grouped[record.phase] ? record.phase : 'initial_brainstorm';
+      grouped[phaseKey].push(record);
+    });
+
+    Object.values(grouped).forEach((phaseRecords) => {
+      phaseRecords.sort(compareRecordsChronologically);
+    });
+
+    return {
+      records,
+      grouped,
+      acceptedCount,
+      acceptanceEvents,
+      prunedCount,
+      pruneOperations: toNumber(status?.brainstorm_prune_operations_applied),
+    };
+  }, [status]);
+
+  return (
+    <div className="brainstorm-list leanoj-brainstorms">
+      <div className="brainstorm-list-header">
+        <div>
+          <h3>Proof Solver Brainstorms ({summary.records.length})</h3>
+          <p className="settings-hint">
+            Review the two Proof Solver brainstorm memories and track how many accepted ideas were pruned from the current working context.
+          </p>
+        </div>
+      </div>
+
+      <div className="brainstorm-list-warning">
+        (WARNING: Any given brainstorm idea may be pruned/deleted if the AI deems it to hurt the collective database quality. These Lean brainstorm memories are the working context used to build the final proof.)
+      </div>
+
+      <div className="logs-metrics leanoj-brainstorms__metrics">
+        <div className="metric-card">
+          <span className="metric-value">{summary.acceptedCount}</span>
+          <span className="metric-label">Current Ideas</span>
+        </div>
+        <div className="metric-card">
+          <span className="metric-value">{summary.acceptanceEvents}</span>
+          <span className="metric-label">Accepted Events</span>
+        </div>
+        <div className="metric-card">
+          <span className="metric-value">{summary.prunedCount}</span>
+          <span className="metric-label">Pruned</span>
+        </div>
+        <div className="metric-card">
+          <span className="metric-value">{summary.pruneOperations}</span>
+          <span className="metric-label">Prune Operations</span>
+        </div>
+      </div>
+
+      {BRAINSTORM_PHASES.map((phase) => {
+        const records = summary.grouped[phase.key] || [];
+        const isExpanded = expandedPhase === phase.key;
+        const pruneAddedCount = records.filter((record) => record.pruneAdd).length;
+        const latestActivityTime = Math.max(
+          0,
+          ...records.map((record) => Math.max(dateValue(record.createdAt), dateValue(record.editedAt))),
+        );
+        const latestActivity = latestActivityTime ? formatDate(new Date(latestActivityTime).toISOString()) : '';
+
+        return (
+          <div
+            key={phase.key}
+            className={`brainstorm-card ${isExpanded ? 'expanded' : ''}`}
+          >
+            <div
+              className="brainstorm-card-clickable"
+              onClick={() => setExpandedPhase(isExpanded ? '' : phase.key)}
+              role="button"
+              tabIndex={0}
+              onKeyDown={(event) => {
+                if (event.key === 'Enter' || event.key === ' ') {
+                  event.preventDefault();
+                  setExpandedPhase(isExpanded ? '' : phase.key);
+                }
+              }}
+            >
+              <div className="brainstorm-card-header">
+                <span className="brainstorm-card-id">{phase.title}</span>
+                <span className={`brainstorm-status ${records.length > 0 ? 'complete' : 'in-progress'}`}>
+                  {isExpanded ? '▼' : '▶'} {pluralize(records.length, 'Idea')}
+                </span>
+              </div>
+
+              <div className="brainstorm-card-prompt">
+                {phase.description}
+              </div>
+
+              <div className="brainstorm-card-meta">
+                <span>{pluralize(records.length, 'current idea')}</span>
+                <span>{pluralize(pruneAddedCount, 'prune-added idea')}</span>
+                <span>Last: {latestActivity || 'N/A'}</span>
+              </div>
+            </div>
+
+            {isExpanded && (
+              <div className="brainstorm-submissions-container">
+                <div className="file-content">
+                  <div className="submissions-list-header">
+                    <h4>Accepted Ideas</h4>
+                  </div>
+
+                  {records.length === 0 ? (
+                    <div className="auto-empty-state">
+                      No accepted ideas in this brainstorm yet.
+                    </div>
+                  ) : (
+                    <div className="submissions-list leanoj-brainstorms__ideas">
+                      {records.map((record) => {
+                        const ideaNumber = record.acceptanceEvent || record.fallbackIndex;
+                        const createdAt = formatDate(record.createdAt);
+                        const editedAt = formatDate(record.editedAt);
+                        const meta = [
+                          hasValue(record.submitterIndex) ? `Submitter ${record.submitterIndex}` : '',
+                          editedAt ? `Edited: ${editedAt}` : createdAt,
+                        ].filter(Boolean);
+
+                        return (
+                          <article
+                            key={`${phase.key}-${ideaNumber}-${record.fallbackIndex}`}
+                            className="submission-item leanoj-brainstorms__idea-card"
+                          >
+                            <div className="submission-header leanoj-brainstorms__idea-header">
+                              <span className="submission-number">Idea #{ideaNumber}</span>
+                              <span className="submission-timestamp">
+                                {meta.join(' | ') || phase.title}
+                              </span>
+                              {record.pruneAdd && (
+                                <span className="brainstorm-status complete">Prune Added</span>
+                              )}
+                            </div>
+                            <div className="submission-content">
+                              <pre>{record.content || 'No brainstorm content recorded.'}</pre>
+                              {record.reasoning && (
+                                <div className="leanoj-brainstorms__reasoning">
+                                  <strong>Reasoning</strong>
+                                  <span>{record.reasoning}</span>
+                                </div>
+                              )}
+                            </div>
+                          </article>
+                        );
+                      })}
+                    </div>
+                  )}
+                </div>
+              </div>
+            )}
+          </div>
+        );
+      })}
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJInterface.jsx b/frontend/src/components/leanoj/LeanOJInterface.jsx
new file mode 100644
index 0000000..48bc849
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJInterface.jsx
@@ -0,0 +1,170 @@
+import React, { useEffect, useState } from 'react';
+import { persistLeanOJSettings, settingsToLeanOJRequest } from '../../utils/leanojProfiles';
+import LiveActivityFeed from '../LiveActivityFeed';
+import '../autonomous/AutonomousResearch.css';
+
+export default function LeanOJInterface({
+  isRunning,
+  anyWorkflowRunning,
+  status,
+  activity,
+  settings,
+  onSettingsChange,
+  onStart,
+  onStop,
+  onClear,
+  onSkipBrainstorm,
+  onForceBrainstorm,
+}) {
+  const [prompt, setPrompt] = useState(settings.prompt || '');
+  const [leanTemplate, setLeanTemplate] = useState(settings.leanTemplate || '');
+
+  useEffect(() => {
+    setPrompt(settings.prompt || '');
+    setLeanTemplate(settings.leanTemplate || '');
+  }, [settings.prompt, settings.leanTemplate]);
+
+  const persistDraft = (nextPrompt, nextLeanTemplate) => {
+    const nextSettings = persistLeanOJSettings({
+      ...settings,
+      prompt: nextPrompt,
+      leanTemplate: nextLeanTemplate,
+    });
+    onSettingsChange(nextSettings);
+    return nextSettings;
+  };
+
+  const handlePromptChange = (value) => {
+    setPrompt(value);
+    persistDraft(value, leanTemplate);
+  };
+
+  const handleLeanTemplateChange = (value) => {
+    setLeanTemplate(value);
+    persistDraft(prompt, value);
+  };
+
+  const handleStart = async () => {
+    const nextSettings = persistDraft(prompt, leanTemplate);
+    await onStart(settingsToLeanOJRequest(nextSettings, prompt, leanTemplate));
+  };
+
+  const canStart = !isRunning && !anyWorkflowRunning && prompt.trim() && leanTemplate.trim();
+  const disabledReason = anyWorkflowRunning && !isRunning
+    ? 'Another workflow is already running.'
+    : 'Enter a problem prompt and Lean template.';
+
+  return (
+    <div className={`autonomous-interface workflow-main-interface ${isRunning ? 'workflow-main-interface--running' : ''}`}>
+      <div className="autonomous-header leanoj-header">
+        <div className="leanoj-header-copy">
+          <h2>Proof Solver</h2>
+          <p className="settings-hint leanoj-proof-solver-intro">
+            Paste a proof problem statement and Lean template. MOTO will build cumulative brainstorm context, allow Lean-verified proof fragments during brainstorming, and keep trying the final Lean 4 submission until Lean verifies it or you stop the run.
+          </p>
+        </div>
+        <div className="autonomous-controls">
+          {!isRunning ? (
+            <button className="btn-start" onClick={handleStart} disabled={!canStart} title={!canStart ? disabledReason : ''}>
+              Start Proof Solver
+            </button>
+          ) : (
+            <>
+              <span className="runtime-indicator" role="status" aria-live="polite" title="Proof Solver is running">
+                <span className="runtime-indicator-dot" aria-hidden="true"></span>
+                <span className="runtime-indicator-label">Running</span>
+              </span>
+              <button className="btn-stop" onClick={onStop}>
+                Stop Proof Solver
+              </button>
+            </>
+          )}
+          <button className="btn-clear" onClick={onSkipBrainstorm} disabled={!isRunning}>
+            Skip Brainstorm
+          </button>
+          <button className="btn-clear" onClick={onForceBrainstorm} disabled={!isRunning}>
+            Force Brainstorm
+          </button>
+          <button className="btn-clear" onClick={onClear} disabled={isRunning}>
+            Clear Progress
+          </button>
+        </div>
+      </div>
+
+      <div className="research-prompt-section">
+        <label htmlFor="leanoj-problem-prompt">Problem Prompt</label>
+        <textarea
+          id="leanoj-problem-prompt"
+          value={prompt}
+          onChange={(event) => handlePromptChange(event.target.value)}
+          disabled={isRunning}
+          rows={6}
+          placeholder="Describe the proof problem, constraints, and what the template expects."
+        />
+      </div>
+
+      <div className="research-prompt-section">
+        <label htmlFor="leanoj-template">Lean Template</label>
+        <textarea
+          id="leanoj-template"
+          value={leanTemplate}
+          onChange={(event) => handleLeanTemplateChange(event.target.value)}
+          disabled={isRunning}
+          rows={14}
+          spellCheck={false}
+          placeholder={'import Mathlib\n\nexample ... := by\n  sorry'}
+        />
+      </div>
+
+      <div className="status-section">
+        <div className="status-tier">
+          <span className="status-label">Current Status:</span>
+          <span className={`status-value ${isRunning ? 'status-running' : 'status-idle'}`}>
+            {isRunning ? status?.phase || 'running' : 'Not Running'}
+          </span>
+        </div>
+        {status?.current_path_decision && (
+          <div className="current-brainstorm">
+            <span className="status-label">Current Path:</span>
+            <p className="brainstorm-prompt">{status.current_path_decision}</p>
+          </div>
+        )}
+        {status?.last_error && (
+          <div className="error-message">{status.last_error}</div>
+        )}
+      </div>
+
+      <div className="stats-section">
+        <div className="stat-item">
+          <span className="stat-value">{status?.accepted_brainstorm_count || 0}</span>
+          <span className="stat-label">Accepted Ideas</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{(status?.validated_topics || []).length}</span>
+          <span className="stat-label">Validated Topics</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{(status?.verified_subproofs || []).length}</span>
+          <span className="stat-label">Verified Proof Fragments</span>
+        </div>
+        <div className="stat-item">
+          <span className="stat-value">{status?.final_attempt_count || 0}</span>
+          <span className="stat-label">Final Attempts</span>
+        </div>
+      </div>
+
+      {status?.final_solution && (
+        <div className="status-section">
+          <h3>Verified Proof Solver Submission</h3>
+          <pre className="code-block">{status.final_solution}</pre>
+        </div>
+      )}
+
+      <LiveActivityFeed
+        title="Live Activity"
+        items={activity || []}
+        emptyMessage="No activity yet."
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJLogs.jsx b/frontend/src/components/leanoj/LeanOJLogs.jsx
new file mode 100644
index 0000000..45c78b0
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJLogs.jsx
@@ -0,0 +1,20 @@
+import React from 'react';
+import { autonomousAPI } from '../../services/api';
+import ApiCallLogs from '../ApiCallLogs';
+import '../autonomous/AutonomousResearch.css';
+
+export default function LeanOJLogs() {
+  return (
+    <div className="autonomous-logs">
+      <div className="autonomous-header">
+        <h2>API Call Logs</h2>
+      </div>
+
+      <ApiCallLogs
+        api={autonomousAPI}
+        workflow="leanoj"
+        emptyHint="Run Proof Solver and make model calls to see request/response logs here."
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJMasterProof.css b/frontend/src/components/leanoj/LeanOJMasterProof.css
new file mode 100644
index 0000000..ae23a9f
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJMasterProof.css
@@ -0,0 +1,167 @@
+.leanoj-master-proof {
+  padding: 1.5rem;
+  display: flex;
+  flex-direction: column;
+  gap: 1rem;
+  color: var(--text-primary, #e5e7eb);
+}
+
+.leanoj-master-proof__header,
+.leanoj-master-proof__panel-header,
+.leanoj-master-proof__actions,
+.leanoj-master-proof__edit-topline {
+  display: flex;
+  gap: 0.75rem;
+  align-items: center;
+  flex-wrap: wrap;
+}
+
+.leanoj-master-proof__header,
+.leanoj-master-proof__panel-header {
+  justify-content: space-between;
+}
+
+.leanoj-master-proof__header h2,
+.leanoj-master-proof__panel h3 {
+  margin: 0;
+}
+
+.leanoj-master-proof__header p {
+  margin: 0.35rem 0 0;
+  color: var(--text-secondary, #9ca3af);
+  max-width: 62rem;
+}
+
+.leanoj-master-proof__actions button,
+.leanoj-master-proof__panel-header button,
+.leanoj-master-proof__edit-card button {
+  border-radius: 0.8rem;
+  border: 1px solid var(--border-default, #374151);
+  background: var(--surface-2, #111827);
+  color: var(--text-primary, #f3f4f6);
+  padding: 0.6rem 0.85rem;
+  cursor: pointer;
+}
+
+.leanoj-master-proof__actions button:disabled {
+  opacity: 0.55;
+  cursor: not-allowed;
+}
+
+.leanoj-master-proof__stats {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(140px, 1fr));
+  gap: 0.75rem;
+}
+
+.leanoj-master-proof__stat,
+.leanoj-master-proof__panel,
+.leanoj-master-proof__meta,
+.leanoj-master-proof__edit-card,
+.leanoj-master-proof__empty,
+.leanoj-master-proof__error {
+  border: 1px solid var(--border-default, #374151);
+  background: rgba(255, 255, 255, 0.025);
+  border-radius: 1rem;
+}
+
+.leanoj-master-proof__stat {
+  padding: 0.9rem 1rem;
+  display: flex;
+  flex-direction: column;
+  gap: 0.2rem;
+}
+
+.leanoj-master-proof__stat span {
+  font-size: 1.35rem;
+  font-weight: 700;
+}
+
+.leanoj-master-proof__stat label,
+.leanoj-master-proof__meta strong,
+.leanoj-master-proof__panel-header span,
+.leanoj-master-proof__edit-topline {
+  color: var(--text-secondary, #9ca3af);
+  font-size: 0.88rem;
+}
+
+.leanoj-master-proof__meta {
+  padding: 1rem;
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(260px, 1fr));
+  gap: 0.9rem;
+}
+
+.leanoj-master-proof__meta div {
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+  min-width: 0;
+}
+
+.leanoj-master-proof__meta span {
+  overflow-wrap: anywhere;
+}
+
+.leanoj-master-proof__panel {
+  padding: 1rem;
+}
+
+.leanoj-master-proof__code,
+.leanoj-master-proof__edit-details pre {
+  margin: 0.85rem 0 0;
+  padding: 1rem;
+  border-radius: 0.8rem;
+  background: var(--surface-1, #0b1120);
+  border: 1px solid rgba(148, 163, 184, 0.22);
+  color: var(--text-primary, #e5e7eb);
+  overflow: auto;
+  white-space: pre-wrap;
+  max-height: 70vh;
+  font-size: 0.86rem;
+  line-height: 1.45;
+}
+
+.leanoj-master-proof__edits {
+  display: flex;
+  flex-direction: column;
+  gap: 0.75rem;
+  margin-top: 0.85rem;
+}
+
+.leanoj-master-proof__edit-card {
+  padding: 0.9rem 1rem;
+}
+
+.leanoj-master-proof__edit-card p {
+  margin: 0.65rem 0;
+  color: var(--text-primary, #e5e7eb);
+}
+
+.leanoj-master-proof__badge {
+  border-radius: 999px;
+  border: 1px solid rgba(96, 165, 250, 0.45);
+  color: #bfdbfe;
+  padding: 0.25rem 0.6rem;
+}
+
+.leanoj-master-proof__edit-details {
+  display: grid;
+  gap: 0.75rem;
+  margin-top: 0.75rem;
+}
+
+.leanoj-master-proof__edit-details strong {
+  color: var(--text-secondary, #9ca3af);
+}
+
+.leanoj-master-proof__empty,
+.leanoj-master-proof__error {
+  padding: 1rem;
+  color: var(--text-secondary, #9ca3af);
+}
+
+.leanoj-master-proof__error {
+  color: #fecaca;
+  border-color: rgba(248, 113, 113, 0.4);
+}
diff --git a/frontend/src/components/leanoj/LeanOJMasterProof.jsx b/frontend/src/components/leanoj/LeanOJMasterProof.jsx
new file mode 100644
index 0000000..1b8457d
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJMasterProof.jsx
@@ -0,0 +1,207 @@
+import React, { useEffect, useMemo, useState } from 'react';
+import { downloadTextFile } from '../../utils/downloadHelpers';
+import './LeanOJMasterProof.css';
+
+function formatDate(isoString) {
+  if (!isoString) return 'Unknown';
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function formatNumber(value) {
+  const number = Number(value || 0);
+  return Number.isFinite(number) ? number.toLocaleString() : '0';
+}
+
+function metadataValue(metadata, key, fallback = 'N/A') {
+  const value = metadata?.[key];
+  if (value === undefined || value === null || value === '') return fallback;
+  return value;
+}
+
+export default function LeanOJMasterProof({ api, status, refreshToken = 0 }) {
+  const [draft, setDraft] = useState(null);
+  const [edits, setEdits] = useState([]);
+  const [totalEdits, setTotalEdits] = useState(0);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState('');
+  const [showFullProof, setShowFullProof] = useState(false);
+  const [expandedEditIndex, setExpandedEditIndex] = useState(null);
+
+  const loadMasterProof = async () => {
+    try {
+      setLoading(true);
+      setError('');
+      const [draftResponse, editsResponse] = await Promise.all([
+        api.getMasterProof(),
+        api.getMasterProofEdits(75),
+      ]);
+      setDraft(draftResponse || null);
+      setEdits(editsResponse?.edits || []);
+      setTotalEdits(editsResponse?.total_edits || 0);
+    } catch (err) {
+      setError(err.message || 'Failed to load Proof Solver master proof draft');
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    loadMasterProof();
+  }, [refreshToken, status?.master_proof_version, status?.master_proof_hash]);
+
+  const metadata = draft?.metadata || {};
+  const proofContent = draft?.content || '';
+  const proofPreview = useMemo(() => {
+    if (showFullProof || proofContent.length <= 20000) return proofContent;
+    return `${proofContent.slice(0, 20000)}\n\n-- Preview truncated in UI. Download the .lean file or expand full proof to inspect all ${formatNumber(proofContent.length)} characters.`;
+  }, [proofContent, showFullProof]);
+
+  const handleDownload = () => {
+    if (!proofContent) return;
+    downloadTextFile(proofContent, `leanoj_master_proof_${metadataValue(metadata, 'version', 'draft')}.lean`);
+  };
+
+  return (
+    <div className="leanoj-master-proof">
+      <div className="leanoj-master-proof__header">
+        <div>
+          <h2>Master Proof Draft</h2>
+          <p>
+            Inspect the durable Proof Solver draft that the final solver edits with exact-string operations before Lean verification.
+          </p>
+        </div>
+        <div className="leanoj-master-proof__actions">
+          <button type="button" onClick={loadMasterProof} disabled={loading}>
+            {loading ? 'Refreshing...' : 'Refresh'}
+          </button>
+          <button type="button" onClick={handleDownload} disabled={!proofContent}>
+            Download .lean
+          </button>
+        </div>
+      </div>
+
+      {loading && <div className="leanoj-master-proof__empty">Loading master proof draft...</div>}
+      {!loading && error && <div className="leanoj-master-proof__error">{error}</div>}
+
+      {!loading && !error && (
+        <>
+          <div className="leanoj-master-proof__stats">
+            <div className="leanoj-master-proof__stat">
+              <span>{metadataValue(metadata, 'version', 0)}</span>
+              <label>Version</label>
+            </div>
+            <div className="leanoj-master-proof__stat">
+              <span>{formatNumber(metadata?.line_count)}</span>
+              <label>Lines</label>
+            </div>
+            <div className="leanoj-master-proof__stat">
+              <span>{formatNumber(metadata?.char_count)}</span>
+              <label>Characters</label>
+            </div>
+            <div className="leanoj-master-proof__stat">
+              <span>{formatNumber(totalEdits)}</span>
+              <label>Edit Records</label>
+            </div>
+          </div>
+
+          <div className="leanoj-master-proof__meta">
+            <div>
+              <strong>Session</strong>
+              <span>{draft?.session_id || status?.session_id || 'No session loaded'}</span>
+            </div>
+            <div>
+              <strong>Hash</strong>
+              <span>{metadataValue(metadata, 'sha256')}</span>
+            </div>
+            <div>
+              <strong>Last Edit</strong>
+              <span>{metadataValue(metadata, 'last_edit_summary', 'No master proof edit recorded yet.')}</span>
+            </div>
+            {metadata?.last_stuck_reason && (
+              <div>
+                <strong>Last Stuck Reason</strong>
+                <span>{metadata.last_stuck_reason}</span>
+              </div>
+            )}
+          </div>
+
+          {!draft?.exists ? (
+            <div className="leanoj-master-proof__empty">
+              No master proof draft exists yet. Start or resume Proof Solver and enter the final proof loop to initialize it.
+            </div>
+          ) : (
+            <section className="leanoj-master-proof__panel">
+              <div className="leanoj-master-proof__panel-header">
+                <h3>Current Master Proof</h3>
+                {proofContent.length > 20000 && (
+                  <button type="button" onClick={() => setShowFullProof((value) => !value)}>
+                    {showFullProof ? 'Show Preview' : 'Show Full Proof'}
+                  </button>
+                )}
+              </div>
+              <pre className="leanoj-master-proof__code">{proofPreview}</pre>
+            </section>
+          )}
+
+          <section className="leanoj-master-proof__panel">
+            <div className="leanoj-master-proof__panel-header">
+              <h3>Recent Edit History</h3>
+              <span>{edits.length} shown</span>
+            </div>
+
+            {edits.length === 0 ? (
+              <div className="leanoj-master-proof__empty">No edit history recorded yet.</div>
+            ) : (
+              <div className="leanoj-master-proof__edits">
+                {[...edits].reverse().map((edit, index) => {
+                  const key = `${edit.master_proof_version || 'v'}-${edit.created_at || index}-${index}`;
+                  const expanded = expandedEditIndex === index;
+                  return (
+                    <article key={key} className="leanoj-master-proof__edit-card">
+                      <div className="leanoj-master-proof__edit-topline">
+                        <span className="leanoj-master-proof__badge">{edit.action || 'edit'}</span>
+                        {edit.operation && <span>{edit.operation}</span>}
+                        <span>v{edit.master_proof_version || '?'}</span>
+                        <span>{formatDate(edit.created_at)}</span>
+                      </div>
+                      <p>{edit.reasoning || edit.error_summary || edit.stuck_reason || 'No edit summary provided.'}</p>
+                      <button type="button" onClick={() => setExpandedEditIndex(expanded ? null : index)}>
+                        {expanded ? 'Hide Details' : 'Show Details'}
+                      </button>
+                      {expanded && (
+                        <div className="leanoj-master-proof__edit-details">
+                          {edit.old_string_preview && (
+                            <div>
+                              <strong>Old String Preview</strong>
+                              <pre>{edit.old_string_preview}</pre>
+                            </div>
+                          )}
+                          {edit.new_string_preview && (
+                            <div>
+                              <strong>New String Preview</strong>
+                              <pre>{edit.new_string_preview}</pre>
+                            </div>
+                          )}
+                          {edit.error_summary && (
+                            <div>
+                              <strong>Error</strong>
+                              <pre>{edit.error_summary}</pre>
+                            </div>
+                          )}
+                        </div>
+                      )}
+                    </article>
+                  );
+                })}
+              </div>
+            )}
+          </section>
+        </>
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJMathematicalProofs.jsx b/frontend/src/components/leanoj/LeanOJMathematicalProofs.jsx
new file mode 100644
index 0000000..a77f667
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJMathematicalProofs.jsx
@@ -0,0 +1,312 @@
+import React, { useEffect, useMemo, useState } from 'react';
+import { downloadTextFile } from '../../utils/downloadHelpers';
+import '../autonomous/MathematicalProofs.css';
+
+function formatDate(isoString) {
+  if (!isoString) return 'Unknown';
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function truncate(text, maxLength = 220) {
+  if (!text) return '';
+  return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
+}
+
+function getProofBadge(proof) {
+  const tier = proof.novelty_tier;
+  if (tier === 'major_mathematical_discovery') {
+    return { cardClass: 'platinum', badgeClass: 'platinum', label: 'Major Mathematical Discovery' };
+  }
+  if (tier === 'mathematical_discovery') {
+    return { cardClass: 'gold', badgeClass: 'gold', label: 'Minor Mathematical Discovery' };
+  }
+  if (tier === 'novel_variant') {
+    return { cardClass: 'silver', badgeClass: 'silver', label: 'Novel Reformulation' };
+  }
+  if (tier === 'novel_formulation') {
+    return { cardClass: 'bronze', badgeClass: 'bronze', label: 'Novel Formalization' };
+  }
+  if (proof.novel) {
+    return { cardClass: 'gold', badgeClass: 'gold', label: 'Novel Proof' };
+  }
+  return { cardClass: 'known', badgeClass: 'known', label: 'Known Proof' };
+}
+
+function getStatusLabel(status) {
+  if (!status?.session_id) return 'No Proof Solver Session Loaded';
+  if (status.phase === 'verified') return 'Final Submission Verified';
+  if (status.is_running) return `Proof Solver Running: ${status.phase || 'running'}`;
+  return `Proof Solver ${status.phase || 'idle'}`;
+}
+
+function formatSolverName(solver) {
+  return String(solver || 'Proof Solver').replace(/^LeanOJ\b/, 'Proof Solver');
+}
+
+export default function LeanOJMathematicalProofs({ api, status, refreshToken = 0 }) {
+  const [proofs, setProofs] = useState([]);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState('');
+  const [filter, setFilter] = useState('all');
+  const [expandedProofId, setExpandedProofId] = useState(null);
+
+  const loadProofs = async () => {
+    try {
+      setLoading(true);
+      setError('');
+      const response = await api.getProofs();
+      setProofs(response.proofs || []);
+    } catch (err) {
+      if (err.status === 404) {
+        setProofs([]);
+        setError('');
+        return;
+      }
+      setError(err.message || 'Failed to load Proof Solver proofs');
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    loadProofs();
+  }, [refreshToken]);
+
+  const counts = useMemo(() => ({
+    total: proofs.length,
+    final: proofs.filter((proof) => proof.proof_kind === 'final').length,
+    subproof: proofs.filter((proof) => proof.proof_kind === 'subproof').length,
+    novel: proofs.filter((proof) => proof.novel).length,
+    majorDiscovery: proofs.filter((proof) => proof.novelty_tier === 'major_mathematical_discovery').length,
+    discovery: proofs.filter((proof) => proof.novelty_tier === 'mathematical_discovery').length,
+    variant: proofs.filter((proof) => proof.novelty_tier === 'novel_variant').length,
+    formulation: proofs.filter((proof) => proof.novelty_tier === 'novel_formulation').length,
+    known: proofs.filter((proof) => !proof.novel).length,
+  }), [proofs]);
+
+  const visibleProofs = useMemo(() => {
+    if (filter === 'novel') {
+      return proofs.filter((proof) => proof.novel);
+    }
+    if (filter === 'major_mathematical_discovery' || filter === 'mathematical_discovery' || filter === 'novel_variant' || filter === 'novel_formulation') {
+      return proofs.filter((proof) => proof.novelty_tier === filter);
+    }
+    if (filter === 'known') {
+      return proofs.filter((proof) => !proof.novel);
+    }
+    if (filter === 'final') {
+      return proofs.filter((proof) => proof.proof_kind === 'final');
+    }
+    if (filter === 'subproof') {
+      return proofs.filter((proof) => proof.proof_kind === 'subproof');
+    }
+    return proofs;
+  }, [filter, proofs]);
+
+  const handleDownloadLean = (proof) => {
+    if (!proof.lean_code) return;
+    downloadTextFile(proof.lean_code, `${proof.theorem_name || proof.proof_id}.lean`);
+  };
+
+  return (
+    <div className="math-proofs-view">
+      <div className="math-proofs-header">
+        <div>
+          <h2>Mathematical Proofs</h2>
+          <p>
+            Verified Lean 4 proofs from the active Proof Solver run, including brainstorm proof fragments and the final solved submission.
+          </p>
+        </div>
+
+        <div className="math-proofs-status-group">
+          <span className={`math-proofs-status ${status?.phase === 'verified' ? 'ready' : 'pending'}`}>
+            {getStatusLabel(status)}
+          </span>
+          <span className="math-proofs-count">
+            {counts.novel} novel / {counts.total} total
+          </span>
+          <button className="math-proofs-refresh" onClick={loadProofs}>
+            Refresh
+          </button>
+        </div>
+      </div>
+
+      <div className="math-proofs-toolbar">
+        <div className="math-proofs-filters">
+          <button
+            className={`math-proofs-filter ${filter === 'novel' ? 'active' : ''}`}
+            onClick={() => setFilter('novel')}
+          >
+            All Novel ({counts.novel})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--platinum ${filter === 'major_mathematical_discovery' ? 'active' : ''}`}
+            onClick={() => setFilter('major_mathematical_discovery')}
+          >
+            Major Discovery ({counts.majorDiscovery})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--gold ${filter === 'mathematical_discovery' ? 'active' : ''}`}
+            onClick={() => setFilter('mathematical_discovery')}
+          >
+            Minor Mathematical Discovery ({counts.discovery})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--silver ${filter === 'novel_variant' ? 'active' : ''}`}
+            onClick={() => setFilter('novel_variant')}
+          >
+            Reformulation ({counts.variant})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--bronze ${filter === 'novel_formulation' ? 'active' : ''}`}
+            onClick={() => setFilter('novel_formulation')}
+          >
+            Formalization ({counts.formulation})
+          </button>
+          <button
+            className={`math-proofs-filter ${filter === 'known' ? 'active' : ''}`}
+            onClick={() => setFilter('known')}
+          >
+            Known ({counts.known})
+          </button>
+          <button
+            className={`math-proofs-filter ${filter === 'all' ? 'active' : ''}`}
+            onClick={() => setFilter('all')}
+          >
+            All Verified ({counts.total})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--gold ${filter === 'final' ? 'active' : ''}`}
+            onClick={() => setFilter('final')}
+          >
+            Final Verified Submissions ({counts.final})
+          </button>
+          <button
+            className={`math-proofs-filter math-proofs-filter--silver ${filter === 'subproof' ? 'active' : ''}`}
+            onClick={() => setFilter('subproof')}
+          >
+            Verified Proof Fragments ({counts.subproof})
+          </button>
+        </div>
+      </div>
+
+      {loading && <div className="math-proofs-empty">Loading Proof Solver proofs...</div>}
+      {!loading && error && <div className="math-proofs-error">{error}</div>}
+
+      {!loading && !error && visibleProofs.length === 0 && (
+        <div className="math-proofs-empty">
+          {proofs.length === 0
+            ? 'No Proof Solver proofs yet. This tab will populate as brainstorm proof fragments and final submissions pass Lean 4.'
+            : 'No Proof Solver proofs match the selected filter.'}
+        </div>
+      )}
+
+      {!loading && !error && visibleProofs.length > 0 && (
+        <div className="math-proofs-list">
+          {visibleProofs.map((proof) => {
+            const isExpanded = expandedProofId === proof.library_id;
+            const badge = getProofBadge(proof);
+            return (
+              <article key={proof.library_id} className={`math-proof-card ${badge.cardClass}`}>
+                <div className="math-proof-card-header">
+                  <div>
+                    <div className="math-proof-card-topline">
+                      <span className={`math-proof-badge ${badge.badgeClass}`}>
+                        {badge.label}
+                      </span>
+                      <span className="math-proof-source">
+                        {proof.session_id}
+                      </span>
+                    </div>
+                    <h3>{proof.theorem_statement}</h3>
+                    <p className="math-proof-summary">
+                      {truncate(proof.source_title || proof.user_prompt || 'Lean 4 verified this Proof Solver proof.')}
+                    </p>
+                  </div>
+
+                  <div className="math-proof-card-actions">
+                    <button
+                      type="button"
+                      className="math-proof-download math-proof-download--compact"
+                      onClick={() => handleDownloadLean(proof)}
+                      disabled={!proof.lean_code}
+                    >
+                      Download .lean
+                    </button>
+                    <button
+                      className="math-proof-expand"
+                      onClick={() => setExpandedProofId(isExpanded ? null : proof.library_id)}
+                    >
+                      {isExpanded ? 'Hide Details' : 'View Details'}
+                    </button>
+                  </div>
+                </div>
+
+                <div className="math-proof-meta">
+                  <span>Solver: {formatSolverName(proof.solver)}</span>
+                  <span>Attempts: {proof.attempt_count || 0}</span>
+                  <span>Verified: {formatDate(proof.created_at)}</span>
+                </div>
+
+                {isExpanded && (
+                  <div className="math-proof-details">
+                    <div className="math-proof-actions">
+                      <button
+                        type="button"
+                        className="math-proof-download"
+                        onClick={() => handleDownloadLean(proof)}
+                        disabled={!proof.lean_code}
+                      >
+                        Download .lean
+                      </button>
+                    </div>
+
+                    <div className="math-proof-detail-block">
+                      <strong>Proof Work</strong>
+                      <div>{proof.theorem_name || proof.proof_id}</div>
+                    </div>
+
+                    {proof.shared_proof_id && (
+                      <div className="math-proof-detail-block">
+                        <strong>Shared Proof ID</strong>
+                        <div>{proof.shared_proof_id}</div>
+                      </div>
+                    )}
+
+                    {proof.novelty_reasoning && (
+                      <div className="math-proof-detail-block">
+                        <strong>Novelty Reasoning</strong>
+                        <div>{proof.novelty_reasoning}</div>
+                      </div>
+                    )}
+
+                    <div className="math-proof-detail-block">
+                      <strong>Proof Solver Proof Kind</strong>
+                      <div>{proof.proof_kind === 'final' ? 'Final verified submission' : 'Verified proof fragment'}</div>
+                    </div>
+
+                    {proof.role && (
+                      <div className="math-proof-detail-block">
+                        <strong>Proof Fragment Role</strong>
+                        <div>{proof.role}</div>
+                      </div>
+                    )}
+
+                    <div className="math-proof-detail-block">
+                      <strong>Lean 4 Code</strong>
+                      <pre className="math-proof-code">{proof.lean_code}</pre>
+                    </div>
+                  </div>
+                )}
+              </article>
+            );
+          })}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJProofLibrary.jsx b/frontend/src/components/leanoj/LeanOJProofLibrary.jsx
new file mode 100644
index 0000000..a2b3eb0
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJProofLibrary.jsx
@@ -0,0 +1,352 @@
+import React, { useEffect, useMemo, useState } from 'react';
+import { downloadTextFile } from '../../utils/downloadHelpers';
+import '../autonomous/FinalAnswerLibrary.css';
+import '../autonomous/ProofLibrary.css';
+
+function formatDate(isoString) {
+  if (!isoString) return 'N/A';
+  try {
+    return new Date(isoString).toLocaleString();
+  } catch {
+    return isoString;
+  }
+}
+
+function truncate(text, maxLength = 260) {
+  if (!text) return '';
+  return text.length > maxLength ? `${text.slice(0, maxLength)}...` : text;
+}
+
+function getProofBadge(proof) {
+  if (proof.proof_kind === 'final') {
+    return { cssClass: 'proof-badge--gold', cardClass: 'proof-card--gold', label: 'Final Verified Submission' };
+  }
+  return { cssClass: 'proof-badge--silver', cardClass: 'proof-card--silver', label: 'Verified Proof Fragment' };
+}
+
+function formatSolverName(solver) {
+  return String(solver || 'Proof Solver').replace(/^LeanOJ\b/, 'Proof Solver');
+}
+
+export default function LeanOJProofLibrary({ api, refreshToken = 0 }) {
+  const [proofs, setProofs] = useState([]);
+  const [sessions, setSessions] = useState([]);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState('');
+  const [expandedId, setExpandedId] = useState(null);
+  const [expandedProof, setExpandedProof] = useState(null);
+  const [loadingContentId, setLoadingContentId] = useState(null);
+  const [searchTerm, setSearchTerm] = useState('');
+  const [filterKind, setFilterKind] = useState('all');
+
+  const loadProofLibrary = async () => {
+    try {
+      setLoading(true);
+      setError('');
+      const response = await api.getProofLibrary(true);
+      setProofs(response.proofs || []);
+      setSessions(response.sessions || []);
+    } catch (err) {
+      if (err.status === 404) {
+        setProofs([]);
+        setSessions([]);
+        setError('');
+        return;
+      }
+      setError(err.message || 'Failed to load Proof Solver proof works library');
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    loadProofLibrary();
+  }, [refreshToken]);
+
+  const filteredProofs = useMemo(() => {
+    const lowerSearch = searchTerm.trim().toLowerCase();
+    return proofs.filter((proof) => {
+      const kindMatches = filterKind === 'all' || proof.proof_kind === filterKind;
+      if (!kindMatches) return false;
+      if (!lowerSearch) return true;
+      return (
+        (proof.theorem_name || '').toLowerCase().includes(lowerSearch) ||
+        (proof.theorem_statement || '').toLowerCase().includes(lowerSearch) ||
+        (proof.source_title || '').toLowerCase().includes(lowerSearch) ||
+        (proof.user_prompt || '').toLowerCase().includes(lowerSearch) ||
+        (proof.session_id || '').toLowerCase().includes(lowerSearch)
+      );
+    });
+  }, [filterKind, proofs, searchTerm]);
+
+  const proofsBySession = useMemo(() => {
+    const map = new Map();
+    for (const proof of filteredProofs) {
+      const sessionId = proof.session_id || 'unknown';
+      if (!map.has(sessionId)) map.set(sessionId, []);
+      map.get(sessionId).push(proof);
+    }
+    return map;
+  }, [filteredProofs]);
+
+  const visibleSessions = useMemo(() => {
+    return sessions.filter((session) => proofsBySession.has(session.session_id));
+  }, [proofsBySession, sessions]);
+
+  const counts = useMemo(() => ({
+    total: proofs.length,
+    final: proofs.filter((proof) => proof.proof_kind === 'final').length,
+    subproof: proofs.filter((proof) => proof.proof_kind === 'subproof').length,
+  }), [proofs]);
+
+  const handleExpand = async (proof) => {
+    const id = proof.library_id || `${proof.session_id}:${proof.proof_id}`;
+    if (expandedId === id) {
+      setExpandedId(null);
+      setExpandedProof(null);
+      return;
+    }
+
+    setExpandedId(id);
+    setLoadingContentId(id);
+    try {
+      const fullProof = await api.getLibraryProof(proof.session_id, proof.proof_id);
+      setExpandedProof(fullProof);
+    } catch {
+      setExpandedProof(proof);
+    } finally {
+      setLoadingContentId(null);
+    }
+  };
+
+  const handleDownloadLean = async (proof, event) => {
+    event?.stopPropagation();
+
+    let proofForDownload = proof;
+    let leanCode = proof.lean_code || '';
+    if (!leanCode && proof.session_id && proof.proof_id) {
+      try {
+        proofForDownload = await api.getLibraryProof(proof.session_id, proof.proof_id);
+        leanCode = proofForDownload.lean_code || '';
+      } catch {
+        return;
+      }
+    }
+
+    if (!leanCode) return;
+    downloadTextFile(leanCode, `${proofForDownload.theorem_name || proof.theorem_name || proof.proof_id}.lean`);
+  };
+
+  if (loading) {
+    return (
+      <div className="final-answer-library proof-library">
+        <div className="library-loading">
+          <span className="library-loading__icon">&#x21BB;</span>
+          <span className="library-loading__text">Loading Proof Solver proof works...</span>
+        </div>
+      </div>
+    );
+  }
+
+  if (error) {
+    return (
+      <div className="final-answer-library proof-library">
+        <div className="error-message">
+          <span>&#x26A0;</span>
+          <p>{error}</p>
+          <button className="retry-button" onClick={loadProofLibrary}>
+            Retry
+          </button>
+        </div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="final-answer-library proof-library">
+      <div className="library-header">
+        <h2>Your Completed Proof Works Library</h2>
+        <p>
+          Browse verified Proof Solver final submissions and brainstorm proof fragments saved across proof-solver sessions.
+        </p>
+        <div className="library-stats">
+          <span className="stat-badge">{counts.total} Proof Work{counts.total !== 1 ? 's' : ''}</span>
+          <span className="stat-badge">{counts.final} Final Submission{counts.final !== 1 ? 's' : ''}</span>
+          <span className="stat-badge">{counts.subproof} Proof Fragment{counts.subproof !== 1 ? 's' : ''}</span>
+        </div>
+      </div>
+
+      <div className="library-controls">
+        <input
+          className="search-input"
+          type="text"
+          placeholder="Search by theorem, problem, session, or Proof Solver source..."
+          value={searchTerm}
+          onChange={(event) => setSearchTerm(event.target.value)}
+        />
+        <div className="filter-buttons">
+          <button className={filterKind === 'all' ? 'active' : ''} onClick={() => setFilterKind('all')}>
+            All
+          </button>
+          <button className={filterKind === 'final' ? 'active' : ''} onClick={() => setFilterKind('final')}>
+            Final
+          </button>
+          <button className={filterKind === 'subproof' ? 'active' : ''} onClick={() => setFilterKind('subproof')}>
+            Proof Fragments
+          </button>
+        </div>
+      </div>
+
+      {filteredProofs.length === 0 ? (
+        <div className="fal-empty-state">
+          <span className="empty-icon">&#x1D7D9;</span>
+          <h3>{proofs.length === 0 ? 'No Proof Solver Proofs Yet' : 'No Proof Solver Proof Works Found'}</h3>
+          <p>
+            {proofs.length === 0
+              ? 'No Proof Solver proofs yet. Completed final submissions and verified brainstorm proof fragments will appear here.'
+              : 'No proof works match your search criteria.'}
+          </p>
+        </div>
+      ) : (
+        <div className="run-history-groups">
+          {visibleSessions.map((session) => {
+            const sessionProofs = proofsBySession.get(session.session_id) || [];
+            return (
+              <div key={session.session_id} className="run-history-group">
+                <div className="run-history-group-header">
+                  <div className="run-history-group-heading">
+                    <h3 className="run-history-group-title">{session.user_prompt}</h3>
+                    <p className="run-history-group-subtitle">
+                      {sessionProofs.length} proof work{sessionProofs.length !== 1 ? 's' : ''} - {formatDate(session.updated_at)}
+                    </p>
+                  </div>
+                  <div className="run-history-group-badges">
+                    {session.is_current && (
+                      <span className="run-history-group-badge run-history-group-badge--current">
+                        Current Session
+                      </span>
+                    )}
+                    {session.phase && (
+                      <span className="run-history-group-badge">{session.phase}</span>
+                    )}
+                  </div>
+                </div>
+
+                <div className="run-history-group-body">
+                  <div className="answer-list">
+                    {sessionProofs.map((proof) => {
+                      const id = proof.library_id || `${proof.session_id}:${proof.proof_id}`;
+                      const isExpanded = expandedId === id;
+                      const badge = getProofBadge(proof);
+
+                      return (
+                        <div key={id} className={`answer-card proof-card ${isExpanded ? 'expanded' : ''} ${badge.cardClass}`}>
+                          <div className="answer-header" onClick={() => handleExpand(proof)}>
+                            <div className="answer-title-row">
+                              <h4 className="answer-title proof-title">
+                                {proof.theorem_name || proof.proof_id}
+                              </h4>
+                              <div className="proof-card-actions">
+                                <button
+                                  type="button"
+                                  className="proof-header-download"
+                                  onClick={(event) => handleDownloadLean(proof, event)}
+                                >
+                                  Download .lean
+                                </button>
+                                <button className="expand-button">
+                                  {isExpanded ? 'Hide' : 'View'}
+                                </button>
+                              </div>
+                            </div>
+
+                            <div className="answer-metadata">
+                              <span className={`format-badge ${badge.cssClass}`}>
+                                {badge.label}
+                              </span>
+                              <span className="word-count">
+                                {formatSolverName(proof.solver)}
+                              </span>
+                              <span className="word-count">
+                                {proof.attempt_count || 0} attempt{(proof.attempt_count || 0) !== 1 ? 's' : ''}
+                              </span>
+                            </div>
+
+                            <p className="proof-statement">
+                              {truncate(proof.theorem_statement, 320)}
+                            </p>
+
+                            {proof.source_title && (
+                              <p className="answer-prompt">
+                                <strong>Source:</strong> {truncate(proof.source_title, 220)}
+                              </p>
+                            )}
+
+                            <div className="answer-footer-info">
+                              <span className="completion-date">
+                                Verified: {formatDate(proof.created_at)}
+                              </span>
+                            </div>
+                          </div>
+
+                          {isExpanded && (
+                            <div className="answer-content">
+                              {loadingContentId === id ? (
+                                <div className="library-loading" style={{ padding: '20px' }}>
+                                  <span className="library-loading__icon">&#x21BB;</span>
+                                  <span className="library-loading__text">Loading proof work details...</span>
+                                </div>
+                              ) : expandedProof ? (
+                                <div className="proof-expanded-content">
+                                  <div className="proof-detail-section">
+                                    <h4>Proof Work</h4>
+                                    <p>{expandedProof.theorem_statement}</p>
+                                  </div>
+
+                                  {expandedProof.lean_template && (
+                                    <div className="proof-detail-section">
+                                      <h4>Original Proof Solver Template</h4>
+                                      <pre className="proof-code-block">{expandedProof.lean_template}</pre>
+                                    </div>
+                                  )}
+
+                                  {expandedProof.lean_code && (
+                                    <div className="proof-detail-section">
+                                      <h4>Lean 4 Source Code</h4>
+                                      <pre className="proof-code-block proof-lean-code">{expandedProof.lean_code}</pre>
+                                    </div>
+                                  )}
+
+                                  <div className="quick-download-buttons">
+                                    {expandedProof.lean_code && (
+                                      <button
+                                        className="quick-download-raw"
+                                        onClick={() => handleDownloadLean(expandedProof)}
+                                      >
+                                        Download .lean
+                                      </button>
+                                    )}
+                                  </div>
+                                </div>
+                              ) : null}
+                            </div>
+                          )}
+                        </div>
+                      );
+                    })}
+                  </div>
+                </div>
+              </div>
+            );
+          })}
+        </div>
+      )}
+
+      <div className="library-footer">
+        <button className="refresh-button" onClick={loadProofLibrary}>
+          Refresh Proof Works Library
+        </button>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/LeanOJSettings.jsx b/frontend/src/components/leanoj/LeanOJSettings.jsx
new file mode 100644
index 0000000..a5a8bc1
--- /dev/null
+++ b/frontend/src/components/leanoj/LeanOJSettings.jsx
@@ -0,0 +1,840 @@
+import React, { useEffect, useState } from 'react';
+import { api, openRouterAPI } from '../../services/api';
+import {
+  computeOpenRouterAutoSettings,
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
+  findOpenRouterModel,
+  getProviderNames,
+  getReasoningSupportInfo,
+  hasEndpointMetadata,
+  normalizeOpenRouterReasoningEffort,
+  OPENROUTER_REASONING_EFFORT_OPTIONS,
+} from '../../utils/openRouterSelection';
+import {
+  LEANOJ_PROFILES_STORAGE_KEY,
+  LEANOJ_RECOMMENDED_PROFILES,
+  applyLeanOJProfileSelection,
+  persistLeanOJSettings,
+} from '../../utils/leanojProfiles';
+import HelpTooltip from '../HelpTooltip';
+import HighlightedModelsSidebar from '../HighlightedModelsSidebar';
+import RawSettingsEditor from '../RawSettingsEditor';
+import '../settings-common.css';
+
+const RAW_VIEW_EXIT_WARNING = 'Switching back to the GUI view will restore your last GUI settings/profile and discard raw-only changes. Continue?';
+const formatRawSettings = (value) => JSON.stringify(value, null, 2);
+const SUPERCHARGE_TOOLTIP = 'Supercharge makes this role generate 4 full answer attempts, then run a 5th same-model call to choose or synthesize the best final answer. It uses 5x the API calls, so it is about 5x slower and 5x more costly, but can produce more intelligent answers.';
+
+const ROLE_EDITOR_GROUPS = [
+  { key: 'validator', title: 'Validator', roleKeys: ['topic_validator', 'brainstorm_validator'] },
+  { key: 'final_solver', title: 'Final Proof Solver', roleKeys: ['final_solver'] },
+];
+
+const toRoleConfig = (config = {}) => {
+  const { submitterId, ...roleConfig } = config;
+  return roleConfig;
+};
+
+function ModelSelector({
+  config,
+  onChange,
+  lmStudioModels,
+  openRouterModels,
+  modelProviders,
+  hasOpenRouterKey,
+  isRunning,
+  lmStudioEnabled,
+}) {
+  const provider = lmStudioEnabled ? (config.provider || 'lm_studio') : 'openrouter';
+  const models = provider === 'openrouter' ? openRouterModels : lmStudioModels;
+  const providers = provider === 'openrouter' && config.modelId
+    ? getProviderNames(modelProviders[config.modelId])
+    : [];
+  const reasoningInfo = provider === 'openrouter'
+    ? getReasoningSupportInfo(modelProviders[config.modelId], config.openrouterProvider || null)
+    : { hasEndpointMetadata: false, supportsReasoning: false };
+
+  return (
+    <>
+      <div className="settings-row">
+        <label>Provider</label>
+        {lmStudioEnabled ? (
+          <div className="provider-toggle-group">
+            <button
+              type="button"
+              className={`provider-toggle-btn${provider === 'lm_studio' ? ' active-lm' : ''}`}
+              disabled={isRunning}
+              onClick={() => onChange({ ...config, provider: 'lm_studio', openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT })}
+            >
+              LM Studio
+            </button>
+            <button
+              type="button"
+              className={`provider-toggle-btn${provider === 'openrouter' ? ' active-or-orange' : ''}`}
+              disabled={isRunning || !hasOpenRouterKey}
+              onClick={() => onChange({ ...config, provider: 'openrouter', openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT })}
+              title={!hasOpenRouterKey ? 'Set OpenRouter API key first' : 'Use OpenRouter'}
+            >
+              OpenRouter
+            </button>
+          </div>
+        ) : (
+          <small className="settings-hint">OpenRouter is required in this deployment.</small>
+        )}
+      </div>
+
+      <div className="settings-row">
+        <label>Model</label>
+        <select
+          value={config.modelId || ''}
+          disabled={isRunning}
+          onChange={(event) => onChange({ ...config, provider, modelId: event.target.value, openrouterProvider: null, openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT })}
+        >
+          <option value="">Select model...</option>
+          {models.map((model) => {
+            const isFree = provider === 'openrouter' && model.pricing?.prompt === '0' && model.pricing?.completion === '0';
+            const contextInfo = model.context_length ? ` (${Math.round(model.context_length / 1000)}K)` : '';
+            return (
+              <option key={model.id} value={model.id}>
+                {(model.name || model.id)}{contextInfo}{isFree ? ' [FREE]' : ''}
+              </option>
+            );
+          })}
+        </select>
+      </div>
+
+      {provider === 'openrouter' && config.modelId && (
+        <div className="settings-row">
+          <label>Host Provider</label>
+          <select
+            value={config.openrouterProvider || ''}
+            disabled={isRunning}
+            onChange={(event) => onChange({ ...config, provider, openrouterProvider: event.target.value || null })}
+          >
+            <option value="">Auto</option>
+            {providers.map((providerName) => (
+              <option key={providerName} value={providerName}>{providerName}</option>
+            ))}
+          </select>
+        </div>
+      )}
+
+      {provider === 'openrouter' && config.modelId && (
+        <div className="settings-row">
+          <label>Reasoning Effort</label>
+          <select
+            value={normalizeOpenRouterReasoningEffort(config.openrouterReasoningEffort)}
+            disabled={isRunning}
+            onChange={(event) => onChange({ ...config, provider, openrouterReasoningEffort: event.target.value })}
+          >
+            {OPENROUTER_REASONING_EFFORT_OPTIONS.map(option => (
+              <option key={option.value} value={option.value}>{option.label}</option>
+            ))}
+          </select>
+          <small className="settings-hint">
+            {reasoningInfo.hasEndpointMetadata && !reasoningInfo.supportsReasoning
+              ? 'This selected host does not advertise reasoning support; OpenRouter may ignore the setting.'
+              : 'Auto sends OpenRouter max reasoning effort by default.'}
+          </small>
+        </div>
+      )}
+
+      {provider === 'openrouter' && lmStudioEnabled && (
+        <div className="settings-row">
+          <label>LM Studio Fallback</label>
+          <select
+            value={config.lmStudioFallbackId || ''}
+            disabled={isRunning}
+            onChange={(event) => onChange({ ...config, provider, lmStudioFallbackId: event.target.value || null })}
+          >
+            <option value="">No fallback</option>
+            {lmStudioModels.map((model) => (
+              <option key={model.id} value={model.id}>{model.id}</option>
+            ))}
+          </select>
+        </div>
+      )}
+    </>
+  );
+}
+function RoleEditor(props) {
+  const { title, config, onChange, isRunning, developerModeEnabled = false } = props;
+  const updateNumber = (key, value, fallback) => {
+    const parsed = parseInt(value, 10);
+    onChange({ ...config, [key]: Number.isFinite(parsed) && parsed > 0 ? parsed : fallback });
+  };
+
+  return (
+    <div className={`submitter-config-section${config.provider === 'openrouter' ? ' role-config-card--openrouter-orange' : ''}`}>
+      <h4>{title}</h4>
+      <ModelSelector {...props} />
+      <div className="settings-row">
+        <label>Context Window</label>
+        <input
+          type="number"
+          min={4096}
+          step={1024}
+          value={config.contextWindow || DEFAULT_CONTEXT_WINDOW}
+          disabled={isRunning}
+          onChange={(event) => updateNumber('contextWindow', event.target.value, DEFAULT_CONTEXT_WINDOW)}
+        />
+      </div>
+      <div className="settings-row">
+        <label>Max Output Tokens</label>
+        <input
+          type="number"
+          min={1000}
+          step={1000}
+          value={config.maxOutputTokens || DEFAULT_MAX_OUTPUT_TOKENS}
+          disabled={isRunning}
+          onChange={(event) => updateNumber('maxOutputTokens', event.target.value, DEFAULT_MAX_OUTPUT_TOKENS)}
+        />
+      </div>
+      {developerModeEnabled && (
+        <div className="settings-row settings-row--inline-checkbox">
+          <label className="settings-checkbox-label settings-checkbox-label--supercharge">
+            <input
+              type="checkbox"
+              checked={Boolean(config.superchargeEnabled)}
+              disabled={isRunning}
+              onChange={(event) => onChange({ ...config, superchargeEnabled: event.target.checked })}
+            />
+            <HelpTooltip
+              label="Learn about Supercharge"
+              buttonContent="Supercharge"
+              buttonClassName="help-tooltip-btn--text"
+              popupClassName="help-tooltip-popup--fixed"
+              useFixedPosition
+            >
+              {SUPERCHARGE_TOOLTIP}
+            </HelpTooltip>
+          </label>
+        </div>
+      )}
+    </div>
+  );
+}
+export default function LeanOJSettings({
+  settings,
+  onSettingsChange,
+  capabilities,
+  isRunning,
+  developerModeEnabled = false,
+}) {
+  const [lmStudioModels, setLmStudioModels] = useState([]);
+  const [openRouterModels, setOpenRouterModels] = useState([]);
+  const [modelProviders, setModelProviders] = useState(settings.modelProviders || {});
+  const [hasOpenRouterKey, setHasOpenRouterKey] = useState(false);
+  const [userProfiles, setUserProfiles] = useState({});
+  const [selectedProfile, setSelectedProfile] = useState(settings.selectedProfile || '');
+  const [showSaveDialog, setShowSaveDialog] = useState(false);
+  const [newProfileName, setNewProfileName] = useState('');
+  const [advancedSettingsExpanded, setAdvancedSettingsExpanded] = useState(false);
+  const [editRawSettings, setEditRawSettings] = useState(false);
+  const [rawSettingsText, setRawSettingsText] = useState('');
+  const [rawSettingsMessage, setRawSettingsMessage] = useState('');
+  const [guiSettingsBeforeRaw, setGuiSettingsBeforeRaw] = useState(null);
+  const lmStudioEnabled = capabilities?.lmStudioEnabled !== false;
+
+  useEffect(() => {
+    if (!developerModeEnabled && editRawSettings) {
+      setEditRawSettings(false);
+      setRawSettingsMessage('');
+    }
+  }, [developerModeEnabled, editRawSettings]);
+
+  useEffect(() => {
+    const load = async () => {
+      try {
+        const status = await openRouterAPI.getApiKeyStatus();
+        setHasOpenRouterKey(Boolean(status.has_key));
+        if (status.has_key) {
+          const openRouter = await openRouterAPI.getModels(null, settings.freeOnly);
+          setOpenRouterModels(openRouter.models || []);
+        }
+      } catch (error) {
+        console.error('Failed to load OpenRouter state for Proof Solver:', error);
+      }
+
+      if (lmStudioEnabled) {
+        try {
+          const models = await api.getModels();
+          setLmStudioModels(models.models || models || []);
+        } catch (error) {
+          console.error('Failed to load LM Studio models for Proof Solver:', error);
+        }
+      }
+
+      try {
+        setUserProfiles(JSON.parse(localStorage.getItem(LEANOJ_PROFILES_STORAGE_KEY) || '{}'));
+      } catch {
+        setUserProfiles({});
+      }
+    };
+    load();
+  }, [lmStudioEnabled, settings.freeOnly]);
+
+  useEffect(() => {
+    setSelectedProfile(settings.selectedProfile || '');
+  }, [settings.selectedProfile]);
+
+  const persistSettings = (nextSettings, { markCustom = false } = {}) => {
+    const finalSettings = markCustom
+      ? { ...nextSettings, selectedProfile: '' }
+      : nextSettings;
+    const next = persistLeanOJSettings(finalSettings);
+    if (markCustom && selectedProfile) {
+      setSelectedProfile('');
+    } else {
+      setSelectedProfile(next.selectedProfile || '');
+    }
+    onSettingsChange(next);
+    return next;
+  };
+
+  const updateSettings = (patch) => persistSettings({
+    ...settings,
+    ...patch,
+    modelProviders,
+  }, { markCustom: true });
+
+  const shouldAutoFillRole = (previousConfig = {}, config = {}) => (
+    config.provider === 'openrouter' && config.modelId && (
+      previousConfig.provider !== config.provider ||
+      previousConfig.modelId !== config.modelId ||
+      previousConfig.openrouterProvider !== config.openrouterProvider
+    )
+  );
+
+  const updateRoles = (roleKeys, config) => {
+    const shouldAutoFill = roleKeys.some((roleKey) => shouldAutoFillRole(settings.roles[roleKey], config));
+    const roles = { ...settings.roles };
+    roleKeys.forEach((roleKey) => {
+      roles[roleKey] = config;
+    });
+    const nextSettings = updateSettings({
+      roles,
+    });
+    if (shouldAutoFill) {
+      maybeApplyAutoSettingsToRoles(roleKeys, config, nextSettings);
+    }
+  };
+
+  const updateSubmitter = (index, config) => {
+    const previousConfig = settings.submitterConfigs[index] || {};
+    const shouldAutoFill = config.provider === 'openrouter' && config.modelId && (
+      previousConfig.provider !== config.provider ||
+      previousConfig.modelId !== config.modelId ||
+      previousConfig.openrouterProvider !== config.openrouterProvider
+    );
+    const submitterConfigs = [...settings.submitterConfigs];
+    submitterConfigs[index] = { ...config, submitterId: index + 1 };
+    const patch = { submitterConfigs };
+    if (index === 0) {
+      patch.roles = {
+        ...settings.roles,
+        topic_generator: toRoleConfig(submitterConfigs[index]),
+      };
+    }
+    const nextSettings = updateSettings(patch);
+    if (shouldAutoFill) {
+      maybeApplyAutoSettingsToSubmitter(index, submitterConfigs[index], nextSettings);
+    }
+  };
+
+  const fetchProvidersForModel = async (modelId, baseSettings = settings) => {
+    if (!modelId) return null;
+    if (hasEndpointMetadata(modelProviders[modelId])) {
+      return modelProviders[modelId];
+    }
+    try {
+      const result = await openRouterAPI.getProviders(modelId);
+      const nextProviders = {
+        ...modelProviders,
+        [modelId]: {
+          providers: result.providers || [],
+          endpoints: result.endpoints || [],
+        },
+      };
+      setModelProviders(nextProviders);
+      persistSettings({ ...baseSettings, modelProviders: nextProviders });
+      return nextProviders[modelId];
+    } catch (error) {
+      console.error('Failed to fetch Proof Solver provider list:', error);
+      return null;
+    }
+  };
+
+  const getAutoSettingsForModel = async (modelId, selectedProvider = null, baseSettings = settings) => {
+    const model = findOpenRouterModel(openRouterModels, modelId);
+    if (!model) {
+      console.debug('[ProofSolverAutoFill] model not in loaded list, skipping auto-fill', { modelId });
+      return null;
+    }
+    const providerData = await fetchProvidersForModel(modelId, baseSettings);
+    const autoSettings = computeOpenRouterAutoSettings(model, providerData, selectedProvider);
+    if (autoSettings?.warnings?.length) {
+      console.warn('[ProofSolverAutoFill] auto-settings fallback used:', autoSettings.warnings);
+    }
+    return autoSettings;
+  };
+
+  const applyAutoSettingsToConfig = async (config, baseSettings = settings) => {
+    if (config.provider !== 'openrouter' || !config.modelId) return;
+    const auto = await getAutoSettingsForModel(config.modelId, config.openrouterProvider || null, baseSettings);
+    if (!auto) return null;
+    return {
+      ...config,
+      ...(auto.contextWindowKnown ? { contextWindow: auto.contextWindow } : {}),
+      ...(auto.outputCapKnown ? { maxOutputTokens: auto.maxOutputTokens } : {}),
+    };
+  };
+
+  const maybeApplyAutoSettingsToRoles = async (roleKeys, config, baseSettings) => {
+    const nextConfig = await applyAutoSettingsToConfig(config, baseSettings);
+    if (!nextConfig) return;
+    const roles = { ...baseSettings.roles };
+    roleKeys.forEach((roleKey) => {
+      roles[roleKey] = nextConfig;
+    });
+    persistSettings({
+      ...baseSettings,
+      roles,
+    });
+  };
+
+  const maybeApplyAutoSettingsToSubmitter = async (index, config, baseSettings) => {
+    const nextConfig = await applyAutoSettingsToConfig(config, baseSettings);
+    if (!nextConfig) return;
+    const submitterConfigs = [...baseSettings.submitterConfigs];
+    submitterConfigs[index] = { ...nextConfig, submitterId: index + 1 };
+    const nextSettings = {
+      ...baseSettings,
+      submitterConfigs,
+    };
+    if (index === 0) {
+      nextSettings.roles = {
+        ...baseSettings.roles,
+        topic_generator: toRoleConfig(submitterConfigs[index]),
+      };
+    }
+    persistSettings(nextSettings);
+  };
+
+  const handleProfileSelect = async (profileKey) => {
+    if (!profileKey) {
+      setSelectedProfile('');
+      persistSettings({ ...settings, selectedProfile: '' });
+      return;
+    }
+    if (!hasOpenRouterKey) {
+      alert('OpenRouter API key required to use profiles. Please set your API key first.');
+      return;
+    }
+    if (openRouterModels.length === 0) {
+      alert('Please wait for OpenRouter models to load, or refresh OpenRouter models in settings.');
+      return;
+    }
+    try {
+      const { settings: nextSettings } = await applyLeanOJProfileSelection(profileKey, userProfiles);
+      setSelectedProfile(nextSettings.selectedProfile || profileKey);
+      onSettingsChange(nextSettings);
+      setModelProviders(nextSettings.modelProviders || {});
+    } catch (error) {
+      console.error(error.message || 'Failed to apply Proof Solver profile:', error);
+    }
+  };
+
+  const saveCurrentAsProfile = () => {
+    if (!newProfileName.trim()) {
+      alert('Please enter a profile name');
+      return;
+    }
+    const key = `user_${Date.now()}`;
+    const nextProfiles = {
+      ...userProfiles,
+      [key]: {
+        name: newProfileName.trim(),
+        numSubmitters: settings.submitterConfigs.length,
+        submitters: settings.submitterConfigs.map((config) => ({
+          modelId: config.modelId,
+          provider: config.provider,
+          openrouterProvider: config.openrouterProvider,
+          lmStudioFallbackId: config.lmStudioFallbackId,
+          contextWindow: config.contextWindow,
+          maxOutputTokens: config.maxOutputTokens,
+          superchargeEnabled: Boolean(config.superchargeEnabled),
+        })),
+        roles: settings.roles,
+        maxInitialBrainstormAccepts: settings.maxInitialBrainstormAccepts,
+        maxRecursiveBrainstormAccepts: settings.maxRecursiveBrainstormAccepts,
+        finalAttemptsPerCycle: settings.finalAttemptsPerCycle,
+      },
+    };
+    localStorage.setItem(LEANOJ_PROFILES_STORAGE_KEY, JSON.stringify(nextProfiles));
+    setUserProfiles(nextProfiles);
+    const nextSettings = persistLeanOJSettings({ ...settings, selectedProfile: key });
+    setSelectedProfile(key);
+    onSettingsChange(nextSettings);
+    setShowSaveDialog(false);
+    setNewProfileName('');
+  };
+
+  const deleteProfile = (profileKey) => {
+    if (!profileKey.startsWith('user_')) {
+      alert('Cannot delete recommended profiles');
+      return;
+    }
+    const profileToDelete = userProfiles[profileKey];
+    if (!profileToDelete) {
+      console.error(`Proof Solver profile ${profileKey} not found`);
+      return;
+    }
+    if (!confirm(`Delete profile "${profileToDelete.name}"?`)) {
+      return;
+    }
+    const nextProfiles = { ...userProfiles };
+    delete nextProfiles[profileKey];
+    localStorage.setItem(LEANOJ_PROFILES_STORAGE_KEY, JSON.stringify(nextProfiles));
+    setUserProfiles(nextProfiles);
+    if (selectedProfile === profileKey) {
+      setSelectedProfile('');
+      onSettingsChange(persistLeanOJSettings({ ...settings, selectedProfile: '' }));
+    }
+  };
+
+  const setSubmitterCount = (count) => {
+    const nextCount = Math.max(1, Math.min(10, Number(count) || 1));
+    const submitterConfigs = [...settings.submitterConfigs];
+    while (submitterConfigs.length < nextCount) {
+      submitterConfigs.push({
+        ...(submitterConfigs[submitterConfigs.length - 1] || settings.roles.final_solver),
+        submitterId: submitterConfigs.length + 1,
+      });
+    }
+    updateSettings({
+      numSubmitters: nextCount,
+      submitterConfigs: submitterConfigs.slice(0, nextCount).map((config, index) => ({ ...config, submitterId: index + 1 })),
+    });
+  };
+
+  const toggleAdvancedSettings = () => {
+    setAdvancedSettingsExpanded((expanded) => !expanded);
+  };
+
+  const refreshLmStudioModels = async () => {
+    if (!lmStudioEnabled) return;
+    try {
+      const models = await api.getModels();
+      setLmStudioModels(models.models || models || []);
+    } catch (error) {
+      console.error('Failed to refresh LM Studio models for Proof Solver:', error);
+    }
+  };
+
+  const refreshOpenRouterModels = async (freeFilter = settings.freeOnly) => {
+    if (!hasOpenRouterKey) return;
+    try {
+      const openRouter = await openRouterAPI.getModels(null, freeFilter);
+      setOpenRouterModels(openRouter.models || []);
+    } catch (error) {
+      console.error('Failed to refresh OpenRouter models for Proof Solver:', error);
+    }
+  };
+
+  const getLeanOJRawSettings = () => ({
+    ...settings,
+    modelProviders,
+  });
+
+  const applyLeanOJRawSettings = (rawSettings, { updateRawText = true } = {}) => {
+    const nextSettings = persistLeanOJSettings({
+      ...settings,
+      ...rawSettings,
+    });
+    setModelProviders(nextSettings.modelProviders || {});
+    setSelectedProfile(nextSettings.selectedProfile || '');
+    onSettingsChange(nextSettings);
+    if (updateRawText) {
+      setRawSettingsText(formatRawSettings(nextSettings));
+    }
+  };
+
+  const handleRawEditToggle = (checked) => {
+    if (checked) {
+      const currentSettings = getLeanOJRawSettings();
+      setGuiSettingsBeforeRaw(currentSettings);
+      setRawSettingsText(formatRawSettings(currentSettings));
+      setRawSettingsMessage('');
+      setEditRawSettings(true);
+      return;
+    }
+
+    if (!confirm(RAW_VIEW_EXIT_WARNING)) {
+      return;
+    }
+
+    if (guiSettingsBeforeRaw) {
+      applyLeanOJRawSettings(guiSettingsBeforeRaw, { updateRawText: false });
+    }
+    setRawSettingsMessage('');
+    setEditRawSettings(false);
+  };
+
+  const saveRawSettings = () => {
+    try {
+      const parsed = JSON.parse(rawSettingsText);
+      applyLeanOJRawSettings(parsed);
+      setRawSettingsMessage('Saved raw settings.');
+    } catch (error) {
+      setRawSettingsMessage(`Invalid JSON: ${error.message}`);
+    }
+  };
+
+  const handleAdvancedSettingsKeyDown = (event) => {
+    if (event.key === 'Enter' || event.key === ' ') {
+      event.preventDefault();
+      toggleAdvancedSettings();
+    }
+  };
+
+  return (
+    <div className="settings-with-model-sidebar">
+      <HighlightedModelsSidebar />
+      <div className="settings-with-model-sidebar__main">
+        <div className="settings-panel">
+          <h2>Proof Solver Model Selection & Settings</h2>
+          <p className="settings-hint">These profiles are dedicated to Proof Solver runs and do not change Autonomous, Aggregator, or Compiler profiles.</p>
+
+      <div className="settings-section">
+        <h3>Proof Solver Profiles</h3>
+        <div className="settings-row">
+          <label>Apply Profile</label>
+          <select value={selectedProfile} disabled={isRunning} onChange={(event) => handleProfileSelect(event.target.value)}>
+            <option value="">-- Custom Settings --</option>
+            <optgroup label="Recommended Profiles">
+              {Object.keys(LEANOJ_RECOMMENDED_PROFILES).map((key) => (
+                <option key={key} value={key}>{LEANOJ_RECOMMENDED_PROFILES[key].name}</option>
+              ))}
+            </optgroup>
+            {Object.keys(userProfiles).length > 0 && (
+              <optgroup label="My Profiles">
+                {Object.keys(userProfiles)
+                  .sort((a, b) => userProfiles[a].name.localeCompare(userProfiles[b].name))
+                  .map((key) => (
+                    <option key={key} value={key}>{userProfiles[key].name}</option>
+                  ))}
+              </optgroup>
+            )}
+          </select>
+        </div>
+        <div className="settings-row">
+          <button type="button" className="secondary" disabled={isRunning} onClick={() => setShowSaveDialog(true)}>
+            Save as Profile
+          </button>
+          {selectedProfile && selectedProfile.startsWith('user_') && (
+            <button
+              type="button"
+              className="secondary"
+              disabled={isRunning}
+              onClick={() => deleteProfile(selectedProfile)}
+              style={{ marginLeft: '0.5rem', backgroundColor: '#e74c3c' }}
+            >
+              Delete Profile
+            </button>
+          )}
+        </div>
+      </div>
+
+      {showSaveDialog && (
+        <div className="inline-modal-overlay">
+          <div className="inline-modal-content">
+            <h3 style={{ marginTop: 0 }}>Save Proof Solver Profile</h3>
+            <p className="label--muted">
+              Enter a name for this profile. Current Proof Solver model settings will be saved.
+            </p>
+            <input
+              type="text"
+              value={newProfileName}
+              onChange={(event) => setNewProfileName(event.target.value)}
+              placeholder="Profile name..."
+              className="input-dark"
+              onKeyPress={(event) => {
+                if (event.key === 'Enter') {
+                  saveCurrentAsProfile();
+                }
+              }}
+              autoFocus
+            />
+            <div style={{ display: 'flex', gap: '0.5rem', justifyContent: 'flex-end' }}>
+              <button
+                className="secondary"
+                onClick={() => {
+                  setShowSaveDialog(false);
+                  setNewProfileName('');
+                }}
+              >
+                Cancel
+              </button>
+              <button className="btn-success-sm" onClick={saveCurrentAsProfile}>
+                Save Profile
+              </button>
+            </div>
+          </div>
+        </div>
+      )}
+
+      <div className="model-refresh-controls">
+        {lmStudioEnabled && (
+          <button type="button" className="secondary" disabled={isRunning} onClick={refreshLmStudioModels}>
+            Refresh LM Studio Models
+          </button>
+        )}
+        {hasOpenRouterKey && (
+          <>
+            <button type="button" className="secondary" disabled={isRunning} onClick={() => refreshOpenRouterModels(settings.freeOnly)}>
+              Refresh OpenRouter Models
+            </button>
+            <button
+              type="button"
+              className="secondary"
+              onClick={() => window.open('https://openrouter.ai/models', '_blank', 'noopener,noreferrer')}
+              title="Browse all available OpenRouter models"
+            >
+              🔗 OpenRouter Model List
+            </button>
+            <label className="settings-checkbox-label model-refresh-controls__toggle" style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}>
+              <input
+                type="checkbox"
+                checked={settings.freeOnly}
+                onChange={(event) => updateSettings({ freeOnly: event.target.checked })}
+                disabled={isRunning}
+              />
+              Free models only
+            </label>
+          </>
+        )}
+        {developerModeEnabled ? (
+          <label className="settings-checkbox-label model-refresh-controls__toggle" style={{ cursor: isRunning ? 'not-allowed' : 'pointer' }}>
+            <input
+              type="checkbox"
+              checked={editRawSettings}
+              onChange={(event) => handleRawEditToggle(event.target.checked)}
+              disabled={isRunning}
+            />
+            Edit Raw
+          </label>
+        ) : (
+          <span className="settings-developer-mode-hint">
+            Developer mode: press Shift + Z + X to toggle raw JSON settings.
+          </span>
+        )}
+      </div>
+
+      {editRawSettings ? (
+        <RawSettingsEditor
+          value={rawSettingsText}
+          onChange={setRawSettingsText}
+          onSave={saveRawSettings}
+          message={rawSettingsMessage}
+          disabled={isRunning}
+        />
+      ) : (
+        <>
+      <div className="settings-section">
+        <h3>Brainstorm Submitters</h3>
+        <div className="settings-row">
+          <label>Number of Submitters</label>
+          <input type="number" min={1} max={10} disabled={isRunning} value={settings.submitterConfigs.length} onChange={(event) => setSubmitterCount(event.target.value)} />
+        </div>
+        {settings.submitterConfigs.map((submitter, index) => (
+          <RoleEditor
+            key={submitter.submitterId || index}
+            title={index === 0 ? 'Brainstorm Submitter 1 + Topic Generator' : `Brainstorm Submitter ${index + 1}`}
+            config={submitter}
+            onChange={(next) => updateSubmitter(index, next)}
+            lmStudioModels={lmStudioModels}
+            openRouterModels={openRouterModels}
+            modelProviders={modelProviders}
+            hasOpenRouterKey={hasOpenRouterKey}
+            isRunning={isRunning}
+            lmStudioEnabled={lmStudioEnabled}
+            developerModeEnabled={developerModeEnabled}
+          />
+        ))}
+      </div>
+
+      <div className="settings-section">
+        <h3>Proof Solver Roles</h3>
+        {ROLE_EDITOR_GROUPS.map((group) => (
+          <div key={group.key}>
+            <RoleEditor
+              title={group.title}
+              config={settings.roles[group.roleKeys[0]]}
+              onChange={(next) => updateRoles(group.roleKeys, next)}
+              lmStudioModels={lmStudioModels}
+              openRouterModels={openRouterModels}
+              modelProviders={modelProviders}
+              hasOpenRouterKey={hasOpenRouterKey}
+              isRunning={isRunning}
+              lmStudioEnabled={lmStudioEnabled}
+              developerModeEnabled={developerModeEnabled}
+            />
+          </div>
+        ))}
+      </div>
+
+      <div className="settings-section">
+        <div
+          className="collapsible-trigger settings-trigger--multiline"
+          onClick={toggleAdvancedSettings}
+          onKeyDown={handleAdvancedSettingsKeyDown}
+          role="button"
+          tabIndex={0}
+          aria-expanded={advancedSettingsExpanded}
+          aria-controls="leanoj-advanced-settings-panel"
+          style={{ marginBottom: advancedSettingsExpanded ? '1rem' : 0 }}
+        >
+          <div className="settings-heading-stack">
+            <h3 className="settings-trigger-title">Advanced Settings</h3>
+            <p className="settings-subsection-description">
+              Tune Proof Solver run limits and proof-search loop budgets.
+            </p>
+          </div>
+          <span className={`collapse-chevron${advancedSettingsExpanded ? ' collapse-chevron--open' : ''}`}>▼</span>
+        </div>
+
+        {advancedSettingsExpanded && (
+          <div className="collapsible-body settings-advanced-content" id="leanoj-advanced-settings-panel">
+            <div className="settings-subsection">
+              <div className="settings-subsection-header">
+                <h3 className="settings-subsection-title">Run Limits</h3>
+                <p className="settings-subsection-description">
+                  Control how many brainstorm ideas and final proof attempts Proof Solver will run. Inline brainstorm proof candidates use a fixed 5-attempt Lean repair gate.
+                </p>
+              </div>
+              <div className="settings-row">
+                <label>Initial Brainstorm Accepts</label>
+                <input type="number" min={1} max={200} disabled={isRunning} value={settings.maxInitialBrainstormAccepts} onChange={(event) => updateSettings({ maxInitialBrainstormAccepts: Number(event.target.value) || 30 })} />
+              </div>
+              <div className="settings-row">
+                <label>Recursive Brainstorm Accepts</label>
+                <input type="number" min={1} max={100} disabled={isRunning} value={settings.maxRecursiveBrainstormAccepts} onChange={(event) => updateSettings({ maxRecursiveBrainstormAccepts: Number(event.target.value) || 10 })} />
+              </div>
+              <div className="settings-row">
+                <label>Final Attempts Per Cycle</label>
+                <input type="number" min={30} max={200} disabled={isRunning} value={settings.finalAttemptsPerCycle} onChange={(event) => updateSettings({ finalAttemptsPerCycle: Math.max(30, Number(event.target.value) || 30) })} />
+              </div>
+            </div>
+          </div>
+        )}
+      </div>
+        </>
+      )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/leanoj/index.js b/frontend/src/components/leanoj/index.js
new file mode 100644
index 0000000..ee19d6b
--- /dev/null
+++ b/frontend/src/components/leanoj/index.js
@@ -0,0 +1,7 @@
+export { default as LeanOJInterface } from './LeanOJInterface';
+export { default as LeanOJBrainstorms } from './LeanOJBrainstorms';
+export { default as LeanOJLogs } from './LeanOJLogs';
+export { default as LeanOJMasterProof } from './LeanOJMasterProof';
+export { default as LeanOJSettings } from './LeanOJSettings';
+export { default as LeanOJMathematicalProofs } from './LeanOJMathematicalProofs';
+export { default as LeanOJProofLibrary } from './LeanOJProofLibrary';
diff --git a/frontend/src/components/settings-common.css b/frontend/src/components/settings-common.css
index 2d62893..3e15f13 100644
--- a/frontend/src/components/settings-common.css
+++ b/frontend/src/components/settings-common.css
@@ -217,6 +217,101 @@
   margin-left: 0.5rem;
 }
 
+/* Proof strength badge */
+.ps-badge-anchor {
+  position: relative;
+  display: inline-flex;
+  align-items: center;
+  vertical-align: middle;
+  z-index: 1000;
+}
+
+.ps-badge-anchor--model {
+  position: absolute;
+  top: 2.3rem;
+  right: 0.35rem;
+  z-index: 4;
+}
+
+.ps-badge-anchor--model-only {
+  position: absolute;
+  top: 0.35rem;
+  right: 0.35rem;
+  z-index: 4;
+}
+
+.ps-badge {
+  padding: 0.15rem 0.35rem;
+  border-radius: 3px;
+  font-size: 0.58rem;
+  font-weight: 800;
+  line-height: 1;
+  color: #2c1700;
+  letter-spacing: 0.04em;
+  background:
+    linear-gradient(120deg, rgba(255, 255, 255, 0.72) 0%, rgba(255, 255, 255, 0.22) 18%, rgba(255, 255, 255, 0.02) 34%),
+    linear-gradient(135deg, #fff7bf 0%, #ffe27a 18%, #ffc93b 46%, #d58d00 100%);
+  box-shadow:
+    0 0 0 1px rgba(255, 219, 96, 0.78),
+    0 0 12px rgba(255, 200, 40, 0.34),
+    inset 0 1px 0 rgba(255, 255, 255, 0.55),
+    inset 0 -1px 0 rgba(120, 70, 0, 0.2);
+  text-shadow: 0 1px 0 rgba(255, 255, 255, 0.35);
+  user-select: none;
+  cursor: default;
+}
+
+.ps-badge-tooltip {
+  display: none;
+  position: absolute;
+  top: calc(100% + 7px);
+  width: min(310px, 70vw);
+  background: #241700;
+  border: 1px solid rgba(255, 219, 96, 0.62);
+  border-radius: 6px;
+  padding: 0.6rem 0.75rem;
+  color: #ffe9a8;
+  font-size: 0.72rem;
+  font-weight: 500;
+  line-height: 1.45;
+  box-shadow: 0 8px 22px rgba(0, 0, 0, 0.5);
+  pointer-events: none;
+  white-space: normal;
+  text-transform: none;
+  letter-spacing: normal;
+  text-shadow: none;
+  z-index: 100000;
+}
+
+.ps-badge-anchor--role .ps-badge-tooltip {
+  left: 0;
+  right: auto;
+  width: min(330px, 48vw);
+}
+
+.ps-badge-anchor--leaderboard .ps-badge-tooltip {
+  right: 0;
+  width: 235px;
+  max-width: calc(322px - 3rem);
+}
+
+.ps-badge-anchor:hover .ps-badge-tooltip,
+.ps-badge-anchor:focus .ps-badge-tooltip {
+  display: block;
+}
+
+.ps-badge-anchor:hover,
+.ps-badge-anchor:focus {
+  z-index: 100000;
+}
+
+.role-title-with-badges {
+  display: inline-flex;
+  align-items: center;
+  gap: 0.45rem;
+  flex-wrap: wrap;
+}
+
 /* Apply-to-all button */
 .btn-apply-all {
   font-size: 0.8rem;
@@ -246,6 +341,25 @@
   cursor: pointer;
 }
 
+.settings-developer-mode-hint {
+  color: var(--text-muted);
+  font-size: 0.85rem;
+  line-height: 1.4;
+}
+
+.settings-row--inline-checkbox {
+  grid-template-columns: 1fr;
+}
+
+.settings-checkbox-label--supercharge {
+  gap: 0.5rem;
+  width: fit-content;
+}
+
+.settings-checkbox-label--supercharge input[type="checkbox"] {
+  margin-right: 0;
+}
+
 .settings-checkbox-label--stacked {
   display: grid;
   grid-template-columns: auto minmax(0, 1fr);
diff --git a/frontend/src/hooks/useProofCheckRuntime.js b/frontend/src/hooks/useProofCheckRuntime.js
index 32f6a82..465f535 100644
--- a/frontend/src/hooks/useProofCheckRuntime.js
+++ b/frontend/src/hooks/useProofCheckRuntime.js
@@ -1,11 +1,83 @@
 import { useCallback, useEffect, useMemo, useState } from 'react';
 import { autonomousAPI } from '../services/api';
 import { websocket } from '../services/websocket';
+import {
+  getStoredAutonomousSettings,
+  settingsToAutonomousConfig,
+} from '../utils/autonomousProfiles';
+
+const DEFAULT_CONTEXT_WINDOW = 131072;
+const DEFAULT_MAX_OUTPUT_TOKENS = 25000;
+const DEVELOPER_MODE_STORAGE_KEY = 'developerModeSettingsEnabled';
+
+function isDeveloperModeEnabled() {
+  return localStorage.getItem(DEVELOPER_MODE_STORAGE_KEY) === 'true';
+}
 
 function buildSourceKey(sourceType, sourceId) {
   return `${sourceType}:${sourceId}`;
 }
 
+function normalizeProvider(provider) {
+  return provider === 'openrouter' ? 'openrouter' : 'lm_studio';
+}
+
+function toPositiveInteger(value, fallback) {
+  const parsed = Number(value);
+  return Number.isFinite(parsed) && parsed > 0 ? Math.floor(parsed) : fallback;
+}
+
+function roleFromSubmitterConfig(config = {}) {
+  const superchargeAllowed = isDeveloperModeEnabled();
+  return {
+    provider: normalizeProvider(config.provider),
+    model_id: config.modelId || config.model_id || '',
+    openrouter_provider: config.openrouterProvider ?? config.openrouter_provider ?? null,
+    openrouter_reasoning_effort: config.openrouterReasoningEffort ?? config.openrouter_reasoning_effort ?? 'auto',
+    lm_studio_fallback_id: config.lmStudioFallbackId ?? config.lm_studio_fallback_id ?? null,
+    context_window: toPositiveInteger(config.contextWindow ?? config.context_window, DEFAULT_CONTEXT_WINDOW),
+    max_output_tokens: toPositiveInteger(config.maxOutputTokens ?? config.max_output_tokens, DEFAULT_MAX_OUTPUT_TOKENS),
+    supercharge_enabled: superchargeAllowed && Boolean(config.superchargeEnabled ?? config.supercharge_enabled),
+  };
+}
+
+function roleFromAutonomousConfig(config, rolePrefix, fallbackModelId = '') {
+  const superchargeAllowed = isDeveloperModeEnabled();
+  return {
+    provider: normalizeProvider(config[`${rolePrefix}_provider`]),
+    model_id: config[`${rolePrefix}_model`] || fallbackModelId || '',
+    openrouter_provider: config[`${rolePrefix}_openrouter_provider`] ?? null,
+    openrouter_reasoning_effort: config[`${rolePrefix}_openrouter_reasoning_effort`] ?? 'auto',
+    lm_studio_fallback_id: config[`${rolePrefix}_lm_studio_fallback`] ?? null,
+    context_window: toPositiveInteger(config[`${rolePrefix}_context_window`], DEFAULT_CONTEXT_WINDOW),
+    max_output_tokens: toPositiveInteger(config[`${rolePrefix}_max_tokens`], DEFAULT_MAX_OUTPUT_TOKENS),
+    supercharge_enabled: superchargeAllowed && Boolean(config[`${rolePrefix}_supercharge_enabled`]),
+  };
+}
+
+export function buildCurrentProofRuntimeConfig() {
+  try {
+    const config = settingsToAutonomousConfig(getStoredAutonomousSettings());
+    const firstSubmitter = roleFromSubmitterConfig(config.submitter_configs?.[0]);
+    return {
+      brainstorm: firstSubmitter,
+      paper: roleFromAutonomousConfig(config, 'high_context', firstSubmitter.model_id),
+      validator: roleFromAutonomousConfig(config, 'validator'),
+    };
+  } catch (error) {
+    console.warn('Failed to build current proof runtime config:', error);
+    return null;
+  }
+}
+
+export function isProofRuntimeConfigComplete(config) {
+  return Boolean(
+    config?.brainstorm?.model_id &&
+    config?.paper?.model_id &&
+    config?.validator?.model_id
+  );
+}
+
 export function useProofCheckRuntime() {
   const [proofStatus, setProofStatus] = useState(null);
   const [runtimeError, setRuntimeError] = useState('');
@@ -95,7 +167,12 @@ export function useProofCheckRuntime() {
     }));
 
     try {
-      return await autonomousAPI.runProofCheck({ sourceType, sourceId });
+      const proofRuntimeConfig = buildCurrentProofRuntimeConfig();
+      return await autonomousAPI.runProofCheck({
+        sourceType,
+        sourceId,
+        proofRuntimeConfig: isProofRuntimeConfigComplete(proofRuntimeConfig) ? proofRuntimeConfig : null,
+      });
     } catch (err) {
       setQueuedChecks((prev) => {
         if (!prev[sourceKey]) {
@@ -127,6 +204,9 @@ export function useProofCheckRuntime() {
     return Boolean(getSourceState(sourceType, sourceId));
   }, [getSourceState]);
 
+  const currentProofRuntimeConfig = buildCurrentProofRuntimeConfig();
+  const hasCurrentProofRuntimeConfig = isProofRuntimeConfigComplete(currentProofRuntimeConfig);
+
   const manualCheckReason = useMemo(() => {
     if (!proofStatus) {
       return 'Loading proof runtime status...';
@@ -134,11 +214,11 @@ export function useProofCheckRuntime() {
     if (!proofStatus.lean4_enabled) {
       return 'Lean 4 proof checks are disabled.';
     }
-    if (!proofStatus.manual_check_ready) {
+    if (!proofStatus.manual_check_ready && !hasCurrentProofRuntimeConfig) {
       return proofStatus.manual_check_message || 'Manual proof checks are not ready yet.';
     }
     return '';
-  }, [proofStatus]);
+  }, [proofStatus, hasCurrentProofRuntimeConfig]);
 
   return {
     proofStatus,
@@ -147,7 +227,10 @@ export function useProofCheckRuntime() {
     queueManualProofCheck,
     getSourceState,
     isSourceBusy,
-    manualCheckEnabled: Boolean(proofStatus?.lean4_enabled && proofStatus?.manual_check_ready),
+    manualCheckEnabled: Boolean(
+      proofStatus?.lean4_enabled &&
+      (proofStatus?.manual_check_ready || hasCurrentProofRuntimeConfig)
+    ),
     manualCheckReason,
   };
 }
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 9054c22..f6c6986 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -196,6 +196,24 @@ code {
   backface-visibility: hidden;
 }
 
+.banner-mode-subtitle {
+  color: #1eff1c;
+  font-size: 0.9rem;
+  line-height: 1.25;
+  min-height: 1.125rem;
+  margin: 0.35rem 0 0 0;
+  font-weight: 700;
+  letter-spacing: 0.08em;
+  text-transform: uppercase;
+  text-shadow:
+    0 0 10px rgba(30, 255, 28, 0.35),
+    0 0 18px rgba(30, 255, 28, 0.18);
+}
+
+.banner-mode-subtitle--hidden {
+  visibility: hidden;
+}
+
 .banner-company {
   color: #ffffff;
   font-size: 0.85rem;
@@ -223,6 +241,10 @@ code {
     font-size: 0.85rem;
     margin-top: 0.65rem;
   }
+
+  .banner-mode-subtitle {
+    font-size: 0.78rem;
+  }
   
   .banner-company {
     font-size: 0.8rem;
@@ -374,6 +396,21 @@ code {
   color: #4caf50;
 }
 
+.help-tooltip-btn--text {
+  width: auto;
+  height: auto;
+  padding: 0;
+  border: 0;
+  border-radius: 0;
+  background: transparent;
+  color: var(--text-secondary, #888);
+  box-shadow: none;
+  font-size: 0.9rem;
+  font-weight: 500;
+  line-height: 1.35;
+  text-decoration: none;
+}
+
 .app-header-help-btn:hover,
 .app-header-help-btn:focus-visible,
 .help-tooltip-btn:hover,
@@ -384,6 +421,15 @@ code {
   box-shadow: 0 10px 20px rgba(0, 0, 0, 0.26);
 }
 
+.help-tooltip-btn--text:hover,
+.help-tooltip-btn--text:focus-visible {
+  border-color: transparent;
+  filter: brightness(1.15);
+  transform: none;
+  box-shadow: none;
+  color: var(--text-primary, #e0e0e0);
+}
+
 .app-header-help-btn:focus-visible,
 .help-tooltip-btn:focus-visible {
   outline: 1px solid rgba(30, 255, 28, 0.45);
@@ -542,6 +588,11 @@ button.header-status-chip:focus-visible {
   row-gap: 0.5rem;
 }
 
+.tabs.tabs-leanoj {
+  flex-wrap: wrap;
+  row-gap: 0.5rem;
+}
+
 .tab {
   padding: 0.8rem 1.25rem;
   min-height: 58px;
@@ -613,6 +664,25 @@ button.header-status-chip:focus-visible {
   padding: 0 1rem;
 }
 
+.workflow-main-interface > * {
+  transition:
+    filter var(--transition-normal),
+    opacity var(--transition-normal);
+}
+
+.workflow-main-interface--running > :not(.autonomous-header):not(.button-group):not(.activity-section):not(.tier3-dialog-overlay) {
+  filter: brightness(0.72);
+  opacity: 0.78;
+}
+
+.workflow-main-interface--running > .autonomous-header,
+.workflow-main-interface--running > .button-group,
+.workflow-main-interface--running > .activity-section,
+.workflow-main-interface--running > .tier3-dialog-overlay {
+  filter: none;
+  opacity: 1;
+}
+
 h1 {
   font-size: 1.8rem;
   margin-bottom: 1rem;
diff --git a/frontend/src/index.jsx b/frontend/src/index.jsx
index ca42421..d87156a 100644
--- a/frontend/src/index.jsx
+++ b/frontend/src/index.jsx
@@ -2,9 +2,10 @@ import React from 'react'
 import ReactDOM from 'react-dom/client'
 import App from './App'
 import './index.css'
-import { installNamespacedLocalStorage } from './utils/runtimeConfig'
+import { installAuthenticatedFetch, installNamespacedLocalStorage } from './utils/runtimeConfig'
 
 installNamespacedLocalStorage()
+installAuthenticatedFetch()
 
 ReactDOM.createRoot(document.getElementById('root')).render(
   <React.StrictMode>
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index f0a3223..62a2223 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -73,6 +73,22 @@ async function throwFromResponse(response, fallbackMessage) {
 
 // Aggregator API
 export const api = {
+  async get(path) {
+    if (/^https?:\/\//i.test(path)) {
+      const response = await fetch(path);
+      if (!response.ok) throw new Error(`Failed to fetch ${path}`);
+      return response.json();
+    }
+    const base = API_BASE.replace(/\/$/, '');
+    const normalizedPath = path.startsWith('/api/')
+      ? (base.endsWith('/api') ? path.slice(4) : path)
+      : (path.startsWith('/') ? path : `/${path}`);
+    const url = `${base}${normalizedPath}`;
+    const response = await fetch(url);
+    if (!response.ok) throw new Error(`Failed to fetch ${path}`);
+    return response.json();
+  },
+
   // Get available models from LM Studio
   async getModels() {
     const response = await fetch(`${API_BASE}/aggregator/models`);
@@ -288,13 +304,6 @@ export const compilerAPI = {
     return { data: await response.json() };
   },
 
-  // Get previous versions
-  async getPreviousVersions() {
-    const response = await fetch(`${API_BASE}/compiler/previous-versions`);
-    if (!response.ok) throw new Error('Failed to get previous versions');
-    return { data: await response.json() };
-  },
-
   // Save paper
   async savePaper() {
     const response = await fetch(`${API_BASE}/compiler/save-paper`, {
@@ -345,6 +354,7 @@ export const compilerAPI = {
       body.validator_max_tokens = validatorConfig.validator_max_tokens;
       body.validator_provider = validatorConfig.validator_provider;
       body.validator_openrouter_provider = validatorConfig.validator_openrouter_provider;
+      body.validator_openrouter_reasoning_effort = validatorConfig.validator_openrouter_reasoning_effort || 'auto';
     }
 
     const response = await fetch(`${API_BASE}/compiler/critique-paper`, {
@@ -477,6 +487,20 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  async getPrunedPaperHistory() {
+    const response = await fetch(`${API_BASE}/auto-research/paper-history/pruned`);
+    if (!response.ok) throw new Error('Failed to get pruned Stage 2 paper history');
+    return response.json();
+  },
+
+  async getPrunedHistoryPaper(sessionId, paperId) {
+    const response = await fetch(
+      `${API_BASE}/auto-research/paper-history/pruned/${encodeURIComponent(sessionId)}/${encodeURIComponent(paperId)}`
+    );
+    if (!response.ok) throw new Error(`Failed to get pruned history paper ${sessionId}/${paperId}`);
+    return response.json();
+  },
+
   // Get statistics
   async getStats() {
     const response = await fetch(`${API_BASE}/auto-research/stats`);
@@ -520,14 +544,19 @@ export const autonomousAPI = {
   },
 
   // Queue a manual proof check for one brainstorm or paper
-  async runProofCheck({ sourceType, sourceId }) {
+  async runProofCheck({ sourceType, sourceId, proofRuntimeConfig = null }) {
+    const body = {
+      source_type: sourceType,
+      source_id: sourceId,
+    };
+    if (proofRuntimeConfig) {
+      body.proof_runtime_config = proofRuntimeConfig;
+    }
+
     const response = await fetch(`${API_BASE}/proofs/check`, {
       method: 'POST',
       headers: { 'Content-Type': 'application/json' },
-      body: JSON.stringify({
-        source_type: sourceType,
-        source_id: sourceId,
-      }),
+      body: JSON.stringify(body),
     });
     if (!response.ok) {
       const errorData = await response.json().catch(() => ({}));
@@ -681,6 +710,18 @@ export const autonomousAPI = {
     return response.json();
   },
 
+  async deleteAllPrunedPapers(sessionId = null) {
+    const endpoint = sessionId
+      ? `${API_BASE}/auto-research/paper-history/pruned/${encodeURIComponent(sessionId)}?confirm=true`
+      : `${API_BASE}/auto-research/pruned-papers?confirm=true`;
+    const response = await fetch(endpoint, { method: 'DELETE' });
+    if (!response.ok) {
+      const errorData = await response.json();
+      throw new Error(errorData.detail || 'Failed to delete pruned papers');
+    }
+    return response.json();
+  },
+
   // Delete Stage 2 history paper by session-aware identifier
   async deleteHistoryPaper(sessionId, paperId) {
     const response = await fetch(
@@ -756,16 +797,38 @@ export const autonomousAPI = {
 
   // Get API logs
   async getApiLogs(limit = 100, options = {}) {
-    const response = await fetch(`${API_BASE}/auto-research/api-logs?limit=${limit}`, {
+    const params = new URLSearchParams({ limit: String(limit) });
+    if (options.workflow) {
+      params.append('workflow', options.workflow);
+    }
+    const response = await fetch(`${API_BASE}/auto-research/api-logs?${params.toString()}`, {
       signal: options.signal,
     });
     if (!response.ok) throw new Error('Failed to get API logs');
     return response.json();
   },
 
+  // Get one full API log entry on demand
+  async getApiLogDetail(logKey, options = {}) {
+    const params = new URLSearchParams();
+    if (options.workflow) {
+      params.append('workflow', options.workflow);
+    }
+    const response = await fetch(
+      `${API_BASE}/auto-research/api-logs/detail/${encodeURIComponent(logKey)}${params.toString() ? `?${params.toString()}` : ''}`,
+      { signal: options.signal }
+    );
+    if (!response.ok) throw new Error('Failed to get API log detail');
+    return response.json();
+  },
+
   // Clear API logs
-  async clearApiLogs() {
-    const response = await fetch(`${API_BASE}/auto-research/api-logs/clear`, {
+  async clearApiLogs(options = {}) {
+    const params = new URLSearchParams();
+    if (options.workflow) {
+      params.append('workflow', options.workflow);
+    }
+    const response = await fetch(`${API_BASE}/auto-research/api-logs/clear${params.toString() ? `?${params.toString()}` : ''}`, {
       method: 'POST',
     });
     if (!response.ok) throw new Error('Failed to clear API logs');
@@ -773,8 +836,12 @@ export const autonomousAPI = {
   },
 
   // Get API stats
-  async getApiStats() {
-    const response = await fetch(`${API_BASE}/auto-research/api-logs/stats`);
+  async getApiStats(options = {}) {
+    const params = new URLSearchParams();
+    if (options.workflow) {
+      params.append('workflow', options.workflow);
+    }
+    const response = await fetch(`${API_BASE}/auto-research/api-logs/stats${params.toString() ? `?${params.toString()}` : ''}`);
     if (!response.ok) throw new Error('Failed to get API stats');
     return response.json();
   },
@@ -797,6 +864,7 @@ export const autonomousAPI = {
       body.validator_max_tokens = validatorConfig.validator_max_tokens;
       body.validator_provider = validatorConfig.validator_provider;
       body.validator_openrouter_provider = validatorConfig.validator_openrouter_provider;
+      body.validator_openrouter_reasoning_effort = validatorConfig.validator_openrouter_reasoning_effort || 'auto';
     }
     
     const response = await fetch(`${API_BASE}/auto-research/paper/${paperId}/critique`, {
@@ -840,6 +908,7 @@ export const autonomousAPI = {
       body.validator_max_tokens = validatorConfig.validator_max_tokens;
       body.validator_provider = validatorConfig.validator_provider;
       body.validator_openrouter_provider = validatorConfig.validator_openrouter_provider;
+      body.validator_openrouter_reasoning_effort = validatorConfig.validator_openrouter_reasoning_effort || 'auto';
     }
 
     const response = await fetch(
@@ -882,6 +951,7 @@ export const autonomousAPI = {
       body.validator_max_tokens = validatorConfig.validator_max_tokens;
       body.validator_provider = validatorConfig.validator_provider;
       body.validator_openrouter_provider = validatorConfig.validator_openrouter_provider;
+      body.validator_openrouter_reasoning_effort = validatorConfig.validator_openrouter_reasoning_effort || 'auto';
     }
     
     const response = await fetch(`${API_BASE}/auto-research/final-answer-library/${answerId}/critique`, {
@@ -1057,6 +1127,99 @@ export const boostAPI = {
   },
 };
 
+// LeanOJ Proof Solver API
+export const leanojAPI = {
+  async start(config) {
+    const response = await fetch(`${API_BASE}/leanoj/start`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify(config),
+    });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      const error = new Error('Failed to start Proof Solver');
+      error.details = errorData.detail;
+      throw error;
+    }
+    return response.json();
+  },
+
+  async stop() {
+    const response = await fetch(`${API_BASE}/leanoj/stop`, { method: 'POST' });
+    if (!response.ok) throw new Error('Failed to stop Proof Solver');
+    return response.json();
+  },
+
+  async clear() {
+    const response = await fetch(`${API_BASE}/leanoj/clear?confirm=true`, { method: 'POST' });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData.detail || 'Failed to clear Proof Solver progress');
+    }
+    return response.json();
+  },
+
+  async getStatus() {
+    const response = await fetch(`${API_BASE}/leanoj/status`);
+    if (!response.ok) throw new Error('Failed to get Proof Solver status');
+    return response.json();
+  },
+
+  async getMasterProof() {
+    const response = await fetch(`${API_BASE}/leanoj/master-proof`);
+    if (!response.ok) throw new Error('Failed to get Proof Solver master proof');
+    return response.json();
+  },
+
+  async getMasterProofEdits(limit = 50) {
+    const response = await fetch(`${API_BASE}/leanoj/master-proof/edits?limit=${encodeURIComponent(limit)}`);
+    if (!response.ok) throw new Error('Failed to get Proof Solver master proof edit history');
+    return response.json();
+  },
+
+  async getProofs() {
+    const response = await fetch(`${API_BASE}/leanoj/proofs`);
+    if (response.status === 204) {
+      return { proofs: [], counts: { total: 0, final: 0, subproof: 0 } };
+    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to get Proof Solver proofs');
+    return response.json();
+  },
+
+  async getProofLibrary(includeSubproofs = true) {
+    const response = await fetch(`${API_BASE}/leanoj/library?include_subproofs=${includeSubproofs}`);
+    if (response.status === 204) {
+      return { proofs: [], sessions: [] };
+    }
+    if (!response.ok) await throwFromResponse(response, 'Failed to get Proof Solver proof works library');
+    return response.json();
+  },
+
+  async getLibraryProof(sessionId, proofId) {
+    const response = await fetch(`${API_BASE}/leanoj/library/${encodeURIComponent(sessionId)}/${encodeURIComponent(proofId)}`);
+    if (!response.ok) throw new Error(`Failed to get Proof Solver proof work ${proofId}`);
+    return response.json();
+  },
+
+  async skipBrainstorm() {
+    const response = await fetch(`${API_BASE}/leanoj/skip-brainstorm`, { method: 'POST' });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData.detail || 'Failed to skip Proof Solver brainstorming');
+    }
+    return response.json();
+  },
+
+  async forceBrainstorm() {
+    const response = await fetch(`${API_BASE}/leanoj/force-brainstorm`, { method: 'POST' });
+    if (!response.ok) {
+      const errorData = await response.json().catch(() => ({}));
+      throw new Error(errorData.detail || 'Failed to force Proof Solver recursive brainstorming');
+    }
+    return response.json();
+  },
+};
+
 // Workflow API
 export const workflowAPI = {
   // Get workflow predictions
@@ -1131,11 +1294,12 @@ export const openRouterAPI = {
   // Get available OpenRouter models (uses stored key or provided key)
   async getModels(apiKey = null, freeOnly = false) {
     const params = new URLSearchParams();
-    if (apiKey) params.append('api_key', apiKey);
     if (freeOnly) params.append('free_only', 'true');
     
     const url = `${API_BASE}/openrouter/models${params.toString() ? '?' + params.toString() : ''}`;
-    const response = await fetch(url);
+    const response = await fetch(url, {
+      headers: apiKey ? { 'Authorization': `Bearer ${apiKey}` } : {}
+    });
     if (!response.ok) await throwFromResponse(response, 'Failed to fetch models');
     return response.json();
   },
diff --git a/frontend/src/services/websocket.js b/frontend/src/services/websocket.js
index 55d36c7..dea8d0a 100644
--- a/frontend/src/services/websocket.js
+++ b/frontend/src/services/websocket.js
@@ -1,6 +1,7 @@
 /**
  * WebSocket service for real-time updates
  */
+import { getDesktopApiToken } from '../utils/runtimeConfig';
 
 class WebSocketService {
   constructor() {
@@ -8,14 +9,38 @@ class WebSocketService {
     this.listeners = new Map();
     this.reconnectInterval = 3000;
     this.reconnectTimer = null;
+    this.connectAttempt = 0;
   }
 
-  connect() {
+  async connect() {
+    const attemptId = ++this.connectAttempt;
     const protocol = window.location.protocol === 'https:' ? 'wss:' : 'ws:';
     const wsPath = import.meta.env.VITE_MOTO_WS_PATH || '/ws';
-    const wsUrl = `${protocol}//${window.location.host}${wsPath}`;
+    const wsUrl = new URL(`${protocol}//${window.location.host}${wsPath}`);
+    const desktopApiToken = getDesktopApiToken();
+    if (desktopApiToken) {
+      try {
+        const response = await fetch('/api/ws-ticket', { method: 'POST' });
+        if (!response.ok) {
+          throw new Error(`WebSocket ticket request failed: ${response.status}`);
+        }
+        const payload = await response.json();
+        if (!payload.ticket) {
+          throw new Error('WebSocket ticket response did not include a ticket');
+        }
+        wsUrl.searchParams.set('ticket', payload.ticket);
+      } catch (error) {
+        console.error('Failed to create WebSocket ticket:', error);
+        this.scheduleReconnect();
+        return;
+      }
+    }
+
+    if (attemptId !== this.connectAttempt) {
+      return;
+    }
     
-    this.ws = new WebSocket(wsUrl);
+    this.ws = new WebSocket(wsUrl.toString());
     
     this.ws.onopen = () => {
       console.log('WebSocket connected');
@@ -82,6 +107,7 @@ class WebSocketService {
   }
 
   disconnect() {
+    this.connectAttempt += 1;
     if (this.reconnectTimer) {
       clearTimeout(this.reconnectTimer);
       this.reconnectTimer = null;
diff --git a/frontend/src/utils/activityStyles.js b/frontend/src/utils/activityStyles.js
new file mode 100644
index 0000000..bbb68da
--- /dev/null
+++ b/frontend/src/utils/activityStyles.js
@@ -0,0 +1,320 @@
+export const getActivityIcon = (event = '') => {
+  switch (event) {
+    case 'brainstorm_submission_accepted':
+    case 'submission_accepted':
+    case 'compiler_acceptance':
+    case 'outline_locked':
+      return '✓';
+    case 'brainstorm_submission_rejected':
+    case 'submission_rejected':
+    case 'compiler_rejection':
+      return '✗';
+    case 'topic_selected':
+      return '»';
+    case 'topic_selection_rejected':
+      return '⚠';
+    case 'topic_exploration_started':
+      return '◉';
+    case 'topic_exploration_progress':
+      return '◈';
+    case 'topic_exploration_rejected':
+      return '⚠';
+    case 'topic_exploration_complete':
+      return '✓';
+    case 'paper_title_exploration_started':
+      return '◉';
+    case 'paper_title_exploration_progress':
+      return '◈';
+    case 'paper_title_exploration_complete':
+      return '✓';
+    case 'completion_review_started':
+      return '◎';
+    case 'completion_review_result':
+      return '□';
+    case 'manual_paper_writing_triggered':
+      return '▶';
+    case 'brainstorm_hard_limit_reached':
+      return '⊘';
+    case 'paper_writing_started':
+    case 'paper_writing_resumed':
+      return '▬';
+    case 'critique_phase_started':
+      return '◎';
+    case 'critique_progress':
+      return '⊟';
+    case 'self_review_appended':
+      return '◈';
+    case 'critique_phase_ended':
+      return '✓';
+    case 'critique_phase_skipped':
+    case 'compiler_decline':
+      return '↷';
+    case 'phase_transition':
+      return '□';
+    case 'paper_completed':
+      return '⊟';
+    case 'paper_redundancy_review':
+      return '◇';
+    case 'brainstorm_continuation_started':
+      return '◎';
+    case 'brainstorm_continuation_decided':
+      return '⊞';
+    case 'brainstorm_paper_limit_reached':
+      return '⊘';
+    case 'reference_selection_started':
+      return '▭';
+    case 'reference_selection_complete':
+      return '✓';
+    case 'auto_research_resumed':
+      return '↻';
+    case 'tier3_started':
+      return '★';
+    case 'tier3_result':
+      return '⊟';
+    case 'tier3_format_selected':
+      return '▬';
+    case 'tier3_volume_organized':
+      return '▭';
+    case 'tier3_chapter_started':
+      return '✎';
+    case 'tier3_chapter_complete':
+      return '✓';
+    case 'tier3_complete':
+      return '◆';
+    case 'tier3_rejection':
+      return '⚠';
+    case 'tier3_forced':
+      return '▶';
+    case 'tier3_phase_changed':
+      return '↻';
+    case 'tier3_paper_started':
+      return '▬';
+    case 'tier3_short_form_complete':
+    case 'tier3_long_form_complete':
+      return '✓';
+    case 'final_answer_complete':
+      return '◆';
+    case 'proof_framing_decided':
+      return 'P';
+    case 'proof_check_started':
+      return '◌';
+    case 'proof_retry_scheduled':
+      return '↺';
+    case 'proof_retry_started':
+      return '↻';
+    case 'proof_check_candidates_found':
+      return '#';
+    case 'proof_check_no_candidates':
+      return '-';
+    case 'smt_check_started':
+      return 'S';
+    case 'smt_check_error':
+      return '!';
+    case 'smt_check_complete':
+      return 'Z';
+    case 'proof_attempt_started':
+      return '>';
+    case 'proof_lean_accepted':
+      return '>';
+    case 'proof_integrity_rejected':
+      return '⚠';
+    case 'proof_attempt_failed':
+    case 'proof_attempts_exhausted':
+      return '⚠';
+    case 'proof_verified':
+    case 'known_proof_verified':
+    case 'proof_check_complete':
+      return '✓';
+    case 'novel_proof_discovered':
+      return '◆';
+    case 'proof_dependency_added':
+      return '↗';
+    case 'leanoj_started':
+      return '▶';
+    case 'leanoj_stopped':
+      return '■';
+    case 'leanoj_phase_changed':
+    case 'leanoj_path_decided':
+    case 'leanoj_path_validated':
+    case 'leanoj_role_json_retrying':
+    case 'leanoj_model_call_started':
+    case 'leanoj_brainstorm_submitters_started':
+    case 'leanoj_brainstorm_submission_queued':
+    case 'leanoj_brainstorm_batch_validation_started':
+    case 'leanoj_sufficiency_check_started':
+    case 'leanoj_brainstorm_phase_limit_reached':
+      return '□';
+    case 'leanoj_skip_brainstorm_requested':
+    case 'leanoj_brainstorm_skip_deferred':
+    case 'leanoj_brainstorm_skipped':
+    case 'leanoj_force_brainstorm_requested':
+    case 'leanoj_brainstorm_forced':
+      return '↷';
+    case 'leanoj_recursive_brainstorm_started':
+      return '◎';
+    case 'leanoj_recursive_brainstorm_completed':
+      return '✓';
+    case 'leanoj_topic_validated':
+    case 'leanoj_model_call_completed':
+    case 'leanoj_brainstorm_accepted':
+    case 'leanoj_sufficiency_checked':
+    case 'leanoj_brainstorm_prune_applied':
+    case 'leanoj_brainstorm_proof_verified':
+    case 'leanoj_master_proof_edit_applied':
+    case 'leanoj_final_verified':
+      return '✓';
+    case 'leanoj_brainstorm_rejected':
+    case 'leanoj_brainstorm_submitter_failed':
+    case 'leanoj_brainstorm_prune_rejected':
+    case 'leanoj_brainstorm_prune_apply_failed':
+    case 'leanoj_brainstorm_prune_error':
+    case 'leanoj_brainstorm_proof_failed':
+    case 'leanoj_brainstorm_proof_registration_failed':
+    case 'leanoj_model_call_failed':
+    case 'leanoj_master_proof_edit_rejected':
+    case 'leanoj_final_attempt_failed':
+    case 'leanoj_final_attempt_cycle_exhausted':
+    case 'leanoj_master_proof_stuck':
+    case 'leanoj_master_proof_progress_watchdog':
+    case 'leanoj_error':
+      return '✗';
+    case 'leanoj_final_attempt_started':
+      return '>';
+    case 'leanoj_partial_proof_saved':
+      return '▭';
+    case 'leanoj_master_proof_initialized':
+      return 'P';
+    case 'leanoj_master_proof_edit_started':
+    case 'leanoj_master_proof_edit_validation_started':
+      return '✎';
+    case 'leanoj_brainstorm_prune_review_complete':
+      return '◇';
+    default:
+      return '•';
+  }
+};
+
+export const getActivityClass = (event = '', item = {}) => {
+  const data = item?.data || item || {};
+  if (event === 'leanoj_path_validated') {
+    return data.validated === false ? 'activity-reject' : 'activity-success';
+  }
+
+  if (event === 'leanoj_sufficiency_checked') {
+    return data.enough ? 'activity-success' : 'activity-info';
+  }
+
+  if (event === 'tier3_complete' || event === 'final_answer_complete') {
+    return 'activity-tier3-complete';
+  }
+
+  if (
+    event.includes('accepted') ||
+    event === 'compiler_acceptance' ||
+    event === 'outline_locked' ||
+    event === 'paper_completed' ||
+    event === 'self_review_appended' ||
+    event === 'topic_exploration_complete' ||
+    event === 'paper_title_exploration_complete' ||
+    event === 'tier3_chapter_complete' ||
+    event === 'tier3_short_form_complete' ||
+    event === 'tier3_long_form_complete' ||
+    event === 'reference_selection_complete' ||
+    event === 'proof_verified' ||
+    event === 'proof_lean_accepted' ||
+    event === 'novel_proof_discovered' ||
+    event === 'known_proof_verified' ||
+    event === 'proof_check_complete' ||
+    event === 'smt_check_complete' ||
+    event === 'leanoj_model_call_completed' ||
+    event === 'leanoj_recursive_brainstorm_completed' ||
+    event === 'leanoj_topic_validated' ||
+    event === 'leanoj_brainstorm_prune_applied' ||
+    event === 'leanoj_brainstorm_proof_verified' ||
+    event === 'leanoj_master_proof_edit_applied' ||
+    event === 'leanoj_final_verified'
+  ) {
+    return 'activity-success';
+  }
+
+  if (
+    event.includes('rejected') ||
+    event === 'compiler_rejection' ||
+    event === 'tier3_rejection' ||
+    event === 'proof_attempt_failed' ||
+    event === 'proof_attempts_exhausted' ||
+    event === 'proof_integrity_rejected' ||
+    event === 'smt_check_error' ||
+    event === 'leanoj_brainstorm_rejected' ||
+    event === 'leanoj_brainstorm_submitter_failed' ||
+    event === 'leanoj_brainstorm_prune_rejected' ||
+    event === 'leanoj_brainstorm_prune_apply_failed' ||
+    event === 'leanoj_brainstorm_prune_error' ||
+    event === 'leanoj_brainstorm_proof_failed' ||
+    event === 'leanoj_brainstorm_proof_registration_failed' ||
+    event === 'leanoj_model_call_failed' ||
+    event === 'leanoj_master_proof_edit_rejected' ||
+    event === 'leanoj_final_attempt_failed' ||
+    event === 'leanoj_final_attempt_cycle_exhausted' ||
+    event === 'leanoj_master_proof_stuck' ||
+    event === 'leanoj_master_proof_progress_watchdog' ||
+    event === 'leanoj_error'
+  ) {
+    return 'activity-reject';
+  }
+
+  if (
+    event.includes('review') ||
+    event.includes('started') ||
+    event.includes('resumed') ||
+    event.includes('progress') ||
+    event.includes('transition') ||
+    event === 'manual_paper_writing_triggered' ||
+    event === 'brainstorm_hard_limit_reached' ||
+    event === 'tier3_forced' ||
+    event === 'tier3_phase_changed' ||
+    event === 'tier3_result' ||
+    event === 'tier3_format_selected' ||
+    event === 'tier3_volume_organized' ||
+    event === 'topic_selected' ||
+    event === 'reference_selection_started' ||
+    event === 'compiler_decline' ||
+    event === 'critique_phase_ended' ||
+    event === 'critique_phase_skipped' ||
+    event === 'brainstorm_continuation_decided' ||
+    event === 'brainstorm_paper_limit_reached' ||
+    event === 'proof_framing_decided' ||
+    event === 'proof_retry_scheduled' ||
+    event === 'proof_retry_started' ||
+    event === 'proof_check_candidates_found' ||
+    event === 'proof_check_no_candidates' ||
+    event === 'proof_attempt_started' ||
+    event === 'smt_check_started' ||
+    event === 'leanoj_started' ||
+    event === 'leanoj_stopped' ||
+    event === 'leanoj_phase_changed' ||
+    event === 'leanoj_model_call_started' ||
+    event === 'leanoj_recursive_brainstorm_started' ||
+    event === 'leanoj_brainstorm_submitters_started' ||
+    event === 'leanoj_brainstorm_submission_queued' ||
+    event === 'leanoj_brainstorm_batch_validation_started' ||
+    event === 'leanoj_sufficiency_check_started' ||
+    event === 'leanoj_brainstorm_phase_limit_reached' ||
+    event === 'leanoj_role_json_retrying' ||
+    event === 'leanoj_skip_brainstorm_requested' ||
+    event === 'leanoj_brainstorm_skip_deferred' ||
+    event === 'leanoj_brainstorm_skipped' ||
+    event === 'leanoj_force_brainstorm_requested' ||
+    event === 'leanoj_brainstorm_forced' ||
+    event === 'leanoj_path_decided' ||
+    event === 'leanoj_partial_proof_saved' ||
+    event === 'leanoj_master_proof_initialized' ||
+    event === 'leanoj_master_proof_edit_started' ||
+    event === 'leanoj_brainstorm_prune_review_complete' ||
+    event === 'leanoj_final_attempt_started'
+  ) {
+    return 'activity-info';
+  }
+
+  return 'activity-neutral';
+};
diff --git a/frontend/src/utils/autonomousProfiles.js b/frontend/src/utils/autonomousProfiles.js
index 9ec3fd3..b24c196 100644
--- a/frontend/src/utils/autonomousProfiles.js
+++ b/frontend/src/utils/autonomousProfiles.js
@@ -1,4 +1,10 @@
 import { loadModelCache, getModelApiId } from './modelCache';
+import {
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
+  normalizeOpenRouterReasoningEffort,
+} from './openRouterSelection';
 
 export const AUTONOMOUS_SETTINGS_STORAGE_KEY = 'autonomous_research_settings';
 export const AUTONOMOUS_PROFILES_STORAGE_KEY = 'autonomous_research_profiles';
@@ -8,11 +14,9 @@ export const RECOMMENDED_PROFILE_KEY = 'recommended_slower_affordable_higher_kno
 export const RECOMMENDED_ALTERNATE_PROFILE_KEY = 'recommended_fast_affordable_mid';
 export const RECOMMENDED_LAB_FAST_PROFILE_KEY = 'recommended_lab_fast_costly_extra_high';
 export const RECOMMENDED_LAB_MAX_PROFILE_KEY = 'recommended_lab_slow_costly_max';
-export const RECOMMENDED_ENTRY_LAB_PROFILE_KEY = 'recommended_entry_lab_fast_less_affordable';
 export const RECOMMENDED_PROFILE_KEYS = [
-  RECOMMENDED_PROFILE_KEY,
   RECOMMENDED_ALTERNATE_PROFILE_KEY,
-  RECOMMENDED_ENTRY_LAB_PROFILE_KEY,
+  RECOMMENDED_PROFILE_KEY,
   RECOMMENDED_LAB_FAST_PROFILE_KEY,
   RECOMMENDED_LAB_MAX_PROFILE_KEY,
 ];
@@ -22,9 +26,11 @@ const DEFAULT_SUBMITTER_CONFIG = {
   provider: 'lm_studio',
   modelId: '',
   openrouterProvider: null,
+  openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   lmStudioFallbackId: null,
-  contextWindow: 131072,
-  maxOutputTokens: 25000,
+  contextWindow: DEFAULT_CONTEXT_WINDOW,
+  maxOutputTokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  superchargeEnabled: false,
 };
 
 // NOTE: DEFAULT_OPENROUTER_SUBMITTER_CONFIGS and DEFAULT_LOCAL_CONFIG are derived
@@ -32,31 +38,48 @@ const DEFAULT_SUBMITTER_CONFIG = {
 // startup configuration and the selectable recommended profile stay in sync.
 // Update the recommended profile below to change what a fresh install runs with.
 
+const GEMINI_FLASH_LATEST_PROFILE_CONFIG = {
+  modelId: '~google/gemini-flash-latest',
+  provider: 'openrouter',
+  openrouterProvider: null,
+  lmStudioFallbackId: null,
+  contextWindow: 1048576,
+  maxOutputTokens: 65536,
+};
+
 const DEFAULT_LM_LOCAL_CONFIG = {
   validator_provider: 'lm_studio',
   validator_model: '',
   validator_openrouter_provider: null,
+  validator_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   validator_lm_studio_fallback: null,
-  validator_context_window: 131072,
-  validator_max_tokens: 25000,
+  validator_context_window: DEFAULT_CONTEXT_WINDOW,
+  validator_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  validator_supercharge_enabled: false,
   high_context_provider: 'lm_studio',
   high_context_model: '',
   high_context_openrouter_provider: null,
+  high_context_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   high_context_lm_studio_fallback: null,
-  high_context_context_window: 131072,
-  high_context_max_tokens: 25000,
+  high_context_context_window: DEFAULT_CONTEXT_WINDOW,
+  high_context_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  high_context_supercharge_enabled: false,
   high_param_provider: 'lm_studio',
   high_param_model: '',
   high_param_openrouter_provider: null,
+  high_param_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   high_param_lm_studio_fallback: null,
-  high_param_context_window: 131072,
-  high_param_max_tokens: 25000,
+  high_param_context_window: DEFAULT_CONTEXT_WINDOW,
+  high_param_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  high_param_supercharge_enabled: false,
   critique_submitter_provider: 'lm_studio',
   critique_submitter_model: '',
   critique_submitter_openrouter_provider: null,
+  critique_submitter_openrouter_reasoning_effort: DEFAULT_OPENROUTER_REASONING_EFFORT,
   critique_submitter_lm_studio_fallback: null,
-  critique_submitter_context_window: 131072,
-  critique_submitter_max_tokens: 25000,
+  critique_submitter_context_window: DEFAULT_CONTEXT_WINDOW,
+  critique_submitter_max_tokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  critique_submitter_supercharge_enabled: false,
 };
 
 const createDefaultSubmitterConfigs = (modelId = '') => (
@@ -168,12 +191,7 @@ export const RECOMMENDED_PROFILES = {
       },
     ],
     validator: {
-      modelId: 'qwen/qwen3.5-flash-02-23',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500,
+      ...GEMINI_FLASH_LATEST_PROFILE_CONFIG,
     },
     highContext: {
       modelId: 'moonshotai/kimi-k2.6',
@@ -200,68 +218,6 @@ export const RECOMMENDED_PROFILES = {
       maxOutputTokens: 65500,
     },
   },
-  [RECOMMENDED_ENTRY_LAB_PROFILE_KEY]: {
-    name: 'Fast, less affordable, higher knowledge',
-    numSubmitters: 3,
-    submitters: [
-      {
-        modelId: 'x-ai/grok-4.3',
-        provider: 'openrouter',
-        openrouterProvider: null,
-        lmStudioFallbackId: null,
-        contextWindow: 1000000,
-        maxOutputTokens: 128000,
-      },
-      {
-        modelId: 'moonshotai/kimi-k2.6',
-        provider: 'openrouter',
-        openrouterProvider: null,
-        lmStudioFallbackId: null,
-        contextWindow: 262000,
-        maxOutputTokens: 40000,
-      },
-      {
-        modelId: 'x-ai/grok-4.3',
-        provider: 'openrouter',
-        openrouterProvider: null,
-        lmStudioFallbackId: null,
-        contextWindow: 1000000,
-        maxOutputTokens: 128000,
-      },
-    ],
-    validator: {
-      modelId: 'x-ai/grok-4.1-fast',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 2000000,
-      maxOutputTokens: 30000,
-    },
-    highContext: {
-      modelId: 'x-ai/grok-4.3',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1000000,
-      maxOutputTokens: 128000,
-    },
-    highParam: {
-      modelId: 'x-ai/grok-4.3',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1000000,
-      maxOutputTokens: 128000,
-    },
-    critique: {
-      modelId: 'google/gemini-3.1-pro-preview',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 1048576,
-      maxOutputTokens: 65500,
-    },
-  },
   [RECOMMENDED_LAB_FAST_PROFILE_KEY]: {
     name: 'Lab grade, fast, costly (starts at ~$10 per hour), extra-high knowledge',
     numSubmitters: 3,
@@ -292,12 +248,7 @@ export const RECOMMENDED_PROFILES = {
       },
     ],
     validator: {
-      modelId: 'x-ai/grok-4.1-fast',
-      provider: 'openrouter',
-      openrouterProvider: null,
-      lmStudioFallbackId: null,
-      contextWindow: 2000000,
-      maxOutputTokens: 30000,
+      ...GEMINI_FLASH_LATEST_PROFILE_CONFIG,
     },
     highContext: {
       modelId: 'openai/gpt-5.5',
@@ -420,27 +371,35 @@ const DEFAULT_LOCAL_CONFIG = {
   validator_provider: DEFAULT_RECOMMENDED_PROFILE.validator.provider || 'openrouter',
   validator_model: DEFAULT_RECOMMENDED_PROFILE.validator.modelId || '',
   validator_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.validator.openrouterProvider || null,
+  validator_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(DEFAULT_RECOMMENDED_PROFILE.validator.openrouterReasoningEffort),
   validator_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.validator.lmStudioFallbackId || null,
   validator_context_window: DEFAULT_RECOMMENDED_PROFILE.validator.contextWindow,
   validator_max_tokens: DEFAULT_RECOMMENDED_PROFILE.validator.maxOutputTokens,
+  validator_supercharge_enabled: Boolean(DEFAULT_RECOMMENDED_PROFILE.validator.superchargeEnabled),
   high_context_provider: DEFAULT_RECOMMENDED_PROFILE.highContext.provider || 'openrouter',
   high_context_model: DEFAULT_RECOMMENDED_PROFILE.highContext.modelId || '',
   high_context_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.highContext.openrouterProvider || null,
+  high_context_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(DEFAULT_RECOMMENDED_PROFILE.highContext.openrouterReasoningEffort),
   high_context_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.highContext.lmStudioFallbackId || null,
   high_context_context_window: DEFAULT_RECOMMENDED_PROFILE.highContext.contextWindow,
   high_context_max_tokens: DEFAULT_RECOMMENDED_PROFILE.highContext.maxOutputTokens,
+  high_context_supercharge_enabled: Boolean(DEFAULT_RECOMMENDED_PROFILE.highContext.superchargeEnabled),
   high_param_provider: DEFAULT_RECOMMENDED_PROFILE.highParam.provider || 'openrouter',
   high_param_model: DEFAULT_RECOMMENDED_PROFILE.highParam.modelId || '',
   high_param_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.highParam.openrouterProvider || null,
+  high_param_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(DEFAULT_RECOMMENDED_PROFILE.highParam.openrouterReasoningEffort),
   high_param_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.highParam.lmStudioFallbackId || null,
   high_param_context_window: DEFAULT_RECOMMENDED_PROFILE.highParam.contextWindow,
   high_param_max_tokens: DEFAULT_RECOMMENDED_PROFILE.highParam.maxOutputTokens,
+  high_param_supercharge_enabled: Boolean(DEFAULT_RECOMMENDED_PROFILE.highParam.superchargeEnabled),
   critique_submitter_provider: DEFAULT_RECOMMENDED_PROFILE.critique.provider || 'openrouter',
   critique_submitter_model: DEFAULT_RECOMMENDED_PROFILE.critique.modelId || '',
   critique_submitter_openrouter_provider: DEFAULT_RECOMMENDED_PROFILE.critique.openrouterProvider || null,
+  critique_submitter_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(DEFAULT_RECOMMENDED_PROFILE.critique.openrouterReasoningEffort),
   critique_submitter_lm_studio_fallback: DEFAULT_RECOMMENDED_PROFILE.critique.lmStudioFallbackId || null,
   critique_submitter_context_window: DEFAULT_RECOMMENDED_PROFILE.critique.contextWindow,
   critique_submitter_max_tokens: DEFAULT_RECOMMENDED_PROFILE.critique.maxOutputTokens,
+  critique_submitter_supercharge_enabled: Boolean(DEFAULT_RECOMMENDED_PROFILE.critique.superchargeEnabled),
 };
 
 const DEFAULT_AUTONOMOUS_SETTINGS = {
@@ -461,6 +420,7 @@ function normalizeStoredSettings(settings = {}) {
         ...DEFAULT_SUBMITTER_CONFIG,
         ...cfg,
         submitterId: cfg.submitterId || index + 1,
+        openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(cfg.openrouterReasoningEffort),
       }))
     : DEFAULT_AUTONOMOUS_SETTINGS.submitterConfigs;
 
@@ -472,6 +432,10 @@ function normalizeStoredSettings(settings = {}) {
     localConfig: {
       ...DEFAULT_LOCAL_CONFIG,
       ...(settings.localConfig || {}),
+      validator_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(settings.localConfig?.validator_openrouter_reasoning_effort),
+      high_context_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(settings.localConfig?.high_context_openrouter_reasoning_effort),
+      high_param_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(settings.localConfig?.high_param_openrouter_reasoning_effort),
+      critique_submitter_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(settings.localConfig?.critique_submitter_openrouter_reasoning_effort),
     },
     freeOnly: settings.freeOnly ?? DEFAULT_AUTONOMOUS_SETTINGS.freeOnly,
     freeModelLooping: settings.freeModelLooping ?? DEFAULT_AUTONOMOUS_SETTINGS.freeModelLooping,
@@ -507,31 +471,43 @@ export function settingsToAutonomousConfig(settings) {
   const localConfig = normalized.localConfig || {};
 
   return {
-    submitter_configs: normalized.submitterConfigs.slice(0, normalized.numSubmitters),
+    submitter_configs: normalized.submitterConfigs.slice(0, normalized.numSubmitters).map(cfg => ({
+      ...cfg,
+      openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(cfg.openrouterReasoningEffort),
+      supercharge_enabled: Boolean(cfg.superchargeEnabled),
+    })),
     validator_provider: localConfig.validator_provider,
     validator_model: localConfig.validator_model,
     validator_openrouter_provider: localConfig.validator_openrouter_provider,
+    validator_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(localConfig.validator_openrouter_reasoning_effort),
     validator_lm_studio_fallback: localConfig.validator_lm_studio_fallback,
     validator_context_window: localConfig.validator_context_window,
     validator_max_tokens: localConfig.validator_max_tokens,
+    validator_supercharge_enabled: Boolean(localConfig.validator_supercharge_enabled),
     high_context_provider: localConfig.high_context_provider,
     high_context_model: localConfig.high_context_model,
     high_context_openrouter_provider: localConfig.high_context_openrouter_provider,
+    high_context_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(localConfig.high_context_openrouter_reasoning_effort),
     high_context_lm_studio_fallback: localConfig.high_context_lm_studio_fallback,
     high_context_context_window: localConfig.high_context_context_window,
     high_context_max_tokens: localConfig.high_context_max_tokens,
+    high_context_supercharge_enabled: Boolean(localConfig.high_context_supercharge_enabled),
     high_param_provider: localConfig.high_param_provider,
     high_param_model: localConfig.high_param_model,
     high_param_openrouter_provider: localConfig.high_param_openrouter_provider,
+    high_param_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(localConfig.high_param_openrouter_reasoning_effort),
     high_param_lm_studio_fallback: localConfig.high_param_lm_studio_fallback,
     high_param_context_window: localConfig.high_param_context_window,
     high_param_max_tokens: localConfig.high_param_max_tokens,
+    high_param_supercharge_enabled: Boolean(localConfig.high_param_supercharge_enabled),
     critique_submitter_provider: localConfig.critique_submitter_provider,
     critique_submitter_model: localConfig.critique_submitter_model,
     critique_submitter_openrouter_provider: localConfig.critique_submitter_openrouter_provider,
+    critique_submitter_openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(localConfig.critique_submitter_openrouter_reasoning_effort),
     critique_submitter_lm_studio_fallback: localConfig.critique_submitter_lm_studio_fallback,
     critique_submitter_context_window: localConfig.critique_submitter_context_window,
     critique_submitter_max_tokens: localConfig.critique_submitter_max_tokens,
+    critique_submitter_supercharge_enabled: Boolean(localConfig.critique_submitter_supercharge_enabled),
     tier3_enabled: normalized.tier3Enabled ?? false,
   };
 }
@@ -589,9 +565,11 @@ export async function applyAutonomousProfileSelection(profileKey, userProfiles =
       ? convertToApiId(submitterProfile.modelId || '')
       : (submitterProfile.modelId || ''),
     openrouterProvider: submitterProfile.openrouterProvider || null,
+    openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(submitterProfile.openrouterReasoningEffort),
     lmStudioFallbackId: isRecommended ? null : (submitterProfile.lmStudioFallbackId || null),
     contextWindow: submitterProfile.contextWindow,
     maxOutputTokens: submitterProfile.maxOutputTokens,
+    superchargeEnabled: Boolean(submitterProfile.superchargeEnabled),
   }));
 
   const getModelId = (roleProfile = {}) => (
@@ -601,6 +579,7 @@ export async function applyAutonomousProfileSelection(profileKey, userProfiles =
   );
 
   const getOpenRouterProvider = (roleProfile = {}) => roleProfile.openrouterProvider || null;
+  const getOpenRouterReasoningEffort = (roleProfile = {}) => normalizeOpenRouterReasoningEffort(roleProfile.openrouterReasoningEffort);
 
   const currentSettings = getStoredAutonomousSettings();
   const nextSettings = persistAutonomousSettings({
@@ -612,27 +591,35 @@ export async function applyAutonomousProfileSelection(profileKey, userProfiles =
       validator_provider: isRecommended ? 'openrouter' : (profile.validator.provider || 'openrouter'),
       validator_model: getModelId(profile.validator),
       validator_openrouter_provider: getOpenRouterProvider(profile.validator),
+      validator_openrouter_reasoning_effort: getOpenRouterReasoningEffort(profile.validator),
       validator_lm_studio_fallback: isRecommended ? null : (profile.validator.lmStudioFallbackId || null),
       validator_context_window: profile.validator.contextWindow,
       validator_max_tokens: profile.validator.maxOutputTokens,
+      validator_supercharge_enabled: Boolean(profile.validator.superchargeEnabled),
       high_context_provider: isRecommended ? 'openrouter' : (profile.highContext.provider || 'openrouter'),
       high_context_model: getModelId(profile.highContext),
       high_context_openrouter_provider: getOpenRouterProvider(profile.highContext),
+      high_context_openrouter_reasoning_effort: getOpenRouterReasoningEffort(profile.highContext),
       high_context_lm_studio_fallback: isRecommended ? null : (profile.highContext.lmStudioFallbackId || null),
       high_context_context_window: profile.highContext.contextWindow,
       high_context_max_tokens: profile.highContext.maxOutputTokens,
+      high_context_supercharge_enabled: Boolean(profile.highContext.superchargeEnabled),
       high_param_provider: isRecommended ? 'openrouter' : (profile.highParam.provider || 'openrouter'),
       high_param_model: getModelId(profile.highParam),
       high_param_openrouter_provider: getOpenRouterProvider(profile.highParam),
+      high_param_openrouter_reasoning_effort: getOpenRouterReasoningEffort(profile.highParam),
       high_param_lm_studio_fallback: isRecommended ? null : (profile.highParam.lmStudioFallbackId || null),
       high_param_context_window: profile.highParam.contextWindow,
       high_param_max_tokens: profile.highParam.maxOutputTokens,
+      high_param_supercharge_enabled: Boolean(profile.highParam.superchargeEnabled),
       critique_submitter_provider: isRecommended ? 'openrouter' : (profile.critique.provider || 'openrouter'),
       critique_submitter_model: getModelId(profile.critique),
       critique_submitter_openrouter_provider: getOpenRouterProvider(profile.critique),
+      critique_submitter_openrouter_reasoning_effort: getOpenRouterReasoningEffort(profile.critique),
       critique_submitter_lm_studio_fallback: isRecommended ? null : (profile.critique.lmStudioFallbackId || null),
       critique_submitter_context_window: profile.critique.contextWindow,
       critique_submitter_max_tokens: profile.critique.maxOutputTokens,
+      critique_submitter_supercharge_enabled: Boolean(profile.critique.superchargeEnabled),
     },
     selectedProfile: profileKey,
   });
diff --git a/frontend/src/utils/downloadHelpers.js b/frontend/src/utils/downloadHelpers.js
index f630269..be5db46 100644
--- a/frontend/src/utils/downloadHelpers.js
+++ b/frontend/src/utils/downloadHelpers.js
@@ -31,11 +31,15 @@ export const downloadRawText = (content, filename, outline = null, disclaimerTyp
 
   fullContent += body;
 
-  const blob = new Blob([fullContent], { type: 'text/plain' });
+  downloadTextFile(fullContent, `${filename}.txt`);
+};
+
+export const downloadTextFile = (content, filename, mimeType = 'text/plain') => {
+  const blob = new Blob([content], { type: mimeType });
   const url = URL.createObjectURL(blob);
   const link = document.createElement('a');
   link.href = url;
-  link.download = `${filename}.txt`;
+  link.download = filename;
   document.body.appendChild(link);
   link.click();
   document.body.removeChild(link);
diff --git a/frontend/src/utils/leanojProfiles.js b/frontend/src/utils/leanojProfiles.js
new file mode 100644
index 0000000..4165b78
--- /dev/null
+++ b/frontend/src/utils/leanojProfiles.js
@@ -0,0 +1,278 @@
+import { loadModelCache, getModelApiId } from './modelCache';
+import {
+  DEFAULT_CONTEXT_WINDOW,
+  DEFAULT_MAX_OUTPUT_TOKENS,
+  DEFAULT_OPENROUTER_REASONING_EFFORT,
+  normalizeOpenRouterReasoningEffort,
+} from './openRouterSelection';
+
+export const LEANOJ_SETTINGS_STORAGE_KEY = 'leanoj_solver_settings';
+export const LEANOJ_PROFILES_STORAGE_KEY = 'leanoj_solver_profiles';
+export const LEANOJ_RECOMMENDED_PROFILE_KEY = 'leanoj_recommended_balanced_proof';
+export const LEANOJ_LAB_GRADE_PROFILE_KEY = 'leanoj_recommended_lab_grade_solver';
+
+export const LEANOJ_ROLE_KEYS = [
+  'topic_generator',
+  'topic_validator',
+  'brainstorm_validator',
+  'final_solver',
+];
+
+const GEMINI_FLASH_LATEST_MODEL = '~google/gemini-flash-latest';
+const GEMINI_FLASH_LATEST_CONTEXT_WINDOW = 1048576;
+const GEMINI_FLASH_LATEST_MAX_OUTPUT_TOKENS = 65536;
+
+const DEFAULT_ROLE_CONFIG = {
+  provider: 'lm_studio',
+  modelId: '',
+  openrouterProvider: null,
+  openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
+  lmStudioFallbackId: null,
+  contextWindow: DEFAULT_CONTEXT_WINDOW,
+  maxOutputTokens: DEFAULT_MAX_OUTPUT_TOKENS,
+  superchargeEnabled: false,
+};
+
+const DEFAULT_SUBMITTER_CONFIG = {
+  submitterId: 1,
+  ...DEFAULT_ROLE_CONFIG,
+};
+
+const role = (modelId, contextWindow = 262000, maxOutputTokens = 40000) => ({
+  provider: 'openrouter',
+  modelId,
+  openrouterProvider: null,
+  openrouterReasoningEffort: DEFAULT_OPENROUTER_REASONING_EFFORT,
+  lmStudioFallbackId: null,
+  contextWindow,
+  maxOutputTokens,
+});
+
+const geminiFlashLatestRole = () => role(
+  GEMINI_FLASH_LATEST_MODEL,
+  GEMINI_FLASH_LATEST_CONTEXT_WINDOW,
+  GEMINI_FLASH_LATEST_MAX_OUTPUT_TOKENS
+);
+
+export const LEANOJ_RECOMMENDED_PROFILES = {
+  [LEANOJ_RECOMMENDED_PROFILE_KEY]: {
+    name: 'Balanced Proof Solver',
+    numSubmitters: 3,
+    submitters: [
+      role('moonshotai/kimi-k2.6'),
+      role('deepseek/deepseek-v4-pro', 1048576, 65500),
+      role('google/gemini-3.1-pro-preview', 1048576, 65500),
+    ],
+    roles: {
+      topic_generator: role('moonshotai/kimi-k2.6'),
+      topic_validator: geminiFlashLatestRole(),
+      brainstorm_validator: geminiFlashLatestRole(),
+      final_solver: role('google/gemini-3.1-pro-preview', 1048576, 65500),
+    },
+  },
+  [LEANOJ_LAB_GRADE_PROFILE_KEY]: {
+    name: 'Lab Grade Solver',
+    numSubmitters: 3,
+    submitters: [
+      role('openai/gpt-5.5'),
+      role('deepseek/deepseek-v4-pro', 1048576, 65500),
+      role('anthropic/claude-opus-4.7', 1048576, 65500),
+    ],
+    roles: {
+      topic_generator: role('openai/gpt-5.5'),
+      topic_validator: geminiFlashLatestRole(),
+      brainstorm_validator: geminiFlashLatestRole(),
+      final_solver: role('anthropic/claude-opus-4.7', 1048576, 65500),
+    },
+  },
+};
+
+const DEFAULT_PROFILE = LEANOJ_RECOMMENDED_PROFILES[LEANOJ_RECOMMENDED_PROFILE_KEY];
+
+const createDefaultSubmitters = (modelId = '') => (
+  [1, 2, 3].map((submitterId) => ({
+    ...DEFAULT_SUBMITTER_CONFIG,
+    submitterId,
+    modelId,
+  }))
+);
+
+const createDefaultRoles = (modelId = '') => (
+  LEANOJ_ROLE_KEYS.reduce((acc, roleKey) => {
+    acc[roleKey] = {
+      ...DEFAULT_ROLE_CONFIG,
+      modelId,
+    };
+    return acc;
+  }, {})
+);
+
+const profileSubmitters = DEFAULT_PROFILE.submitters.map((submitter, index) => ({
+  ...DEFAULT_SUBMITTER_CONFIG,
+  ...submitter,
+  submitterId: index + 1,
+}));
+
+const DEFAULT_SETTINGS = {
+  prompt: '',
+  leanTemplate: '',
+  numSubmitters: DEFAULT_PROFILE.numSubmitters,
+  submitterConfigs: profileSubmitters,
+  roles: DEFAULT_PROFILE.roles,
+  maxInitialBrainstormAccepts: 30,
+  maxRecursiveBrainstormAccepts: 10,
+  finalAttemptsPerCycle: 30,
+  freeOnly: false,
+  freeModelLooping: true,
+  freeModelAutoSelector: true,
+  modelProviders: {},
+  selectedProfile: LEANOJ_RECOMMENDED_PROFILE_KEY,
+};
+
+function normalizeRoleConfig(config = {}) {
+  return {
+    ...DEFAULT_ROLE_CONFIG,
+    ...config,
+    openrouterProvider: config.openrouterProvider || null,
+    openrouterReasoningEffort: normalizeOpenRouterReasoningEffort(config.openrouterReasoningEffort),
+    lmStudioFallbackId: config.lmStudioFallbackId || null,
+  };
+}
+
+function normalizeSubmitterConfig(config = {}, index = 0) {
+  return {
+    ...DEFAULT_SUBMITTER_CONFIG,
+    ...normalizeRoleConfig(config),
+    submitterId: config.submitterId || index + 1,
+  };
+}
+
+export function normalizeLeanOJSettings(settings = {}) {
+  const submitterConfigs = Array.isArray(settings.submitterConfigs) && settings.submitterConfigs.length > 0
+    ? settings.submitterConfigs.map(normalizeSubmitterConfig)
+    : DEFAULT_SETTINGS.submitterConfigs;
+
+  const roles = LEANOJ_ROLE_KEYS.reduce((acc, roleKey) => {
+    acc[roleKey] = normalizeRoleConfig((settings.roles || {})[roleKey] || DEFAULT_SETTINGS.roles[roleKey]);
+    return acc;
+  }, {});
+
+  return {
+    ...DEFAULT_SETTINGS,
+    ...settings,
+    numSubmitters: settings.numSubmitters || submitterConfigs.length || DEFAULT_SETTINGS.numSubmitters,
+    submitterConfigs,
+    roles,
+    maxInitialBrainstormAccepts: settings.maxInitialBrainstormAccepts ?? DEFAULT_SETTINGS.maxInitialBrainstormAccepts,
+    maxRecursiveBrainstormAccepts: settings.maxRecursiveBrainstormAccepts ?? DEFAULT_SETTINGS.maxRecursiveBrainstormAccepts,
+    finalAttemptsPerCycle: Math.max(30, Number(settings.finalAttemptsPerCycle ?? DEFAULT_SETTINGS.finalAttemptsPerCycle)),
+    modelProviders: settings.modelProviders || DEFAULT_SETTINGS.modelProviders,
+    selectedProfile: settings.selectedProfile ?? DEFAULT_SETTINGS.selectedProfile,
+  };
+}
+
+export function getStoredLeanOJSettings() {
+  try {
+    const raw = localStorage.getItem(LEANOJ_SETTINGS_STORAGE_KEY);
+    if (!raw) return normalizeLeanOJSettings();
+    return normalizeLeanOJSettings(JSON.parse(raw));
+  } catch (error) {
+    console.error('Failed to load Proof Solver settings:', error);
+    return normalizeLeanOJSettings();
+  }
+}
+
+export function persistLeanOJSettings(settings) {
+  const normalized = normalizeLeanOJSettings(settings);
+  localStorage.setItem(LEANOJ_SETTINGS_STORAGE_KEY, JSON.stringify(normalized));
+  return normalized;
+}
+
+const roleToApi = (config = {}) => ({
+  provider: config.provider || 'lm_studio',
+  model_id: config.modelId || '',
+  openrouter_provider: config.openrouterProvider || null,
+  openrouter_reasoning_effort: normalizeOpenRouterReasoningEffort(config.openrouterReasoningEffort),
+  lm_studio_fallback_id: config.lmStudioFallbackId || null,
+  context_window: Number(config.contextWindow || DEFAULT_CONTEXT_WINDOW),
+  max_output_tokens: Number(config.maxOutputTokens || DEFAULT_MAX_OUTPUT_TOKENS),
+  supercharge_enabled: Boolean(config.superchargeEnabled),
+});
+
+export function settingsToLeanOJRequest(settings, prompt, leanTemplate) {
+  const normalized = normalizeLeanOJSettings(settings);
+  const roles = normalized.roles;
+  const topicGenerator = normalized.submitterConfigs[0] || roles.topic_generator;
+  return {
+    user_prompt: prompt ?? normalized.prompt ?? '',
+    lean_template: leanTemplate ?? normalized.leanTemplate ?? '',
+    topic_generator: roleToApi(topicGenerator),
+    topic_validator: roleToApi(roles.topic_validator),
+    brainstorm_submitters: normalized.submitterConfigs.map(roleToApi),
+    brainstorm_validator: roleToApi(roles.brainstorm_validator),
+    path_decider: roleToApi(roles.final_solver),
+    final_solver: roleToApi(roles.final_solver),
+    max_initial_brainstorm_accepts: Number(normalized.maxInitialBrainstormAccepts || 30),
+    max_recursive_brainstorm_accepts: Number(normalized.maxRecursiveBrainstormAccepts || 10),
+    final_attempts_per_cycle: Number(normalized.finalAttemptsPerCycle || 30),
+  };
+}
+
+export function applyLeanOJLmStudioDefaults(modelId = '') {
+  const current = getStoredLeanOJSettings();
+  const next = persistLeanOJSettings({
+    ...current,
+    numSubmitters: 3,
+    submitterConfigs: createDefaultSubmitters(modelId),
+    roles: createDefaultRoles(modelId),
+    selectedProfile: '',
+  });
+  return next;
+}
+
+export async function applyLeanOJProfileSelection(profileKey, userProfiles = {}) {
+  const isRecommended = profileKey.startsWith('leanoj_recommended_');
+  const profile = isRecommended
+    ? LEANOJ_RECOMMENDED_PROFILES[profileKey]
+    : userProfiles[profileKey];
+  if (!profile) {
+    throw new Error(`Proof Solver profile not found: ${profileKey}`);
+  }
+
+  await loadModelCache();
+  const toModelId = (modelId = '') => (
+    isRecommended ? (getModelApiId(modelId) || modelId) : modelId
+  );
+  const convertRole = (config = {}) => ({
+    ...normalizeRoleConfig(config),
+    provider: isRecommended ? 'openrouter' : (config.provider || 'openrouter'),
+    modelId: toModelId(config.modelId || ''),
+    lmStudioFallbackId: isRecommended ? null : (config.lmStudioFallbackId || null),
+  });
+
+  const current = getStoredLeanOJSettings();
+  const roles = LEANOJ_ROLE_KEYS.reduce((acc, roleKey) => {
+    acc[roleKey] = convertRole((profile.roles || {})[roleKey]);
+    return acc;
+  }, {});
+  const submitterConfigs = (profile.submitters || []).map((submitter, index) => ({
+    ...convertRole(submitter),
+    submitterId: index + 1,
+  }));
+
+  const nextSettings = persistLeanOJSettings({
+    ...current,
+    numSubmitters: profile.numSubmitters || submitterConfigs.length,
+    submitterConfigs,
+    roles,
+    maxInitialBrainstormAccepts: profile.maxInitialBrainstormAccepts ?? current.maxInitialBrainstormAccepts,
+    maxRecursiveBrainstormAccepts: profile.maxRecursiveBrainstormAccepts ?? current.maxRecursiveBrainstormAccepts,
+    finalAttemptsPerCycle: profile.finalAttemptsPerCycle ?? current.finalAttemptsPerCycle,
+    selectedProfile: profileKey,
+  });
+
+  return {
+    profile,
+    settings: nextSettings,
+  };
+}
diff --git a/frontend/src/utils/openRouterSelection.js b/frontend/src/utils/openRouterSelection.js
index 4d08e33..98d82c6 100644
--- a/frontend/src/utils/openRouterSelection.js
+++ b/frontend/src/utils/openRouterSelection.js
@@ -1,8 +1,20 @@
-const DEFAULT_CONTEXT_WINDOW = 131072;
-const CONTEXT_BUFFER_TOKENS = 500;
-const KNOWN_NO_OUTPUT_CAP_DEFAULTS = {
-  'x-ai/grok-4.3': 128000,
-};
+export const DEFAULT_CONTEXT_WINDOW = 131072;
+export const DEFAULT_MAX_OUTPUT_TOKENS = 25000;
+export const DEFAULT_OPENROUTER_REASONING_EFFORT = 'auto';
+export const OPENROUTER_REASONING_EFFORT_OPTIONS = [
+  { value: 'auto', label: 'Auto (max supported)' },
+  { value: 'xhigh', label: 'xhigh (maximum)' },
+  { value: 'high', label: 'high' },
+  { value: 'medium', label: 'medium' },
+  { value: 'low', label: 'low' },
+  { value: 'minimal', label: 'minimal' },
+  { value: 'none', label: 'none / disabled' },
+];
+const AUTO_ENDPOINT_OUTLIER_RATIO = 0.75;
+const AUTO_MIN_CAPABLE_OUTPUT_TOKENS = 32768;
+const KNOWN_WEAK_AUTO_PROVIDERS = new Set([
+  'venice',
+]);
 
 function toPositiveInteger(value) {
   const parsed = Number(value);
@@ -12,9 +24,138 @@ function toPositiveInteger(value) {
   return Math.floor(parsed);
 }
 
-function getKnownNoOutputCapDefault(model) {
-  const modelId = typeof model?.id === 'string' ? model.id.toLowerCase() : '';
-  return KNOWN_NO_OUTPUT_CAP_DEFAULTS[modelId] || null;
+function getModelContext(model) {
+  return (
+    toPositiveInteger(model?.context_length) ||
+    toPositiveInteger(model?.top_provider?.context_length)
+  );
+}
+
+function normalizeProviderName(providerName) {
+  return typeof providerName === 'string' ? providerName.trim().toLowerCase() : '';
+}
+
+function getEndpointProviderName(endpoint) {
+  return (
+    endpoint?.provider_name ||
+    endpoint?.provider ||
+    endpoint?.name ||
+    endpoint?.id ||
+    ''
+  );
+}
+
+function uniqueSorted(values) {
+  return Array.from(new Set(values.filter(Boolean))).sort((a, b) => a.localeCompare(b));
+}
+
+function median(values) {
+  const sorted = values
+    .filter((value) => Number.isFinite(value))
+    .slice()
+    .sort((a, b) => a - b);
+  if (sorted.length === 0) {
+    return null;
+  }
+  const midpoint = Math.floor(sorted.length / 2);
+  if (sorted.length % 2 === 1) {
+    return sorted[midpoint];
+  }
+  return Math.floor((sorted[midpoint - 1] + sorted[midpoint]) / 2);
+}
+
+function buildEndpointMetric(endpoint) {
+  return {
+    endpoint,
+    providerName: getEndpointProviderName(endpoint),
+    normalizedProviderName: normalizeProviderName(getEndpointProviderName(endpoint)),
+    contextLength: toPositiveInteger(endpoint?.context_length),
+    outputCap: toPositiveInteger(endpoint?.max_completion_tokens),
+    promptCap: toPositiveInteger(endpoint?.max_prompt_tokens),
+  };
+}
+
+function selectAutoEndpointSet(endpoints, modelContext = null) {
+  if (!Array.isArray(endpoints) || endpoints.length <= 1) {
+    return {
+      endpoints: endpoints || [],
+      ignoredEndpoints: [],
+      recommendedProvider: null,
+      capableProviderNames: uniqueSorted((endpoints || []).map(getEndpointProviderName)),
+      ignoredProviderNames: [],
+      providerSelectionRecommended: false,
+    };
+  }
+
+  const metrics = endpoints.map(buildEndpointMetric);
+  const outputCaps = metrics.map((metric) => metric.outputCap).filter((value) => value !== null);
+  const contextLengths = metrics.map((metric) => metric.contextLength).filter((value) => value !== null);
+  const medianOutputCap = median(outputCaps);
+  const outputThreshold = medianOutputCap && medianOutputCap >= AUTO_MIN_CAPABLE_OUTPUT_TOKENS
+    ? Math.max(AUTO_MIN_CAPABLE_OUTPUT_TOKENS, Math.floor(medianOutputCap * AUTO_ENDPOINT_OUTLIER_RATIO))
+    : null;
+  const contextThresholdFromModel = modelContext && modelContext >= DEFAULT_CONTEXT_WINDOW * 2
+    ? Math.floor(modelContext * AUTO_ENDPOINT_OUTLIER_RATIO)
+    : null;
+  const hasEndpointNearModelContext = contextThresholdFromModel !== null && metrics.some(
+    (metric) => metric.contextLength !== null && metric.contextLength >= contextThresholdFromModel
+  );
+  const contextThreshold = hasEndpointNearModelContext ? contextThresholdFromModel : null;
+
+  const annotatedMetrics = metrics.map((metric) => {
+    const reasons = [];
+    if (KNOWN_WEAK_AUTO_PROVIDERS.has(metric.normalizedProviderName)) {
+      reasons.push('known weak auto-routing host');
+    }
+    if (outputThreshold !== null && metric.outputCap === null && outputCaps.length > 0) {
+      reasons.push('missing max_completion_tokens while other endpoints expose output caps');
+    }
+    if (outputThreshold !== null && metric.outputCap !== null && metric.outputCap < outputThreshold) {
+      reasons.push(`max_completion_tokens=${metric.outputCap} below capable threshold ${outputThreshold}`);
+    }
+    if (contextThreshold !== null && metric.contextLength !== null && metric.contextLength < contextThreshold) {
+      reasons.push(`context_length=${metric.contextLength} below capable threshold ${contextThreshold}`);
+    }
+    if (contextThreshold !== null && metric.contextLength === null && contextLengths.length > 0) {
+      reasons.push('missing context_length while other endpoints match model context');
+    }
+    return { ...metric, reasons };
+  });
+
+  const capableMetrics = annotatedMetrics.filter((metric) => metric.reasons.length === 0);
+  if (capableMetrics.length === 0) {
+    return {
+      endpoints,
+      ignoredEndpoints: [],
+      recommendedProvider: null,
+      capableProviderNames: uniqueSorted(metrics.map((metric) => metric.providerName)),
+      ignoredProviderNames: [],
+      providerSelectionRecommended: false,
+    };
+  }
+
+  const ignoredMetrics = annotatedMetrics.filter((metric) => metric.reasons.length > 0);
+  if (ignoredMetrics.length === 0) {
+    return {
+      endpoints,
+      ignoredEndpoints: [],
+      recommendedProvider: null,
+      capableProviderNames: uniqueSorted(capableMetrics.map((metric) => metric.providerName)),
+      ignoredProviderNames: [],
+      providerSelectionRecommended: false,
+    };
+  }
+
+  const capableProviderNames = uniqueSorted(capableMetrics.map((metric) => metric.providerName));
+
+  return {
+    endpoints: capableMetrics.map((metric) => metric.endpoint),
+    ignoredEndpoints: ignoredMetrics,
+    recommendedProvider: null,
+    capableProviderNames,
+    ignoredProviderNames: uniqueSorted(ignoredMetrics.map((metric) => metric.providerName)),
+    providerSelectionRecommended: false,
+  };
 }
 
 export function findOpenRouterModel(models, modelId) {
@@ -57,14 +198,46 @@ export function getProviderNames(providerData) {
   return normalizeProviderData(providerData).providers;
 }
 
+export function normalizeOpenRouterReasoningEffort(value) {
+  const normalized = typeof value === 'string' ? value.trim().toLowerCase() : '';
+  if (OPENROUTER_REASONING_EFFORT_OPTIONS.some((option) => option.value === normalized)) {
+    return normalized;
+  }
+  return DEFAULT_OPENROUTER_REASONING_EFFORT;
+}
+
+export function getReasoningSupportInfo(providerData, selectedProvider = null) {
+  const { endpoints } = normalizeProviderData(providerData);
+  const normalizedSelectedProvider = normalizeProviderName(selectedProvider);
+  const relevantEndpoints = selectedProvider
+    ? endpoints.filter((endpoint) => normalizeProviderName(getEndpointProviderName(endpoint)) === normalizedSelectedProvider)
+    : endpoints;
+  const supportedParameters = relevantEndpoints.flatMap((endpoint) => (
+    Array.isArray(endpoint?.supported_parameters) ? endpoint.supported_parameters : []
+  ));
+  const normalizedParams = supportedParameters.map((param) => String(param).toLowerCase());
+  const supportsReasoning = normalizedParams.some((param) => (
+    param === 'reasoning' ||
+    param === 'reasoning_effort' ||
+    param === 'reasoning.effort' ||
+    param === 'include_reasoning'
+  ));
+
+  return {
+    supportsReasoning,
+    hasEndpointMetadata: relevantEndpoints.length > 0,
+    supportedParameters,
+  };
+}
+
 /**
  * Compute auto-fill context window + max output tokens for an OpenRouter model.
  *
  * Returns a valid object and marks which values are metadata-backed:
- *   1. Best: full endpoint metadata for the relevant provider(s)
- *   2. Partial: use explicit `max_completion_tokens` when present
- *   3. No-cap: use vetted model-specific defaults for known no-cap models
- *   4. Unknown: fill context only and ask callers not to overwrite output
+ *   1. Context: OpenRouter model.context_length is the source of truth
+ *   2. Output: largest non-outlier endpoint max_completion_tokens
+ *   3. Safety: cap output at 20% of model.context_length
+ *   4. Unknown: ask callers not to overwrite values when metadata is missing
  *
  * The `source` field reports which tier produced the answer, and `warnings`
  * is a list of human-readable diagnostics for logging.
@@ -72,24 +245,43 @@ export function getProviderNames(providerData) {
 export function computeOpenRouterAutoSettings(model, providerData, selectedProvider = null) {
   const { endpoints } = normalizeProviderData(providerData);
   const warnings = [];
+  const modelContext = getModelContext(model);
 
-  const relevantEndpoints = selectedProvider
+  const initialRelevantEndpoints = selectedProvider
     ? endpoints.filter((endpoint) => endpoint?.provider_name === selectedProvider)
     : endpoints;
+  const autoEndpointSelection = selectedProvider
+    ? {
+        endpoints: initialRelevantEndpoints,
+        ignoredEndpoints: [],
+        recommendedProvider: null,
+        capableProviderNames: uniqueSorted(initialRelevantEndpoints.map(getEndpointProviderName)),
+        ignoredProviderNames: [],
+        providerSelectionRecommended: false,
+      }
+    : selectAutoEndpointSet(initialRelevantEndpoints, modelContext);
+  const relevantEndpoints = autoEndpointSelection.endpoints;
 
-  if (selectedProvider && relevantEndpoints.length === 0 && endpoints.length > 0) {
+  if (selectedProvider && initialRelevantEndpoints.length === 0 && endpoints.length > 0) {
     warnings.push(
       `Selected provider "${selectedProvider}" not present in endpoint list; falling back to model-level context.`
     );
   }
 
-  const modelContext = toPositiveInteger(model?.context_length);
-  const knownNoOutputCapDefault = getKnownNoOutputCapDefault(model);
+  if (!selectedProvider && autoEndpointSelection.ignoredEndpoints.length > 0) {
+    const ignoredSummary = autoEndpointSelection.ignoredEndpoints
+      .map((metric) => `${metric.providerName || 'unknown'} (${metric.reasons.join('; ')})`)
+      .join(', ');
+    warnings.push(
+      `Ignored weak OpenRouter auto-routing endpoint(s): ${ignoredSummary}.`
+    );
+  }
 
   if (relevantEndpoints.length === 0) {
     const contextWindow = modelContext || DEFAULT_CONTEXT_WINDOW;
     const contextWindowKnown = modelContext !== null;
-    const maxOutputTokens = knownNoOutputCapDefault;
+    const maxOutputTokens = null;
+    const outputCapSource = 'unknown';
 
     if (!modelContext) {
       warnings.push(
@@ -101,37 +293,33 @@ export function computeOpenRouterAutoSettings(model, providerData, selectedProvi
       );
     }
 
-    if (maxOutputTokens === null) {
-      warnings.push(
-        'No endpoint metadata exposed max_completion_tokens; preserving the current max output setting.'
-      );
-    } else {
-      warnings.push(
-        `No endpoint metadata exposed max_completion_tokens; using known no-cap default ${maxOutputTokens}.`
-      );
-    }
+    warnings.push(
+      'No endpoint metadata exposed max_completion_tokens; preserving the current max output setting.'
+    );
 
     return {
       contextWindow,
       contextWindowKnown,
       maxOutputTokens,
       outputCapKnown: maxOutputTokens !== null,
-      outputCapSource: maxOutputTokens !== null ? 'known-no-cap-default' : 'unknown',
+      outputCapSource,
       smallestEndpointOutputCap: null,
       smallestEndpointContext: null,
       smallestEndpointPromptCap: null,
+      largestEndpointOutputCap: null,
+      largestEndpointContext: null,
+      largestEndpointPromptCap: null,
+      recommendedProvider: autoEndpointSelection.recommendedProvider,
+      providerSelectionRecommended: autoEndpointSelection.providerSelectionRecommended,
+      capableProviderNames: autoEndpointSelection.capableProviderNames,
+      ignoredProviderNames: autoEndpointSelection.ignoredProviderNames,
       fallbackModelContext: modelContext || DEFAULT_CONTEXT_WINDOW,
       source: modelContext ? 'model-context-length' : 'hardcoded-default',
       warnings,
     };
   }
 
-  // Filter endpoints to only those that expose a usable context_length.
-  const endpointsWithContext = relevantEndpoints.filter(
-    (endpoint) => toPositiveInteger(endpoint?.context_length) !== null
-  );
-
-  const endpointContexts = endpointsWithContext
+  const endpointContexts = relevantEndpoints
     .map((endpoint) => toPositiveInteger(endpoint.context_length))
     .filter((value) => value !== null);
 
@@ -143,71 +331,53 @@ export function computeOpenRouterAutoSettings(model, providerData, selectedProvi
     .map((endpoint) => toPositiveInteger(endpoint?.max_prompt_tokens))
     .filter((value) => value !== null);
 
-  // Choose a base context: smallest endpoint context, then model context, then default.
-  let contextWindow;
-  let contextWindowKnown = true;
-  if (endpointContexts.length > 0) {
-    contextWindow = Math.min(...endpointContexts);
-    if (endpointContexts.length < relevantEndpoints.length) {
-      warnings.push(
-        `${relevantEndpoints.length - endpointContexts.length}/${relevantEndpoints.length} endpoints missing context_length; using min of remaining.`
-      );
-    }
-  } else if (modelContext) {
-    contextWindow = modelContext;
-    warnings.push(
-      'No endpoints exposed context_length; falling back to model.context_length.'
-    );
+  const smallestEndpointContext = endpointContexts.length > 0 ? Math.min(...endpointContexts) : null;
+  const smallestEndpointOutputCap = endpointOutputCaps.length > 0 ? Math.min(...endpointOutputCaps) : null;
+  const smallestEndpointPromptCap = endpointPromptCaps.length > 0 ? Math.min(...endpointPromptCaps) : null;
+  const largestEndpointContext = endpointContexts.length > 0 ? Math.max(...endpointContexts) : null;
+  const largestEndpointOutputCap = endpointOutputCaps.length > 0 ? Math.max(...endpointOutputCaps) : null;
+  const largestEndpointPromptCap = endpointPromptCaps.length > 0 ? Math.max(...endpointPromptCaps) : null;
+
+  // The model-level OpenRouter context is the total context source of truth.
+  // Endpoint context rows are provider diagnostics only; they must not shrink
+  // the configured model context after weak providers have been filtered out.
+  const contextWindow = modelContext || DEFAULT_CONTEXT_WINDOW;
+  const contextWindowKnown = modelContext !== null;
+  let contextSource;
+  if (modelContext) {
+    contextSource = 'model-context-length';
   } else {
-    contextWindow = DEFAULT_CONTEXT_WINDOW;
-    contextWindowKnown = false;
+    contextSource = 'hardcoded-default';
     warnings.push(
-      `No endpoint or model context_length; using default ${DEFAULT_CONTEXT_WINDOW}.`
+      `No OpenRouter model.context_length; preserving the current context setting unless callers need fallback ${DEFAULT_CONTEXT_WINDOW}.`
     );
   }
 
-  const smallestEndpointContext = endpointContexts.length > 0 ? Math.min(...endpointContexts) : null;
-  const smallestEndpointOutputCap = endpointOutputCaps.length > 0 ? Math.min(...endpointOutputCaps) : null;
-  const smallestEndpointPromptCap = endpointPromptCaps.length > 0 ? Math.min(...endpointPromptCaps) : null;
-
-  // Determine max output tokens.
-  // If at least one endpoint provides max_completion_tokens, honor the smallest.
-  // If none do, use only vetted model-specific defaults; otherwise preserve
-  // the user's current setting instead of guessing from context length.
+  // Determine max output tokens from non-outlier endpoint caps, capped at 20%
+  // of the OpenRouter model context. In OpenRouter auto mode, use the smallest
+  // capable endpoint cap so OpenRouter can choose any remaining host safely.
   let maxOutputTokens;
   let outputCapSource;
-  if (smallestEndpointOutputCap !== null) {
-    maxOutputTokens = smallestEndpointOutputCap;
+  const endpointOutputCap = selectedProvider ? largestEndpointOutputCap : smallestEndpointOutputCap;
+  const contextBasedOutputCap = modelContext ? Math.floor(modelContext * 0.2) : null;
+  if (endpointOutputCap !== null && contextBasedOutputCap !== null) {
+    maxOutputTokens = Math.min(contextBasedOutputCap, endpointOutputCap);
     outputCapSource = 'endpoint-metadata';
-    if (endpointOutputCaps.length < relevantEndpoints.length) {
-      warnings.push(
-        `${relevantEndpoints.length - endpointOutputCaps.length}/${relevantEndpoints.length} endpoints missing max_completion_tokens; using min of remaining.`
-      );
-    }
-  } else if (knownNoOutputCapDefault !== null) {
-    maxOutputTokens = knownNoOutputCapDefault;
-    outputCapSource = 'known-no-cap-default';
-    warnings.push(
-      `No endpoints exposed max_completion_tokens; using known no-cap default ${maxOutputTokens}.`
-    );
   } else {
     maxOutputTokens = null;
     outputCapSource = 'unknown';
-    warnings.push(
-      'No endpoints exposed max_completion_tokens; preserving the current max output setting.'
-    );
-  }
-
-  if (smallestEndpointPromptCap !== null && maxOutputTokens !== null) {
-    contextWindow = Math.min(
-      contextWindow,
-      smallestEndpointPromptCap + maxOutputTokens + CONTEXT_BUFFER_TOKENS
-    );
+    if (endpointOutputCap !== null && contextBasedOutputCap === null) {
+      warnings.push(
+        'Endpoint metadata exposed max_completion_tokens but model.context_length is unknown; preserving the current max output setting.'
+      );
+    } else {
+      warnings.push(
+        'No endpoints exposed max_completion_tokens; preserving the current max output setting.'
+      );
+    }
   }
 
-  const source = smallestEndpointContext !== null && smallestEndpointOutputCap !== null
-    ? 'endpoint-metadata'
-    : 'partial-endpoint-metadata';
+  const source = `${contextSource}+${outputCapSource}`;
 
   return {
     contextWindow,
@@ -218,6 +388,13 @@ export function computeOpenRouterAutoSettings(model, providerData, selectedProvi
     smallestEndpointOutputCap,
     smallestEndpointContext,
     smallestEndpointPromptCap,
+    largestEndpointOutputCap,
+    largestEndpointContext,
+    largestEndpointPromptCap,
+    recommendedProvider: autoEndpointSelection.recommendedProvider,
+    providerSelectionRecommended: autoEndpointSelection.providerSelectionRecommended,
+    capableProviderNames: autoEndpointSelection.capableProviderNames,
+    ignoredProviderNames: autoEndpointSelection.ignoredProviderNames,
     fallbackModelContext: modelContext || DEFAULT_CONTEXT_WINDOW,
     source,
     warnings,
diff --git a/frontend/src/utils/runtimeConfig.js b/frontend/src/utils/runtimeConfig.js
index 77f1818..17d558d 100644
--- a/frontend/src/utils/runtimeConfig.js
+++ b/frontend/src/utils/runtimeConfig.js
@@ -1,6 +1,9 @@
 const storagePrefix = (import.meta.env.VITE_MOTO_STORAGE_PREFIX || '').trim();
 const instanceId = (import.meta.env.VITE_MOTO_INSTANCE_ID || '').trim();
 const dataRootDisplay = (import.meta.env.VITE_MOTO_DATA_ROOT_DISPLAY || '').trim();
+const desktopApiToken = (import.meta.env.VITE_MOTO_DESKTOP_API_TOKEN || '').trim();
+const backendUrl = (import.meta.env.VITE_MOTO_BACKEND_URL || '').trim();
+const DESKTOP_TOKEN_HEADER = 'X-Moto-Desktop-Token';
 
 function toScopedKey(key) {
   if (!storagePrefix || typeof key !== 'string' || key.length === 0) {
@@ -47,6 +50,73 @@ export function installNamespacedLocalStorage() {
   window.__motoStorageNamespacePatched = true;
 }
 
+function shouldAttachDesktopToken(input) {
+  if (!desktopApiToken || typeof window === 'undefined') {
+    return false;
+  }
+
+  try {
+    const rawUrl = typeof input === 'string'
+      ? input
+      : (input && typeof input.url === 'string' ? input.url : '');
+    if (!rawUrl) {
+      return false;
+    }
+
+    const requestUrl = new URL(rawUrl, window.location.origin);
+    if (!requestUrl.pathname.startsWith('/api')) {
+      return false;
+    }
+
+    if (requestUrl.origin === window.location.origin) {
+      return true;
+    }
+
+    if (backendUrl) {
+      return requestUrl.origin === new URL(backendUrl, window.location.origin).origin;
+    }
+  } catch {
+    return false;
+  }
+
+  return false;
+}
+
+function withDesktopTokenHeaders(headers) {
+  const nextHeaders = new Headers(headers || {});
+  if (!nextHeaders.has(DESKTOP_TOKEN_HEADER)) {
+    nextHeaders.set(DESKTOP_TOKEN_HEADER, desktopApiToken);
+  }
+  return nextHeaders;
+}
+
+export function installAuthenticatedFetch() {
+  if (typeof window === 'undefined' || !desktopApiToken || window.__motoAuthFetchPatched) {
+    return;
+  }
+
+  const originalFetch = window.fetch.bind(window);
+  window.fetch = (input, init = {}) => {
+    if (!shouldAttachDesktopToken(input)) {
+      return originalFetch(input, init);
+    }
+
+    if (input instanceof Request) {
+      const request = new Request(input, {
+        ...init,
+        headers: withDesktopTokenHeaders(init.headers || input.headers),
+      });
+      return originalFetch(request);
+    }
+
+    return originalFetch(input, {
+      ...init,
+      headers: withDesktopTokenHeaders(init.headers),
+    });
+  };
+  window.__motoAuthFetchPatched = true;
+}
+
 export function getRuntimeDataPath(relativePath = '') {
   const normalizedRelativePath = String(relativePath || '').replace(/^[/\\]+/, '');
   const basePath = dataRootDisplay || 'this instance data root';
@@ -57,3 +127,7 @@ export function getRuntimeInstanceId() {
   return instanceId || 'default';
 }
 
+export function getDesktopApiToken() {
+  return desktopApiToken;
+}
+
diff --git a/frontend/vite.config.js b/frontend/vite.config.js
index 63f7f2a..ecdb95e 100644
--- a/frontend/vite.config.js
+++ b/frontend/vite.config.js
@@ -7,7 +7,7 @@ export default defineConfig(({ mode }) => {
   const backendUrl = env.VITE_MOTO_BACKEND_URL || `http://localhost:${backendPort}`
   const backendWsUrl = env.VITE_MOTO_BACKEND_WS_URL || backendUrl.replace(/^http/i, 'ws')
   const frontendPort = Number(env.VITE_MOTO_FRONTEND_PORT || env.MOTO_FRONTEND_PORT || env.FRONTEND_PORT || 5173)
-  const frontendHost = env.VITE_MOTO_FRONTEND_HOST || '0.0.0.0'
+  const frontendHost = env.VITE_MOTO_FRONTEND_HOST || '127.0.0.1'
 
   const logger = createLogger()
   const originalError = logger.error.bind(logger)
diff --git a/Launch MOTO.sh b/linux-ubuntu-launcher.sh
similarity index 94%
rename from Launch MOTO.sh
rename to linux-ubuntu-launcher.sh
index 7c3dd23..6ede60d 100644
--- a/Launch MOTO.sh	
+++ b/linux-ubuntu-launcher.sh
@@ -40,5 +40,5 @@ if [[ ! -x "$PYTHON_BIN" ]]; then
     exit 1
 fi
 
-export MOTO_LAUNCHER_ENTRYPOINT="$SCRIPT_DIR/Launch MOTO.sh"
+export MOTO_LAUNCHER_ENTRYPOINT="$SCRIPT_DIR/linux-ubuntu-launcher.sh"
 exec "$PYTHON_BIN" "$SCRIPT_DIR/moto_launcher.py" "$@"
diff --git a/moto-update-manifest.json b/moto-update-manifest.json
index df18b1d..8d635ee 100644
--- a/moto-update-manifest.json
+++ b/moto-update-manifest.json
@@ -1,7 +1,7 @@
 {
   "manifest_version": 1,
-  "version": "1.0.7",
+  "version": "1.0.8",
   "build_commit": "d352090d687bd3475acfee17f29f7f0cfb17264e",
   "update_channel": "main",
-  "api_contract_version": "build5-v1"
+  "api_contract_version": "build5-v12"
 }
diff --git a/moto_launcher.py b/moto_launcher.py
index ce24dc9..53ad70d 100644
--- a/moto_launcher.py
+++ b/moto_launcher.py
@@ -1,6 +1,6 @@
 """
 MOTO System Launcher (Python)
-This is an internal script. Use "Click To Launch MOTO.bat" on Windows or "Launch MOTO.sh" on Ubuntu 24.04.
+This is an internal script. Use "Click To Launch MOTO.bat" on Windows or "linux-ubuntu-launcher.sh" on Ubuntu 24.04.
 """
 from __future__ import annotations
 
@@ -12,6 +12,7 @@
 import platform
 from random import randint
 import re
+import secrets
 import socket
 import shlex
 from shutil import rmtree, which
@@ -230,7 +231,7 @@ def resolve_instance_runtime() -> InstanceRuntime:
     explicit_secret = sanitize_instance_id(os.environ.get("MOTO_SECRET_NAMESPACE"))
     explicit_storage = sanitize_instance_id(os.environ.get("MOTO_FRONTEND_STORAGE_PREFIX"))
 
-    backend_host = os.environ.get("MOTO_BACKEND_HOST") or os.environ.get("HOST") or "0.0.0.0"
+    backend_host = os.environ.get("MOTO_BACKEND_HOST") or os.environ.get("HOST") or "127.0.0.1"
 
     explicit_backend_port = None
     for variable in ("MOTO_BACKEND_PORT", "PORT"):
@@ -648,7 +649,7 @@ def check_python_installation() -> None:
         cprint("============================================================", RED)
         print()
         if is_linux():
-            cprint("Install Python 3 and python3-venv, then launch via `Launch MOTO.sh`.", YELLOW)
+            cprint("Install Python 3 and python3-venv, then launch via `bash linux-ubuntu-launcher.sh`.", YELLOW)
             cprint("Example: sudo apt install python3 python3-venv", YELLOW)
         else:
             cprint("Please install Python 3.8+ from:", YELLOW)
@@ -664,7 +665,7 @@ def check_python_installation() -> None:
         if using_repo_local_venv():
             cprint("Using repo-local .venv for Ubuntu-safe package installs.", GREEN)
         else:
-            cprint("Tip: `Launch MOTO.sh` is the recommended Ubuntu 24.04 entrypoint because it keeps Python packages inside the repo-local .venv.", YELLOW)
+            cprint("Tip: `linux-ubuntu-launcher.sh` is the recommended Ubuntu 24.04 entrypoint because it keeps Python packages inside the repo-local .venv.", YELLOW)
     print()
 
 
@@ -771,6 +772,9 @@ def prepare_runtime_and_environment() -> tuple[InstanceRuntime, str, str, dict[s
     env["VITE_MOTO_BACKEND_URL"] = backend_url
     env["VITE_MOTO_INSTANCE_ID"] = runtime.instance_id
     env["VITE_MOTO_DATA_ROOT_DISPLAY"] = runtime.data_root
+    desktop_api_token = os.environ.get("MOTO_DESKTOP_API_TOKEN") or secrets.token_urlsafe(32)
+    env["MOTO_DESKTOP_API_TOKEN"] = desktop_api_token
+    env["VITE_MOTO_DESKTOP_API_TOKEN"] = desktop_api_token
 
     if runtime.storage_prefix:
         env["MOTO_FRONTEND_STORAGE_PREFIX"] = runtime.storage_prefix
@@ -808,7 +812,7 @@ def install_python_dependencies() -> None:
         cprint("- Internet connection is working", YELLOW)
         cprint("- You have permission to install packages", YELLOW)
         if is_linux():
-            cprint("- On Ubuntu 24.04, prefer launching via `Launch MOTO.sh` so installs stay inside the repo-local .venv", YELLOW)
+            cprint("- On Ubuntu 24.04, prefer launching via `bash linux-ubuntu-launcher.sh` so installs stay inside the repo-local .venv", YELLOW)
             cprint("- If venv creation fails, install `python3-venv` first", YELLOW)
         exit_with_pause(1)
     cprint("Python dependencies up to date", GREEN)
diff --git a/moto_updater.py b/moto_updater.py
index 7434c56..5233b2b 100644
--- a/moto_updater.py
+++ b/moto_updater.py
@@ -28,7 +28,7 @@
     "version": "0.0.0-dev",
     "build_commit": "dev",
     "update_channel": "main",
-    "api_contract_version": "build5-v1",
+    "api_contract_version": "build5-v12",
 }
 
 _DEFAULT_PRESERVED_ROOTS = {
diff --git a/package.json b/package.json
index 57dcba0..ab10b20 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.7",
+  "version": "1.0.8",
   "description": "MOTO S.T.E.M. Mathematics Variant - Autonomous ASI Research System for Novel S.T.E.M. Mathematical Paper Generation",
   "scripts": {
     "dev:backend": "python -c \"import os, uvicorn; uvicorn.run('backend.api.main:app', host=os.getenv('MOTO_BACKEND_HOST', os.getenv('HOST', '0.0.0.0')), port=int(os.getenv('MOTO_BACKEND_PORT', os.getenv('PORT', '8000'))), reload=True, access_log=False)\"",
diff --git a/randomlog.txt b/randomlog.txt
deleted file mode 100644
index d5c1c74..0000000
--- a/randomlog.txt
+++ /dev/null
@@ -1,467 +0,0 @@
-2026-05-05 09:37:18.716 - backend.api.middleware - INFO - Using default CORS origins: ['http://localhost:5173', 'http://127.0.0.1:5173', 'http://localhost:8000', 'http://127.0.0.1:8000']
-2026-05-05 09:37:18.716 - backend.api.middleware - INFO - Middleware configured
-INFO:     Started server process [15848]
-INFO:     Waiting for application startup.
-2026-05-05 09:37:18.777 - backend.api.main - INFO - Starting ASI Aggregator System instance 'default' (data_dir=C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data, logs_dir=C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\logs)
-2026-05-05 09:37:18.783 - backend.api.main - INFO - Secret store active: namespaced_instance=False
-2026-05-05 09:37:20.433 - backend.shared.api_client_manager - INFO - OpenRouter client initialized
-2026-05-05 09:37:20.433 - backend.api.main - INFO - Restored OpenRouter API key from secure backend storage
-2026-05-05 09:37:20.446 - backend.api.main - INFO - No Wolfram Alpha API key found in secure backend storage for this namespace
-2026-05-05 09:37:20.465 - backend.shared.lm_studio_client - INFO - Successfully connected to LM Studio. Found 4 models.
-2026-05-05 09:37:20.465 - backend.api.main - INFO - No resumable session found - using legacy paths
-2026-05-05 09:37:20.465 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\proofs
-2026-05-05 09:37:20.465 - backend.api.main - INFO - ASI Aggregator System ready
-2026-05-05 09:37:20.497 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
-INFO:     Application startup complete.
-INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)
-INFO:     127.0.0.1:62649 - "WebSocket /ws" [accepted]
-2026-05-05 09:37:28.127 - backend.api.routes.websocket - INFO - WebSocket connected. Total connections: 1
-INFO:     connection open
-2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 1 (Main Submitter): model=x-ai/grok-4.3, context=1000000, max_tokens=128000
-2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 2 : model=moonshotai/kimi-k2.6, context=262000, max_tokens=40000
-2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Brainstorm Submitter 3 : model=x-ai/grok-4.3, context=1000000, max_tokens=128000
-2026-05-05 09:37:33.477 - backend.api.routes.autonomous - INFO - Validator: model=x-ai/grok-4.1-fast, context=2000000, max_tokens=30000
-2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous coordinator initializing with 3 submitters
-2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 1 (Main Submitter): model=x-ai/grok-4.3, context=1000000
-2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 2 : model=moonshotai/kimi-k2.6, context=262000
-2026-05-05 09:37:33.477 - backend.autonomous.core.autonomous_coordinator - INFO -   Submitter 3 : model=x-ai/grok-4.3, context=1000000
-2026-05-05 09:37:33.493 - backend.autonomous.memory.session_manager - INFO - Session initialized: explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
-2026-05-05 09:37:33.493 - backend.autonomous.memory.session_manager - INFO - Session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
-2026-05-05 09:37:33.493 - backend.autonomous.core.autonomous_coordinator - INFO - New session initialized: explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
-2026-05-05 09:37:33.493 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
-2026-05-05 09:37:33.493 - backend.autonomous.memory.paper_library - INFO - Paper library using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
-2026-05-05 09:37:33.493 - backend.autonomous.memory.research_metadata - INFO - Research metadata using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37
-2026-05-05 09:37:33.493 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory using session path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\final_answer
-2026-05-05 09:37:33.493 - backend.autonomous.memory.proof_database - INFO - Proof database using path: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\proofs
-2026-05-05 09:37:33.493 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
-2026-05-05 09:37:33.509 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'user_research_prompt' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'base_user_research_prompt' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_active' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_context' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_framing_reasoning' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'proof_runtime_config' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'brainstorms' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'papers' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_topic_id' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - Added missing key 'next_paper_id' to research metadata
-2026-05-05 09:37:33.510 - backend.autonomous.memory.research_metadata - INFO - User research prompt updated
-2026-05-05 09:37:33.527 - backend.autonomous.memory.research_metadata - INFO - Research metadata initialized
-2026-05-05 09:37:33.543 - backend.autonomous.memory.autonomous_rejection_logs - INFO - Autonomous rejection logs initialized
-2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_coordinator - INFO - Resetting RAG state for fresh autonomous research mode...
-2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_rag_manager - INFO - Resetting AutonomousRAGManager tracking state...
-2026-05-05 09:37:33.543 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager state reset
-2026-05-05 09:37:33.543 - backend.aggregator.core.rag_manager - INFO - Clearing all documents from RAG database...
-2026-05-05 09:37:33.560 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_256
-2026-05-05 09:37:33.576 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_512
-2026-05-05 09:37:33.577 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_768
-2026-05-05 09:37:33.593 - backend.aggregator.core.rag_manager - INFO - Deleted collection chunks_1024
-2026-05-05 09:37:33.610 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_256
-2026-05-05 09:37:33.610 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_512
-2026-05-05 09:37:33.626 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_768
-2026-05-05 09:37:33.677 - backend.aggregator.core.rag_manager - INFO - Recreated collection chunks_1024
-2026-05-05 09:37:33.677 - backend.aggregator.core.rag_manager - INFO - Successfully cleared all RAG documents
-2026-05-05 09:37:33.677 - backend.autonomous.core.autonomous_coordinator - INFO - RAG state reset and cleared for autonomous mode
-2026-05-05 09:37:33.677 - backend.autonomous.memory.brainstorm_memory - INFO - Brainstorm memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms
-2026-05-05 09:37:33.677 - backend.autonomous.memory.paper_library - INFO - Paper library initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\papers
-2026-05-05 09:37:33.677 - backend.autonomous.core.autonomous_rag_manager - INFO - AutonomousRAGManager initialized
-2026-05-05 09:37:33.677 - backend.autonomous.memory.final_answer_memory - INFO - Final answer memory initialized at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\final_answer
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_selector': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_completion_reviewer': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_reference_selector': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_title_selector': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_topic_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_paper_redundancy_checker': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_framing_gate': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_novelty': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_brainstorm': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.677 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_identification_manual_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.692 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_lemma_search_manual_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.692 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_proof_formalization_manual_paper': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_certainty_assessor': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_format_selector': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.693 - backend.shared.api_client_manager - INFO - Configured role 'autonomous_volume_organizer': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - Configured Tier 3 Final Answer agents with api_client_manager
-2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - No interrupted workflow found - checking for incomplete papers
-2026-05-05 09:37:33.693 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator initialized
-2026-05-05 09:37:33.710 - backend.shared.api_client_manager - INFO - Autonomous API logger callback set
-2026-05-05 09:37:33.710 - backend.autonomous.core.autonomous_coordinator - INFO - Autonomous API logging enabled
-2026-05-05 09:37:33.710 - backend.shared.token_tracker - INFO - TokenTracker reset
-2026-05-05 09:37:33.710 - backend.shared.token_tracker - INFO - TokenTracker timer started
-2026-05-05 09:37:33.710 - backend.autonomous.core.autonomous_coordinator - INFO - AutonomousCoordinator started
-2026-05-05 09:37:42.744 - backend.autonomous.core.autonomous_coordinator - INFO - Starting topic exploration phase (target: 5 candidates)
-2026-05-05 09:37:42.744 - backend.aggregator.memory.shared_training - INFO - Brainstorm database file doesn't exist yet: C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms\exploration_candidates.txt
-2026-05-05 09:37:42.744 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-05-05 09:37:42.759 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 1000000, Validator: 2000000
-2026-05-05 09:37:42.759 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['x-ai/grok-4.3', 'moonshotai/kimi-k2.6', 'x-ai/grok-4.3'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
-2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 1000000 tokens (model: x-ai/grok-4.3)
-  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.6)
-  - Submitter 3: 1000000 tokens (model: x-ai/grok-4.3)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-05-05 09:37:43.544 - backend.aggregator.memory.shared_training - INFO - Created new shared training file
-2026-05-05 09:37:43.544 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-05-05 09:37:43.561 - backend.aggregator.memory.event_log - INFO - Created new event log file
-2026-05-05 09:37:43.561 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 1
-2026-05-05 09:37:43.561 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model x-ai/grok-4.3
-2026-05-05 09:37:43.561 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:43.561 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=x-ai/grok-4.3, provider=openrouter, context=1000000
-2026-05-05 09:37:43.561 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 2
-2026-05-05 09:37:43.570 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.6
-2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
-2026-05-05 09:37:43.570 - backend.aggregator.memory.local_training - INFO - Created new rejection log for submitter 3
-2026-05-05 09:37:43.570 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.3
-2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.3, provider=openrouter, context=1000000
-2026-05-05 09:37:43.570 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-05-05 09:37:43.570 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
-2026-05-05 09:37:43.570 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-05-05 09:37:43.576 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-05-05 09:37:43.576 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-05-05 09:37:43.577 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-05-05 09:37:43.577 - backend.autonomous.core.autonomous_coordinator - INFO - Exploration aggregator started with parallel submitters
-2026-05-05 09:37:43.577 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-05-05 09:37:43.876 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-05-05 09:37:43.877 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-05-05 09:37:43.877 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-05-05 09:38:04.127 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 8ad7c7a9-5bac-4d75-b43b-d97e86b604bf (iteration 1)
-2026-05-05 09:38:04.976 - backend.aggregator.core.coordinator - INFO - Validator iteration 22 - batch validating 1 submissions: ['8ad7c7a9-5bac-4d75-b43b-d97e86b604bf']
-2026-05-05 09:38:13.593 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
-2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:38:13.593 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
-2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 1)
-2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:38:13.593 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-05-05 09:38:13.600 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 4 total chunks
-2026-05-05 09:38:13.611 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 1/5 candidates accepted
-2026-05-05 09:38:13.760 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-05-05 09:38:13.760 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-05-05 09:38:23.076 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission c4e0cff3-864a-4369-b923-c566bf2591af (iteration 1)
-2026-05-05 09:38:23.625 - backend.aggregator.core.coordinator - INFO - Validator iteration 33 - batch validating 1 submissions: ['c4e0cff3-864a-4369-b923-c566bf2591af']
-2026-05-05 09:38:35.643 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
-2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:38:35.643 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
-2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 2)
-2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:38:35.643 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-05-05 09:38:35.643 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 2 total chunks
-2026-05-05 09:38:35.768 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-05-05 09:38:35.768 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-05-05 09:38:37.629 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 2/5 candidates accepted
-2026-05-05 09:38:47.097 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission fd6f9a4b-8e0a-45cb-b816-0ac7a0b2b575 (iteration 2)
-2026-05-05 09:38:47.707 - backend.aggregator.core.coordinator - INFO - Validator iteration 46 - batch validating 1 submissions: ['fd6f9a4b-8e0a-45cb-b816-0ac7a0b2b575']
-2026-05-05 09:38:55.508 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
-2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:38:55.508 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
-2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 3)
-2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:38:55.508 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-05-05 09:38:55.508 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 2 total chunks
-2026-05-05 09:38:55.625 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-05-05 09:38:55.625 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-05-05 09:38:55.625 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 3/5 candidates accepted
-2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - JSON TRUNCATION DETECTED: Model hit max_tokens during generation. Response has 1 unclosed braces, in_string=True. Response length: 743 chars. Last completed property at char 525: ...'obabilistic certificates for admissible lossiness?",\n  "reasoning": "This candidate is substantively'...
-2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - JSON TRUNCATION DETECTED: Incomplete JSON structure. open_braces=1, open_brackets=0, in_string=True. Response length: 743 chars. Model hit max_tokens during generation.
-2026-05-05 09:39:05.825 - backend.shared.json_parser - ERROR - parse_json: JSON response truncated at max_tokens: incomplete structure with 1 unclosed braces, 0 unclosed brackets, in_string=True. Response length: 743 chars. Model needs to generate more concise output that fits within token limits.
-2026-05-05 09:39:05.825 - backend.aggregator.agents.submitter - INFO - Submitter 3: Initial JSON parse failed, attempting conversational retry
-2026-05-05 09:39:32.192 - backend.shared.lean4_client - INFO - Updated workspace lean-toolchain: 'leanprover/lean4:stable' -> 'leanprover/lean4:v4.30.0-rc2'
-2026-05-05 09:39:32.192 - backend.shared.lean4_client - INFO - Aligned workspace lean-toolchain with Mathlib; re-running lake update.
-2026-05-05 09:39:49.573 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 9c50c080-d45f-4b57-bbd5-759ca83d9313 (iteration 3)
-2026-05-05 09:39:49.622 - backend.aggregator.core.coordinator - INFO - Validator iteration 101 - batch validating 1 submissions: ['9c50c080-d45f-4b57-bbd5-759ca83d9313']
-2026-05-05 09:39:59.057 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
-2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:39:59.057 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 3)
-2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
-2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:39:59.057 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-05-05 09:39:59.057 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 1 total chunks
-2026-05-05 09:39:59.140 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-05-05 09:39:59.140 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-05-05 09:39:59.657 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 4/5 candidates accepted
-2026-05-05 09:40:15.356 - backend.aggregator.agents.submitter - INFO - Submitter 3: First retry succeeded!
-2026-05-05 09:40:15.356 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 918a44e9-acb1-4680-9c48-01dbe53780d1 (iteration 2)
-2026-05-05 09:40:16.123 - backend.aggregator.core.coordinator - INFO - Validator iteration 119 - batch validating 1 submissions: ['918a44e9-acb1-4680-9c48-01dbe53780d1']
-2026-05-05 09:40:26.339 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
-2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:40:26.354 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
-2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 5)
-2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:40:26.354 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-05-05 09:40:26.355 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 3 total chunks
-2026-05-05 09:40:26.439 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-05-05 09:40:26.439 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-05-05 09:40:27.678 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: 5/5 candidates accepted
-2026-05-05 09:40:27.679 - backend.autonomous.core.autonomous_coordinator - INFO - TopicExploration: Target of 5 candidates reached
-2026-05-05 09:40:27.679 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-05-05 09:40:27.679 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-05-05 09:40:27.691 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-05-05 09:40:27.694 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-05-05 09:40:27.694 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 121
-2026-05-05 09:40:27.694 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 121 iterations - is_running=False
-2026-05-05 09:40:27.695 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Topic exploration complete: 5 candidates accepted
-2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Exploration: Restored shared_training_memory state
-2026-05-05 09:40:27.696 - backend.autonomous.core.autonomous_coordinator - INFO - Topic selection attempt 1
-2026-05-05 09:40:27.696 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generating topic selection with model x-ai/grok-4.3 (prompt=2689t, task_id=agg_sub1_000)
-2026-05-05 09:40:56.939 - backend.autonomous.agents.topic_selector - INFO - TopicSelector: Generated submission - action=new_topic
-2026-05-05 09:40:56.939 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Validating topic selection with model x-ai/grok-4.1-fast (prompt=1406t, task_id=agg_val_000)
-2026-05-05 09:41:04.810 - backend.autonomous.agents.topic_validator - INFO - TopicValidator: Decision=accept
-2026-05-05 09:41:04.828 - backend.autonomous.memory.brainstorm_memory - INFO - Created new brainstorm: topic_001
-2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Created new brainstorm: topic_001
-2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - No papers available for pre-brainstorm reference selection
-2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Selected 0 reference papers for brainstorm
-2026-05-05 09:41:04.845 - backend.shared.api_client_manager - INFO - Model tracking callback set for Tier 3
-2026-05-05 09:41:04.845 - backend.autonomous.core.autonomous_coordinator - INFO - Per-paper model tracking enabled for brainstorm topic_001
-2026-05-05 09:41:04.845 - backend.aggregator.memory.shared_training - INFO - Reloaded 0 insights from C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\auto_sessions\explore_the_most_impactful_ways_to_use_volterra_st_2026-05-05_09-37\brainstorms\brainstorm_topic_001.txt (submission count: 0)
-2026-05-05 09:41:04.855 - backend.autonomous.core.autonomous_coordinator - INFO - Reloaded 0 existing submissions from brainstorm database
-2026-05-05 09:41:04.855 - backend.aggregator.core.coordinator - INFO - Initializing coordinator...
-2026-05-05 09:41:04.855 - backend.aggregator.core.context_allocator - INFO - Context windows updated - Submitter: 1000000, Validator: 2000000
-2026-05-05 09:41:04.856 - backend.aggregator.core.coordinator - INFO - Multi-model mode: 3 submitters with models ['x-ai/grok-4.3', 'moonshotai/kimi-k2.6', 'x-ai/grok-4.3'] run in parallel, validator (x-ai/grok-4.1-fast) runs independently.
-2026-05-05 09:41:05.527 - backend.aggregator.core.coordinator - INFO - Currently loaded models: ['text-embedding-nomic-embed-text-v1.5']
-2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Context window configuration:
-  - Submitter 1: 1000000 tokens (model: x-ai/grok-4.3)
-  - Submitter 2: 262000 tokens (model: moonshotai/kimi-k2.6)
-  - Submitter 3: 1000000 tokens (model: x-ai/grok-4.3)
-  - Validator: 2000000 tokens (model: x-ai/grok-4.1-fast)
-2026-05-05 09:41:05.528 - backend.aggregator.memory.shared_training - INFO - Loaded 0 existing insights from shared training (submission count: 0)
-2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Skipping stats load (autonomous mode - starting fresh)
-2026-05-05 09:41:05.528 - backend.aggregator.memory.event_log - INFO - Loaded 5 events from event log
-2026-05-05 09:41:05.528 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 1
-2026-05-05 09:41:05.528 - backend.aggregator.agents.submitter - INFO - Submitter 1 initialized with model x-ai/grok-4.3
-2026-05-05 09:41:05.528 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_1': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Created Submitter 1: model=x-ai/grok-4.3, provider=openrouter, context=1000000
-2026-05-05 09:41:05.528 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 2
-2026-05-05 09:41:05.528 - backend.aggregator.agents.submitter - INFO - Submitter 2 initialized with model moonshotai/kimi-k2.6
-2026-05-05 09:41:05.528 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_2': provider=openrouter, model=moonshotai/kimi-k2.6
-2026-05-05 09:41:05.528 - backend.aggregator.core.coordinator - INFO - Created Submitter 2: model=moonshotai/kimi-k2.6, provider=openrouter, context=262000
-2026-05-05 09:41:05.538 - backend.aggregator.memory.local_training - INFO - Loaded 0 rejections for submitter 3
-2026-05-05 09:41:05.539 - backend.aggregator.agents.submitter - INFO - Submitter 3 initialized with model x-ai/grok-4.3
-2026-05-05 09:41:05.539 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_submitter_3': provider=openrouter, model=x-ai/grok-4.3
-2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Created Submitter 3: model=x-ai/grok-4.3, provider=openrouter, context=1000000
-2026-05-05 09:41:05.539 - backend.aggregator.agents.validator - INFO - Validator initialized with model x-ai/grok-4.1-fast
-2026-05-05 09:41:05.539 - backend.shared.api_client_manager - INFO - Configured role 'aggregator_validator': provider=openrouter, model=x-ai/grok-4.1-fast
-2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Created Validator: model=x-ai/grok-4.1-fast, provider=openrouter
-2026-05-05 09:41:05.539 - backend.aggregator.core.coordinator - INFO - Coordinator initialized successfully with 3 submitters
-2026-05-05 09:41:05.540 - backend.aggregator.core.coordinator - INFO - Starting coordinator...
-2026-05-05 09:41:05.540 - backend.aggregator.core.coordinator - INFO - Starting multi-model workflow (parallel submitters)
-2026-05-05 09:41:05.540 - backend.aggregator.agents.submitter - INFO - Submitter 1 started
-2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 2 started
-2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 3 started
-2026-05-05 09:41:05.541 - backend.aggregator.core.coordinator - INFO - Coordinator started successfully
-2026-05-05 09:41:05.541 - backend.autonomous.core.autonomous_coordinator - INFO - Aggregator started for brainstorm topic_001
-2026-05-05 09:41:05.541 - backend.autonomous.core.autonomous_coordinator - INFO - Starting fresh brainstorm with 0 acceptances
-2026-05-05 09:41:05.541 - backend.aggregator.agents.submitter - INFO - Submitter 1 run loop started - will run continuously until stopped
-2026-05-05 09:41:05.545 - backend.aggregator.agents.submitter - INFO - Submitter 2 run loop started - will run continuously until stopped
-2026-05-05 09:41:05.545 - backend.aggregator.agents.submitter - INFO - Submitter 3 run loop started - will run continuously until stopped
-2026-05-05 09:41:05.555 - backend.aggregator.core.coordinator - INFO - Validator loop started - will run continuously until stopped (batch mode: up to 3)
-2026-05-05 09:41:33.088 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission cfd4829a-3a5f-4ea2-8dfb-7dfcc0c5d377 (iteration 1)
-2026-05-05 09:41:33.570 - backend.aggregator.core.coordinator - INFO - Validator iteration 29 - batch validating 1 submissions: ['cfd4829a-3a5f-4ea2-8dfb-7dfcc0c5d377']
-2026-05-05 09:41:41.931 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #1
-2026-05-05 09:41:41.936 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:41:41.936 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 1)
-2026-05-05 09:41:41.937 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 1)
-2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:41:41.938 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-05-05 09:41:41.938 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 13 total chunks
-2026-05-05 09:41:42.205 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-05-05 09:41:42.205 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-05-05 09:42:00.104 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission eb653b63-2e14-42df-87c8-971f683d4b54 (iteration 1)
-2026-05-05 09:42:00.952 - backend.aggregator.core.coordinator - INFO - Validator iteration 49 - batch validating 1 submissions: ['eb653b63-2e14-42df-87c8-971f683d4b54']
-2026-05-05 09:42:25.104 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #2
-2026-05-05 09:42:25.104 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:42:25.120 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 1)
-2026-05-05 09:42:25.121 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 2)
-2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:42:25.122 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-05-05 09:42:25.124 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 6 total chunks
-2026-05-05 09:42:25.304 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-05-05 09:42:25.304 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-05-05 09:42:46.150 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 1752a022-ebc0-44e7-854c-77c34bcc134f (iteration 2)
-2026-05-05 09:42:46.161 - backend.aggregator.core.coordinator - INFO - Validator iteration 71 - batch validating 1 submissions: ['1752a022-ebc0-44e7-854c-77c34bcc134f']
-2026-05-05 09:43:15.187 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission rejected (consecutive: 1)
-2026-05-05 09:43:15.187 - backend.aggregator.core.coordinator - INFO - Rejected submission from submitter 1 (total: 1)
-2026-05-05 09:43:41.573 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission 4ce1ad0e-18a7-4855-a408-ad71e44a2bad (iteration 2)
-2026-05-05 09:43:42.251 - backend.aggregator.core.coordinator - INFO - Validator iteration 99 - batch validating 1 submissions: ['4ce1ad0e-18a7-4855-a408-ad71e44a2bad']
-2026-05-05 09:43:59.534 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #3
-2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:43:59.534 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 2)
-2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 3)
-2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:43:59.534 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=768
-2026-05-05 09:43:59.550 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_768: 5 total chunks
-2026-05-05 09:43:59.699 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_768
-2026-05-05 09:43:59.699 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=768
-2026-05-05 09:44:28.808 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 15b0c73a-a6c3-40b4-9ea5-dfa7b351ba61 (iteration 3)
-2026-05-05 09:44:29.665 - backend.aggregator.core.coordinator - INFO - Validator iteration 130 - batch validating 1 submissions: ['15b0c73a-a6c3-40b4-9ea5-dfa7b351ba61']
-2026-05-05 09:44:48.360 - backend.aggregator.agents.submitter - INFO - Submitter 3 generated submission f5754b90-663f-4778-a822-927137536d11 (iteration 3)
-2026-05-05 09:44:57.829 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #4
-2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:44:57.829 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 2)
-2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 4)
-2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:44:57.829 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=1024
-2026-05-05 09:44:57.829 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_1024: 3 total chunks
-2026-05-05 09:44:57.845 - backend.aggregator.core.coordinator - INFO - Validator iteration 131 - batch validating 1 submissions: ['f5754b90-663f-4778-a822-927137536d11']
-2026-05-05 09:44:57.948 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_1024
-2026-05-05 09:44:57.948 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=1024
-2026-05-05 09:45:26.368 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #5
-2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:45:26.368 - backend.aggregator.agents.submitter - INFO - Submitter 3: Submission accepted (total: 3)
-2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 3 (total: 5)
-2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:45:26.368 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=256
-2026-05-05 09:45:26.368 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_256: 8 total chunks
-2026-05-05 09:45:26.512 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_256
-2026-05-05 09:45:26.512 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=256
-2026-05-05 09:45:57.396 - backend.aggregator.agents.submitter - INFO - Submitter 1 generated submission 9863bbde-134c-4777-b6d7-4fdc20b73076 (iteration 4)
-2026-05-05 09:45:57.554 - backend.aggregator.core.coordinator - INFO - Validator iteration 163 - batch validating 1 submissions: ['9863bbde-134c-4777-b6d7-4fdc20b73076']
-2026-05-05 09:46:17.543 - backend.aggregator.memory.shared_training - INFO - Triggering immediate re-chunking callback for acceptance #6
-2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Launched background re-chunking task (validator continues processing)
-2026-05-05 09:46:17.543 - backend.aggregator.agents.submitter - INFO - Submitter 1: Submission accepted (total: 3)
-2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Accepted submission from submitter 1 (total: 6)
-2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Background incremental re-chunking started...
-2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Processing 1 new submissions
-2026-05-05 09:46:17.543 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking: Using chunk_size=512
-2026-05-05 09:46:17.543 - backend.aggregator.ingestion.pipeline - INFO - Ingested rag_shared_training_update_512: 8 total chunks
-2026-05-05 09:46:17.694 - backend.aggregator.core.rag_manager - INFO - Added text: rag_shared_training_update_512
-2026-05-05 09:46:17.694 - backend.aggregator.core.coordinator - INFO - Incremental re-chunking COMPLETE - 1 submissions added, chunk_size=512
-2026-05-05 09:46:33.252 - backend.api.routes.autonomous - INFO - Manual override: Forcing paper writing for brainstorm topic_001
-2026-05-05 09:46:33.252 - backend.autonomous.core.autonomous_coordinator - INFO - MANUAL OVERRIDE: Forcing paper writing for brainstorm topic_001
-2026-05-05 09:46:33.252 - backend.aggregator.core.coordinator - INFO - Stopping coordinator...
-2026-05-05 09:46:33.252 - backend.aggregator.agents.submitter - INFO - Submitter 1 stopped
-2026-05-05 09:46:33.252 - backend.aggregator.agents.submitter - INFO - Submitter 2 stopped
-2026-05-05 09:46:33.264 - backend.aggregator.agents.submitter - INFO - Submitter 3 stopped
-2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - INFO - Validator loop cancelled at iteration 179
-2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - WARNING - Validator loop EXITED after 179 iterations - is_running=False
-2026-05-05 09:46:33.264 - backend.aggregator.core.coordinator - INFO - Coordinator stopped
-2026-05-05 09:46:33.264 - backend.autonomous.core.autonomous_coordinator - INFO - Brainstorm aggregator stopped by manual override
-2026-05-05 09:46:34.169 - backend.autonomous.core.autonomous_coordinator - INFO - Manual override detected - transitioning to paper writing
-2026-05-05 09:47:50.131 - backend.autonomous.agents.lemma_search_agent - INFO - Built Mathlib declaration index with 169436 entries
-2026-05-05 09:47:53.453 - backend.shared.lean4_client - WARNING - Lean 4 LSP unhealthy; falling back to subprocess mode: startup failed:
-2026-05-05 09:47:53.469 - backend.shared.lean4_client - INFO - Lean 4 LSP reader exited after idle shutdown
-2026-05-05 09:50:57.464 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
-2026-05-05 09:55:59.235 - backend.shared.lean4_client - WARNING - Lean 4 workspace infrastructure error detected; invalidating workspace cache and refetching Mathlib artifacts. Diagnostic: LEAN 4 WORKSPACE ERROR: Mathlib cache/workspace repair failed. This is an infrastructure problem, not a proof error. Lean reported missing or invalid compiled Mathlib artifacts. Original diagnostic: MOTOProofCheck_170b6342efa846cf8f8beb216ddbccca.lean:1:0: error: object file 'C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace\.lake\packages\mathlib\.lake\build\lib\lean\Mathlib\Analysis\SpecialFunctions\Integrals.olean' of module Mathlib.Analysis.SpecialFunctions.Integrals does not exist
-2026-05-05 09:57:32.423 - backend.shared.lean4_client - INFO - Removed stale .lake directory at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace\.lake
-2026-05-05 09:57:32.439 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
-2026-05-05 09:57:32.870 - backend.shared.lm_studio_client - WARNING - 'lms ps' timed out after 10s
-2026-05-05 09:57:32.906 - backend.shared.lean4_client - INFO - Bootstrapping Lean 4 workspace at C:\Users\phwhi\Desktop\MOTO-Autonomous-ASI-dev-v1.0.7\backend\data\lean4_workspace
-2026-05-05 09:57:36.296 - backend.shared.lean4_client - WARNING - Lean 4 workspace update failed: error: compiled configuration is invalid; run with '-R' to reconfigure
-
-
-P
-9:37:42 AM
-Proof framing enabled for this research run
-◉
-9:37:42 AM
-Topic exploration started (target: 5 candidates)
-✓
-9:38:13 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 1)
-◈
-9:38:13 AM
-Exploration candidate 1/5 accepted:
-✓
-9:38:35 AM
-Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 2)
-◈
-9:38:37 AM
-Exploration candidate 2/5 accepted:
-✓
-9:38:55 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 3)
-◈
-9:38:55 AM
-Exploration candidate 3/5 accepted:
-✓
-9:39:59 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 4)
-◈
-9:39:59 AM
-Exploration candidate 4/5 accepted:
-✓
-9:40:26 AM
-Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 5)
-◈
-9:40:27 AM
-Exploration candidate 5/5 accepted:
-✓
-9:40:27 AM
-Topic exploration complete: 5 candidates collected from 5 attempts
-»
-9:41:04 AM
-Topic selected: How can the resolvent kernel and successive approximation theory for Volterra integral equations of the second kind be generalized to families of operators with time- or state-dependent coupling parameters, yielding explicit a-priori bounds on the deviation between solutions of the fully coupled system and those of its partly or fully decoupled truncations, thereby furnishing rigorous guarantees for controlled lossiness in variably-coupled computational models?
-✓
-9:41:41 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 1)
-✓
-9:42:25 AM
-Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 2)
-✗
-9:43:15 AM
-Submitter 1 [grok-4.3]: ✗ REJECTED (total: 1)
-✓
-9:43:59 AM
-Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 3)
-✓
-9:44:57 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 4)
-✓
-9:45:26 AM
-Submitter 3 [grok-4.3]: ✓ ACCEPTED (total: 5)
-✓
-9:46:17 AM
-Submitter 1 [grok-4.3]: ✓ ACCEPTED (total: 6)
-▶
-9:46:33 AM
-Manual override: Forcing paper writing for topic_001 (6 submissions)
-◌
-9:46:34 AM
-Proof check started for brainstorm topic_001
-#
-9:47:18 AM
-Proof check found 4 theorem candidate(s)
->
-9:48:19 AM
-Proof attempt 1 started: Let V(ε) be the one-parameter family of Volterra operators (V(ε)x)(t) := ∫_0^t K(t,s; ε λ(t,s)) x(s) ds for ε ∈ [0,1]. Let x(ε) solve x = f + V(ε)x in C([0,T];X). Then the deviation δ = x(1) − x(0) admits the representation δ(t) = ∫_0^1 R_ε (∂V/∂ε(ε) x(ε))(t) dε, and under the uniform bound ||K|| ≤ M and Lipschitz constant L of K w.r.t. its coupling argument, ||δ(t)|| ≤ L ||λ||_∞ ||f|| (t exp(M t) − (exp(M t)−1)/M).
->
-9:49:01 AM
-Proof attempt 1 started: Equip C([0,T];X) with the weighted norm |||x|||_\alpha := sup_t ||x(t)|| e^{-\alpha t}. Under linear growth and Lipschitz conditions on the kernel with constants M and L, the nonlinear Volterra map x ↦ f + V(x) is a contraction of ratio L/\alpha whenever \alpha > L. Consequently there exists a unique global solution satisfying ||x(t)|| ≤ C_\alpha exp(\alpha t). For a decoupled truncation V_0 the deviation δ satisfies the explicit weighted-norm bound |||δ|||_\alpha ≤ (ε_∞ / ((1 − L/\alpha) \alpha)) |||x_0|||_\alpha, which optimizes the exponential growth rate over admissible \alpha.
->
-9:49:26 AM
-Proof attempt 1 started: Let x and x_0 be the solutions corresponding to coupling functions λ and λ_0 ≡ 0 on selected blocks. Using the Neumann series expansions x = ∑ V_λ^n f and x_0 = ∑ V_0^n f, the deviation admits the telescoping representation δ = ∑_{n=1}^∞ (V_λ^n − V_0^n) f. Under the Lipschitz assumption on K, ||V_λ^n − V_0^n|| ≤ n M^{n−1} ε with ε ≤ L T ||λ||_∞, yielding the explicit bound ||δ(t)|| ≤ (ε t / (1 − M t)^2) exp(M t) ||f||_∞ for t < 1/M. The same telescoping argument produces a strictly sharper estimate than the crude resolvent bound whenever the support of λ − λ_0 has small measure.
->
-9:49:41 AM
-Proof attempt 1 started: For the block-structured Volterra operator T_λ = T_d + ΔT with measurable coupling λ : [0,T]×[0,T] → [0,1], the deviation δ = x − x_0 between the fully coupled and decoupled solutions satisfies the inhomogeneous Volterra equation δ = T_λ δ + ΔT x_0. The resolvent representation then gives the explicit integral bound ||δ(t)|| ≤ C ∫_0^t ε(s) exp(M t) ds, where ε(s) = sup_{u≤s} |λ(s,u)| · M_c(s) measures the effective coupling strength and C depends only on M and ||f||. The same bound continues locally for state-dependent λ(t,s,x(s)) as long as the solution remains inside a ball where the local Lipschitz constant is controlled.
-⚠
-9:55:51 AM
-Proof attempt 1 failed: MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:11:8: error: No goals to be solved MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:17:10: error(lean.unknownIdentifier): Unknown identifier `deriv_sub` MOTOProofCheck_4c04f51444d44489bd5de26445f30c60.lean:27:25: error(lean.invalidField): Invalid field `monotoneOn_of_deriv_nonneg`: The environment does not contain `Function.monotoneOn_of_deriv_nonneg`, so it is not possible to project the field `monotoneOn_of_deriv_nonneg` from an expressi...
->
-9:55:51 AM
-Proof attempt 2 started: Let V(ε) be the one-parameter family of Volterra operators (V(ε)x)(t) := ∫_0^t K(t,s; ε λ(t,s)) x(s) ds for ε ∈ [0,1]. Let x(ε) solve x = f + V(ε)x in C([0,T];X). Then the deviation δ = x(1) − x(0) admits the representation δ(t) = ∫_0^1 R_ε (∂V/∂ε(ε) x(ε))(t) dε, and under the uniform bound ||K|| ≤ M and Lipschitz constant L of K w.r.t. its coupling argument, ||δ(t)|| ≤ L ||λ||_∞ ||f|| (t exp(M t) − (exp(M t)−1)/M).
-⚠
-9:57:36 AM
-Proof attempt 2 failed: LEAN 4 WORKSPACE ERROR: Mathlib cache/workspace repair failed. This is an infrastructure problem, not a proof error. Lean reported missing or invalid compiled Mathlib artifacts. Original diagnostic: error: compiled configuration is invalid; run with '-R' to reconfigure
\ No newline at end of file
diff --git a/tests/test_lean4_client.py b/tests/test_lean4_client.py
index d5b97ac..a17d106 100644
--- a/tests/test_lean4_client.py
+++ b/tests/test_lean4_client.py
@@ -27,7 +27,7 @@ async def test_cache_fetch_retries_after_removing_failed_ltar_archive(self) -> N
             client = Lean4Client(lean_path=str(root / "lean.exe"), workspace_dir=str(workspace))
             calls: list[list[str]] = []
 
-            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple[int, str, str]:
+            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int | None = None) -> tuple[int, str, str]:
                 calls.append(args)
                 if args[1:] == ["update"]:
                     return 0, "updated", ""
@@ -49,6 +49,7 @@ async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple
                     ["update"],
                     ["exe", "cache", "get"],
                     ["exe", "cache", "get"],
+                    ["env", str(root / "lean.exe"), "MOTOProofWorkspace.lean"],
                 ],
             )
 
@@ -63,7 +64,7 @@ async def test_workspace_bootstrap_is_serialized(self) -> None:
             client = Lean4Client(lean_path=str(root / "lean.exe"), workspace_dir=str(workspace))
             calls: list[list[str]] = []
 
-            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple[int, str, str]:
+            async def fake_run_process(args: list[str], *, cwd: Path, timeout: int | None = None) -> tuple[int, str, str]:
                 calls.append(args)
                 await asyncio.sleep(0.01)
                 return 0, "ok", ""
@@ -78,6 +79,7 @@ async def fake_run_process(args: list[str], *, cwd: Path, timeout: int) -> tuple
                 [
                     ["update"],
                     ["exe", "cache", "get"],
+                    ["env", str(root / "lean.exe"), "MOTOProofWorkspace.lean"],
                 ],
             )
 
diff --git a/tests/test_leanoj_coordinator.py b/tests/test_leanoj_coordinator.py
new file mode 100644
index 0000000..25ced91
--- /dev/null
+++ b/tests/test_leanoj_coordinator.py
@@ -0,0 +1,2255 @@
+import asyncio
+import unittest
+import tempfile
+from types import SimpleNamespace
+
+from backend.leanoj.core import leanoj_context as leanoj_context_module
+from backend.leanoj.core import leanoj_coordinator as leanoj_module
+from backend.leanoj.core.leanoj_context import LeanOJContextAllocation, leanoj_context_manager
+from backend.leanoj.core.leanoj_coordinator import LeanOJConfigurationError, LeanOJCoordinator
+from backend.leanoj.prompts import (
+    LEANOJ_FORMALIZATION_GUARDRAILS,
+    build_final_solution_review_prompt,
+    build_final_solver_prompt,
+)
+from backend.shared.boost_manager import BoostManager
+from backend.shared.config import system_config
+from backend.shared.models import DocumentChunk, LeanOJRoleConfig, LeanOJStartRequest, ProofRecord
+
+
+def _role() -> LeanOJRoleConfig:
+    return LeanOJRoleConfig(model_id="test-model")
+
+
+def _request() -> LeanOJStartRequest:
+    return LeanOJStartRequest(
+        user_prompt="Prove one equals one.",
+        lean_template="import Mathlib\n\nexample : 1 = 1 := by\n  sorry",
+        topic_generator=_role(),
+        topic_validator=_role(),
+        brainstorm_submitters=[_role()],
+        brainstorm_validator=_role(),
+        path_decider=_role(),
+        final_solver=_role(),
+    )
+
+
+class LeanOJCoordinatorTests(unittest.IsolatedAsyncioTestCase):
+    async def _initialized_coordinator(self) -> LeanOJCoordinator:
+        coordinator = LeanOJCoordinator()
+        await coordinator.initialize(_request())
+
+        async def noop(*_args, **_kwargs):
+            return None
+
+        coordinator._persist_state = noop  # type: ignore[method-assign]
+        coordinator._broadcast = noop  # type: ignore[method-assign]
+
+        async def fake_register(*_args, **_kwargs):
+            return ProofRecord(
+                proof_id="proof_leanoj_test",
+                theorem_statement="LeanOJ theorem",
+                source_type="leanoj_final",
+                source_id=coordinator.get_state().session_id,
+                lean_code="import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+                novel=True,
+                novelty_tier="mathematical_discovery",
+                novelty_reasoning="test novelty",
+            )
+
+        coordinator._register_verified_leanoj_proof = fake_register  # type: ignore[method-assign]
+
+        async def fake_review(*_args, **_kwargs):
+            return True, "Final review accepted.", "Lean 4 accepted with no diagnostics."
+
+        coordinator._review_final_solution_completion = fake_review  # type: ignore[method-assign]
+        return coordinator
+
+    def test_final_solver_prompt_has_no_phase_transition_contract(self) -> None:
+        prompt = build_final_solver_prompt(
+            "Prove one equals one.",
+            "import Mathlib\n\nexample : 1 = 1 := by\n  sorry",
+            "import Mathlib\n\nexample : 1 = 1 := by\n  sorry",
+            {"version": 1},
+            accepted_ideas=[],
+            verified_subproofs=[],
+            partial_proofs=[],
+            failed_feedback=[
+                {
+                    "request": "final Proof Solver proof cycle",
+                    "error_summary": "failed 30 times and requested need_more_brainstorming",
+                }
+            ],
+            final_attempts=[
+                {
+                    "request": "final attempt",
+                    "error_summary": "prior final attempt failed",
+                }
+            ],
+            context_blocks={},
+        )
+
+        self.assertNotIn("stuck_needs_brainstorm", prompt)
+        self.assertNotIn("need_more_brainstorming", prompt)
+        self.assertNotIn("failed 30", prompt)
+        self.assertNotIn("brainstorm", prompt.lower())
+        self.assertIn("You must choose exactly one action: edit_proof.", prompt)
+        self.assertIn(LEANOJ_FORMALIZATION_GUARDRAILS, prompt)
+        self.assertIn("truncated natural subtraction", prompt)
+
+    def test_final_review_prompt_requires_semantic_cross_check(self) -> None:
+        prompt = build_final_solution_review_prompt(
+            "Solve the informal olympiad problem.",
+            "def answer (n : Nat) : Nat := sorry\n\ntheorem solution : True := by\n  sorry",
+            "def answer (n : Nat) : Nat := 0\n\ntheorem solution : True := by\n  trivial",
+            "Lean should accept.",
+            "Lean 4 accepted with no diagnostics.",
+        )
+
+        self.assertIn(LEANOJ_FORMALIZATION_GUARDRAILS, prompt)
+        self.assertIn("Lean acceptance is necessary but not sufficient", prompt)
+        self.assertIn("does not automatically prove the user's informal problem statement", prompt)
+
+    async def test_final_loop_retries_until_lean_verifies(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+
+        responses = [
+            {"lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  simp", "reasoning": "first try"},
+            {"lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  rfl", "reasoning": "fix"},
+        ]
+
+        async def fake_call_json(_config, task_prefix, *_args, **_kwargs):
+            if task_prefix == "leanoj_master_proof_edit_val":
+                raise AssertionError("Tiny placeholder replacement should not require shortening validation")
+            if task_prefix == "leanoj_final_review":
+                return {"solved": True, "reasoning": "final answer complete"}
+            return responses.pop(0)
+
+        class FakeLean:
+            def __init__(self) -> None:
+                self.calls = 0
+
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                self.calls += 1
+                if self.calls == 1:
+                    return SimpleNamespace(success=False, error_output="unsolved goals")
+                return SimpleNamespace(success=True, error_output="")
+
+        fake_lean = FakeLean()
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: fake_lean  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "verified")
+                self.assertEqual(coordinator.get_state().final_attempt_count, 2)
+                self.assertIn("rfl", coordinator.get_state().final_solution)
+                self.assertEqual(coordinator.get_state().final_proof_id, "proof_leanoj_test")
+                self.assertEqual(coordinator.get_state().final_novelty_tier, "mathematical_discovery")
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_path_decision_replaces_removed_proof_storm_with_brainstorming(self) -> None:
+        request = _request()
+        coordinator = await self._initialized_coordinator()
+        coordinator._accepted_ideas.append("Useful accepted idea.")
+
+        async def fake_context_blocks(*_args, **_kwargs):
+            return {}
+
+        async def fake_call_json(*_args, **_kwargs):
+            return {"path": "need_proof_storm", "reasoning": "legacy path"}
+
+        async def fake_validate(*_args, **_kwargs):
+            return True, ""
+
+        coordinator._build_context_blocks = fake_context_blocks  # type: ignore[method-assign]
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+        coordinator._validate_path_decision = fake_validate  # type: ignore[method-assign]
+
+        decision = await coordinator._path_decision_phase(request)
+
+        self.assertEqual(decision, "need_more_brainstorming")
+        self.assertNotIn("need_proof_storm", leanoj_module._LEANOJ_PATH_OPTIONS)
+
+    async def test_recursive_brainstorm_starts_proof_memory_without_topic_prepass(self) -> None:
+        request = _request().model_copy(
+            update={
+                "brainstorm_submitters": [
+                    LeanOJRoleConfig(model_id="submitter-1"),
+                    LeanOJRoleConfig(model_id="submitter-2"),
+                    LeanOJRoleConfig(model_id="submitter-3"),
+                ],
+            }
+        )
+        coordinator = LeanOJCoordinator()
+        await coordinator.initialize(request)
+
+        async def noop(*_args, **_kwargs):
+            return None
+
+        brainstorm_calls: list[dict[str, object]] = []
+        async def fake_brainstorm_until_path_check(*_args, **_kwargs):
+            brainstorm_calls.append(dict(_kwargs))
+            return None
+
+        coordinator._persist_state = noop  # type: ignore[method-assign]
+        coordinator._broadcast = noop  # type: ignore[method-assign]
+        coordinator._brainstorm_until_path_check = fake_brainstorm_until_path_check  # type: ignore[method-assign]
+
+        await coordinator._recursive_brainstorm_phase(request)
+
+        self.assertEqual(len(brainstorm_calls), 1)
+        self.assertEqual(brainstorm_calls[0]["phase_key"], "recursive_brainstorm")
+        self.assertNotIn("_".join(["recursive", "topics"]), coordinator.get_status())
+
+    async def test_topic_dequeue_respects_remaining_capacity_without_dropping(self) -> None:
+        coordinator = LeanOJCoordinator()
+        topic_queue: asyncio.Queue[tuple[int, str]] = asyncio.Queue()
+        await topic_queue.put((1, "topic one"))
+        await topic_queue.put((2, "topic two"))
+        await topic_queue.put((3, "topic three"))
+
+        batch = await coordinator._dequeue_topic_batch(topic_queue, max_count=1)  # type: ignore[attr-defined]
+
+        self.assertEqual(batch, [(1, "topic one")])
+        self.assertEqual(topic_queue.qsize(), 2)
+
+    async def test_brainstorm_queue_global_pause_uses_shared_threshold(self) -> None:
+        old_global_threshold = system_config.queue_overflow_threshold
+        old_submitter_threshold = system_config.per_submitter_queue_threshold
+        try:
+            system_config.queue_overflow_threshold = 3
+            system_config.per_submitter_queue_threshold = 2
+            queue = leanoj_module._LeanOJBrainstormSubmissionQueue(submitter_count=3)  # type: ignore[attr-defined]
+
+            await queue.put((1, "submission one", {}))
+            await queue.put((2, "submission two", {}))
+            await queue.put((3, "submission three", {}))
+
+            self.assertTrue(queue.should_pause_submitter(1))
+            self.assertTrue(queue.should_pause_submitter(2))
+            self.assertTrue(queue.should_pause_submitter(3))
+            transitions = queue.refresh_pause_transitions()
+            self.assertTrue(transitions["global_paused"])
+            self.assertTrue(transitions["global_changed"])
+        finally:
+            system_config.queue_overflow_threshold = old_global_threshold
+            system_config.per_submitter_queue_threshold = old_submitter_threshold
+
+    async def test_brainstorm_queue_pauses_only_overrepresented_submitter(self) -> None:
+        old_global_threshold = system_config.queue_overflow_threshold
+        old_submitter_threshold = system_config.per_submitter_queue_threshold
+        try:
+            system_config.queue_overflow_threshold = 10
+            system_config.per_submitter_queue_threshold = 2
+            queue = leanoj_module._LeanOJBrainstormSubmissionQueue(submitter_count=3)  # type: ignore[attr-defined]
+
+            await queue.put((1, "submission one", {}))
+            await queue.put((1, "submission two", {}))
+            await queue.put((1, "submission three", {}))
+
+            self.assertTrue(queue.should_pause_submitter(1))
+            self.assertFalse(queue.should_pause_submitter(2))
+            self.assertFalse(queue.should_pause_submitter(3))
+            transitions = queue.refresh_pause_transitions()
+            self.assertFalse(transitions["global_paused"])
+            self.assertEqual(transitions["submitters_paused"], {1})
+        finally:
+            system_config.queue_overflow_threshold = old_global_threshold
+            system_config.per_submitter_queue_threshold = old_submitter_threshold
+
+    async def test_brainstorm_queue_skips_per_submitter_pause_for_single_submitter(self) -> None:
+        old_global_threshold = system_config.queue_overflow_threshold
+        old_submitter_threshold = system_config.per_submitter_queue_threshold
+        try:
+            system_config.queue_overflow_threshold = 10
+            system_config.per_submitter_queue_threshold = 2
+            queue = leanoj_module._LeanOJBrainstormSubmissionQueue(submitter_count=1)  # type: ignore[attr-defined]
+
+            await queue.put((1, "submission one", {}))
+            await queue.put((1, "submission two", {}))
+            await queue.put((1, "submission three", {}))
+
+            self.assertFalse(queue.should_pause_submitter(1))
+            transitions = queue.refresh_pause_transitions()
+            self.assertFalse(transitions["global_paused"])
+            self.assertEqual(transitions["submitters_paused"], set())
+        finally:
+            system_config.queue_overflow_threshold = old_global_threshold
+            system_config.per_submitter_queue_threshold = old_submitter_threshold
+
+    async def test_brainstorm_dequeue_updates_submitter_pending_counts(self) -> None:
+        old_global_threshold = system_config.queue_overflow_threshold
+        old_submitter_threshold = system_config.per_submitter_queue_threshold
+        try:
+            system_config.queue_overflow_threshold = 10
+            system_config.per_submitter_queue_threshold = 1
+            coordinator = LeanOJCoordinator()
+            queue = leanoj_module._LeanOJBrainstormSubmissionQueue(submitter_count=2)  # type: ignore[attr-defined]
+
+            await queue.put((1, "submission one", {}))
+            await queue.put((1, "submission two", {}))
+            await queue.put((2, "submission three", {}))
+
+            self.assertTrue(queue.should_pause_submitter(1))
+            batch = await coordinator._dequeue_brainstorm_batch(queue, max_count=2)  # type: ignore[attr-defined]
+
+            self.assertEqual(
+                batch,
+                [
+                    (1, "submission one", {}),
+                    (1, "submission two", {}),
+                ],
+            )
+            self.assertEqual(queue.count_for_submitter(1), 0)
+            self.assertEqual(queue.count_for_submitter(2), 1)
+            self.assertFalse(queue.should_pause_submitter(1))
+            self.assertEqual(queue.qsize(), 1)
+        finally:
+            system_config.queue_overflow_threshold = old_global_threshold
+            system_config.per_submitter_queue_threshold = old_submitter_threshold
+
+    async def test_accepted_brainstorm_proof_records_verified_subproof_context(self) -> None:
+        request = _request()
+        coordinator = await self._initialized_coordinator()
+
+        await coordinator._record_accepted_brainstorm_proof(
+            request,
+            1,
+            {
+                "brainstorm_lean_proof": {
+                    "theorem_statement": "True is true.",
+                    "theorem_name": "brainstorm_true",
+                    "formal_sketch": "Proof fragment from brainstorm.",
+                    "lean_code": "import Mathlib\n\ntheorem brainstorm_true : True := by trivial",
+                    "attempt_count": 2,
+                }
+            },
+        )
+
+        self.assertEqual(len(coordinator.get_state().verified_subproofs), 1)
+        proof = coordinator.get_state().verified_subproofs[0]
+        self.assertTrue(proof.verified)
+        self.assertEqual(proof.attempts_used, 2)
+        self.assertIn("brainstorm_true", proof.lean_code)
+
+    async def test_final_loop_edits_master_proof_before_lean_verification(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+
+        responses = [
+            {
+                "action": "edit_proof",
+                "needs_more_time": True,
+                "operation": "replace",
+                "old_string": "sorry",
+                "new_string": "simp",
+                "reasoning": "First close the obvious placeholder, but keep editing time.",
+            },
+            {
+                "action": "edit_proof",
+                "needs_more_time": False,
+                "operation": "replace",
+                "old_string": "simp",
+                "new_string": "rfl",
+                "reasoning": "Use the final proof term and verify now.",
+            },
+        ]
+
+        async def fake_call_json(_config, task_prefix, *_args, **_kwargs):
+            if task_prefix == "leanoj_final_review":
+                return {"solved": True, "reasoning": "final answer complete"}
+            return responses.pop(0)
+
+        class FakeLean:
+            def __init__(self) -> None:
+                self.calls = 0
+                self.seen_code = ""
+
+            async def check_proof(self, code: str, timeout: int = 120, **_kwargs):
+                self.calls += 1
+                self.seen_code = code
+                return SimpleNamespace(success=True, error_output="")
+
+        fake_lean = FakeLean()
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: fake_lean  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(fake_lean.calls, 2)
+                self.assertIn("rfl", fake_lean.seen_code)
+                self.assertNotIn("simp", fake_lean.seen_code)
+                self.assertEqual(coordinator.get_state().phase, "verified")
+                self.assertEqual(coordinator.get_state().final_attempt_count, 1)
+                self.assertEqual(coordinator.get_state().master_proof_version, 3)
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_loop_continues_when_final_review_rejects_lean_pass(self) -> None:
+        request = _request()
+        request.final_attempts_per_cycle = 1
+        old_data_dir = system_config.data_dir
+
+        async def fake_call_json(*_args, **_kwargs):
+            return {
+                "action": "edit_proof",
+                "needs_more_time": False,
+                "operation": "replace",
+                "old_string": "sorry",
+                "new_string": "rfl",
+                "reasoning": "Lean should accept this equality proof.",
+            }
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                return SimpleNamespace(
+                    success=True,
+                    error_output="",
+                    diagnostic_output="Lean 4 accepted with an informational diagnostic.",
+                    goal_states="",
+                    raw_stderr="",
+                )
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+                async def reject_review(*_args, **_kwargs):
+                    return (
+                        False,
+                        "The Lean proof checks, but it does not answer the actual problem prompt.",
+                        "Lean 4 accepted with an informational diagnostic.",
+                    )
+
+                coordinator._review_final_solution_completion = reject_review  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "path_decision")
+                self.assertFalse(coordinator.get_state().final_solution)
+                self.assertIn("FINAL SOLUTION REVIEW REJECTED", coordinator._final_attempts[-1]["error_summary"])  # type: ignore[attr-defined]
+                self.assertIn("informational diagnostic", coordinator._final_attempts[-1]["lean_feedback"])  # type: ignore[attr-defined]
+                self.assertTrue(
+                    any(
+                        "actual problem prompt" in feedback.get("error_summary", "")
+                        for feedback in coordinator._failed_feedback  # type: ignore[attr-defined]
+                    )
+                )
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_solution_review_prompt_includes_problem_template_code_and_lean_feedback(self) -> None:
+        request = _request()
+        coordinator = LeanOJCoordinator()
+        captured_prompt = ""
+
+        async def fake_call_json(_config, task_prefix, role_id, prompt, **_kwargs):
+            nonlocal captured_prompt
+            captured_prompt = prompt
+            self.assertEqual(task_prefix, "leanoj_final_review")
+            self.assertEqual(role_id, "leanoj_final_solver")
+            return {
+                "solved": False,
+                "continuation_feedback": "Give an explicit answer instead of a circular maximum.",
+                "reasoning": "The formal code is evasive.",
+            }
+
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+        solved, feedback, lean_feedback = await LeanOJCoordinator._review_final_solution_completion(
+            coordinator,
+            request,
+            lean_code="import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+            final_solver_reasoning="This should close the template.",
+            lean_result=SimpleNamespace(
+                success=True,
+                error_output="",
+                diagnostic_output="Lean 4 accepted with a useful warning.",
+                goal_states="",
+                raw_stderr="",
+            ),
+        )
+
+        self.assertFalse(solved)
+        self.assertIn("explicit answer", feedback)
+        self.assertIn("useful warning", lean_feedback)
+        self.assertIn(request.user_prompt, captured_prompt)
+        self.assertIn(request.lean_template, captured_prompt)
+        self.assertIn("example : 1 = 1", captured_prompt)
+        self.assertIn("Lean 4 accepted with a useful warning.", captured_prompt)
+        self.assertIn("maximum/supremum over the same feasible set", captured_prompt)
+
+    async def test_final_review_can_reject_evasive_lean_accepted_answer(self) -> None:
+        request = _request()
+        request.lean_template = (
+            "import Mathlib.Data.Finset.Card\n"
+            "import Mathlib.Order.Bounds.Defs\n\n"
+            "def answer (n : ℕ) : ℕ := sorry\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | a = 0 }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := sorry"
+        )
+        request.final_attempts_per_cycle = 1
+        old_data_dir = system_config.data_dir
+        evasive_code = (
+            "import Mathlib.Data.Finset.Card\n"
+            "import Mathlib.Order.Bounds.Defs\n"
+            "import Mathlib\n\n"
+            "noncomputable def candidates (n : ℕ) : Finset ℕ := {0}\n"
+            "noncomputable def answer (n : ℕ) : ℕ := (candidates n).max' (by simp [candidates])\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | a = 0 }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := by\n"
+            "  exact ⟨by simp [S, answer, candidates], by intro y hy; simp [S, answer, candidates] at hy ⊢⟩"
+        )
+
+        async def fake_call_json(*_args, **_kwargs):
+            return {"lean_code": evasive_code, "reasoning": "Lean accepts this maximum-based construction."}
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                return SimpleNamespace(success=True, error_output="", diagnostic_output="", goal_states="", raw_stderr="")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+                async def reject_evasive_review(*_args, lean_code: str, **_kwargs):
+                    self.assertIn("candidates", lean_code)
+                    return False, "This defines `answer` by searching candidates instead of giving the requested formula.", ""
+
+                coordinator._review_final_solution_completion = reject_evasive_review  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "path_decision")
+                self.assertFalse(coordinator.get_state().final_solution)
+                self.assertIn("searching candidates", coordinator._final_attempts[-1]["error_summary"])  # type: ignore[attr-defined]
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_loop_rejects_duplicate_master_proof_old_string(self) -> None:
+        request = _request()
+        request.lean_template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry\n\nexample : 2 = 2 := by\n  sorry"
+        request.final_attempts_per_cycle = 1
+        old_data_dir = system_config.data_dir
+
+        async def fake_call_json(*_args, **_kwargs):
+            return {
+                "action": "edit_proof",
+                "needs_more_time": False,
+                "operation": "replace",
+                "old_string": "sorry",
+                "new_string": "rfl",
+                "reasoning": "Ambiguous edit.",
+            }
+
+        class FakeLean:
+            def __init__(self) -> None:
+                self.calls = 0
+
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                self.calls += 1
+                return SimpleNamespace(success=True, error_output="")
+
+        fake_lean = FakeLean()
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: fake_lean  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(fake_lean.calls, 0)
+                self.assertEqual(coordinator.get_state().final_attempt_count, 1)
+                self.assertIn("appears 2 times", coordinator._final_attempts[-1]["error_summary"])  # type: ignore[attr-defined]
+                self.assertEqual(coordinator.get_state().phase, "path_decision")
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_loop_rejects_nonprogressive_shortening_before_write(self) -> None:
+        request = _request()
+        request.lean_template = (
+            "import Mathlib\n\n"
+            "theorem helper : True := by\n"
+            "  trivial\n\n"
+            "example : True := by\n"
+            "  exact helper"
+        )
+        request.final_attempts_per_cycle = 1
+        old_data_dir = system_config.data_dir
+        events: list[tuple[str, dict]] = []
+
+        async def fake_call_json(_config, task_prefix, role_id, _prompt, **_kwargs):
+            if task_prefix == "leanoj_master_proof_edit_val":
+                self.assertEqual(role_id, "leanoj_master_proof_edit_validator")
+                return {
+                    "decision": "reject",
+                    "reasoning": "The edit deletes the proved helper and returns to a placeholder.",
+                    "feedback_to_submitter": "Restore theorem helper or replace it with an equivalent proof before shortening.",
+                }
+            return {
+                "action": "edit_proof",
+                "needs_more_time": False,
+                "operation": "full_content",
+                "new_string": "import Mathlib\n\nexample : True := by\n  sorry",
+                "reasoning": "Shorten the file by restarting from the goal.",
+            }
+
+        class FakeLean:
+            def __init__(self) -> None:
+                self.calls = 0
+
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                self.calls += 1
+                raise AssertionError("Lean should not run after validator rejects the shortening edit")
+
+        fake_lean = FakeLean()
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+                async def capture_broadcast(event: str, data: dict | None = None):
+                    events.append((event, data or {}))
+
+                coordinator._broadcast = capture_broadcast  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: fake_lean  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(fake_lean.calls, 0)
+                self.assertEqual(await coordinator._read_master_proof(), request.lean_template.strip())  # type: ignore[attr-defined]
+                self.assertEqual(coordinator.get_state().final_attempt_count, 1)
+                self.assertEqual(coordinator.get_state().phase, "path_decision")
+                self.assertIn("Restore theorem helper", coordinator._final_attempts[-1]["error_summary"])  # type: ignore[attr-defined]
+                self.assertTrue(
+                    any(
+                        "Restore theorem helper" in feedback.get("error_summary", "")
+                        for feedback in coordinator._failed_feedback  # type: ignore[attr-defined]
+                    )
+                )
+                self.assertIn("leanoj_master_proof_edit_rejected", [event for event, _data in events])
+                edits = await coordinator.get_master_proof_edit_summaries(limit=1)
+                self.assertFalse(edits["edits"][0]["accepted"])
+                self.assertIn("Restore theorem helper", edits["edits"][0]["validator_feedback"])
+                self.assertGreater(edits["edits"][0]["shortening_metrics"]["line_delta_removed"], 0)
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_loop_allows_validator_accepted_shortening(self) -> None:
+        request = _request()
+        request.lean_template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        old_data_dir = system_config.data_dir
+
+        shortened_code = "import Mathlib\n\nexample : 1 = 1 := by\n  rfl"
+
+        async def fake_call_json(_config, task_prefix, role_id, _prompt, **_kwargs):
+            if task_prefix == "leanoj_master_proof_edit_val":
+                self.assertEqual(role_id, "leanoj_master_proof_edit_validator")
+                return {
+                    "decision": "accept",
+                    "reasoning": "The shorter proof removes only redundant helper scaffolding and keeps the solved template.",
+                    "feedback_to_submitter": "",
+                }
+            return {
+                "action": "edit_proof",
+                "needs_more_time": False,
+                "operation": "full_content",
+                "new_string": shortened_code,
+                "reasoning": "Replace the verbose draft with the direct final proof.",
+            }
+
+        class FakeLean:
+            def __init__(self) -> None:
+                self.calls = 0
+                self.seen_code = ""
+
+            async def check_proof(self, code: str, timeout: int = 120, **_kwargs):
+                self.calls += 1
+                self.seen_code = code
+                return SimpleNamespace(success=True, error_output="", diagnostic_output="", goal_states="", raw_stderr="")
+
+        fake_lean = FakeLean()
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                await coordinator._write_master_proof(  # type: ignore[attr-defined]
+                    "import Mathlib\n\n"
+                    "theorem helper : 1 = 1 := by\n"
+                    "  rfl\n\n"
+                    "example : 1 = 1 := by\n"
+                    "  exact helper",
+                    summary="verbose seed",
+                )
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: fake_lean  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(fake_lean.calls, 1)
+                self.assertEqual(fake_lean.seen_code, shortened_code)
+                self.assertEqual(coordinator.get_state().phase, "verified")
+                self.assertEqual(await coordinator._read_master_proof(), shortened_code)  # type: ignore[attr-defined]
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_final_loop_rejects_phase_transition_action_as_invalid_edit(self) -> None:
+        request = _request()
+        request.final_attempts_per_cycle = 3
+        old_data_dir = system_config.data_dir
+        call_count = 0
+
+        async def fake_call_json(*_args, **_kwargs):
+            nonlocal call_count
+            call_count += 1
+            return {
+                "action": "phase_transition",
+                "reasoning": "Trying to leave final mode should be rejected.",
+            }
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                raise AssertionError("Lean should not be called for an invalid final solver action")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "path_decision")
+                self.assertEqual(coordinator.get_state().current_path_decision, "need_more_brainstorming")
+                self.assertEqual(call_count, 3)
+                self.assertEqual(coordinator.get_state().final_attempt_count, 3)
+                self.assertIn("Invalid final solver action", coordinator._final_attempts[-1]["error_summary"])  # type: ignore[attr-defined]
+                self.assertNotIn("brainstorm", coordinator._final_attempts[-1]["error_summary"].lower())  # type: ignore[attr-defined]
+                self.assertFalse(coordinator.get_state().master_proof_last_stuck_reason)
+                self.assertEqual(await coordinator._read_master_proof(), request.lean_template.strip())  # type: ignore[attr-defined]
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_skip_brainstorm_enters_final_loop_without_path_decision(self) -> None:
+        request = _request()
+        coordinator = await self._initialized_coordinator()
+        coordinator._state.phase = "recursive_brainstorm"  # type: ignore[attr-defined]
+        coordinator._state.skip_brainstorm_requested = True  # type: ignore[attr-defined]
+        final_loop_calls = 0
+
+        async def fake_final_proof_loop(_request):
+            nonlocal final_loop_calls
+            final_loop_calls += 1
+            coordinator._state.phase = "verified"  # type: ignore[attr-defined]
+
+        async def fail_path_decision(_request):
+            raise AssertionError("Path decision should not run after brainstorm skip")
+
+        coordinator._final_proof_loop = fake_final_proof_loop  # type: ignore[method-assign]
+        coordinator._path_decision_phase = fail_path_decision  # type: ignore[method-assign]
+
+        await coordinator._run_workflow(request)  # type: ignore[attr-defined]
+
+        self.assertEqual(final_loop_calls, 1)
+        self.assertFalse(coordinator.get_state().skip_brainstorm_requested)
+        self.assertEqual(coordinator.get_state().current_path_decision, "solve_final_now")
+        self.assertEqual(coordinator.get_state().phase, "verified")
+
+    async def test_forced_final_phase_runs_before_next_path_decision(self) -> None:
+        request = _request()
+        coordinator = await self._initialized_coordinator()
+        coordinator._state.phase = "recursive_brainstorm"  # type: ignore[attr-defined]
+        final_loop_calls = 0
+
+        async def fake_recursive_brainstorm(_request):
+            coordinator._state.phase = "final_proof_loop"  # type: ignore[attr-defined]
+            coordinator._state.user_forced_final_cycle = True  # type: ignore[attr-defined]
+
+        async def fake_final_proof_loop(_request):
+            nonlocal final_loop_calls
+            final_loop_calls += 1
+            coordinator._state.user_forced_final_cycle = False  # type: ignore[attr-defined]
+            coordinator._state.phase = "verified"  # type: ignore[attr-defined]
+
+        async def fail_path_decision(_request):
+            raise AssertionError("Path decision should not run while forced final cycle is active")
+
+        coordinator._recursive_brainstorm_phase = fake_recursive_brainstorm  # type: ignore[method-assign]
+        coordinator._final_proof_loop = fake_final_proof_loop  # type: ignore[method-assign]
+        coordinator._path_decision_phase = fail_path_decision  # type: ignore[method-assign]
+
+        await coordinator._run_workflow(request)  # type: ignore[attr-defined]
+
+        self.assertEqual(final_loop_calls, 1)
+        self.assertEqual(coordinator.get_state().phase, "verified")
+
+    async def test_forced_final_cycle_uses_all_attempts_before_path(self) -> None:
+        request = _request().model_copy(update={"final_attempts_per_cycle": 3})
+        coordinator = await self._initialized_coordinator()
+        coordinator._state.user_forced_final_cycle = True  # type: ignore[attr-defined]
+        call_count = 0
+
+        async def fake_call_json(*_args, **_kwargs):
+            nonlocal call_count
+            call_count += 1
+            return {
+                "action": "phase_transition",
+                "reasoning": f"invalid action {call_count}",
+            }
+
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+        await coordinator._final_proof_loop(request)
+
+        self.assertEqual(call_count, 3)
+        self.assertEqual(coordinator.get_state().final_attempt_count, 3)
+        self.assertFalse(coordinator.get_state().user_forced_final_cycle)
+        self.assertEqual(coordinator.get_state().phase, "path_decision")
+        self.assertEqual(coordinator.get_state().current_path_decision, "need_more_brainstorming")
+
+    async def test_recursive_brainstorm_targets_current_working_proof_attempt(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+        old_allocate = leanoj_module.leanoj_context_manager.allocate_context
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._state.phase = "recursive_brainstorm"  # type: ignore[attr-defined]
+                coordinator._state.selected_topic = "Original broad equality topic"
+                await coordinator._write_master_proof(  # type: ignore[attr-defined]
+                    "import Mathlib\n\nexample : 1 = 1 := by\n  have h : 1 = 1 := by\n    sorry",
+                    summary="latest draft",
+                )
+                coordinator._final_attempts.append(  # type: ignore[attr-defined]
+                    {
+                        "request": "final Proof Solver solution",
+                        "error_summary": "unsolved goals at h",
+                        "lean_code": "bad final",
+                    }
+                )
+                await coordinator._set_current_working_proof_attempt(  # type: ignore[attr-defined]
+                    trigger="final_solver_stuck",
+                    requested_path="need_more_brainstorming",
+                    stuck_reason="Need a way to close h.",
+                )
+
+                async def fake_allocate_context(**kwargs):
+                    packet = kwargs.get("current_working_proof_attempt") or {}
+                    return LeanOJContextAllocation(
+                        current_working_proof_attempt=(
+                            "CURRENT WORKING PROOF ATTEMPT\n"
+                            f"{packet.get('master_proof', '')}\n"
+                            f"{packet.get('recent_final_attempts', '')}"
+                        )
+                    )
+
+                prompts = []
+
+                async def fake_call_json(_config, _task_prefix, _role_id, prompt, **_kwargs):
+                    prompts.append(prompt)
+                    coordinator._stop_event.set()  # type: ignore[attr-defined]
+                    return {"submission": "Use rfl to close the local equality.", "reasoning": "direct repair"}
+
+                leanoj_module.leanoj_context_manager.allocate_context = fake_allocate_context  # type: ignore[assignment]
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                queue = leanoj_module._LeanOJBrainstormSubmissionQueue(submitter_count=1)  # type: ignore[attr-defined]
+
+                await coordinator._brainstorm_submitter_loop(request, 1, request.brainstorm_submitters[0], queue)  # type: ignore[attr-defined]
+
+                self.assertTrue(prompts)
+                prompt = prompts[0]
+                self.assertIn("ACTIVE TOPIC:\nRepair and complete the current Proof Solver master proof attempt", prompt)
+                self.assertNotIn("ACTIVE TOPIC:\nOriginal broad equality topic", prompt)
+                self.assertIn("CURRENT WORKING PROOF ATTEMPT", prompt)
+                self.assertIn("have h : 1 = 1", prompt)
+                self.assertIn("unsolved goals at h", prompt)
+            finally:
+                leanoj_module.leanoj_context_manager.allocate_context = old_allocate  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_master_proof_direct_context_overflow_raises(self) -> None:
+        request = _request()
+        request.final_solver.context_window = 28000
+        request.final_solver.max_output_tokens = 25000
+        coordinator = await self._initialized_coordinator()
+        large_proof = "\n".join(
+            [
+                "import Mathlib",
+                "",
+                *[f"def filler_{index} : Nat := {index}" for index in range(1, 900)],
+                "example : 1 = 1 := by",
+                "  sorry",
+                *[f"def tail_filler_{index} : Nat := {index}" for index in range(900, 1800)],
+            ]
+        )
+
+        with self.assertRaisesRegex(LeanOJConfigurationError, "MANDATORY DIRECT CONTEXT OVERFLOW"):
+            coordinator._build_master_proof_direct_context(  # type: ignore[attr-defined]
+                large_proof,
+                request,
+                context_blocks={},
+            )
+
+    async def test_master_proof_draft_and_edit_summaries_are_read_on_demand(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                await coordinator._write_master_proof(  # type: ignore[attr-defined]
+                    "import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+                    summary="draft ready",
+                )
+                await coordinator._append_master_proof_edit(  # type: ignore[attr-defined]
+                    {
+                        "action": "edit_proof",
+                        "operation": "replace",
+                        "old_string": "sorry",
+                        "new_string": "rfl",
+                        "reasoning": "Closed the proof.",
+                        "accepted": True,
+                    }
+                )
+
+                draft = await coordinator.get_master_proof_draft()
+                edits = await coordinator.get_master_proof_edit_summaries(limit=1)
+
+                self.assertTrue(draft["exists"])
+                self.assertIn("rfl", draft["content"])
+                self.assertEqual(draft["metadata"]["version"], 1)
+                self.assertEqual(edits["total_edits"], 1)
+                self.assertEqual(len(edits["edits"]), 1)
+                self.assertEqual(edits["edits"][0]["new_string_preview"], "rfl")
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_master_proof_edit_log_compacts_to_snapshot(self) -> None:
+        old_data_dir = system_config.data_dir
+        old_limit = leanoj_module._MASTER_PROOF_EDIT_LOG_COMPACT_RECORD_LIMIT
+        old_keep = leanoj_module._MASTER_PROOF_EDIT_LOG_RECENT_RECORDS_TO_KEEP
+        leanoj_module._MASTER_PROOF_EDIT_LOG_COMPACT_RECORD_LIMIT = 3
+        leanoj_module._MASTER_PROOF_EDIT_LOG_RECENT_RECORDS_TO_KEEP = 2
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                await coordinator._write_master_proof("import Mathlib", summary="seed")  # type: ignore[attr-defined]
+                for index in range(5):
+                    await coordinator._append_master_proof_edit(  # type: ignore[attr-defined]
+                        {
+                            "action": "edit_proof",
+                            "operation": "insert_after",
+                            "old_string": "import Mathlib",
+                            "new_string": f"def helper_{index} : Nat := {index}",
+                            "reasoning": f"edit {index}",
+                            "accepted": True,
+                        }
+                    )
+
+                records = coordinator._read_master_proof_edit_records()  # type: ignore[attr-defined]
+                snapshot_path = coordinator._master_proof_snapshot_log_path()  # type: ignore[attr-defined]
+
+                self.assertLessEqual(len(records), 3)
+                self.assertTrue(snapshot_path.exists())
+                self.assertIn("master_proof_edit_log_compaction", snapshot_path.read_text(encoding="utf-8"))
+            finally:
+                leanoj_module._MASTER_PROOF_EDIT_LOG_COMPACT_RECORD_LIMIT = old_limit
+                leanoj_module._MASTER_PROOF_EDIT_LOG_RECENT_RECORDS_TO_KEEP = old_keep
+                system_config.data_dir = old_data_dir
+
+    async def test_master_proof_progress_watchdog_returns_to_brainstorming(self) -> None:
+        request = _request()
+        request.final_attempts_per_cycle = 3
+        old_data_dir = system_config.data_dir
+        old_limit = leanoj_module._MASTER_PROOF_NO_PROGRESS_LIMIT
+        leanoj_module._MASTER_PROOF_NO_PROGRESS_LIMIT = 2
+        call_count = 0
+
+        async def fake_call_json(*_args, **_kwargs):
+            nonlocal call_count
+            call_count += 1
+            return {
+                "action": "edit_proof",
+                "needs_more_time": True,
+                "operation": "insert_after",
+                "old_string": "import Mathlib",
+                "new_string": f"def repeated_region_{call_count} : Nat := {call_count}",
+                "reasoning": "Keep expanding the same import anchor.",
+            }
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                return SimpleNamespace(success=True, error_output="")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "recursive_brainstorm")
+                self.assertEqual(coordinator.get_state().current_path_decision, "need_more_brainstorming")
+                self.assertEqual(coordinator.get_state().final_attempt_count, 1)
+                self.assertIn("same proof region", coordinator.get_state().master_proof_last_stuck_reason)
+                self.assertGreaterEqual(call_count, 1)
+            finally:
+                leanoj_module._MASTER_PROOF_NO_PROGRESS_LIMIT = old_limit
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_leanoj_master_proof_routes_return_draft_and_edits(self) -> None:
+        from backend.api.routes import leanoj as leanoj_route_module
+
+        old_data_dir = system_config.data_dir
+        old_route_coordinator = leanoj_route_module.leanoj_coordinator
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                await coordinator._write_master_proof("import Mathlib\n\nexample : True := by\n  trivial", summary="api")  # type: ignore[attr-defined]
+                await coordinator._append_master_proof_edit(  # type: ignore[attr-defined]
+                    {
+                        "action": "edit_proof",
+                        "operation": "full_content",
+                        "new_string": "import Mathlib\n\nexample : True := by\n  trivial",
+                        "reasoning": "API route test.",
+                        "accepted": True,
+                    }
+                )
+                leanoj_route_module.leanoj_coordinator = coordinator
+
+                draft = await leanoj_route_module.get_leanoj_master_proof()
+                edits = await leanoj_route_module.get_leanoj_master_proof_edits(limit=5)
+
+                self.assertTrue(draft["exists"])
+                self.assertIn("trivial", draft["content"])
+                self.assertEqual(edits["total_edits"], 1)
+            finally:
+                leanoj_route_module.leanoj_coordinator = old_route_coordinator
+                system_config.data_dir = old_data_dir
+
+    async def test_leanoj_library_exposes_shared_proof_tiers(self) -> None:
+        from backend.api.routes import leanoj as leanoj_route_module
+
+        payload = {
+            "session_id": "leanoj_session",
+            "user_prompt": "Prove one equals one.",
+            "selected_topic": "Equality",
+            "phase": "verified",
+            "final_solution": "import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+            "final_proof_id": "proof_final",
+            "final_novel": True,
+            "final_novelty_tier": "mathematical_discovery",
+            "final_novelty_reasoning": "Final proof is novel in context.",
+            "verified_subproofs": [
+                {
+                    "subproof_id": "subproof_1",
+                    "request": "Show reflexivity.",
+                    "verified": True,
+                    "lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+                    "proof_id": "proof_sub",
+                    "novel": True,
+                    "novelty_tier": "novel_formulation",
+                    "novelty_reasoning": "Subproof formalization is useful.",
+                }
+            ],
+        }
+
+        proofs = leanoj_route_module._extract_leanoj_proofs(payload)
+
+        final = next(proof for proof in proofs if proof["proof_kind"] == "final")
+        subproof = next(proof for proof in proofs if proof["proof_kind"] == "subproof")
+        self.assertEqual(final["shared_proof_id"], "proof_final")
+        self.assertEqual(final["novelty_tier"], "mathematical_discovery")
+        self.assertEqual(subproof["shared_proof_id"], "proof_sub")
+        self.assertEqual(subproof["novelty_tier"], "novel_formulation")
+
+    async def test_skip_brainstorm_sets_state_flag(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+
+                await coordinator.skip_brainstorm()
+
+                self.assertTrue(coordinator.get_state().skip_brainstorm_requested)
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_skip_brainstorm_is_consumed_once(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                await coordinator.skip_brainstorm()
+
+                await coordinator._brainstorm_until_path_check(  # type: ignore[attr-defined]
+                    _request(),
+                    max_accepts=1,
+                    sufficiency_interval=1,
+                    force_after_max=True,
+                )
+
+                self.assertFalse(coordinator.get_state().skip_brainstorm_requested)
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_force_brainstorm_resets_recursive_acceptance_window(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        state = coordinator.get_state()
+        state.phase = "final_proof_loop"
+        state.active_brainstorm_phase = "recursive_brainstorm"
+        state.active_brainstorm_start_count = 10
+        state.brainstorm_acceptance_events = 14
+
+        await coordinator.force_brainstorm()
+        consumed = await coordinator._consume_force_brainstorm()  # type: ignore[attr-defined]
+
+        self.assertTrue(consumed)
+        self.assertEqual(state.phase, "recursive_brainstorm")
+        self.assertEqual(state.active_brainstorm_phase, "")
+        self.assertEqual(state.active_brainstorm_start_count, 14)
+        self.assertEqual(
+            coordinator._get_brainstorm_acceptance_start("recursive_brainstorm"),  # type: ignore[attr-defined]
+            14,
+        )
+
+    async def test_skip_brainstorm_prevents_recursive_brainstorm_start(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        coordinator._state.phase = "path_decision"  # type: ignore[attr-defined]
+        coordinator._state.skip_brainstorm_requested = True  # type: ignore[attr-defined]
+
+        async def fail_brainstorm_until_path_check(*_args, **_kwargs):
+            raise AssertionError("Recursive brainstorm should not start after skip brainstorm")
+
+        coordinator._brainstorm_until_path_check = fail_brainstorm_until_path_check  # type: ignore[method-assign]
+
+        await coordinator._recursive_brainstorm_phase(_request())  # type: ignore[attr-defined]
+
+        self.assertFalse(coordinator.get_state().skip_brainstorm_requested)
+        self.assertTrue(coordinator.get_state().user_forced_final_cycle)
+        self.assertEqual(coordinator.get_state().phase, "final_proof_loop")
+        self.assertEqual(coordinator.get_state().current_path_decision, "solve_final_now")
+
+    async def test_path_decision_uses_final_solver_actor_when_final_path_available(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        request = _request().model_copy(
+            update={
+                "path_decider": LeanOJRoleConfig(model_id="legacy-path-model"),
+                "final_solver": LeanOJRoleConfig(model_id="final-model"),
+            }
+        )
+        calls = []
+        context_models = []
+
+        async def fake_build_context_blocks(_request, config, **_kwargs):
+            context_models.append(config.model_id)
+            return {}
+
+        async def fake_call_json(config, task_prefix, role_id, _prompt, **_kwargs):
+            calls.append({"model_id": config.model_id, "task_prefix": task_prefix, "role_id": role_id})
+            if task_prefix == "leanoj_path":
+                return {"path": "solve_final_now", "reasoning": "ready for final proof"}
+            if role_id == "leanoj_path_validator":
+                return {"decision": "accept", "reasoning": "valid", "summary": ""}
+            return {}
+
+        coordinator._build_context_blocks = fake_build_context_blocks  # type: ignore[method-assign]
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+        decision = await coordinator._path_decision_phase(request)  # type: ignore[attr-defined]
+
+        self.assertEqual(decision, "solve_final_now")
+        self.assertEqual(calls[0]["model_id"], "final-model")
+        self.assertEqual(calls[0]["role_id"], "leanoj_final_solver")
+        self.assertEqual(context_models[0], "final-model")
+
+    def test_path_decision_actor_falls_back_to_topic_generator_without_final_option(self) -> None:
+        request = _request().model_copy(
+            update={
+                "topic_generator": LeanOJRoleConfig(model_id="topic-model"),
+                "final_solver": LeanOJRoleConfig(model_id="final-model"),
+            }
+        )
+
+        actor, role_id = LeanOJCoordinator._path_decision_actor(  # type: ignore[attr-defined]
+            request,
+            valid_paths=("need_more_brainstorming",),
+        )
+
+        self.assertEqual(actor.model_id, "topic-model")
+        self.assertEqual(role_id, "leanoj_topic_generator")
+
+    def test_leanoj_path_boost_category_is_absorbed_into_final_solver(self) -> None:
+        manager = BoostManager()
+
+        self.assertEqual(manager._extract_role_prefix("leanoj_path_003"), "leanoj_final")
+        self.assertEqual(manager._canonical_category("leanoj_path"), "leanoj_final")
+
+    async def test_final_loop_retries_after_malformed_model_output(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+
+        calls = 0
+
+        async def fake_call_json(_config, task_prefix, *_args, **_kwargs):
+            nonlocal calls
+            if task_prefix == "leanoj_final_review":
+                return {"solved": True, "reasoning": "final answer complete"}
+            calls += 1
+            if calls == 1:
+                raise ValueError("No JSON found in response")
+            return {"lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  rfl", "reasoning": "retry"}
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                return SimpleNamespace(success=True, error_output="")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                self.assertEqual(coordinator.get_state().phase, "verified")
+                self.assertEqual(coordinator.get_state().final_attempt_count, 2)
+                self.assertEqual(calls, 2)
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_placeholder_scaffold_is_saved_as_partial_not_verified(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, *, allow_placeholders: bool = False):
+                if not allow_placeholders:
+                    return SimpleNamespace(success=False, error_output="placeholders were not allowed")
+                return SimpleNamespace(success=True, error_output="", goal_states="", raw_stderr="")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                result = await coordinator._check_proof_and_capture_partial(  # type: ignore[attr-defined]
+                    request,
+                    "import Mathlib\n\nexample : 1 = 1 := by\n  sorry",
+                    target="final",
+                    attempt_number=1,
+                    proof_request="final Proof Solver solution",
+                    reasoning="scaffold",
+                )
+
+                self.assertFalse(result.success)
+                self.assertIn("PARTIAL PROOF SAVED", result.error_output)
+                partials = coordinator.get_status()["partial_proofs"]
+                self.assertEqual(len(partials), 1)
+                self.assertEqual(partials[0]["placeholder_tokens"], ["sorry"])
+                self.assertFalse(coordinator.get_state().final_solution)
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_unrelated_final_placeholder_scaffold_is_not_saved(self) -> None:
+        request = _request()
+        old_data_dir = system_config.data_dir
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, *, allow_placeholders: bool = False):
+                return SimpleNamespace(success=True, error_output="", goal_states="", raw_stderr="")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                result = await coordinator._check_proof_and_capture_partial(  # type: ignore[attr-defined]
+                    request,
+                    "import Mathlib\n\ntheorem unrelated : True := by\n  sorry",
+                    target="final",
+                    attempt_number=1,
+                    proof_request="final Proof Solver solution",
+                    reasoning="bad scaffold",
+                )
+
+                self.assertFalse(result.success)
+                self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", result.error_output)
+                self.assertEqual(coordinator.get_status()["partial_proofs"], [])
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_restore_loads_partial_proof_database_records(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                record = {
+                    "session_id": coordinator.get_state().session_id,
+                    "attempt": 7,
+                    "target": "final",
+                    "request": "final Proof Solver solution",
+                    "placeholder_tokens": ["sorry"],
+                    "lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  sorry",
+                }
+                await coordinator._append_partial_proof_database(record)  # type: ignore[attr-defined]
+
+                payload = coordinator.get_status()
+                payload["request"] = _request().model_dump(mode="json")
+                payload["partial_proofs"] = []
+
+                restored = LeanOJCoordinator()
+                restored._restore_from_payload(payload)  # type: ignore[attr-defined]
+
+                partials = restored.get_status()["partial_proofs"]
+                self.assertEqual(len(partials), 1)
+                self.assertEqual(partials[0]["attempt"], 7)
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_brainstorm_submitters_run_in_parallel_and_batch_validate(self) -> None:
+        request = _request()
+        request.brainstorm_submitters = [_role(), _role(), _role()]
+        coordinator = await self._initialized_coordinator()
+
+        never_finish = leanoj_module.asyncio.Event()
+        submitter_calls: list[str] = []
+        validator_prompts: list[str] = []
+        per_submitter_counts: dict[str, int] = {}
+
+        async def fake_call_json(_config, _task_prefix, role_id, prompt, **_kwargs):
+            if role_id.startswith("leanoj_brainstorm_submitter_"):
+                submitter_calls.append(role_id)
+                per_submitter_counts[role_id] = per_submitter_counts.get(role_id, 0) + 1
+                if role_id == "leanoj_brainstorm_submitter_2" or per_submitter_counts[role_id] > 1:
+                    await never_finish.wait()
+                return {"submission": f"{role_id} useful idea"}
+
+            if role_id == "leanoj_brainstorm_validator":
+                validator_prompts.append(prompt)
+                batch_size = prompt.count("SUBMISSION ")
+                if batch_size:
+                    return {
+                        "decisions": [
+                            {
+                                "submission_number": index,
+                                "decision": "accept",
+                                "reasoning": "useful",
+                                "summary": "accepted",
+                            }
+                            for index in range(1, batch_size + 1)
+                        ]
+                    }
+                return {"decision": "accept", "reasoning": "useful", "summary": "accepted"}
+
+            return {"enough": False}
+
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+        await leanoj_module.asyncio.wait_for(
+            coordinator._brainstorm_until_path_check(  # type: ignore[attr-defined]
+                request,
+                max_accepts=2,
+                sufficiency_interval=10,
+                force_after_max=True,
+            ),
+            timeout=2,
+        )
+
+        self.assertIn("leanoj_brainstorm_submitter_2", submitter_calls)
+        self.assertEqual(coordinator.get_state().accepted_brainstorm_count, 2)
+        self.assertTrue(any("SUBMISSION 1:" in prompt and "SUBMISSION 2:" in prompt for prompt in validator_prompts))
+
+    def test_template_mismatch_rejects_unrelated_compiling_code(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        unrelated = "import Mathlib\n\ntheorem unrelated : True := by\n  trivial"
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, unrelated)
+
+        self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", error)
+
+    def test_template_match_accepts_filled_hole(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        solved = "import Mathlib\n\nexample : 1 = 1 := by\n  rfl"
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, solved)
+
+        self.assertEqual(error, "")
+
+    def test_template_match_allows_answer_and_theorem_hole_replacement(self) -> None:
+        template = (
+            "import Mathlib.Data.Finset.Card\n"
+            "import Mathlib.Order.Bounds.Defs\n\n"
+            "def answer (n : ℕ) : ℕ := sorry\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | a = 0 }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := sorry"
+        )
+        solved = (
+            "import Mathlib.Data.Finset.Card\n"
+            "import Mathlib.Order.Bounds.Defs\n"
+            "import Mathlib\n\n"
+            "open Classical\n\n"
+            "noncomputable def answer (n : ℕ) : ℕ := sSup (S n)\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | a = 0 }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := by\n"
+            "  sorry"
+        )
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, solved)
+
+        self.assertEqual(error, "")
+
+    def test_template_match_allows_open_classical_in_noncomputable_hole(self) -> None:
+        template = "import Mathlib\n\ndef answer (n : ℕ) : ℕ := sorry"
+        solved = "import Mathlib\n\nopen Classical in\nnoncomputable def answer (n : ℕ) : ℕ := sSup ({0} : Set ℕ)"
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, solved)
+
+        self.assertEqual(error, "")
+
+    def test_template_mismatch_rejects_changed_fixed_definition(self) -> None:
+        template = (
+            "import Mathlib\n\n"
+            "def answer (n : ℕ) : ℕ := sorry\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | a = 0 }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := sorry"
+        )
+        changed = (
+            "import Mathlib\n\n"
+            "def answer (n : ℕ) : ℕ := 0\n\n"
+            "def S (n : ℕ) : Set ℕ := { a : ℕ | True }\n\n"
+            "theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := by\n"
+            "  sorry"
+        )
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, changed)
+
+        self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", error)
+
+    def test_template_mismatch_rejects_changed_fixed_instance(self) -> None:
+        template = (
+            "import Mathlib\n\n"
+            "instance : Inhabited ℕ := ⟨0⟩\n\n"
+            "example : 1 = 1 := by\n  sorry"
+        )
+        changed = (
+            "import Mathlib\n\n"
+            "instance : Inhabited ℕ := ⟨1⟩\n\n"
+            "example : 1 = 1 := by\n  rfl"
+        )
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, changed)
+
+        self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", error)
+
+    def test_template_mismatch_rejects_changed_theorem_target(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        changed = "import Mathlib\n\nexample : True := by\n  trivial"
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, changed)
+
+        self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", error)
+
+    def test_template_mismatch_rejects_import_only_in_comment(self) -> None:
+        template = "import Mathlib.Data.Finset.Card\n\nexample : 1 = 1 := by\n  sorry"
+        changed = "-- import Mathlib.Data.Finset.Card\nimport Mathlib\n\nexample : 1 = 1 := by\n  rfl"
+        error = LeanOJCoordinator._validate_final_solution_matches_template(template, changed)
+
+        self.assertIn("PROOF SOLVER TEMPLATE MISMATCH", error)
+
+    def test_integrity_rejects_new_axiom_device(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        fake_solution = (
+            "import Mathlib\n\n"
+            "axiom fakeGoal : 1 = 1\n\n"
+            "example : 1 = 1 := by\n"
+            "  exact fakeGoal"
+        )
+        error = LeanOJCoordinator._validate_final_solution_integrity(template, fake_solution)
+
+        self.assertIn("PROOF SOLVER FORBIDDEN PROOF DEVICE", error)
+
+    def test_integrity_rejects_new_attributed_axiom_device(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        fake_solution = (
+            "import Mathlib\n\n"
+            "@[simp] axiom fakeGoal : 1 = 1\n\n"
+            "example : 1 = 1 := by\n"
+            "  exact fakeGoal"
+        )
+        error = LeanOJCoordinator._validate_final_solution_integrity(template, fake_solution)
+
+        self.assertIn("PROOF SOLVER FORBIDDEN PROOF DEVICE", error)
+
+    def test_integrity_rejects_new_escaped_axiom_device(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        fake_solution = (
+            "import Mathlib\n\n"
+            "axiom «fake goal» : 1 = 1\n\n"
+            "example : 1 = 1 := by\n"
+            "  exact «fake goal»"
+        )
+        error = LeanOJCoordinator._validate_final_solution_integrity(template, fake_solution)
+
+        self.assertIn("PROOF SOLVER FORBIDDEN PROOF DEVICE", error)
+
+    def test_integrity_rejects_parenthesized_constant_device(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        fake_solution = (
+            "import Mathlib\n\n"
+            "constant (fakeGoal : 1 = 1)\n\n"
+            "example : 1 = 1 := by\n"
+            "  exact fakeGoal"
+        )
+        error = LeanOJCoordinator._validate_final_solution_integrity(template, fake_solution)
+
+        self.assertIn("PROOF SOLVER FORBIDDEN PROOF DEVICE", error)
+
+    def test_integrity_allows_template_existing_constant(self) -> None:
+        template = "import Mathlib\n\nconstant h : 1 = 1\n\nexample : 1 = 1 := by\n  sorry"
+        solved = "import Mathlib\n\nconstant h : 1 = 1\n\nexample : 1 = 1 := by\n  exact h"
+        error = LeanOJCoordinator._validate_final_solution_integrity(template, solved)
+
+        self.assertEqual(error, "")
+
+    def test_subproof_integrity_rejects_new_axiom_device(self) -> None:
+        template = "import Mathlib\n\nexample : 1 = 1 := by\n  sorry"
+        fake_subproof = "import Mathlib\n\naxiom fakeLemma : 1 = 1\n\ntheorem helper : 1 = 1 := fakeLemma"
+        error = LeanOJCoordinator._validate_no_new_declaration_devices(
+            template,
+            fake_subproof,
+            target="subproof",
+        )
+
+        self.assertIn("PROOF SOLVER FORBIDDEN PROOF DEVICE", error)
+
+    async def test_initialize_rejects_missing_role_model(self) -> None:
+        request = _request()
+        request.final_solver.model_id = ""
+        coordinator = LeanOJCoordinator()
+
+        with self.assertRaisesRegex(ValueError, "final_solver"):
+            await coordinator.initialize(request)
+
+    async def test_call_json_missing_model_is_non_retryable_configuration_error(self) -> None:
+        coordinator = await self._initialized_coordinator()
+
+        with self.assertRaises(LeanOJConfigurationError):
+            await coordinator._call_json(  # type: ignore[attr-defined]
+                LeanOJRoleConfig(model_id=""),
+                "leanoj_final",
+                "leanoj_final_solver",
+                "{}",
+            )
+
+    async def test_call_json_keeps_retrying_malformed_json_until_success(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        old_generate_completion = leanoj_module.api_client_manager.generate_completion
+        old_sleep = leanoj_module.asyncio.sleep
+        calls = 0
+        prompts: list[str] = []
+
+        async def fake_generate_completion(**kwargs):
+            nonlocal calls
+            calls += 1
+            prompts.append(kwargs["messages"][0]["content"])
+            if calls < 5:
+                return {"choices": [{"message": {"content": '{"decisions": ['}}]}
+            return {"choices": [{"message": {"content": '{"decision": "accept", "reasoning": "ok"}'}}]}
+
+        async def noop_sleep(*_args, **_kwargs):
+            return None
+
+        leanoj_module.api_client_manager.generate_completion = fake_generate_completion  # type: ignore[assignment]
+        leanoj_module.asyncio.sleep = noop_sleep  # type: ignore[assignment]
+        try:
+            result = await coordinator._call_json(  # type: ignore[attr-defined]
+                LeanOJRoleConfig(model_id="test-model"),
+                "leanoj_brainstorm_val",
+                "leanoj_brainstorm_validator",
+                "Return the requested JSON.",
+            )
+        finally:
+            leanoj_module.api_client_manager.generate_completion = old_generate_completion  # type: ignore[assignment]
+            leanoj_module.asyncio.sleep = old_sleep  # type: ignore[assignment]
+
+        self.assertEqual(result["decision"], "accept")
+        self.assertEqual(calls, 5)
+        self.assertTrue(any("INVALID_OR_TRUNCATED_JSON" in prompt for prompt in prompts[1:]))
+        self.assertTrue(
+            any(
+                feedback.get("role_id") == "leanoj_brainstorm_validator"
+                for feedback in coordinator.get_status()["failed_feedback"]
+            )
+        )
+
+    async def test_error_resume_prefers_existing_master_proof_loop(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        state = coordinator.get_state()
+        state.phase = "error"
+        state.last_active_phase = "recursive_brainstorm"
+        state.master_proof_initialized = True
+        state.master_proof_version = 2
+
+        self.assertEqual(coordinator._infer_resume_phase(), "final_proof_loop")  # type: ignore[attr-defined]
+
+    async def test_stop_handles_main_task_cleared_during_timeout(self) -> None:
+        coordinator = LeanOJCoordinator()
+
+        async def noop(*_args, **_kwargs):
+            return None
+
+        coordinator._persist_state = noop  # type: ignore[method-assign]
+        coordinator._broadcast = noop  # type: ignore[method-assign]
+        task = leanoj_module.asyncio.create_task(leanoj_module.asyncio.sleep(60))
+        coordinator._main_task = task  # type: ignore[attr-defined]
+
+        original_wait_for = leanoj_module.asyncio.wait_for
+
+        async def fake_wait_for(*_args, **_kwargs):
+            coordinator._main_task = None  # type: ignore[attr-defined]
+            raise leanoj_module.asyncio.TimeoutError
+
+        leanoj_module.asyncio.wait_for = fake_wait_for  # type: ignore[assignment]
+        try:
+            await coordinator.stop()
+        finally:
+            leanoj_module.asyncio.wait_for = original_wait_for  # type: ignore[assignment]
+            if not task.done():
+                task.cancel()
+                await leanoj_module.asyncio.gather(task, return_exceptions=True)
+
+        self.assertTrue(task.cancelled())
+        self.assertIsNone(coordinator._main_task)  # type: ignore[attr-defined]
+
+    async def test_restore_latest_session_recovers_request_and_progress(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = LeanOJCoordinator()
+                await coordinator.initialize(_request())
+                coordinator._state.phase = "final_proof_loop"
+                coordinator._state.selected_topic = "algebraic simplification"
+                coordinator._state.final_attempt_count = 3
+                coordinator._accepted_ideas.append("Use rfl after normalization.")
+                coordinator._validated_topics.append("Template theorem shape")
+                coordinator._final_attempts.append(
+                    {
+                        "request": "final Proof Solver solution",
+                        "error_summary": "unknown tactic",
+                        "lean_code": "bad",
+                    }
+                )
+                await coordinator._persist_state()  # type: ignore[attr-defined]
+
+                restored = LeanOJCoordinator()
+                self.assertTrue(await restored.restore_latest_session(auto_resume=False))
+
+                self.assertEqual(restored.get_state().phase, "final_proof_loop")
+                self.assertFalse(restored.get_state().is_running)
+                self.assertEqual(restored.get_state().final_attempt_count, 3)
+                self.assertEqual(restored.get_status()["accepted_ideas"], ["Use rfl after normalization."])
+                self.assertEqual(restored.get_status()["validated_topics"], ["Template theorem shape"])
+                self.assertTrue(restored.get_status()["resume_available"])
+                self.assertIsNotNone(restored._request)  # type: ignore[attr-defined]
+                self.assertEqual(restored._request.lean_template, _request().lean_template)  # type: ignore[attr-defined]
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_restore_latest_session_auto_resume_starts_interrupted_run(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = LeanOJCoordinator()
+                await coordinator.initialize(_request())
+                coordinator._state.phase = "path_decision"
+                await coordinator._persist_state()  # type: ignore[attr-defined]
+
+                restored = LeanOJCoordinator()
+                called = []
+
+                def fake_start_in_background() -> bool:
+                    called.append(True)
+                    return True
+
+                restored.start_in_background = fake_start_in_background  # type: ignore[method-assign]
+
+                self.assertTrue(await restored.restore_latest_session(auto_resume=True))
+                self.assertEqual(called, [True])
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_leanoj_context_allocation_direct_first(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                allocation = await leanoj_context_manager.allocate_context(
+                    session_id="session_direct",
+                    mode="final_solver",
+                    user_prompt="Prove one equals one.",
+                    lean_template="example : 1 = 1 := by\n  sorry",
+                    task_request="Solve the final proof.",
+                    context_window=131072,
+                    max_output_tokens=25000,
+                    accepted_ideas=["Use rfl after normalization."],
+                    verified_subproofs=[],
+                    partial_proofs=[],
+                    failed_subproofs=[],
+                    final_attempts=[],
+                )
+
+                self.assertIn("Use rfl after normalization.", allocation.direct_proof_context)
+                self.assertEqual(allocation.rag_evidence_context, "")
+                self.assertTrue(allocation.direct_sources)
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_leanoj_context_rag_fallback_is_scoped(self) -> None:
+        captured = {}
+
+        async def fake_ensure(_source_name: str, _text: str) -> None:
+            return None
+
+        async def fake_retrieve(**kwargs):
+            captured.update(kwargs)
+            return SimpleNamespace(text="retrieved scoped LeanOJ evidence")
+
+        old_ensure = leanoj_context_manager._ensure_source_indexed
+        old_retrieve = leanoj_context_module.rag_manager.retrieve
+        try:
+            leanoj_context_manager._ensure_source_indexed = fake_ensure  # type: ignore[method-assign]
+            leanoj_context_module.rag_manager.retrieve = fake_retrieve  # type: ignore[assignment]
+
+            allocation = await leanoj_context_manager.allocate_context(
+                session_id="session_rag",
+                mode="brainstorm",
+                user_prompt="Prove a theorem.",
+                lean_template="example : True := by\n  sorry",
+                task_request="Brainstorm proof ideas.",
+                context_window=10000,
+                max_output_tokens=1000,
+                accepted_ideas=["large idea " * 4000],
+                verified_subproofs=[],
+                partial_proofs=[],
+                failed_subproofs=[],
+                final_attempts=[],
+            )
+
+            self.assertEqual(allocation.rag_evidence_context, "retrieved scoped LeanOJ evidence")
+            self.assertEqual(captured["include_source_prefixes"], ["leanoj_session_rag_"])
+            self.assertIn("leanoj_session_rag_accepted_ideas", captured["include_sources"])
+            self.assertEqual(captured["exclude_sources"], None)
+        finally:
+            leanoj_context_manager._ensure_source_indexed = old_ensure  # type: ignore[method-assign]
+            leanoj_context_module.rag_manager.retrieve = old_retrieve  # type: ignore[assignment]
+
+    async def test_historical_final_cycle_packets_are_rag_only(self) -> None:
+        captured = {}
+
+        async def fake_ensure(_source_name: str, _text: str) -> None:
+            return None
+
+        async def fake_retrieve(**kwargs):
+            captured.update(kwargs)
+            return SimpleNamespace(text="historical final-cycle packet evidence")
+
+        old_ensure = leanoj_context_manager._ensure_source_indexed
+        old_retrieve = leanoj_context_module.rag_manager.retrieve
+        try:
+            leanoj_context_manager._ensure_source_indexed = fake_ensure  # type: ignore[method-assign]
+            leanoj_context_module.rag_manager.retrieve = fake_retrieve  # type: ignore[assignment]
+
+            allocation = await leanoj_context_manager.allocate_context(
+                session_id="session_packets",
+                mode="brainstorm",
+                user_prompt="Prove a theorem.",
+                lean_template="example : True := by\n  sorry",
+                task_request="Generate brainstorm proof context.",
+                context_window=131072,
+                max_output_tokens=25000,
+                accepted_ideas=[],
+                verified_subproofs=[],
+                partial_proofs=[],
+                failed_subproofs=[],
+                final_attempts=[],
+                final_cycle_packets=[
+                    {
+                        "cycle_start_attempt": 1,
+                        "cycle_end_attempt": 30,
+                        "failed_attempt_count": 30,
+                        "attempts": [{"request": "final", "error_summary": "failed", "lean_code": "bad"}],
+                    }
+                ],
+            )
+
+            self.assertNotIn("FINAL-CYCLE PACKET", allocation.direct_proof_context)
+            self.assertEqual(allocation.rag_evidence_context, "historical final-cycle packet evidence")
+            self.assertIn("leanoj_session_packets_final_cycle_packets", captured["include_sources"])
+        finally:
+            leanoj_context_manager._ensure_source_indexed = old_ensure  # type: ignore[method-assign]
+            leanoj_context_module.rag_manager.retrieve = old_retrieve  # type: ignore[assignment]
+
+    async def test_context_allocation_raises_when_useful_memory_would_drop(self) -> None:
+        with self.assertRaisesRegex(
+            RuntimeError,
+            "mandatory context overflow|could not preserve useful proof memory",
+        ):
+            await leanoj_context_manager.allocate_context(
+                session_id="session_tiny",
+                mode="brainstorm",
+                user_prompt="user " * 2000,
+                lean_template="template " * 2000,
+                task_request="task " * 2000,
+                context_window=2500,
+                max_output_tokens=1000,
+                accepted_ideas=["large idea " * 100],
+                verified_subproofs=[],
+                partial_proofs=[],
+                failed_subproofs=[],
+                final_attempts=[],
+            )
+
+    async def test_ensure_source_indexed_removes_stale_source_before_add(self) -> None:
+        calls = []
+
+        async def fake_remove(source_name: str) -> None:
+            calls.append(("remove", source_name))
+
+        async def fake_add(_text: str, source_name: str, **_kwargs) -> None:
+            calls.append(("add", source_name))
+
+        old_remove = leanoj_context_module.rag_manager.remove_document
+        old_add = leanoj_context_module.rag_manager.add_text
+        try:
+            leanoj_context_module.rag_manager.remove_document = fake_remove  # type: ignore[assignment]
+            leanoj_context_module.rag_manager.add_text = fake_add  # type: ignore[assignment]
+            leanoj_context_manager._indexed_hashes.pop("leanoj_stale_source", None)
+
+            await leanoj_context_manager._ensure_source_indexed("leanoj_stale_source", "proof memory")
+
+            self.assertEqual(calls[0], ("remove", "leanoj_stale_source"))
+            self.assertEqual(calls[1], ("add", "leanoj_stale_source"))
+        finally:
+            leanoj_context_module.rag_manager.remove_document = old_remove  # type: ignore[assignment]
+            leanoj_context_module.rag_manager.add_text = old_add  # type: ignore[assignment]
+
+    async def test_current_final_cycle_packet_persists_until_phase_clear(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        request = _request()
+        packet = {
+            "cycle_start_attempt": 1,
+            "cycle_end_attempt": 30,
+            "failed_attempt_count": 30,
+            "attempts": [{"request": "final", "error_summary": "failed", "lean_code": "bad"}],
+        }
+        coordinator._current_final_cycle_packet = packet  # type: ignore[attr-defined]
+
+        async def fake_allocate_context(**kwargs):
+            return LeanOJContextAllocation(
+                current_final_cycle_packet="CURRENT FINAL-CYCLE FAILURE PACKET"
+                if kwargs.get("current_final_cycle_packet")
+                else ""
+            )
+
+        old_allocate = leanoj_module.leanoj_context_manager.allocate_context
+        try:
+            leanoj_module.leanoj_context_manager.allocate_context = fake_allocate_context  # type: ignore[assignment]
+
+            first = await coordinator._build_context_blocks(  # type: ignore[attr-defined]
+                request,
+                request.topic_generator,
+                mode="brainstorm",
+                task_request="Generate brainstorm proof context.",
+                include_current_final_cycle_packet=True,
+            )
+            second = await coordinator._build_context_blocks(  # type: ignore[attr-defined]
+                request,
+                request.topic_generator,
+                mode="brainstorm",
+                task_request="Generate brainstorm proof context.",
+                include_current_final_cycle_packet=True,
+            )
+            coordinator._clear_current_final_cycle_packet()  # type: ignore[attr-defined]
+            third = await coordinator._build_context_blocks(  # type: ignore[attr-defined]
+                request,
+                request.topic_generator,
+                mode="brainstorm",
+                task_request="Generate brainstorm proof context.",
+                include_current_final_cycle_packet=True,
+            )
+
+            self.assertIn("CURRENT FINAL-CYCLE FAILURE PACKET", first["current_final_cycle_packet"])
+            self.assertIn("CURRENT FINAL-CYCLE FAILURE PACKET", second["current_final_cycle_packet"])
+            self.assertEqual(third["current_final_cycle_packet"], "")
+        finally:
+            leanoj_module.leanoj_context_manager.allocate_context = old_allocate  # type: ignore[assignment]
+
+    async def test_final_solver_context_does_not_duplicate_working_proof_packet(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        request = _request()
+        await coordinator._write_master_proof(  # type: ignore[attr-defined]
+            "import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+            summary="final solver draft",
+        )
+        await coordinator._set_current_working_proof_attempt(  # type: ignore[attr-defined]
+            trigger="final_attempt_cycle_exhausted",
+            requested_path="need_more_brainstorming",
+            stuck_reason="Need more context.",
+        )
+
+        blocks = await coordinator._build_context_blocks(  # type: ignore[attr-defined]
+            request,
+            request.final_solver,
+            mode="final_solver",
+            task_request="Edit final proof.",
+            include_current_final_cycle_packet=True,
+        )
+
+        self.assertEqual(blocks["current_working_proof_attempt"], "")
+        self.assertNotIn("CURRENT WORKING PROOF ATTEMPT", "\n".join(blocks.values()))
+
+    def test_final_cycle_packet_formats_partial_proofs(self) -> None:
+        packet = {
+            "cycle_start_attempt": 1,
+            "cycle_end_attempt": 2,
+            "failed_attempt_count": 2,
+            "attempts": [{"request": "final", "error_summary": "failed", "lean_code": "bad"}],
+            "partial_proofs": [
+                {
+                    "request": "final Proof Solver solution",
+                    "target": "final",
+                    "attempt": 2,
+                    "placeholder_tokens": ["sorry"],
+                    "summary": "Lean accepted the scaffold.",
+                    "lean_code": "example : True := by\n  sorry",
+                }
+            ],
+        }
+
+        formatted = leanoj_context_module.LeanOJContextManager._format_final_cycle_packet(packet)
+
+        self.assertIn("Partial final scaffolds captured during this cycle", formatted)
+        self.assertIn("Lean accepted the scaffold", formatted)
+        self.assertIn("example : True", formatted)
+
+    async def test_initial_brainstorm_exit_prune_can_delete_accepted_idea_without_extending_phase(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        request = _request()
+
+        async def fake_call_json(_config, _task_prefix, role_id, prompt, **_kwargs):
+            if role_id.startswith("leanoj_brainstorm_submitter"):
+                return {"submission": "Redundant idea to prune.", "reasoning": "seed"}
+            if role_id == "leanoj_brainstorm_prune_reviewer_1":
+                return {
+                    "action": "delete",
+                    "idea_index": 1,
+                    "new_content": "",
+                    "reasoning": "It is redundant after review.",
+                }
+            if role_id == "leanoj_brainstorm_validator" and "PROPOSED OPERATION:" in prompt:
+                return {"decision": "accept", "reasoning": "Deletion is safe."}
+            if role_id == "leanoj_brainstorm_validator" and "SUBMISSIONS TO VALIDATE:" in prompt:
+                submission_count = prompt.count("SUBMISSION ")
+                return {
+                    "decisions": [
+                        {
+                            "submission_number": index,
+                            "decision": "accept",
+                            "reasoning": "Accept seed.",
+                            "summary": "accepted",
+                        }
+                        for index in range(1, submission_count + 1)
+                    ]
+                }
+            if role_id == "leanoj_brainstorm_validator":
+                return {"decision": "accept", "reasoning": "Accept seed.", "summary": "accepted"}
+            raise AssertionError(f"Unexpected role {role_id}")
+
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+        await coordinator._brainstorm_until_path_check(  # type: ignore[attr-defined]
+            request,
+            phase_key="initial_brainstorm",
+            max_accepts=1,
+            sufficiency_interval=10,
+            force_after_max=True,
+        )
+
+        self.assertEqual(coordinator._accepted_ideas, [])  # type: ignore[attr-defined]
+        self.assertEqual(coordinator.get_state().brainstorm_acceptance_events, 1)
+        self.assertEqual(coordinator.get_state().accepted_brainstorm_count, 0)
+        self.assertEqual(coordinator.get_state().brainstorm_prune_reviews_performed, 1)
+        self.assertEqual(coordinator.get_state().brainstorm_prune_operations_applied, 1)
+
+    async def test_recursive_brainstorm_prune_rejection_leaves_ideas_unchanged(self) -> None:
+        coordinator = await self._initialized_coordinator()
+        request = _request()
+        coordinator._accepted_ideas = ["Useful exact idea"]  # type: ignore[attr-defined]
+        coordinator._accepted_idea_records = [  # type: ignore[attr-defined]
+            {
+                "content": "Useful exact idea",
+                "submitter_index": 1,
+                "phase": "recursive_brainstorm",
+                "acceptance_event": 1,
+            }
+        ]
+        coordinator.get_state().brainstorm_acceptance_events = 1
+
+        async def fake_call_json(_config, _task_prefix, role_id, prompt, **_kwargs):
+            if role_id == "leanoj_brainstorm_prune_reviewer_1":
+                return {
+                    "action": "edit",
+                    "idea_index": 1,
+                    "new_content": "Risky replacement",
+                    "reasoning": "Maybe shorter.",
+                }
+            if role_id == "leanoj_brainstorm_validator":
+                self.assertIn("PROPOSED OPERATION:", prompt)
+                return {"decision": "reject", "reasoning": "Original still has unique value."}
+            raise AssertionError(f"Unexpected role {role_id}")
+
+        coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+
+        await coordinator._perform_brainstorm_prune_review(  # type: ignore[attr-defined]
+            request,
+            "recursive_brainstorm",
+            reason="test recursive review",
+        )
+
+        self.assertEqual(coordinator._accepted_ideas, ["Useful exact idea"])  # type: ignore[attr-defined]
+        self.assertEqual(coordinator.get_state().brainstorm_prune_operations_applied, 0)
+
+    async def test_clear_all_removes_only_registered_leanoj_rag_sources(self) -> None:
+        removed = []
+        old_data_dir = system_config.data_dir
+
+        async def fake_remove(source_name: str) -> None:
+            removed.append(source_name)
+
+        old_remove = leanoj_context_module.rag_manager.remove_document
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                leanoj_context_module.rag_manager.remove_document = fake_remove  # type: ignore[assignment]
+                leanoj_context_manager._indexed_hashes["leanoj_registered_accepted_ideas"] = "hash"
+
+                await leanoj_context_manager.clear_all()
+
+                self.assertEqual(removed, ["leanoj_registered_accepted_ideas"])
+            finally:
+                system_config.data_dir = old_data_dir
+                leanoj_context_module.rag_manager.remove_document = old_remove  # type: ignore[assignment]
+                leanoj_context_manager._indexed_hashes.pop("leanoj_registered_accepted_ideas", None)
+
+    def test_rag_source_scope_filter_limits_chunks_to_leanoj_session(self) -> None:
+        chunks = [
+            DocumentChunk(
+                chunk_id="1",
+                text="LeanOJ proof memory",
+                source_file="leanoj_session_a_accepted_ideas",
+                position=0,
+                chunk_size=512,
+            ),
+            DocumentChunk(
+                chunk_id="2",
+                text="compiler paper memory",
+                source_file="compiler_paper.txt",
+                position=0,
+                chunk_size=512,
+            ),
+        ]
+
+        scoped = leanoj_context_module.rag_manager._filter_chunks_by_source_scope(
+            chunks,
+            include_source_prefixes=["leanoj_session_a_"],
+        )
+
+        self.assertEqual([chunk.source_file for chunk in scoped], ["leanoj_session_a_accepted_ideas"])
+
+    async def test_final_cycle_packet_contains_exact_cycle_attempts(self) -> None:
+        request = _request()
+        request.final_attempts_per_cycle = 30
+        old_data_dir = system_config.data_dir
+
+        async def fake_call_json(*_args, **_kwargs):
+            return {"lean_code": "import Mathlib\n\nexample : 1 = 1 := by\n  simp", "reasoning": "try"}
+
+        class FakeLean:
+            async def check_proof(self, _code: str, timeout: int = 120, **_kwargs):
+                return SimpleNamespace(success=False, error_output="unsolved goals")
+
+        old_get_lean4_client = leanoj_module.get_lean4_client
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = await self._initialized_coordinator()
+                coordinator._call_json = fake_call_json  # type: ignore[method-assign]
+                leanoj_module.get_lean4_client = lambda: FakeLean()  # type: ignore[assignment]
+
+                await coordinator._final_proof_loop(request)
+
+                packet = coordinator.get_status()["current_final_cycle_packet"]
+                self.assertEqual(packet["failed_attempt_count"], 30)
+                self.assertEqual(packet["cycle_start_attempt"], 1)
+                self.assertEqual(packet["cycle_end_attempt"], 30)
+                self.assertEqual(len(packet["attempts"]), 30)
+            finally:
+                leanoj_module.get_lean4_client = old_get_lean4_client  # type: ignore[assignment]
+                system_config.data_dir = old_data_dir
+
+    async def test_restore_reloads_full_final_attempt_artifacts(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = LeanOJCoordinator()
+                await coordinator.initialize(_request())
+                coordinator._state.phase = "final_proof_loop"
+                coordinator._state.final_attempt_count = 25
+                for index in range(25):
+                    coordinator._final_attempts.append(
+                        {
+                            "request": "final Proof Solver solution",
+                            "error_summary": f"error {index}",
+                            "lean_code": f"bad {index}",
+                        }
+                    )
+                await coordinator._persist_state()  # type: ignore[attr-defined]
+
+                restored = LeanOJCoordinator()
+                self.assertTrue(await restored.restore_latest_session(auto_resume=False))
+
+                self.assertEqual(len(restored._final_attempts), 25)  # type: ignore[attr-defined]
+                self.assertEqual(restored._final_attempts[0]["error_summary"], "error 0")  # type: ignore[attr-defined]
+                self.assertEqual(len(restored.get_status()["final_attempts"]), 20)
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_leanoj_artifact_sync_rewrites_same_length_edits(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                session_id = "same_length_edit"
+                leanoj_context_manager._clear_sync_counts(session_id)  # type: ignore[attr-defined]
+                await leanoj_context_manager.write_session_artifacts(
+                    session_id=session_id,
+                    accepted_ideas=["old idea"],
+                    verified_subproofs=[],
+                    partial_proofs=[],
+                    failed_subproofs=[],
+                    final_attempts=[],
+                    final_cycle_packets=[],
+                )
+                await leanoj_context_manager.write_session_artifacts(
+                    session_id=session_id,
+                    accepted_ideas=["new idea"],
+                    verified_subproofs=[],
+                    partial_proofs=[],
+                    failed_subproofs=[],
+                    final_attempts=[],
+                    final_cycle_packets=[],
+                )
+
+                artifacts = leanoj_context_manager.load_session_artifacts(session_id)
+                self.assertEqual(artifacts["accepted_ideas"], ["new idea"])
+            finally:
+                leanoj_context_manager._clear_sync_counts("same_length_edit")  # type: ignore[attr-defined]
+                system_config.data_dir = old_data_dir
+
+    async def test_restore_reloads_master_proof_metadata_and_content(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = LeanOJCoordinator()
+                await coordinator.initialize(_request())
+                coordinator._state.phase = "final_proof_loop"  # type: ignore[attr-defined]
+                await coordinator._write_master_proof(  # type: ignore[attr-defined]
+                    "import Mathlib\n\nexample : 1 = 1 := by\n  rfl",
+                    summary="resume test master proof",
+                )
+                await coordinator._persist_state()  # type: ignore[attr-defined]
+
+                restored = LeanOJCoordinator()
+                self.assertTrue(await restored.restore_latest_session(auto_resume=False))
+
+                self.assertTrue(restored.get_state().master_proof_initialized)
+                self.assertEqual(restored.get_state().master_proof_line_count, 4)
+                self.assertIn("rfl", await restored._read_master_proof())  # type: ignore[attr-defined]
+                self.assertEqual(restored._infer_resume_phase(), "final_proof_loop")  # type: ignore[attr-defined]
+            finally:
+                system_config.data_dir = old_data_dir
+
+    async def test_clear_removes_leanoj_artifact_store(self) -> None:
+        old_data_dir = system_config.data_dir
+        with tempfile.TemporaryDirectory() as tmpdir:
+            try:
+                system_config.data_dir = tmpdir
+                coordinator = LeanOJCoordinator()
+                await coordinator.initialize(_request())
+                coordinator._accepted_ideas.append("persisted idea")
+                await coordinator._persist_state()  # type: ignore[attr-defined]
+
+                self.assertTrue(leanoj_context_manager.artifacts_base_dir().exists())
+
+                await coordinator.clear()
+
+                self.assertFalse(leanoj_context_manager.artifacts_base_dir().exists())
+                self.assertEqual(coordinator.get_status()["accepted_ideas"], [])
+            finally:
+                system_config.data_dir = old_data_dir
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_wolfram_tool_loop.py b/tests/test_wolfram_tool_loop.py
index e253cc9..47d6495 100644
--- a/tests/test_wolfram_tool_loop.py
+++ b/tests/test_wolfram_tool_loop.py
@@ -65,7 +65,7 @@ async def fake_generate_completion(**kwargs):
 
         self.assertEqual(content, '{"needs_construction": false}')
         self.assertEqual(fake_client.queries, ["2+2"])
-        self.assertEqual(wolfram_calls[0]["query"], "2+2")
+        self.assertEqual(wolfram_calls[0]["query"], "[redacted]")
         self.assertIsNotNone(calls[0]["tools"])
         self.assertEqual(calls[1]["messages"][-1]["role"], "tool")
         self.assertEqual(broadcasts[0][0], "compiler_wolfram_call")

From b71d66c74d164acaf317d68794f516d27fe05ad6 Mon Sep 17 00:00:00 2001
From: Pat <pat@local>
Date: Sun, 17 May 2026 22:38:09 -0500
Subject: [PATCH 32/32] MOTO v1.0.8

---
 .gitignore                                    |   6 +
 HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md        | 400 ------------------
 LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md       |  25 --
 LEANOJ_PROBLEM_11_PROMPT.md                   |  34 --
 README.md                                     |  18 +-
 backend/aggregator/core/coordinator.py        |  40 +-
 backend/aggregator/core/rag_manager.py        |  48 ++-
 backend/aggregator/ingestion/pipeline.py      |  39 +-
 backend/autonomous/memory/paper_library.py    | 274 ++++++++----
 backend/compiler/core/compiler_rag_manager.py |   6 +-
 backend/shared/log_redaction.py               |   8 +
 frontend/src/components/LatexRenderer.jsx     |  95 +++--
 moto-update-manifest.json                     |   2 +-
 moto_launcher.py                              |  56 ++-
 moto_updater.py                               |  75 +++-
 package-lock.json                             |   4 +-
 tests/test_codeql_path_hardening.py           | 136 ++++++
 tests/test_moto_launcher.py                   |  54 +++
 tests/test_moto_updater.py                    |  66 +++
 19 files changed, 721 insertions(+), 665 deletions(-)
 delete mode 100644 HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
 delete mode 100644 LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
 delete mode 100644 LEANOJ_PROBLEM_11_PROMPT.md
 create mode 100644 tests/test_codeql_path_hardening.py

diff --git a/.gitignore b/.gitignore
index cc9881a..5a6207c 100644
--- a/.gitignore
+++ b/.gitignore
@@ -21,6 +21,7 @@ wheels/
 *.egg
 MANIFEST
 venv/
+.venv/
 ENV/
 env/
 
@@ -128,3 +129,8 @@ randomlog.txt
 randomlog*.txt
 leanoj_master_proof_*.lean.txt
 commits_pending.txt
+
+# Private/local planning notes that should not be published
+HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
+LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
+LEANOJ_PROBLEM_11_PROMPT.md
diff --git a/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md b/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
deleted file mode 100644
index ba9a15b..0000000
--- a/HARDOJ_AWS_COMPUTE_DONATION_OUTLINE.md
+++ /dev/null
@@ -1,400 +0,0 @@
-# HardOJ AWS Outline: User-Donated Lean Verification and Karma
-
-## Purpose
-
-HardOJ is an advanced Lean proof challenge platform where users can submit theorem templates, vote on templates, solve templates, and optionally donate their own compute to verify Lean proofs safely.
-
-The core product goal is to create a public problem marketplace for hard formalization targets, including advanced theorem templates such as unsolved Lean 100-style problems, while keeping verification trustworthy, reproducible, and resistant to compute abuse.
-
-## Core User Flows
-
-### Template Submission
-
-Users can submit Lean theorem templates as public challenge problems.
-
-A template includes:
-
-- A title and informal mathematical statement
-- The Lean theorem statement
-- Required imports
-- A pinned Lean version and Mathlib revision
-- Optional explanatory notes, references, and difficulty tags
-- Optional helper lemmas or staged subproblem templates
-- A starter file ending in `sorry`
-
-Example template shape:
-
-```lean
-import Mathlib
-
-/-!
-Informal statement:
-This section explains the intended mathematical theorem.
-
-Rules:
-- The final proof must not use `axiom`, `constant`, `opaque`, or unrelated imported shortcuts.
-- The theorem statement must remain unchanged.
-- The proof must compile under the pinned Lean and Mathlib versions.
--/
-
-theorem hardoj_target_theorem
-    (/* variables */)
-    (/* hypotheses */) :
-    /* formal claim */ := by
-  sorry
-```
-
-Before a submitted template becomes public, HardOJ validates that:
-
-- The Lean file parses and typechecks with `sorry` allowed
-- Imports are on the allowlist or approved by moderation
-- The theorem statement is not empty, trivial, or already solved in the submitted file
-- The template does not introduce fake proof devices such as `axiom`, `constant`, `opaque`, or unsafe escape hatches
-- The informal statement reasonably matches the formal Lean target
-
-### Template Voting
-
-Users can upvote or downvote templates.
-
-Voting is used to surface important, interesting, difficult, and well-scoped theorem challenges. A template's visible score works like Reddit-style post score: upvotes increase the score, downvotes decrease it, and ranking can use time decay, controversy, and anti-abuse filtering.
-
-Templates with high scores become more valuable to solve because successful solvers receive karma based on the template's current score.
-
-### Proof Submission
-
-Users submit a completed Lean proof for a public template.
-
-A proof submission includes:
-
-- The unchanged template theorem statement
-- The user's proof replacing `sorry`
-- A proof hash
-- The Lean and Mathlib version used
-- Local verifier logs if available
-- Optional explanation of the proof strategy
-
-HardOJ accepts the solution only if the proof compiles in the pinned environment and passes integrity checks.
-
-### Karma Rewards
-
-Karma works like Reddit-style karma for platform reputation.
-
-Users gain karma when other users upvote their submitted templates, comments, explanations, and accepted solutions. Users lose karma from downvotes, subject to anti-abuse controls.
-
-Special HardOJ rule:
-
-- If a user solves a template, the solver receives solution karma equal to the template's current positive score at the time the solution is accepted.
-- If someone else solves a user's template, the template creator receives a creator bonus equal to 25% of that same positive score snapshot.
-
-Example:
-
-- A template has score `87`
-- A user submits the first accepted proof
-- The solver receives `87` solution karma
-- The template creator receives `21.75` creator-bonus karma, rounded according to the platform's configured karma precision
-
-If a template has a score below zero, the solution reward should floor at zero unless the platform later chooses to allow negative challenge rewards.
-
-## Compute Donation Model
-
-HardOJ should start with a safe model: users donate compute to verify their own submissions locally. Public volunteer verification can be added later with stronger controls.
-
-### Local User-Owned Verification
-
-The user runs a HardOJ verifier agent on their own machine.
-
-The verifier:
-
-1. Downloads the selected template package
-2. Uses the pinned Lean and Mathlib versions
-3. Inserts the user's submitted proof
-4. Runs Lean in a sandbox
-5. Returns verification metadata to HardOJ
-
-Returned metadata includes:
-
-- Template ID
-- Submission ID
-- Proof hash
-- Lean version
-- Mathlib revision
-- Success or failure
-- Lean errors if verification fails
-- Runtime, memory use, and timeout status
-
-Local verification helps users avoid wasting server resources and gives fast feedback. However, local verification alone should not be the sole source of official acceptance because a malicious client can fake success.
-
-### Official Acceptance
-
-For official karma, leaderboard placement, and "solved" status, HardOJ should use one of these trust paths:
-
-1. **Trusted AWS verification**: HardOJ re-verifies the final proof on AWS before accepting it.
-2. **Volunteer quorum plus spot check**: Multiple independent volunteer verifiers return matching success for the same proof hash, with HardOJ spot-checking high-value solves.
-3. **Attested verifier later**: Use stronger attestation if a reliable cross-platform proof-verifier attestation path becomes available.
-
-The recommended MVP is local pre-verification plus AWS official verification.
-
-## Anti-Exploitation Rules for Donated Compute
-
-User-donated compute must not become a free arbitrary job runner.
-
-Every donated verification job must be constrained:
-
-- Verify only a specific HardOJ template ID
-- Use only the pinned Lean and Mathlib revision
-- Use an immutable template package
-- Use a proof file whose hash is known before execution
-- Disable network access during Lean execution
-- Run in a container, VM, or OS sandbox
-- Enforce wall-time, CPU, RAM, process, and file-size limits
-- Use a read-only project root and a temporary write directory
-- Reject unauthorized imports or local file access
-- Never expose user secrets, API keys, cookies, or filesystem paths to the sandbox
-- Allow the user to cancel jobs at any time
-
-For MVP, donated compute should verify only the user's own proofs. Public volunteer verification should be opt-in and off by default.
-
-## AWS Architecture
-
-### Frontend
-
-Use one of:
-
-- S3 + CloudFront for a static web frontend
-- AWS Amplify for managed frontend deployment
-- A separate web app stack if HardOJ shares infrastructure with another website
-
-Frontend responsibilities:
-
-- Browse templates
-- Submit templates
-- Vote on templates
-- Submit proofs
-- Show verification status
-- Show karma, leaderboards, and user profiles
-- Connect to the local verifier agent when installed
-
-### API Layer
-
-Use API Gateway or an Application Load Balancer in front of backend services.
-
-Backend services can run on:
-
-- ECS Fargate for containerized API services
-- EKS if Kubernetes is already used
-- Lambda for small event-driven tasks
-
-Primary backend responsibilities:
-
-- Authentication and user sessions
-- Template submission and moderation
-- Voting and karma accounting
-- Proof submission lifecycle
-- Verification queue management
-- Leaderboards and notifications
-
-### Database
-
-Use PostgreSQL on Amazon RDS for relational data.
-
-Recommended tables:
-
-- `users`
-- `templates`
-- `template_versions`
-- `template_votes`
-- `proof_submissions`
-- `verification_jobs`
-- `verification_results`
-- `karma_events`
-- `comments`
-- `comment_votes`
-- `moderation_events`
-
-Use immutable event rows for karma changes so reputation can be audited and recomputed.
-
-### Object Storage
-
-Use S3 for immutable artifacts:
-
-- Template packages
-- Lean source files
-- Submitted proofs
-- Verification logs
-- Generated problem bundles
-- Public downloadable archives
-
-Every stored artifact should include a content hash.
-
-### Verification Queue
-
-Use SQS for verification jobs.
-
-Job payload:
-
-- Job ID
-- Template ID
-- Template version hash
-- Proof submission ID
-- Proof hash
-- Lean toolchain version
-- Mathlib revision
-- Resource limits
-
-AWS official verifiers and optional volunteer verifiers both consume jobs, but they should use different queues and trust levels.
-
-### Official AWS Verifier Workers
-
-Run official verifier workers on ECS Fargate, AWS Batch, or EC2 autoscaling groups.
-
-Each verifier worker:
-
-- Pulls one job from SQS
-- Downloads immutable artifacts from S3
-- Builds or reuses the pinned Lean environment
-- Runs Lean in a locked sandbox
-- Uploads logs and result metadata
-- Writes the result to the backend
-
-For hard theorem templates, AWS Batch or EC2 workers may be more practical than Lambda because Lean and Mathlib verification can be CPU-heavy and long-running.
-
-## Local Verifier Agent
-
-The local verifier agent is a small desktop service or CLI installed by the user.
-
-Responsibilities:
-
-- Authenticate with HardOJ
-- Receive only user-approved jobs
-- Download immutable template packages
-- Run Lean in a sandbox
-- Stream local logs to the browser
-- Submit signed result metadata
-
-The browser can connect to the local verifier through:
-
-- `localhost` HTTP/WebSocket with a one-time pairing token
-- A CLI command that verifies a downloaded package
-- A desktop app wrapper
-
-The local verifier should never accept remote arbitrary commands. It should expose only a narrow API:
-
-- `GET /status`
-- `POST /verify-template-proof`
-- `POST /cancel-job`
-
-## Template Ranking
-
-Template ranking can use Reddit-style concepts:
-
-- Net score: upvotes minus downvotes
-- Hot ranking: score adjusted by age
-- Top ranking: highest score over a time window
-- New ranking: recent submissions
-- Controversial ranking: high activity with mixed votes
-
-HardOJ-specific ranking signals:
-
-- Number of failed serious attempts
-- Whether the template has a verified solution
-- Difficulty tag
-- Formalization quality score
-- Moderator approval level
-- Number of staged helper templates
-
-## Karma System
-
-Karma should be event-sourced.
-
-Each karma change is stored as a `karma_event`:
-
-- User ID
-- Event type
-- Source object type
-- Source object ID
-- Delta
-- Timestamp
-- Reason
-
-Event types:
-
-- Template upvote received
-- Template downvote received
-- Comment upvote received
-- Comment downvote received
-- Solution accepted
-- Template solved creator bonus
-- Solution upvote received
-- Moderator adjustment
-- Abuse rollback
-
-Template solve reward:
-
-- On accepted solution, compute `reward = max(template_score_at_acceptance, 0)`
-- Compute `creator_bonus = reward * 0.25` for the template author when the solver is not the same user as the template author
-- Add a `solution_accepted` karma event for the solver
-- Add a `template_solved_creator_bonus` karma event for the template creator
-- Store the score snapshot used for the reward
-- Do not retroactively change the solver's reward or creator bonus if the template later gains or loses votes, unless the platform later adds a bounty mechanism
-
-This keeps rewards predictable and prevents old solves from constantly changing user karma.
-
-## Abuse Controls
-
-HardOJ needs anti-abuse protections because votes and karma create incentives.
-
-Recommended controls:
-
-- One vote per user per object
-- Rate limits on voting, posting, and proof submissions
-- New-account vote weighting or trust thresholds
-- Bot and sockpuppet detection
-- Vote-ring detection
-- Moderator review for high-value solve rewards
-- Karma rollback events for abuse
-- Shadow filtering for suspicious votes until reviewed
-- No unlimited verification retries on shared AWS compute
-
-## MVP Scope
-
-The first version should implement:
-
-- User accounts
-- Template submission
-- Template upvotes/downvotes
-- Reddit-style template score
-- Proof submission
-- Local user-owned verifier for pre-checking
-- AWS official verifier for accepted solves
-- Karma events
-- Solver receives karma equal to template score at acceptance
-- Template creator receives a 25% karma bonus when another user solves their template
-- Basic leaderboards
-
-Public donated verification for other users should wait until after the local verifier and AWS verifier are stable.
-
-## Later Extensions
-
-Possible future additions:
-
-- Volunteer verifier pool for public proofs
-- Quorum-based verification
-- Template bounties separate from karma
-- AI-generated Lean template proposals
-- AI semantic review for informal/formal theorem match
-- Staged theorem packs for major open formalization targets
-- Team solving
-- Private templates before publication
-- Proof explanation rewards
-- HardOJ API for external theorem-proving agents
-
-## Critical Invariants
-
-1. A template can be public only if it typechecks with `sorry` in the pinned Lean environment.
-2. A proof can be officially accepted only after trusted verification or an approved trust policy.
-3. User-donated compute must never run arbitrary unscoped jobs.
-4. Verification jobs must be sandboxed, resource-limited, and network-isolated.
-5. Karma must be auditable through immutable karma events.
-6. Solver karma from a template solve is based on the template score snapshot at acceptance.
-7. Template creator solve bonuses are 25% of the same acceptance-time score snapshot.
-8. Lean acceptance is necessary but not always semantically sufficient; high-value templates need informal/formal review.
diff --git a/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md b/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
deleted file mode 100644
index 4e934bb..0000000
--- a/LEANOJ_MASTER_PROOF_WRITER_REMAINDER.md
+++ /dev/null
@@ -1,25 +0,0 @@
-# LeanOJ Master Proof Writer Remainder
-
-## Audit Result
-The master-proof edit loop, persistent `master_proof.lean`, edit history log, resume metadata, stuck-to-brainstorm signal, and focused coordinator tests are implemented.
-
-## Fixed After Audit
-### Mandatory Full Proof Direct Injection
-The final-solver prompt now directly injects the full `master_proof.lean` as mandatory context. The proof attempt is never truncated, summarized, windowed, or RAG-substituted. If the full master proof cannot fit alongside the other mandatory prompt context, LeanOJ raises a hard mandatory direct context overflow error and stops instead of continuing with partial proof context.
-
-Implemented:
-1. Full master proof direct injection.
-2. Hard overflow error when the mandatory full proof cannot fit.
-3. Token counting before prompt assembly.
-4. Test coverage for mandatory context overflow.
-
-## Completed Follow-Ups
-1. Added read-only API access for retrieving the current master proof draft on demand, without broadcasting it in normal status payloads.
-2. Added compact edit-history summaries for debugging.
-3. Added snapshot compaction for large `master_proof_edits.jsonl` logs.
-4. Added a conservative progress watchdog for repeated `needs_more_time: true` edits that do not make meaningful progress.
-5. Added focused coordinator/API route tests for the follow-up behavior.
-6. Added a UI viewer tab for the master proof draft and edit history.
-
-## Remaining Optional Follow-Ups
-- None currently known.
diff --git a/LEANOJ_PROBLEM_11_PROMPT.md b/LEANOJ_PROBLEM_11_PROMPT.md
deleted file mode 100644
index 73cea60..0000000
--- a/LEANOJ_PROBLEM_11_PROMPT.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# LeanOJ Problem 11 Prompt
-
-Source: [LeanOJ Problem 11](https://leanoj.org/index.php?action=view_problem&id=11)
-
-# User Prompt
-
-Solve the LeanOJ problem "RMM 2023 Shortlist N1" completely in Lean 4.
-
-Problem statement:
-
-Let `n` be a positive integer. Let `S` be a set of ordered pairs `(x, y)` such that `1 <= x <= n` and `0 <= y <= n` in each pair, and there are no pairs `(a, b)` and `(c, d)` of different elements in `S` such that `a^2 + b^2` divides both `ac + bd` and `ad - bc`. In terms of `n`, determine the size of the largest possible set `S`.
-
-Your task is to replace every `sorry` in the LeanOJ template with a complete Lean 4 proof accepted by the LeanOJ checker. Preserve the imports, definitions, theorem statement, and overall template structure unless a change is strictly necessary for Lean 4 verification. Do not use `sorry`, `admit`, fake axioms, or placeholder proof devices.
-
-Mathlib version used by the checker: `v4.29.0`.
-
-The final answer must be a complete Lean 4 file suitable for direct LeanOJ submission.
-
-# LeanOJ Template
-
-```lean
-import Mathlib.Data.Finset.Card
-import Mathlib.Order.Bounds.Defs
-
-def answer (n : ℕ) : ℕ := sorry
-
-def S (n : ℕ) : Set ℕ := { a : ℕ | ∃ S : Finset (ℕ × ℕ), S.card = a ∧
-    (∀ p ∈ S, 1 ≤ p.1 ∧ p.1 ≤ n ∧ 0 ≤ p.2 ∧ p.2 ≤ n) ∧
-    (∀ u ∈ S, ∀ v ∈ S, u ≠ v → ¬(
-      (u.1 ^ 2 + u.2 ^ 2) ∣ (u.1 * v.1 + u.2 * v.2) ∧
-      (u.1 ^ 2 + u.2 ^ 2) ∣ (u.1 * v.2 - u.2 * v.1))) }
-
-theorem solution (n : ℕ) (hn : n > 0) : IsGreatest (S n) (answer n) := sorry
-```
diff --git a/README.md b/README.md
index a4aead6..3aa162d 100644
--- a/README.md
+++ b/README.md
@@ -3,8 +3,8 @@
 **Version: 1.0.8**
 
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
-[![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
-[![Node.js 16+](https://img.shields.io/badge/node-16+-green.svg)](https://nodejs.org/)
+[![Python 3.10+](https://img.shields.io/badge/python-3.10+-blue.svg)](https://www.python.org/downloads/)
+[![Node.js 20.19+](https://img.shields.io/badge/node-20.19+-green.svg)](https://nodejs.org/)
 
 **A breakthrough in AI automated theorem generation. An autonomous AI/ASI research system that generates novel and publication-worthy research papers — and the machine-checked theorem proving programming language Lean 4 proofs alongside them for definitive mathematical confirmation of correctness. This ASI is autonomously powered by Intrafere Research Group's new ASI discovery of [Top-P Exploration Through Structured Brainstorming & Validated Feedback](https://intrafere.com/structured-brainstorming-validated-feedback/). Top-P exploration assists in deciphering how we explore AI weights, a specific combination of reiterative brainstorming, validation, feedback, and pruning allows for superintelligence exploration and creative multi-model data extraction from nearly any combination of AI models. Additionally, MOTO has optional automated theorem generation capabilities that formalize candidate theorems and lemmas in Lean 4 (with optional Z3/SMT hinting and Mathlib lemma search) and only stores proofs that Lean 4 accepts as genuinely mathematically verified. Lean 4 automation means the user gets guaranteed verification of the mathematical results produced. This exact version of MOTO is customized to be useful for any discipline with an interest in creative and novel solution generation in S.T.E.M.: physicists, engineers, mathematicians, chemists, researchers, etc. This harness can also easily be modified for topics such as general academic research, chatbots, niche research, robotics, or anything requiring creative output and/or general autonomy. MOTO's novel brainstorming and rejection/validation stage allows autonomous long-term runtime without user intervention — if desired, research can be conducted for days or weeks without user input.**
 
@@ -59,9 +59,9 @@ MOTO (Multi-Output Token Orchestrator) is a high-risk high-reward (novelty seeki
 
 Before installation, you need:
 
-1. **Python 3.8+** - [Download here](https://www.python.org/downloads/)
+1. **Python 3.10+** - [Download here](https://www.python.org/downloads/)
    - ⚠️ **IMPORTANT**: Check "Add Python to PATH" during installation
-2. **Node.js 16+** - [Download here](https://nodejs.org/)
+2. **Node.js 20.19+** - [Download here](https://nodejs.org/)
 3. **LM Studio** (optional but HIGHLY recommended - otherwise your system will need to pay OpenRouter for RAG embedding calls, which is very slow compared to LM Studio's local embeddings) - [Download here](https://lmstudio.ai/)
    - If using OpenRouter, then download and load at least one model (e.g., DeepSeek, Llama, Qwen - older models and some models below 12 billion parameters may struggle; however, it is always worth a try!)
    - **Load the LM Studio RAG agent [optional but HIGHLY recommended for much faster outputs/answers]**: Load the embedding model `nomic-ai/nomic-embed-text-v1.5` in your LM Studio "Developer" tab (server tab) (search for "nomic-ai/nomic-embed-text-v1.5" to download it in the LM Studio downloads center). Please note: you may need to enable "Power User" or "Developer" to see this developer tab - this server will let you load the amount and capacity of simultaneous models that your PC will support. In this developer tab is where you load both your nomic-ai embedding agent and any optional local hosted agents you want to use in the program (e.g., GPT OSS 20b, DeepSeek 32B, etc.). **If you do not download LM Studio and enable the Nomic agent the system will run much slower and cost slightly more due to having to use the paid service OpenRouter for RAG calls.**
@@ -185,7 +185,7 @@ bash linux-ubuntu-launcher.sh
 
 ### Technology Stack
 
-- **Backend**: Python 3.8+, FastAPI, Uvicorn
+- **Backend**: Python 3.10+, FastAPI, Uvicorn
 - **Frontend**: React, Vite, Tailwind CSS
 - **AI**: LM Studio API, OpenRouter API
 - **RAG**: ChromaDB, Nomic Embeddings, or OpenRouter embeddings fallback if LM Studio is unavailable (not recommended - slower).
@@ -336,7 +336,7 @@ All configurable per role:
 
 #### Manual Installation (All Platforms)
 
-If you want the consumer launcher experience on Ubuntu 24.04, prefer `bash linux-ubuntu-launcher.sh` instead of the manual steps below. The manual flow remains the fallback path when you intentionally want full terminal-level control.
+If you want the consumer launcher experience on Ubuntu 24.04, prefer `bash linux-ubuntu-launcher.sh` instead of the manual steps below. The manual flow remains the fallback path when you intentionally want full terminal-level control. For normal desktop use, the launchers are preferred because they create the matching backend/frontend desktop API tokens automatically.
 
 ```bash
 # Clone the repository
@@ -359,13 +359,17 @@ mkdir -p backend/data/user_uploads
 mkdir -p backend/logs
 
 # Start the backend (in one terminal)
-python -m uvicorn backend.api.main:app --host 0.0.0.0 --port 8000
+export MOTO_DESKTOP_API_TOKEN="local-dev-token"
+python -m uvicorn backend.api.main:app --host 127.0.0.1 --port 8000
 
 # Start the frontend (in another terminal)
 cd frontend
+export VITE_MOTO_DESKTOP_API_TOKEN="local-dev-token"
 npm run dev
 ```
 
+On Windows PowerShell, use `$env:MOTO_DESKTOP_API_TOKEN="local-dev-token"` and `$env:VITE_MOTO_DESKTOP_API_TOKEN="local-dev-token"` instead of `export ...`.
+
 Then open `http://localhost:5173` in your browser.
 
 ---
diff --git a/backend/aggregator/core/coordinator.py b/backend/aggregator/core/coordinator.py
index d192614..8d0130e 100644
--- a/backend/aggregator/core/coordinator.py
+++ b/backend/aggregator/core/coordinator.py
@@ -20,6 +20,7 @@
 from backend.shared.openrouter_client import FreeModelExhaustedError
 from backend.shared.free_model_manager import free_model_manager
 from backend.shared.path_safety import resolve_path_within_root, validate_single_path_component
+from backend.shared.log_redaction import redact_log_text
 from backend.aggregator.agents.submitter import SubmitterAgent
 from backend.aggregator.agents.validator import ValidatorAgent
 from backend.aggregator.core.queue_manager import queue_manager
@@ -38,32 +39,26 @@ def _resolve_uploaded_user_file(file_ref: str, *, allow_trusted_context_files: b
 
     uploads_root = Path(system_config.user_uploads_dir).resolve()
     data_root = Path(system_config.data_dir).resolve()
-    candidate = Path(raw_ref)
-
-    if candidate.is_absolute():
-        resolved_candidate = candidate.resolve()
-        try:
-            resolved_candidate.relative_to(uploads_root)
-            return resolved_candidate
-        except ValueError:
-            pass
-
-        if allow_trusted_context_files:
-            try:
-                resolved_candidate.relative_to(data_root)
-                return resolved_candidate
-            except ValueError:
-                pass
-
-        logger.warning("Rejected uploaded file path outside trusted context roots: %s", candidate.name)
-        return None
 
+    # Public uploads are logical filenames. Absolute paths are only accepted
+    # after the same root-containment check, so a caller cannot expand access.
     try:
+        if Path(raw_ref).is_absolute():
+            return resolve_path_within_root(uploads_root, raw_ref)
+
         safe_filename = validate_single_path_component(raw_ref, "uploaded filename")
         return resolve_path_within_root(uploads_root, safe_filename)
     except ValueError as exc:
-        logger.warning("Rejected unsafe uploaded file reference: %s", exc)
-        return None
+        upload_error = exc
+
+    if allow_trusted_context_files:
+        try:
+            return resolve_path_within_root(data_root, raw_ref)
+        except ValueError:
+            pass
+
+    logger.warning("Rejected unsafe uploaded file reference: %s", redact_log_text(upload_error, 240))
+    return None
 
 
 class Coordinator:
@@ -376,9 +371,10 @@ async def initialize(
                     is_user_file=True
                 )
                 # Also load content for potential direct injection (async to avoid blocking)
+                # codeql[py/path-injection]: path is resolved by _resolve_uploaded_user_file within uploads/data roots.
                 async with aiofiles.open(path, 'r', encoding='utf-8') as f:
                     user_files_content[path.name] = await f.read()
-                logger.info(f"Loaded user file: {path.name}")
+                logger.info("Loaded user file: %s", redact_log_text(path.name, 120))
         
         # Create submitter agents from configs (1-10 submitters with individual settings)
         self.submitters = []
diff --git a/backend/aggregator/core/rag_manager.py b/backend/aggregator/core/rag_manager.py
index 54305e2..676463d 100644
--- a/backend/aggregator/core/rag_manager.py
+++ b/backend/aggregator/core/rag_manager.py
@@ -19,6 +19,7 @@
 from backend.shared.api_client_manager import api_client_manager
 from backend.shared.rag_lock import rag_operation_lock
 from backend.shared.utils import count_tokens, compress_text
+from backend.shared.log_redaction import redact_log_text
 from backend.aggregator.ingestion.pipeline import ingestion_pipeline
 
 logger = logging.getLogger(__name__)
@@ -69,7 +70,8 @@ async def add_document(
         self,
         file_path: str,
         chunk_sizes: List[int] = None,
-        is_user_file: bool = False
+        is_user_file: bool = False,
+        trusted_roots: List[str | Path] | None = None,
     ) -> None:
         """
         Add a document to the RAG system.
@@ -80,11 +82,18 @@ async def add_document(
             is_user_file: Whether this is a user file (never evicted)
         """
         try:
+            if trusted_roots is None:
+                trusted_roots = [
+                    system_config.data_dir,
+                    system_config.user_uploads_dir,
+                ]
+
             # Ingest document
             chunks_by_size = await ingestion_pipeline.ingest_file(
                 file_path,
                 chunk_sizes,
-                is_user_file
+                is_user_file,
+                trusted_roots=trusted_roots,
             )
             
             # Add to ChromaDB and memory
@@ -106,10 +115,14 @@ async def add_document(
             # Enforce per-size chunk cap
             await self._enforce_chunk_cap()
             
-            logger.info(f"Added document: {file_path}")
+            logger.info("Added document: %s", redact_log_text(Path(file_path).name, 120))
             
         except Exception as e:
-            logger.error(f"Failed to add document {file_path}: {e}")
+            logger.error(
+                "Failed to add document %s: %s",
+                redact_log_text(Path(file_path).name, 120),
+                redact_log_text(e, 240),
+            )
             raise
     
     async def add_text(
@@ -155,10 +168,14 @@ async def add_text(
             # Enforce per-size chunk cap
             await self._enforce_chunk_cap()
             
-            logger.info(f"Added text: {source_name}")
+            logger.info("Added text: %s", redact_log_text(source_name, 120))
             
         except Exception as e:
-            logger.error(f"Failed to add text {source_name}: {e}")
+            logger.error(
+                "Failed to add text %s: %s",
+                redact_log_text(source_name, 120),
+                redact_log_text(e, 240),
+            )
             raise
     
     async def retrieve(
@@ -718,16 +735,27 @@ async def _evict_lru_document(self) -> None:
             return
         
         # Evict the oldest document
-        logger.info(f"LRU eviction: Removing oldest document '{oldest_doc}' (last accessed: {oldest_time})")
+        logger.info(
+            "LRU eviction: Removing oldest document '%s' (last accessed: %s)",
+            redact_log_text(oldest_doc, 120),
+            oldest_time,
+        )
         
         try:
             await self.remove_document(oldest_doc)
             # Remove from access tracking
             if oldest_doc in self.document_access_order:
                 del self.document_access_order[oldest_doc]
-            logger.info(f"LRU eviction complete: '{oldest_doc}' removed successfully")
+            logger.info(
+                "LRU eviction complete: '%s' removed successfully",
+                redact_log_text(oldest_doc, 120),
+            )
         except Exception as e:
-            logger.error(f"LRU eviction failed for '{oldest_doc}': {e}")
+            logger.error(
+                "LRU eviction failed for '%s': %s",
+                redact_log_text(oldest_doc, 120),
+                redact_log_text(e, 240),
+            )
     
     async def remove_document(self, source_name: str) -> None:
         """Remove a document from all collections."""
@@ -759,7 +787,7 @@ async def remove_document(self, source_name: str) -> None:
         if source_name in self.permanent_documents:
             self.permanent_documents.discard(source_name)
         
-        logger.info(f"Removed document: {source_name}")
+        logger.info("Removed document: %s", redact_log_text(source_name, 120))
     
     def clear_all_documents(self) -> None:
         """Clear all documents from RAG database (synchronous for cleanup).
diff --git a/backend/aggregator/ingestion/pipeline.py b/backend/aggregator/ingestion/pipeline.py
index a4d681a..dd4a568 100644
--- a/backend/aggregator/ingestion/pipeline.py
+++ b/backend/aggregator/ingestion/pipeline.py
@@ -8,6 +8,8 @@
 import logging
 
 from backend.shared.models import DocumentChunk
+from backend.shared.path_safety import resolve_path_within_root
+from backend.shared.log_redaction import redact_log_text
 from backend.aggregator.ingestion.normalizer import normalize_text
 from backend.aggregator.ingestion.chunker import chunker
 
@@ -21,7 +23,8 @@ async def ingest_file(
         self,
         file_path: str,
         chunk_sizes: List[int] = None,
-        is_user_file: bool = False
+        is_user_file: bool = False,
+        trusted_roots: List[str | Path] | None = None,
     ) -> Dict[int, List[DocumentChunk]]:
         """
         Ingest a file and return chunks at multiple sizes.
@@ -35,15 +38,26 @@ async def ingest_file(
             Dict mapping chunk_size -> list of DocumentChunks
         """
         try:
+            resolved_path = Path(file_path)
+            if trusted_roots:
+                for root in trusted_roots:
+                    try:
+                        resolved_path = resolve_path_within_root(Path(root), str(file_path))
+                        break
+                    except ValueError:
+                        continue
+                else:
+                    raise ValueError("File path is outside trusted ingestion roots")
+
             # Read file
-            async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
+            async with aiofiles.open(resolved_path, 'r', encoding='utf-8') as f:
                 text = await f.read()
             
             # Normalize text
             normalized_text = normalize_text(text)
             
             # Get file name
-            file_name = Path(file_path).name
+            file_name = resolved_path.name
             
             # Chunk at multiple sizes
             chunks_by_size = chunker.chunk_text(
@@ -53,12 +67,15 @@ async def ingest_file(
                 is_user_file
             )
             
-            logger.info(f"Ingested {file_name}: {sum(len(chunks) for chunks in chunks_by_size.values())} total chunks")
+            logger.info(
+                "Ingested trusted file into %s total chunks",
+                sum(len(chunks) for chunks in chunks_by_size.values()),
+            )
             
             return chunks_by_size
             
         except Exception as e:
-            logger.error(f"Failed to ingest file {file_path}: {e}")
+            logger.error("Failed to ingest trusted file: %s", redact_log_text(e, 240))
             raise
     
     async def ingest_text(
@@ -92,12 +109,20 @@ async def ingest_text(
                 is_user_file
             )
             
-            logger.info(f"Ingested {source_name}: {sum(len(chunks) for chunks in chunks_by_size.values())} total chunks")
+            logger.info(
+                "Ingested %s: %s total chunks",
+                redact_log_text(source_name, 120),
+                sum(len(chunks) for chunks in chunks_by_size.values()),
+            )
             
             return chunks_by_size
             
         except Exception as e:
-            logger.error(f"Failed to ingest text {source_name}: {e}")
+            logger.error(
+                "Failed to ingest text %s: %s",
+                redact_log_text(source_name, 120),
+                redact_log_text(e, 240),
+            )
             raise
 
 
diff --git a/backend/autonomous/memory/paper_library.py b/backend/autonomous/memory/paper_library.py
index 2a05597..c8b6bb1 100644
--- a/backend/autonomous/memory/paper_library.py
+++ b/backend/autonomous/memory/paper_library.py
@@ -18,6 +18,7 @@
     resolve_path_within_root,
     validate_single_path_component,
 )
+from backend.shared.log_redaction import redact_log_text
 
 logger = logging.getLogger(__name__)
 
@@ -46,7 +47,7 @@ def set_session_manager(self, session_manager) -> None:
             self._base_dir = session_manager.get_papers_dir()
             self._archive_dir = session_manager.get_papers_dir() / "archive"
             self._pruned_dir = session_manager.get_papers_dir() / "pruned"
-            logger.info(f"Paper library using session path: {self._base_dir}")
+            logger.info("Paper library using session path: %s", redact_log_text(self._base_dir, 240))
     
     async def initialize(self) -> None:
         """Initialize the paper library directories."""
@@ -59,19 +60,34 @@ async def initialize(self) -> None:
         self._base_dir.mkdir(parents=True, exist_ok=True)
         self._archive_dir.mkdir(parents=True, exist_ok=True)
         self._pruned_dir.mkdir(parents=True, exist_ok=True)
-        logger.info(f"Paper library initialized at {self._base_dir}")
+        logger.info("Paper library initialized at %s", redact_log_text(self._base_dir, 240))
     
     def _safe_paper_id(self, paper_id: str) -> str:
         """Validate paper_id as a single path component."""
         return validate_single_path_component(paper_id, "paper ID")
 
+    def _paper_path(self, root: Path, paper_id: str, suffix: str, *, prefix: str = "paper_") -> Path:
+        """Build a paper-related path inside a trusted library root."""
+        safe_id = self._safe_paper_id(paper_id)
+        return resolve_path_within_root(root, f"{prefix}{safe_id}{suffix}")
+
+    def _ensure_library_path(self, path: Path, label: str = "library path") -> Path:
+        """Verify an existing helper-built path is still under this library's roots."""
+        candidate = Path(path)
+        for root in (self._base_dir, self._archive_dir, self._pruned_dir):
+            try:
+                return resolve_path_within_root(root, str(candidate))
+            except ValueError:
+                continue
+        raise ValueError(f"{label} escapes paper library roots")
+
     def _get_paper_path(self, paper_id: str) -> Path:
         """Get path to paper file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}.txt"
+        return self._paper_path(self._base_dir, paper_id, ".txt")
 
     def _get_pruned_paper_path(self, paper_id: str) -> Path:
         """Get path to a pruned paper file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}.txt"
+        return self._paper_path(self._pruned_dir, paper_id, ".txt", prefix="pruned_paper_")
     
     def get_paper_path(self, paper_id: str) -> str:
         """
@@ -95,43 +111,55 @@ def get_outline_path(self, paper_id: str) -> str:
     
     def _get_abstract_path(self, paper_id: str) -> Path:
         """Get path to abstract file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_abstract.txt"
+        return self._paper_path(self._base_dir, paper_id, "_abstract.txt")
 
     def _get_pruned_abstract_path(self, paper_id: str) -> Path:
         """Get path to pruned paper abstract file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_abstract.txt"
+        return self._paper_path(self._pruned_dir, paper_id, "_abstract.txt", prefix="pruned_paper_")
     
     def _get_source_brainstorm_path(self, paper_id: str) -> Path:
         """Get path to cached source brainstorm file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_source_brainstorm.txt"
+        return self._paper_path(self._base_dir, paper_id, "_source_brainstorm.txt")
 
     def _get_pruned_source_brainstorm_path(self, paper_id: str) -> Path:
         """Get path to pruned cached source brainstorm file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_source_brainstorm.txt"
+        return self._paper_path(self._pruned_dir, paper_id, "_source_brainstorm.txt", prefix="pruned_paper_")
     
     def _get_outline_path(self, paper_id: str) -> Path:
         """Get path to paper outline file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_outline.txt"
+        return self._paper_path(self._base_dir, paper_id, "_outline.txt")
 
     def _get_pruned_outline_path(self, paper_id: str) -> Path:
         """Get path to pruned paper outline file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_outline.txt"
+        return self._paper_path(self._pruned_dir, paper_id, "_outline.txt", prefix="pruned_paper_")
     
     def _get_metadata_path(self, paper_id: str) -> Path:
         """Get path to paper metadata JSON file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_metadata.json"
+        return self._paper_path(self._base_dir, paper_id, "_metadata.json")
 
     def _get_pruned_metadata_path(self, paper_id: str) -> Path:
         """Get path to pruned paper metadata JSON file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_metadata.json"
+        return self._paper_path(self._pruned_dir, paper_id, "_metadata.json", prefix="pruned_paper_")
     
     def _get_rejections_path(self, paper_id: str) -> Path:
         """Get path to paper compiler rejections file."""
-        return self._base_dir / f"paper_{self._safe_paper_id(paper_id)}_last_10_rejections.txt"
+        return self._paper_path(self._base_dir, paper_id, "_last_10_rejections.txt")
 
     def _get_pruned_rejections_path(self, paper_id: str) -> Path:
         """Get path to pruned paper compiler rejections file."""
-        return self._pruned_dir / f"pruned_paper_{self._safe_paper_id(paper_id)}_last_10_rejections.txt"
+        return self._paper_path(self._pruned_dir, paper_id, "_last_10_rejections.txt", prefix="pruned_paper_")
+
+    def _get_archive_paper_path(self, paper_id: str) -> Path:
+        """Get path to a legacy archived paper file."""
+        return self._paper_path(self._archive_dir, paper_id, ".txt")
+
+    def _get_archive_outline_path(self, paper_id: str) -> Path:
+        """Get path to a legacy archived outline file."""
+        return self._paper_path(self._archive_dir, paper_id, "_outline.txt")
+
+    def _get_archive_metadata_path(self, paper_id: str) -> Path:
+        """Get path to a legacy archived metadata file."""
+        return self._paper_path(self._archive_dir, paper_id, "_metadata.json")
 
     # ========================================================================
     # HISTORY HELPERS
@@ -217,7 +245,11 @@ async def _get_history_user_prompt(self, session_id: str) -> str:
                 metadata.get("user_research_prompt"),
             )
         except Exception as e:
-            logger.warning(f"Failed to read history prompt for session {session_id}: {e}")
+            logger.warning(
+                "Failed to read history prompt for session %s: %s",
+                redact_log_text(session_id, 120),
+                redact_log_text(e, 240),
+            )
             return self._derive_history_prompt_from_session_id(session_id)
 
     @staticmethod
@@ -422,31 +454,58 @@ def _metadata_to_dict(metadata: PaperMetadata) -> Dict[str, Any]:
 
     async def _read_metadata_file(self, metadata_path: Path) -> Optional[PaperMetadata]:
         """Read a metadata file into PaperMetadata."""
+        try:
+            metadata_path = self._ensure_library_path(metadata_path, "metadata path")
+        except ValueError as exc:
+            logger.warning("Rejected unsafe metadata path: %s", exc)
+            return None
+
+        # codeql[py/path-injection]: metadata_path is constrained to this paper library's roots.
         if not metadata_path.exists():
             return None
         try:
+            # codeql[py/path-injection]: metadata_path is constrained to this paper library's roots.
             async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
                 content = await f.read()
             return PaperMetadata(**json.loads(content))
         except Exception as e:
-            logger.error(f"Failed to load paper metadata from {metadata_path}: {e}")
+            logger.error(
+                "Failed to load paper metadata from %s: %s",
+                redact_log_text(metadata_path, 240),
+                redact_log_text(e, 240),
+            )
             return None
 
     async def _save_metadata_to_path(self, metadata: PaperMetadata, metadata_path: Path) -> None:
         """Save paper metadata to a specific path."""
+        metadata_path = self._ensure_library_path(metadata_path, "metadata path")
+        # codeql[py/path-injection]: metadata_path is constrained to this paper library's roots.
         metadata_path.parent.mkdir(parents=True, exist_ok=True)
+        # codeql[py/path-injection]: metadata_path is constrained to this paper library's roots.
         async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
             await f.write(json.dumps(self._metadata_to_dict(metadata), indent=2, default=str))
 
     async def _read_text_file(self, path: Path) -> str:
         """Read a text file if it exists."""
+        try:
+            path = self._ensure_library_path(path, "text path")
+        except ValueError as exc:
+            logger.warning("Rejected unsafe text path: %s", exc)
+            return ""
+
+        # codeql[py/path-injection]: path is constrained to this paper library's roots.
         if not path.exists():
             return ""
         try:
+            # codeql[py/path-injection]: path is constrained to this paper library's roots.
             async with aiofiles.open(path, 'r', encoding='utf-8') as f:
                 return await f.read()
         except Exception as e:
-            logger.error(f"Failed to read {path}: {e}")
+            logger.error(
+                "Failed to read %s: %s",
+                redact_log_text(path, 240),
+                redact_log_text(e, 240),
+            )
             return ""
 
     def _pruned_note_for(self, metadata: PaperMetadata) -> str:
@@ -645,10 +704,10 @@ async def get_pruned_history_paper(self, session_id: str, paper_id: str) -> Opti
 
         # Legacy archives used the old paper_ prefix inside archive/.
         if metadata is None:
-            archive_metadata_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}_metadata.json"
+            archive_metadata_path = scoped_library._get_archive_metadata_path(paper_id)
             metadata = await scoped_library._read_metadata_file(archive_metadata_path)
-            content_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}.txt"
-            outline_path = scoped_library._archive_dir / f"paper_{scoped_library._safe_paper_id(paper_id)}_outline.txt"
+            content_path = scoped_library._get_archive_paper_path(paper_id)
+            outline_path = scoped_library._get_archive_outline_path(paper_id)
             if metadata:
                 is_legacy_archive = True
                 metadata.status = "archived"
@@ -845,7 +904,11 @@ async def _is_paper_complete(self, paper_id: str) -> bool:
             return True
             
         except Exception as e:
-            logger.error(f"Failed to validate paper {paper_id}: {e}")
+            logger.error(
+                "Failed to validate paper %s: %s",
+                redact_log_text(paper_id, 120),
+                redact_log_text(e, 240),
+            )
             return False
     
     # ========================================================================
@@ -909,19 +972,19 @@ async def save_paper(
             paper_path = self._get_paper_path(paper_id)
             async with aiofiles.open(paper_path, 'w', encoding='utf-8') as f:
                 await f.write(content)
-            logger.info(f"Paper saved: {paper_path}")
+            logger.info("Paper saved: %s", redact_log_text(paper_path, 240))
             
             # Save outline
             outline_path = self._get_outline_path(paper_id)
             async with aiofiles.open(outline_path, 'w', encoding='utf-8') as f:
                 await f.write(outline)
-            logger.info(f"Outline saved: {outline_path}")
+            logger.info("Outline saved: %s", redact_log_text(outline_path, 240))
             
             # Save abstract
             abstract_path = self._get_abstract_path(paper_id)
             async with aiofiles.open(abstract_path, 'w', encoding='utf-8') as f:
                 await f.write(abstract)
-            logger.info(f"Abstract saved: {abstract_path}")
+            logger.info("Abstract saved: %s", redact_log_text(abstract_path, 240))
             
             # Save source brainstorm cache
             source_path = self._get_source_brainstorm_path(paper_id)
@@ -937,7 +1000,13 @@ async def save_paper(
             await self._save_metadata(metadata)
             
             model_count = len(model_usage) if model_usage else 0
-            logger.info(f"Saved paper {paper_id}: '{title}' ({word_count} words, {model_count} models tracked)")
+            logger.info(
+                "Saved paper %s: '%s' (%s words, %s models tracked)",
+                redact_log_text(paper_id, 120),
+                redact_log_text(title, 240),
+                word_count,
+                model_count,
+            )
             return metadata
     
     async def get_paper_content(self, paper_id: str, *, strip_proofs: bool = False) -> str:
@@ -957,13 +1026,16 @@ async def get_paper_content(self, paper_id: str, *, strip_proofs: bool = False)
             return ""
 
         try:
-            async with aiofiles.open(paper_path, 'r', encoding='utf-8') as f:
-                content = await f.read()
+            content = await self._read_text_file(paper_path)
             if strip_proofs and content:
                 content = self.strip_verified_proofs_from_content(content)
             return content
         except Exception as e:
-            logger.error(f"Failed to read paper {paper_id}: {e}")
+            logger.error(
+                "Failed to read paper %s: %s",
+                redact_log_text(paper_id, 120),
+                redact_log_text(e, 240),
+            )
             return ""
 
     async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
@@ -972,7 +1044,10 @@ async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
             session_id, scoped_paper_id = paper_id.split(":", 1)
             papers_dir = self.get_history_papers_dir(session_id)
             if papers_dir is None:
-                logger.error(f"History paper directory not found for proof append: {paper_id}")
+                logger.error(
+                    "History paper directory not found for proof append: %s",
+                    redact_log_text(paper_id, 120),
+                )
                 return False
             scoped_library = self._build_scoped_library(papers_dir)
             return await scoped_library.append_proofs_section(scoped_paper_id, proofs_data)
@@ -980,7 +1055,7 @@ async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
         async with self._lock:
             paper_path = self._get_paper_path(paper_id)
             if not paper_path.exists():
-                logger.error(f"Paper not found for proof append: {paper_id}")
+                logger.error("Paper not found for proof append: %s", redact_log_text(paper_id, 120))
                 return False
 
             proofs = proofs_data if isinstance(proofs_data, list) else [proofs_data]
@@ -995,85 +1070,54 @@ async def append_proofs_section(self, paper_id: str, proofs_data: Any) -> bool:
                     "this paper",
                 )
                 if updated_content == existing_content:
-                    logger.info("No new proof entries to append to paper %s", paper_id)
+                    logger.info("No new proof entries to append to paper %s", redact_log_text(paper_id, 120))
                     return True
 
                 async with aiofiles.open(paper_path, "w", encoding="utf-8") as handle:
                     await handle.write(updated_content)
 
-                logger.info("Appended %s proof(s) to paper %s", len(proofs), paper_id)
+                logger.info("Appended %s proof(s) to paper %s", len(proofs), redact_log_text(paper_id, 120))
                 return True
             except Exception as exc:
-                logger.error(f"Failed to append proofs to paper {paper_id}: {exc}")
+                logger.error(
+                    "Failed to append proofs to paper %s: %s",
+                    redact_log_text(paper_id, 120),
+                    redact_log_text(exc, 240),
+                )
                 return False
     
     async def get_abstract(self, paper_id: str) -> str:
         """Get paper abstract."""
         abstract_path = self._get_abstract_path(paper_id)
-        
-        if not abstract_path.exists():
-            return ""
-        
-        try:
-            async with aiofiles.open(abstract_path, 'r', encoding='utf-8') as f:
-                return await f.read()
-        except Exception as e:
-            logger.error(f"Failed to read abstract for {paper_id}: {e}")
-            return ""
+        return await self._read_text_file(abstract_path)
     
     async def get_outline(self, paper_id: str) -> str:
         """Get paper outline."""
         outline_path = self._get_outline_path(paper_id)
-        
-        if not outline_path.exists():
-            return ""
-        
-        try:
-            async with aiofiles.open(outline_path, 'r', encoding='utf-8') as f:
-                return await f.read()
-        except Exception as e:
-            logger.error(f"Failed to read outline for {paper_id}: {e}")
-            return ""
+        return await self._read_text_file(outline_path)
     
     async def get_source_brainstorm(self, paper_id: str) -> str:
         """Get cached source brainstorm content."""
         source_path = self._get_source_brainstorm_path(paper_id)
-        
-        if not source_path.exists():
-            return ""
-        
-        try:
-            async with aiofiles.open(source_path, 'r', encoding='utf-8') as f:
-                return await f.read()
-        except Exception as e:
-            logger.error(f"Failed to read source brainstorm for {paper_id}: {e}")
-            return ""
+        return await self._read_text_file(source_path)
     
     async def _save_metadata(self, metadata: PaperMetadata) -> None:
         """Save paper metadata to JSON file."""
         metadata_path = self._get_metadata_path(metadata.paper_id)
         
         try:
-            async with aiofiles.open(metadata_path, 'w', encoding='utf-8') as f:
-                await f.write(json.dumps(metadata.dict(), indent=2, default=str))
+            await self._save_metadata_to_path(metadata, metadata_path)
         except Exception as e:
-            logger.error(f"Failed to save metadata for {metadata.paper_id}: {e}")
+            logger.error(
+                "Failed to save metadata for %s: %s",
+                redact_log_text(metadata.paper_id, 120),
+                redact_log_text(e, 240),
+            )
     
     async def get_metadata(self, paper_id: str) -> Optional[PaperMetadata]:
         """Get paper metadata."""
         metadata_path = self._get_metadata_path(paper_id)
-        
-        if not metadata_path.exists():
-            return None
-        
-        try:
-            async with aiofiles.open(metadata_path, 'r', encoding='utf-8') as f:
-                content = await f.read()
-                data = json.loads(content)
-                return PaperMetadata(**data)
-        except Exception as e:
-            logger.error(f"Failed to load metadata for {paper_id}: {e}")
-            return None
+        return await self._read_metadata_file(metadata_path)
     
     async def get_all_papers(
         self,
@@ -1124,7 +1168,11 @@ async def get_all_papers(
                     
                     papers.append(metadata)
             except Exception as e:
-                logger.error(f"Failed to load paper metadata from {path}: {e}")
+                logger.error(
+                    "Failed to load paper metadata from %s: %s",
+                    redact_log_text(path, 240),
+                    redact_log_text(e, 240),
+                )
         
         # Sort by creation time (most recent first)
         papers.sort(key=lambda x: x.created_at, reverse=True)
@@ -1167,7 +1215,11 @@ async def get_most_recent_incomplete_paper(self) -> Optional[PaperMetadata]:
                         incomplete_papers.append(metadata)
                         logger.debug(f"Found incomplete paper: {metadata.paper_id}")
             except Exception as e:
-                logger.error(f"Failed to check paper completeness from {path}: {e}")
+                logger.error(
+                    "Failed to check paper completeness from %s: %s",
+                    redact_log_text(path, 240),
+                    redact_log_text(e, 240),
+                )
         
         if not incomplete_papers:
             return None
@@ -1203,11 +1255,13 @@ async def prune_paper(
         async with self._lock:
             try:
                 metadata = await self.get_metadata(paper_id)
+                pruned_metadata_path = self._get_pruned_metadata_path(paper_id)
                 if metadata is None:
-                    if self._get_pruned_metadata_path(paper_id).exists():
-                        logger.info(f"Paper {paper_id} is already pruned")
+                    # codeql[py/path-injection]: paper_id is validated by _get_pruned_metadata_path.
+                    if pruned_metadata_path.exists():
+                        logger.info("Paper %s is already pruned", redact_log_text(paper_id, 120))
                         return True
-                    logger.error(f"Cannot prune paper {paper_id}: metadata not found")
+                    logger.error("Cannot prune paper %s: metadata not found", redact_log_text(paper_id, 120))
                     return False
 
                 self._pruned_dir.mkdir(parents=True, exist_ok=True)
@@ -1218,7 +1272,10 @@ async def prune_paper(
                 metadata.pruned_reason = reason or "No pruning reason recorded."
                 metadata.pruned_by = pruned_by if pruned_by in {"system", "user", "legacy"} else "system"
 
-                paper_path = self._get_paper_path(paper_id)
+                paper_path = self._ensure_library_path(
+                    self._get_paper_path(paper_id),
+                    "paper path",
+                )
                 if paper_path.exists():
                     content = await self._read_text_file(paper_path)
                     clean_content = self._strip_existing_pruned_banner(content)
@@ -1228,7 +1285,11 @@ async def prune_paper(
                         pruned_by=metadata.pruned_by,
                         reason=metadata.pruned_reason,
                     ) + clean_content
-                    async with aiofiles.open(self._get_pruned_paper_path(paper_id), 'w', encoding='utf-8') as f:
+                    pruned_paper_path = self._ensure_library_path(
+                        self._get_pruned_paper_path(paper_id),
+                        "pruned paper path",
+                    )
+                    async with aiofiles.open(pruned_paper_path, 'w', encoding='utf-8') as f:
                         await f.write(pruned_content)
                     paper_path.unlink(missing_ok=True)
 
@@ -1241,17 +1302,27 @@ async def prune_paper(
 
                 for source, dest in files_to_move:
                     if source.exists():
+                        source = self._ensure_library_path(source, "paper source path")
+                        dest = self._ensure_library_path(dest, "pruned destination path")
                         dest.parent.mkdir(parents=True, exist_ok=True)
                         shutil.move(str(source), str(dest))
 
-                await self._save_metadata_to_path(metadata, self._get_pruned_metadata_path(paper_id))
-                self._get_metadata_path(paper_id).unlink(missing_ok=True)
+                await self._save_metadata_to_path(metadata, pruned_metadata_path)
+                metadata_path = self._ensure_library_path(
+                    self._get_metadata_path(paper_id),
+                    "metadata path",
+                )
+                metadata_path.unlink(missing_ok=True)
 
-                logger.info(f"Paper {paper_id} pruned successfully")
+                logger.info("Paper %s pruned successfully", redact_log_text(paper_id, 120))
                 return True
 
             except Exception as e:
-                logger.error(f"Failed to prune paper {paper_id}: {e}")
+                logger.error(
+                    "Failed to prune paper %s: %s",
+                    redact_log_text(paper_id, 120),
+                    redact_log_text(e, 240),
+                )
                 return False
 
     async def archive_paper(self, paper_id: str) -> bool:
@@ -1359,10 +1430,18 @@ async def delete_all_pruned_papers(self) -> int:
                         if path.is_file():
                             path.unlink()
                     # Leave the directory itself in place for future prunes.
-                logger.info(f"Deleted {deleted_count} pruned/archived paper records from {self._base_dir}")
+                logger.info(
+                    "Deleted %s pruned/archived paper records from %s",
+                    deleted_count,
+                    redact_log_text(self._base_dir, 240),
+                )
                 return deleted_count
             except Exception as e:
-                logger.error(f"Failed to delete pruned papers from {self._base_dir}: {e}")
+                logger.error(
+                    "Failed to delete pruned papers from %s: %s",
+                    redact_log_text(self._base_dir, 240),
+                    redact_log_text(e, 240),
+                )
                 return deleted_count
     
     async def delete_paper(self, paper_id: str) -> bool:
@@ -1426,14 +1505,21 @@ async def delete_paper(self, paper_id: str) -> bool:
                         logger.debug(f"Deleted from pruned papers: {path}")
                 
                 if deleted_any:
-                    logger.info(f"Paper {paper_id} deleted successfully")
+                    logger.info("Paper %s deleted successfully", redact_log_text(paper_id, 120))
                     return True
                 else:
-                    logger.warning(f"Paper {paper_id} not found in active or archive directories")
+                    logger.warning(
+                        "Paper %s not found in active or archive directories",
+                        redact_log_text(paper_id, 120),
+                    )
                     return False
                     
             except Exception as e:
-                logger.error(f"Failed to delete paper {paper_id}: {e}")
+                logger.error(
+                    "Failed to delete paper %s: %s",
+                    redact_log_text(paper_id, 120),
+                    redact_log_text(e, 240),
+                )
                 return False
 
 
diff --git a/backend/compiler/core/compiler_rag_manager.py b/backend/compiler/core/compiler_rag_manager.py
index c7b2532..da189c9 100644
--- a/backend/compiler/core/compiler_rag_manager.py
+++ b/backend/compiler/core/compiler_rag_manager.py
@@ -151,7 +151,11 @@ async def load_aggregator_database(self) -> None:
                     chunks_by_size = await ingestion_pipeline.ingest_file(
                         aggregator_file_path,
                         rag_config.submitter_chunk_intervals,  # All 4 configs
-                        is_user_file=True
+                        is_user_file=True,
+                        trusted_roots=[
+                            system_config.data_dir,
+                            system_config.user_uploads_dir,
+                        ],
                     )
                     
                     # Add all chunks while holding the lock
diff --git a/backend/shared/log_redaction.py b/backend/shared/log_redaction.py
index c5a24bc..06a797b 100644
--- a/backend/shared/log_redaction.py
+++ b/backend/shared/log_redaction.py
@@ -24,6 +24,14 @@ def redact_log_text(value: Any, max_chars: int | None = None) -> str:
             text,
         )
 
+    # Prevent log forging by keeping caller-controlled values on one line.
+    text = (
+        text
+        .replace("\r", "\\r")
+        .replace("\n", "\\n")
+        .replace("\t", "\\t")
+    )
+
     if max_chars is not None and max_chars >= 0 and len(text) > max_chars:
         return text[:max_chars] + "...[truncated]"
     return text
diff --git a/frontend/src/components/LatexRenderer.jsx b/frontend/src/components/LatexRenderer.jsx
index f746ac5..3589061 100644
--- a/frontend/src/components/LatexRenderer.jsx
+++ b/frontend/src/components/LatexRenderer.jsx
@@ -451,22 +451,11 @@ const replaceSectionCommand = (text, command, tag, endTag) => {
 const decodeHtmlEntities = (text) => {
   if (!text) return text;
   
-  // Use a textarea to decode HTML entities properly
+  // Decode exactly one entity layer. Repeated unescaping can turn literal
+  // escaped HTML into active markup before DOMPurify sees it.
   const textarea = document.createElement('textarea');
   textarea.innerHTML = text;
-  let decoded = textarea.textContent;
-  
-  // Also handle common named entities that might not be decoded
-  decoded = decoded
-    .replace(/&amp;/g, '&')
-    .replace(/&lt;/g, '<')
-    .replace(/&gt;/g, '>')
-    .replace(/&quot;/g, '"')
-    .replace(/&#39;/g, "'")
-    .replace(/&#x27;/g, "'")
-    .replace(/&apos;/g, "'");
-  
-  return decoded;
+  return textarea.textContent || '';
 };
 
 /**
@@ -475,8 +464,6 @@ const decodeHtmlEntities = (text) => {
 const cleanTikzContent = (content) => {
   return content.trim()
     .replace(/&lt;br\/&gt;/g, '\n')   // Fix HTML-encoded line breaks
-    .replace(/&amp;amp;/g, '&')       // Fix double-encoded ampersands
-    .replace(/&amp;/g, '&')           // Fix encoded ampersands
     .replace(/<br\s*\/?>/g, '\n');    // Fix actual HTML line breaks
 };
 
@@ -521,6 +508,59 @@ const renderKatexSafely = (latex, displayMode, originalMatch) => {
   }
 };
 
+const isEscapedAt = (text, index) => {
+  let backslashCount = 0;
+  for (let i = index - 1; i >= 0 && text[i] === '\\'; i--) {
+    backslashCount += 1;
+  }
+  return backslashCount % 2 === 1;
+};
+
+const isSingleDollarDelimiter = (text, index) => (
+  text[index] === '$'
+  && text[index - 1] !== '$'
+  && text[index + 1] !== '$'
+  && !isEscapedAt(text, index)
+);
+
+const renderInlineDollarMath = (text) => {
+  let output = '';
+  let segmentStart = 0;
+  let index = 0;
+
+  while (index < text.length) {
+    if (!isSingleDollarDelimiter(text, index)) {
+      index += 1;
+      continue;
+    }
+
+    const openIndex = index;
+    let closeIndex = -1;
+    for (let scan = openIndex + 1; scan < text.length; scan++) {
+      if (isSingleDollarDelimiter(text, scan)) {
+        closeIndex = scan;
+        break;
+      }
+    }
+
+    if (closeIndex === -1) {
+      break;
+    }
+
+    const latex = text.slice(openIndex + 1, closeIndex);
+    const match = text.slice(openIndex, closeIndex + 1);
+    output += text.slice(segmentStart, openIndex);
+    output += (latex.includes('<div') || latex.includes('class='))
+      ? match
+      : renderKatexSafely(latex, false, match);
+
+    index = closeIndex + 1;
+    segmentStart = index;
+  }
+
+  return output + text.slice(segmentStart);
+};
+
 /**
  * Process LaTeX theorem-like environments
  */
@@ -861,20 +901,15 @@ const renderLatexToHtml = (text) => {
     });
   });
   
-  // Inline math patterns: $...$ or \(...\)
-  const inlineMathPatterns = [
-    /(?<!\$)\$(?!\$)((?:[^$\\]|\\.|\\)+?)\$(?!\$)/g,
-    /\\\(([\s\S]*?)\\\)/g
-  ];
-  
-  inlineMathPatterns.forEach(pattern => {
-    result = result.replace(pattern, (match, latex) => {
-      // Skip if the content looks like it contains HTML
-      if (latex.includes('<div') || latex.includes('class=')) {
-        return match;
-      }
-      return renderKatexSafely(latex, false, match);
-    });
+  // Inline math: $...$ is scanned linearly to avoid regex backtracking on
+  // adversarial backslash-heavy strings. \( ... \) remains a simple delimiter.
+  result = renderInlineDollarMath(result);
+  result = result.replace(/\\\(([\s\S]*?)\\\)/g, (match, latex) => {
+    // Skip if the content looks like it contains HTML
+    if (latex.includes('<div') || latex.includes('class=')) {
+      return match;
+    }
+    return renderKatexSafely(latex, false, match);
   });
   
   // Step 12: Handle line breaks (AFTER KaTeX - \\ is valid inside math mode)
diff --git a/moto-update-manifest.json b/moto-update-manifest.json
index 8d635ee..ac11f8e 100644
--- a/moto-update-manifest.json
+++ b/moto-update-manifest.json
@@ -1,7 +1,7 @@
 {
   "manifest_version": 1,
   "version": "1.0.8",
-  "build_commit": "d352090d687bd3475acfee17f29f7f0cfb17264e",
+  "build_commit": "06298fc647e267117e7468bb019a4563275dde69",
   "update_channel": "main",
   "api_contract_version": "build5-v12"
 }
diff --git a/moto_launcher.py b/moto_launcher.py
index 53ad70d..ba18f5c 100644
--- a/moto_launcher.py
+++ b/moto_launcher.py
@@ -15,7 +15,7 @@
 import secrets
 import socket
 import shlex
-from shutil import rmtree, which
+from shutil import copyfileobj, rmtree, which
 import subprocess
 import sys
 import tarfile
@@ -130,6 +130,16 @@ def _path_is_within(root: Path, candidate: str | Path) -> bool:
     return True
 
 
+def _stored_keyring_namespace(record: dict | None) -> str | None:
+    """Read current launcher state while accepting legacy records."""
+    if not isinstance(record, dict):
+        return None
+    value = record.get("keyring_namespace")
+    if value is None:
+        value = record.get("secret_namespace")
+    return value if isinstance(value, str) and value.strip() else None
+
+
 def using_repo_local_venv() -> bool:
     return _path_is_within(SCRIPT_DIR / ".venv", get_python_command())
 
@@ -300,7 +310,7 @@ def resolve_instance_runtime() -> InstanceRuntime:
                     "instance_id": candidate_id,
                     "data_root": last_record.get("data_root") or None,
                     "log_root": last_record.get("log_root") or None,
-                    "secret_namespace": last_record.get("secret_namespace"),
+                    "keyring_namespace": _stored_keyring_namespace(last_record),
                     "storage_prefix": last_record.get("storage_prefix"),
                 }
             else:
@@ -371,10 +381,10 @@ def resolve_instance_runtime() -> InstanceRuntime:
     # instance_id unless explicitly overridden or reused from a record that
     # stored an explicit override.
     if is_default_instance:
-        secret_namespace = explicit_secret or (reused_record or {}).get("secret_namespace")
+        secret_namespace = explicit_secret or _stored_keyring_namespace(reused_record)
         storage_prefix = explicit_storage or (reused_record or {}).get("storage_prefix")
     else:
-        recorded_secret = (reused_record or {}).get("secret_namespace")
+        recorded_secret = _stored_keyring_namespace(reused_record)
         recorded_storage = (reused_record or {}).get("storage_prefix")
         secret_namespace = (
             explicit_secret
@@ -741,7 +751,7 @@ def prepare_runtime_and_environment() -> tuple[InstanceRuntime, str, str, dict[s
     else:
         if reused_from_record:
             cprint(
-                "Reusing previously launched instance runtime (same secret namespace, same data root).",
+                "Reusing previously launched instance runtime (same keyring namespace, same data root).",
                 GREEN,
             )
         else:
@@ -753,9 +763,9 @@ def prepare_runtime_and_environment() -> tuple[InstanceRuntime, str, str, dict[s
     cprint(f"Data root: {runtime.data_root}", WHITE)
     cprint(f"Log root: {runtime.log_root}", WHITE)
     if runtime.secret_namespace:
-        cprint(f"Secret namespace: {runtime.secret_namespace}", WHITE)
+        cprint("Keyring namespace: configured for this instance", WHITE)
     else:
-        cprint("Secret namespace: shared default store", WHITE)
+        cprint("Keyring namespace: shared default store", WHITE)
     print()
 
     env = os.environ.copy()
@@ -918,14 +928,38 @@ def _download_file(url: str, destination: Path) -> None:
 def _extract_archive(archive_path: Path, destination: Path) -> None:
     """Extract a zip or tarball into the destination directory."""
     destination.mkdir(parents=True, exist_ok=True)
+    destination_root = destination.resolve()
+
+    def ensure_member_target(member_name: str) -> None:
+        target = (destination_root / member_name).resolve()
+        try:
+            target.relative_to(destination_root)
+        except ValueError as exc:
+            raise RuntimeError(f"Archive member escapes destination: {member_name}") from exc
+
     archive_name = archive_path.name.lower()
     if archive_name.endswith(".zip"):
         with zipfile.ZipFile(archive_path) as archive:
+            for member in archive.infolist():
+                ensure_member_target(member.filename)
             archive.extractall(destination)
         return
     if archive_name.endswith(".tar.gz") or archive_name.endswith(".tgz"):
         with tarfile.open(archive_path, "r:gz") as archive:
-            archive.extractall(destination)
+            for member in archive.getmembers():
+                ensure_member_target(member.name)
+                target = (destination_root / member.name).resolve()
+                if member.isdir():
+                    target.mkdir(parents=True, exist_ok=True)
+                    continue
+                if not member.isfile():
+                    raise RuntimeError(f"Unsupported archive member type: {member.name}")
+                target.parent.mkdir(parents=True, exist_ok=True)
+                source = archive.extractfile(member)
+                if source is None:
+                    raise RuntimeError(f"Could not read archive member: {member.name}")
+                with source, target.open("wb") as output:
+                    copyfileobj(source, output)
         return
     raise RuntimeError(f"Unsupported archive format: {archive_path.name}")
 
@@ -1597,12 +1631,12 @@ def start_services(
         frontend_port=runtime.frontend_port,
         data_root=runtime.data_root,
         log_root=runtime.log_root,
-        secret_namespace=runtime.secret_namespace,
+        keyring_namespace=runtime.secret_namespace,
         storage_prefix=runtime.storage_prefix,
     )
 
     # Persist the active instance runtime so subsequent relaunches can reuse
-    # the same secret_namespace / data_root / storage_prefix. This includes
+    # the same keyring namespace / data root / storage prefix. This includes
     # "default" launches — previously those were skipped, which caused the
     # keyring namespace to flip between None and a freshly minted timestamp
     # whenever the default ports happened to be busy between runs, and
@@ -1620,7 +1654,7 @@ def start_services(
                 instance_id=runtime.instance_id,
                 data_root=runtime.data_root,
                 log_root=runtime.log_root,
-                secret_namespace=runtime.secret_namespace,
+                keyring_namespace=runtime.secret_namespace,
                 storage_prefix=runtime.storage_prefix,
             )
         except OSError as exc:
diff --git a/moto_updater.py b/moto_updater.py
index 5233b2b..a39a349 100644
--- a/moto_updater.py
+++ b/moto_updater.py
@@ -12,6 +12,7 @@
 import sys
 import tempfile
 import urllib.error
+from urllib.parse import urlparse
 import urllib.request
 import zipfile
 
@@ -126,6 +127,14 @@ def _write_json(path: Path, payload: dict) -> None:
     path.write_text(json.dumps(payload, indent=2), encoding="utf-8")
 
 
+def _record_keyring_namespace(record: dict) -> str | None:
+    """Read the current keyring namespace field, with legacy state fallback."""
+    value = record.get("keyring_namespace")
+    if value is None:
+        value = record.get("secret_namespace")
+    return value if isinstance(value, str) and value.strip() else None
+
+
 def _load_package_json() -> dict:
     payload = _read_json(PACKAGE_JSON_PATH)
     return payload if isinstance(payload, dict) else {}
@@ -166,21 +175,31 @@ def _normalize_repo_slug(url: str) -> str | None:
     if not raw:
         return None
 
-    cleaned = raw.rstrip("/")
-    for prefix in ("git+https://", "https://", "http://", "ssh://git@"):
-        if cleaned.startswith(prefix):
-            cleaned = cleaned[len(prefix):]
-            break
-
-    if cleaned.startswith("git@github.com:"):
-        cleaned = cleaned[len("git@github.com:") :]
-    elif cleaned.startswith("github.com/"):
-        cleaned = cleaned[len("github.com/") :]
-
-    cleaned = cleaned.removesuffix(".git")
-    parts = [part for part in cleaned.split("/") if part]
-    if len(parts) >= 2:
-        return f"{parts[-2]}/{parts[-1]}"
+    def slug_from_path(path: str) -> str | None:
+        cleaned_path = path.strip("/").removesuffix(".git")
+        parts = [part for part in cleaned_path.split("/") if part]
+        if len(parts) == 2 and all(parts):
+            return f"{parts[0]}/{parts[1]}"
+        return None
+
+    if raw.startswith("git@github.com:"):
+        return slug_from_path(raw[len("git@github.com:") :])
+
+    parsed_raw = raw
+    if parsed_raw.startswith("git+"):
+        parsed_raw = parsed_raw[len("git+") :]
+
+    parsed = urlparse(parsed_raw)
+    if parsed.scheme in {"http", "https"}:
+        if parsed.hostname != "github.com":
+            return None
+        return slug_from_path(parsed.path)
+
+    if parsed.scheme == "ssh":
+        if parsed.hostname != "github.com":
+            return None
+        return slug_from_path(parsed.path)
+
     return None
 
 
@@ -335,7 +354,11 @@ def cleanup_launcher_state() -> list[dict]:
         backend_pid = _coerce_int(instance.get("backend_window_pid"))
         frontend_pid = _coerce_int(instance.get("frontend_window_pid"))
         if _is_pid_running(backend_pid) or _is_pid_running(frontend_pid):
-            active_instances.append(instance)
+            normalized = dict(instance)
+            keyring_namespace = _record_keyring_namespace(normalized)
+            normalized.pop("secret_namespace", None)
+            normalized["keyring_namespace"] = keyring_namespace
+            active_instances.append(normalized)
 
     _save_launcher_state({"instances": active_instances})
     return active_instances
@@ -350,7 +373,7 @@ def register_active_instance(
     frontend_port: int,
     data_root: str,
     log_root: str,
-    secret_namespace: str | None,
+    keyring_namespace: str | None,
     storage_prefix: str | None,
 ) -> None:
     active_instances = cleanup_launcher_state()
@@ -363,7 +386,6 @@ def register_active_instance(
             "frontend_port": frontend_port,
             "data_root": data_root,
             "log_root": log_root,
-            "secret_namespace": secret_namespace,
             "storage_prefix": storage_prefix,
         }
     )
@@ -373,7 +395,7 @@ def register_active_instance(
 def load_last_instance_record() -> dict | None:
     """Return the most recently launched non-default instance record, or None.
 
-    Used to preserve a stable secret_namespace / data_root / storage_prefix across
+    Used to preserve a stable keyring namespace / data_root / storage_prefix across
     relaunches when the default ports are temporarily busy. Without this the
     launcher would mint a fresh timestamped instance_id on every relaunch, which
     changes the OS-keyring service name and makes the saved OpenRouter / Wolfram
@@ -385,6 +407,11 @@ def load_last_instance_record() -> dict | None:
     instance_id = payload.get("instance_id")
     if not isinstance(instance_id, str) or not instance_id.strip():
         return None
+    payload = dict(payload)
+    keyring_namespace = _record_keyring_namespace(payload)
+    payload.pop("secret_namespace", None)
+    if keyring_namespace:
+        payload["keyring_namespace"] = keyring_namespace
     return payload
 
 
@@ -393,7 +420,7 @@ def save_last_instance_record(
     instance_id: str,
     data_root: str,
     log_root: str,
-    secret_namespace: str | None,
+    keyring_namespace: str | None,
     storage_prefix: str | None,
 ) -> None:
     """Persist the last launched non-default instance so it can be reused on relaunch."""
@@ -403,7 +430,6 @@ def save_last_instance_record(
             "instance_id": instance_id,
             "data_root": data_root,
             "log_root": log_root,
-            "secret_namespace": secret_namespace,
             "storage_prefix": storage_prefix,
         },
     )
@@ -787,6 +813,13 @@ def _download_archive(manifest: BuildManifest, destination: Path) -> None:
 
 def _extract_archive(archive_path: Path, destination: Path) -> Path:
     with zipfile.ZipFile(archive_path) as archive:
+        destination_root = destination.resolve()
+        for member in archive.infolist():
+            target = (destination_root / member.filename).resolve()
+            try:
+                target.relative_to(destination_root)
+            except ValueError as exc:
+                raise RuntimeError(f"Archive member escapes destination: {member.filename}") from exc
         archive.extractall(destination)
 
     children = [child for child in destination.iterdir()]
diff --git a/package-lock.json b/package-lock.json
index 9bea5f7..c609edd 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "moto-math-variant",
-  "version": "1.0.6",
+  "version": "1.0.8",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "moto-math-variant",
-      "version": "1.0.6",
+      "version": "1.0.8",
       "license": "MIT"
     }
   }
diff --git a/tests/test_codeql_path_hardening.py b/tests/test_codeql_path_hardening.py
new file mode 100644
index 0000000..b211445
--- /dev/null
+++ b/tests/test_codeql_path_hardening.py
@@ -0,0 +1,136 @@
+import asyncio
+import json
+from pathlib import Path
+import tempfile
+import unittest
+from unittest import mock
+
+from backend.aggregator.core.coordinator import _resolve_uploaded_user_file
+from backend.aggregator.ingestion.pipeline import IngestionPipeline
+from backend.autonomous.memory.paper_library import PaperLibrary
+from backend.shared.config import system_config
+from backend.shared.models import PaperMetadata
+
+
+class IngestionPathHardeningTests(unittest.TestCase):
+    def test_ingest_file_rejects_paths_outside_trusted_roots(self) -> None:
+        async def run_case() -> None:
+            with tempfile.TemporaryDirectory() as temp_dir:
+                root = Path(temp_dir)
+                trusted = root / "trusted"
+                outside = root / "outside.txt"
+                trusted.mkdir()
+                outside.write_text("outside", encoding="utf-8")
+
+                with self.assertRaises(ValueError):
+                    await IngestionPipeline().ingest_file(
+                        str(outside),
+                        chunk_sizes=[256],
+                        trusted_roots=[trusted],
+                    )
+
+        asyncio.run(run_case())
+
+    def test_ingest_file_accepts_paths_inside_trusted_roots(self) -> None:
+        async def run_case() -> None:
+            with tempfile.TemporaryDirectory() as temp_dir:
+                root = Path(temp_dir)
+                trusted = root / "trusted"
+                trusted.mkdir()
+                paper = trusted / "paper.txt"
+                paper.write_text("A useful mathematical note.", encoding="utf-8")
+
+                chunks = await IngestionPipeline().ingest_file(
+                    str(paper),
+                    chunk_sizes=[256],
+                    trusted_roots=[trusted],
+                )
+
+            self.assertIn(256, chunks)
+            self.assertGreaterEqual(len(chunks[256]), 1)
+
+        asyncio.run(run_case())
+
+
+class UploadPathResolutionTests(unittest.TestCase):
+    def test_uploaded_user_file_rejects_traversal_and_untrusted_absolute_paths(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            root = Path(temp_dir)
+            uploads = root / "uploads"
+            data = root / "data"
+            outside = root / "outside.txt"
+            uploads.mkdir()
+            data.mkdir()
+            outside.write_text("outside", encoding="utf-8")
+
+            with mock.patch.object(system_config, "user_uploads_dir", str(uploads)):
+                with mock.patch.object(system_config, "data_dir", str(data)):
+                    self.assertIsNone(_resolve_uploaded_user_file("../outside.txt"))
+                    self.assertIsNone(_resolve_uploaded_user_file(str(outside)))
+
+    def test_uploaded_user_file_allows_trusted_context_files_only_when_enabled(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            root = Path(temp_dir)
+            uploads = root / "uploads"
+            data = root / "data"
+            trusted_file = data / "paper.txt"
+            uploads.mkdir()
+            data.mkdir()
+            trusted_file.write_text("trusted", encoding="utf-8")
+
+            with mock.patch.object(system_config, "user_uploads_dir", str(uploads)):
+                with mock.patch.object(system_config, "data_dir", str(data)):
+                    self.assertIsNone(
+                        _resolve_uploaded_user_file(
+                            str(trusted_file),
+                            allow_trusted_context_files=False,
+                        )
+                    )
+                    self.assertEqual(
+                        _resolve_uploaded_user_file(
+                            str(trusted_file),
+                            allow_trusted_context_files=True,
+                        ),
+                        trusted_file.resolve(),
+                    )
+
+
+class PaperLibraryPathHardeningTests(unittest.TestCase):
+    def _library_for(self, base_dir: Path) -> PaperLibrary:
+        library = PaperLibrary()
+        library._base_dir = base_dir
+        library._archive_dir = base_dir / "archive"
+        library._pruned_dir = base_dir / "pruned"
+        base_dir.mkdir(parents=True, exist_ok=True)
+        library._archive_dir.mkdir(parents=True, exist_ok=True)
+        library._pruned_dir.mkdir(parents=True, exist_ok=True)
+        return library
+
+    def test_paper_library_rejects_malicious_paper_ids(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            library = self._library_for(Path(temp_dir) / "papers")
+
+            for paper_id in ("../evil", "a/b", r"a\b", ".", ".."):
+                with self.subTest(paper_id=paper_id):
+                    with self.assertRaises(ValueError):
+                        library.get_paper_path(paper_id)
+
+    def test_prune_paper_keeps_outputs_in_session_pruned_directory(self) -> None:
+        async def run_case() -> None:
+            with tempfile.TemporaryDirectory() as temp_dir:
+                base_dir = Path(temp_dir) / "session" / "papers"
+                library = self._library_for(base_dir)
+                metadata = PaperMetadata(paper_id="paper_1", title="Test Paper")
+                (base_dir / "paper_paper_1.txt").write_text("paper content", encoding="utf-8")
+                (base_dir / "paper_paper_1_metadata.json").write_text(
+                    json.dumps(metadata.model_dump(), default=str),
+                    encoding="utf-8",
+                )
+
+                self.assertTrue(await library.prune_paper("paper_1", reason="duplicate", pruned_by="user"))
+
+                self.assertTrue((base_dir / "pruned" / "pruned_paper_paper_1.txt").exists())
+                self.assertTrue((base_dir / "pruned" / "pruned_paper_paper_1_metadata.json").exists())
+                self.assertFalse((base_dir / "paper_paper_1.txt").exists())
+
+        asyncio.run(run_case())
diff --git a/tests/test_moto_launcher.py b/tests/test_moto_launcher.py
index 3408cdd..1546f8e 100644
--- a/tests/test_moto_launcher.py
+++ b/tests/test_moto_launcher.py
@@ -1,8 +1,11 @@
+import io
 import os
 from pathlib import Path
+import tarfile
 import tempfile
 import unittest
 from unittest import mock
+import zipfile
 
 import moto_launcher
 
@@ -171,6 +174,22 @@ def test_explicit_override_does_not_read_last_record(self) -> None:
         # caller provided explicit overrides.
         loader.assert_not_called()
 
+    def test_resolve_instance_runtime_reads_keyring_namespace_field(self) -> None:
+        saved_record = {
+            "instance_id": "instance_20260101_000000_1111",
+            "data_root": r"C:\\custom\\data",
+            "log_root": r"C:\\custom\\logs",
+            "keyring_namespace": "stored_keyring_namespace",
+            "storage_prefix": "instance_20260101_000000_1111",
+        }
+        with mock.patch.dict(os.environ, {}, clear=True):
+            with mock.patch.object(moto_launcher, "load_last_instance_record", return_value=saved_record):
+                with mock.patch.object(moto_launcher, "cleanup_launcher_state", return_value=[]):
+                    with mock.patch.object(moto_launcher, "port_in_use", return_value=False):
+                        runtime = moto_launcher.resolve_instance_runtime()
+
+        self.assertEqual(runtime.secret_namespace, "stored_keyring_namespace")
+
 
 class WindowsLauncherStrategyTests(unittest.TestCase):
     def test_build_windows_service_command_prefers_path_safe_executable_name(self) -> None:
@@ -259,5 +278,40 @@ def test_launch_service_falls_back_to_background_when_no_linux_terminal(self) ->
         popen.assert_called_once()
 
 
+class ArchiveExtractionTests(unittest.TestCase):
+    def test_extract_archive_rejects_tar_path_traversal(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            root = Path(temp_dir)
+            archive_path = root / "archive.tar.gz"
+            destination = root / "extract"
+            outside = root / "evil.txt"
+
+            with tarfile.open(archive_path, "w:gz") as archive:
+                data = b"bad"
+                member = tarfile.TarInfo("../evil.txt")
+                member.size = len(data)
+                archive.addfile(member, io.BytesIO(data))
+
+            with self.assertRaises(RuntimeError):
+                moto_launcher._extract_archive(archive_path, destination)
+
+            self.assertFalse(outside.exists())
+
+    def test_extract_archive_rejects_zip_path_traversal(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            root = Path(temp_dir)
+            archive_path = root / "archive.zip"
+            destination = root / "extract"
+            outside = root / "evil.txt"
+
+            with zipfile.ZipFile(archive_path, "w") as archive:
+                archive.writestr("../evil.txt", "bad")
+
+            with self.assertRaises(RuntimeError):
+                moto_launcher._extract_archive(archive_path, destination)
+
+            self.assertFalse(outside.exists())
+
+
 if __name__ == "__main__":
     unittest.main()
diff --git a/tests/test_moto_updater.py b/tests/test_moto_updater.py
index cfe67ef..c9f98c5 100644
--- a/tests/test_moto_updater.py
+++ b/tests/test_moto_updater.py
@@ -4,6 +4,7 @@
 import unittest
 import urllib.error
 from unittest import mock
+import zipfile
 
 import moto_updater
 
@@ -20,6 +21,17 @@ def test_normalize_repo_slug_handles_common_github_formats(self) -> None:
             with self.subTest(raw=raw):
                 self.assertEqual(moto_updater._normalize_repo_slug(raw), expected)
 
+    def test_normalize_repo_slug_rejects_lookalike_or_untrusted_hosts(self) -> None:
+        cases = [
+            "https://github.com.evil/Intrafere/MOTO-Autonomous-ASI",
+            "https://evil.example/github.com/Intrafere/MOTO-Autonomous-ASI",
+            "ssh://git@github.com.evil/Intrafere/MOTO-Autonomous-ASI.git",
+            "https://example.com/Intrafere/MOTO-Autonomous-ASI",
+        ]
+        for raw in cases:
+            with self.subTest(raw=raw):
+                self.assertIsNone(moto_updater._normalize_repo_slug(raw))
+
 
 class InstallStateTests(unittest.TestCase):
     def test_classify_zip_install_when_repo_has_no_git_metadata(self) -> None:
@@ -120,6 +132,60 @@ def fake_is_pid_running(pid: int | None) -> bool:
             self.assertEqual(len(instances), 1)
             self.assertEqual(instances[0]["instance_id"], "alive")
 
+    def test_last_instance_record_does_not_persist_keyring_namespace(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            record_path = Path(temp_dir) / ".moto_last_instance.json"
+
+            with mock.patch.object(moto_updater, "LAUNCHER_LAST_INSTANCE_PATH", record_path):
+                moto_updater.save_last_instance_record(
+                    instance_id="instance_one",
+                    data_root="data",
+                    log_root="logs",
+                    keyring_namespace="instance_one",
+                    storage_prefix="instance_one",
+                )
+                payload = json.loads(record_path.read_text(encoding="utf-8"))
+
+        self.assertNotIn("keyring_namespace", payload)
+        self.assertNotIn("secret_namespace", payload)
+
+    def test_last_instance_record_reads_legacy_secret_namespace(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            record_path = Path(temp_dir) / ".moto_last_instance.json"
+            record_path.write_text(
+                json.dumps(
+                    {
+                        "instance_id": "instance_one",
+                        "data_root": "data",
+                        "log_root": "logs",
+                        "secret_namespace": "legacy_namespace",
+                        "storage_prefix": "instance_one",
+                    }
+                ),
+                encoding="utf-8",
+            )
+
+            with mock.patch.object(moto_updater, "LAUNCHER_LAST_INSTANCE_PATH", record_path):
+                payload = moto_updater.load_last_instance_record()
+
+        self.assertIsNotNone(payload)
+        self.assertEqual(payload["keyring_namespace"], "legacy_namespace")
+        self.assertNotIn("secret_namespace", payload)
+
+    def test_updater_extract_archive_rejects_zip_path_traversal(self) -> None:
+        with tempfile.TemporaryDirectory() as temp_dir:
+            root = Path(temp_dir)
+            archive_path = root / "archive.zip"
+            destination = root / "extract"
+            outside = root / "evil.txt"
+            with zipfile.ZipFile(archive_path, "w") as archive:
+                archive.writestr("../evil.txt", "bad")
+
+            with self.assertRaises(RuntimeError):
+                moto_updater._extract_archive(archive_path, destination)
+
+            self.assertFalse(outside.exists())
+
 
 class SnapshotSyncTests(unittest.TestCase):
     def test_collect_preserved_relatives_includes_explicit_instance_runtime_paths(self) -> None: