pras-ops
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 8 additions & 0 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 3 additions & 1 deletion b/‎pyproject.toml‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎requirements.txt‎
Lines changed: 2 additions & 0 deletions b/‎requirements.txt‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎scrapewizard/cli/commands/setup.py‎
Lines changed: 139 additions & 28 deletions b/‎scrapewizard/cli/commands/setup.py‎
Lines changed: 139 additions & 28 deletions
diff --git a/‎scrapewizard/cli/commands/utils.py‎
Lines changed: 58 additions & 2 deletions b/‎scrapewizard/cli/commands/utils.py‎
Lines changed: 58 additions & 2 deletions
diff --git a/‎scrapewizard/core/config.py‎
Lines changed: 9 additions & 3 deletions b/‎scrapewizard/core/config.py‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎scrapewizard/core/constants.py‎
Lines changed: 6 additions & 0 deletions b/‎scrapewizard/core/constants.py‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎scrapewizard/core/orchestrator.py‎
Lines changed: 6 additions & 2 deletions b/‎scrapewizard/core/orchestrator.py‎
Lines changed: 6 additions & 2 deletions
@@ -85,6 +85,14 @@ jobs:
         working-directory: studio/frontend
         run: npm run lint
 
+      - name: Run type-check
+        working-directory: studio/frontend
+        run: npm run type-check
+
+      - name: Run test
+        working-directory: studio/frontend
+        run: npm run test
+
       - name: Run build
         working-directory: studio/frontend
         run: npm run build
 
@@ -36,7 +36,9 @@ dependencies = [
     "uvicorn",
     "python-dotenv",
     "aiohttp",
-    "pillow"
+    "pillow",
+    "anthropic>=0.39.0",
+    "httpx>=0.27.0"
 ]
 
 [project.scripts]
 
@@ -22,3 +22,5 @@ uvicorn
 python-dotenv
 aiohttp
 pillow
+anthropic>=0.39.0
+httpx>=0.27.0
@@ -26,37 +26,148 @@ def setup(
             default=current_config.get("provider", "openai")
         ).execute()
 
-    if not api_key:
-        # Check if we already have one
-        existing_key = current_config.get("api_key", "")
-        key_masked = f"{existing_key[:4]}...{existing_key[-4:]}" if len(existing_key) > 8 else "********" if existing_key else ""
+    if provider == "local":
+        import shutil
+        from scrapewizard.llm.local_runtime import LocalRuntime
 
-        api_key = inquirer.text(
-            message=f"Enter API Key (Current: {key_masked}):",
-            default=existing_key,
-            validate=lambda result: len(result) > 0 or "API Key cannot be empty"
-        ).execute()
-
-    if not model:
-        default_models = {
-            "openai": "gpt-4-turbo",
-            "anthropic": "claude-3-5-sonnet-20240620",
-            "openrouter": "google/gemini-pro",
-            "local": "llama3"
+        ollama_installed = shutil.which("ollama") is not None
+        if not ollama_installed:
+            print("⚠️ [yellow]Warning: 'ollama' executable not found on system PATH. Please ensure Ollama is installed.[/yellow]")
+            
+        local_base_url = current_config.get("local_base_url", "http://localhost:11434")
+        if not model:
+            local_base_url = inquirer.text(
+                message="Enter Ollama Base URL:",
+                default=local_base_url
+            ).execute()
+        
+        runtime = LocalRuntime(base_url=local_base_url)
+        daemon_status = runtime.check_daemon()
+        
+        if not daemon_status.running and not model:
+            print("❌ [red]Error: Ollama daemon is not running at configured URL.[/red]")
+            if not inquirer.confirm(message="Ollama daemon is down. Proceed anyway?", default=False).execute():
+                log("Setup aborted.")
+                return
+                
+        # Detect hardware
+        hw = runtime.detect_hardware()
+        if not model:
+            print(f"🖥️ [cyan]Hardware detected:[/cyan] {hw['ram_gb']} GB RAM, GPU: {hw['gpu_name']}")
+            print(f"📦 Suggested performance tier: [green]{hw['tier'].upper()}[/green]")
+        
+        recommended = runtime.recommend_model(hw['tier'])
+        
+        selected_model = model
+        if not selected_model:
+            installed = runtime.list_models()
+            if installed:
+                print("Installed models:")
+                for m in installed:
+                    print(f"  • {m}")
+            else:
+                print("No models found in Ollama.")
+                
+            choices = installed.copy()
+            if recommended not in choices:
+                choices.append(recommended)
+            choices.append("Other (enter custom name)")
+            
+            selected_model = inquirer.select(
+                message="Select Ollama model:",
+                choices=choices,
+                default=recommended if recommended in choices else (installed[0] if installed else choices[0])
+            ).execute()
+            
+            if selected_model == "Other (enter custom name)":
+                selected_model = inquirer.text(
+                    message="Enter custom model name:",
+                    default=recommended
+                ).execute()
+                
+            if selected_model not in installed:
+                if inquirer.confirm(message=f"Model '{selected_model}' is not downloaded. Pull it now?", default=True).execute():
+                    print(f"Downloading '{selected_model}' via Ollama. Please wait...")
+                    
+                    from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn, DownloadColumn
+                    with Progress(
+                        SpinnerColumn(),
+                        TextColumn("[progress.description]{task.description}"),
+                        BarColumn(),
+                        DownloadColumn(),
+                    ) as progress:
+                        task = progress.add_task(f"Pulling {selected_model}...", total=100)
+                        
+                        def callback(data):
+                            status = data.get("status", "")
+                            total = data.get("total", 0)
+                            completed = data.get("completed", 0)
+                            if total > 0:
+                                progress.update(task, completed=completed, total=total, description=f"Pulling {selected_model}: {status}")
+                            else:
+                                progress.update(task, description=f"Pulling {selected_model}: {status}")
+                                
+                        success = runtime.pull_model(selected_model, callback)
+                        if success:
+                            print(f"✅ Model '{selected_model}' pulled successfully.")
+                        else:
+                            print(f"❌ Failed to pull model '{selected_model}'.")
+                            
+        # Probe model latency
+        if daemon_status.running and not model:
+            print("Probing model response latency...")
+            probe_res = runtime.probe(selected_model)
+            if probe_res.success:
+                print(f"✅ Connection successful! Probe latency: [green]{probe_res.latency}s[/green]")
+            else:
+                print(f"⚠️ Probe check failed: {probe_res.error}")
+                
+        offline_only = current_config.get("offline_only", False)
+        if not model:
+            offline_only = inquirer.confirm(message="Enable offline-only mode (disable all cloud fallbacks)?", default=False).execute()
+            
+        new_config = {
+            "provider": "local",
+            "model": selected_model,
+            "local_base_url": local_base_url,
+            "local_model": selected_model,
+            "local_tier": hw['tier'],
+            "offline_only": offline_only
         }
-        model = inquirer.text(
-            message="Enter Model Name:",
-            default=current_config.get("model", default_models.get(provider, ""))
-        ).execute()
+        ConfigManager.save_config(new_config)
+        log("Configuration saved successfully.")
+
+    else:
+        if not api_key:
+            # Check if we already have one
+            existing_key = current_config.get("api_key", "")
+            key_masked = f"{existing_key[:4]}...{existing_key[-4:]}" if len(existing_key) > 8 else "********" if existing_key else ""
+            
+            api_key = inquirer.text(
+                message=f"Enter API Key (Current: {key_masked}):",
+                default=existing_key,
+                validate=lambda result: len(result) > 0 or "API Key cannot be empty"
+            ).execute()
 
-    # Save Config
-    new_config = {
-        "provider": provider,
-        "api_key": api_key,
-        "model": model
-    }
-    ConfigManager.save_config(new_config)
-    log("Configuration saved successfully.")
+        if not model:
+            default_models = {
+                "openai": "gpt-4-turbo",
+                "anthropic": "claude-3-5-sonnet-20240620",
+                "openrouter": "google/gemini-pro"
+            }
+            model = inquirer.text(
+                message="Enter Model Name:",
+                default=current_config.get("model", default_models.get(provider, ""))
+            ).execute()
+
+        # Save Config
+        new_config = {
+            "provider": provider,
+            "api_key": api_key,
+            "model": model
+        }
+        ConfigManager.save_config(new_config)
+        log("Configuration saved successfully.")
 
     # Proxy Setup
     if use_proxy or inquirer.confirm(message="Configure Proxy?", default=False).execute():
 
@@ -96,10 +96,66 @@ def doctor() -> None:
     if config_ok:
         try:
             from scrapewizard.llm.client import LLMClient
+            from scrapewizard.llm.local_runtime import LocalRuntime
+            from scrapewizard.core.constants import LOCAL_LLM_PROBE_TIMEOUT
+            
             client = LLMClient()
-            rprint(f"• LLM Client: [green]Initialized[/green] ({client.provider}/{client.model})")
+            provider = client.provider
+            
+            if provider == "local":
+                runtime = LocalRuntime()
+                daemon = runtime.check_daemon()
+                
+                if daemon.running:
+                    rprint(f"• Local AI Runtime: [green]Ollama {daemon.version}[/green]")
+                    models = runtime.list_models()
+                    model_name = client.model
+                    
+                    model_loaded = False
+                    for m in models:
+                        if m == model_name or m.startswith(model_name + ":") or model_name.startswith(m + ":"):
+                            model_loaded = True
+                            break
+                            
+                    if model_loaded:
+                        rprint(f"• Local Model: [green]{model_name}[/green]")
+                        # Run probe
+                        probe_res = runtime.probe(model_name, timeout=LOCAL_LLM_PROBE_TIMEOUT)
+                        if probe_res.success:
+                            rprint(f"• LLM Local: [green]✅ Ollama running, model {model_name} loaded, probe: {probe_res.latency}s[/green]")
+                        else:
+                            rprint(f"• LLM Local: [red]❌ Probe failed: {probe_res.error}[/red]")
+                    else:
+                        rprint(f"• Local Model: [yellow]Not pulled ({model_name})[/yellow]")
+                        rprint(f"• LLM Local: [yellow]⚠️ Model not pulled. Run 'scrapewizard setup'[/yellow]")
+                else:
+                    rprint(f"• Local AI Runtime: [red]Ollama not running[/red]")
+                    rprint(f"• LLM Local: [red]❌ Ollama daemon is down[/red]")
+                    
+                # Hardware Tier
+                hw = runtime.detect_hardware()
+                rprint(f"• Hardware Tier: [cyan]{hw['tier'].upper()}[/cyan] ({hw['ram_gb']} GB RAM, {hw['gpu_name']})")
+                
+            else:
+                # Cloud client probe check
+                import time
+                start_time = time.time()
+                try:
+                    # Let's run a small test call to verify cloud connectivity
+                    response = client.call(
+                        system_prompt="you are a health check assistant. reply with ok",
+                        user_prompt="ping",
+                        json_mode=False
+                    )
+                    latency = round(time.time() - start_time, 2)
+                    if "ok" in response.lower():
+                        rprint(f"• LLM Cloud: [green]✅ {client.provider}/{client.model}, probe: {latency}s[/green]")
+                    else:
+                        rprint(f"• LLM Cloud: [yellow]⚠️ {client.provider}/{client.model} responded but output was: {response} ({latency}s)[/yellow]")
+                except Exception as e:
+                    rprint(f"• LLM Cloud: [red]❌ Connection failed to {client.provider}/{client.model}: {e}[/red]")
         except Exception as e:
-            rprint(f"• LLM Client: [red]Error ({e})[/red]")
+            rprint(f"• LLM Client: [red]Error initializing client ({e})[/red]")
 
     rprint("\n[bold green]System check complete.[/bold green]")
 
 
@@ -21,7 +21,11 @@ class ConfigManager:
 
     DEFAULT_CONFIG = {
         "provider": "openai",
-        "model": "gpt-4-turbo"
+        "model": "gpt-4-turbo",
+        "local_base_url": "http://localhost:11434",
+        "local_model": "qwen2.5-coder:3b",
+        "local_tier": "balanced",
+        "offline_only": False,
     }
 
     @classmethod
@@ -51,7 +55,7 @@ def migrate_from_plaintext(cls):
                 migrated = True
 
             # Pattern 2: Provider-specific keys
-            for provider in ["openai", "anthropic", "openrouter", "local"]:
+            for provider in ["openai", "anthropic", "openrouter", "local", "local-embedded"]:
                 if provider in data and isinstance(data[provider], dict) and "api_key" in data[provider]:
                     cls.save_api_key(provider, data[provider]["api_key"])
                     del data[provider]["api_key"]
@@ -136,6 +140,8 @@ def save_proxy(cls, proxy_config: Dict[str, Any]):
 
     @classmethod
     def check_setup(cls) -> bool:
-        """Check if essential configuration (API key) is set."""
+        """Check if essential configuration (API key or local setup) is set."""
         config = cls.load_config()
+        if config.get("provider") == "local":
+            return True
         return bool(config.get("api_key"))
@@ -6,6 +6,12 @@
 PROBE_NAVIGATION_TIMEOUT = 30
 SCAN_NAVIGATION_TIMEOUT = 45
 
+# Local LLM timeouts (seconds)
+LOCAL_LLM_COLD_START_TIMEOUT = 60    # First call loads model into RAM
+LOCAL_LLM_WARM_TIMEOUT = 30          # Subsequent calls
+LOCAL_LLM_PROBE_TIMEOUT = 15         # Doctor/setup probe
+
+
 # LLM Thresholds
 LLM_CONFIDENCE_THRESHOLD = 0.5
 SCRAPING_POSSIBLE_MIN_CONFIDENCE = 0.4
 
@@ -855,7 +855,10 @@ def do_final():
                     print(f"🤖 [bold cyan]AI Usage Summary:[/bold cyan]")
                     print(f"   • Calls: {stats['calls']}")
                     print(f"   • Tokens: {stats['input_tokens'] + stats['output_tokens']} ({stats['input_tokens']} in, {stats['output_tokens']} out)")
-                    print(f"   • Est. Cost: ${cost:.4f}\n")
+                    if isinstance(cost, str):
+                        print(f"   • Est. Cost: {cost}\n")
+                    else:
+                        print(f"   • Est. Cost: ${cost:.4f}\n")
 
                 print(f"Your data is ready:")
                 print(f"{output_file}\n")
@@ -905,7 +908,8 @@ def _bundle_output(self) -> None:
         try:
             from scrapewizard.report.html_generator import ReportGenerator
             generator = ReportGenerator(self.project_dir)
-            generator.generate()
+            duration = time.time() - self.start_time
+            generator.generate(duration_seconds=duration)
             report_src = self.project_dir / "report.html"
             if report_src.exists():
                 shutil.copy2(report_src, output_dir / "report.html")