|
10 | 10 |
|
11 | 11 | # Sample metrics for demo (used when no eval has been run yet) |
12 | 12 | SAMPLE_METRICS = { |
13 | | - "openrouter/anthropic/claude-haiku-4-5-20251001": { |
14 | | - "model": "openrouter/anthropic/claude-haiku-4-5-20251001", |
| 13 | + "openrouter/anthropic/claude-haiku-4.5": { |
| 14 | + "model": "openrouter/anthropic/claude-haiku-4.5", |
15 | 15 | "pool": "pool-a + pool-b", |
16 | 16 | "total_cases": 48, |
17 | 17 | "accuracy": 0.938, |
|
34 | 34 | "avg_tokens_per_request": 850, |
35 | 35 | "error_rate": 0.021, |
36 | 36 | }, |
37 | | - "openrouter/anthropic/claude-sonnet-4-5-20250514": { |
38 | | - "model": "openrouter/anthropic/claude-sonnet-4-5-20250514", |
| 37 | + "openrouter/anthropic/claude-sonnet-4.5": { |
| 38 | + "model": "openrouter/anthropic/claude-sonnet-4.5", |
39 | 39 | "pool": "pool-b-upgrade", |
40 | 40 | "total_cases": 48, |
41 | 41 | "accuracy": 0.958, |
|
50 | 50 |
|
51 | 51 |
|
52 | 52 | POOL_MAP = { |
53 | | - "openrouter/anthropic/claude-haiku-4-5-20251001": "pool-a + pool-b", |
| 53 | + "openrouter/anthropic/claude-haiku-4.5": "pool-a + pool-b", |
54 | 54 | "gemini/gemini-2.5-flash": "fallback", |
55 | | - "openrouter/anthropic/claude-sonnet-4-5-20250514": "pool-b-upgrade", |
| 55 | + "openrouter/anthropic/claude-sonnet-4.5": "pool-b-upgrade", |
56 | 56 | } |
57 | 57 |
|
58 | 58 |
|
@@ -95,12 +95,12 @@ async def list_models(): |
95 | 95 | }, |
96 | 96 | "pool-b": { |
97 | 97 | "description": "Complex tasks — reasoning required", |
98 | | - "models": ["anthropic/claude-haiku-4-5-20251001"], |
| 98 | + "models": ["anthropic/claude-haiku-4.5"], |
99 | 99 | "tasks": ["detect_anomalies", "interpret_anomaly", "general_question"], |
100 | 100 | }, |
101 | 101 | "pool-b-upgrade": { |
102 | 102 | "description": "Deep reasoning — comprehensive analysis", |
103 | | - "models": ["anthropic/claude-sonnet-4-5-20250514"], |
| 103 | + "models": ["anthropic/claude-sonnet-4.5"], |
104 | 104 | "tasks": ["calibration_advice"], |
105 | 105 | }, |
106 | 106 | } |
|
0 commit comments