|
38 | 38 | {"id":"CodeContextBench-4zx","title":"US-003: Fix remaining Docker environments (qutebrowser, Teleport, vuls, others)","status":"closed","priority":2,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-11T23:41:41.094793432Z","created_by":"LoCoBench Bot","updated_at":"2026-02-11T23:47:40.236064552Z","closed_at":"2026-02-11T23:47:40.236064552Z","close_reason":"No Docker fixes needed. All 7 non-protonmail repos have healthy environments. 32 infra failures are rate-limit hits. Re-run plan documented."} |
39 | 39 | {"id":"CodeContextBench-54u","title":"US-003 Create codex_2config runner","status":"closed","priority":3,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-17T03:32:30.120181582Z","created_by":"LoCoBench Bot","updated_at":"2026-02-17T03:42:30.711156774Z","closed_at":"2026-02-17T03:42:30.711156774Z","close_reason":"done"} |
40 | 40 | {"id":"CodeContextBench-56k","title":"US-005: Enrich judge context with LoCoBench SE dimensions","status":"closed","priority":2,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-15T22:53:56.691202916Z","created_by":"LoCoBench Bot","updated_at":"2026-02-15T22:55:55.340453929Z","closed_at":"2026-02-15T22:55:55.340453929Z","close_reason":"Implemented _locobench_dimensions in judge_context.py with ACS/DTA/CFRD rubrics"} |
41 | | -{"id":"CodeContextBench-56s","title":"US-008 Add gpt-5.3-codex pricing support and unknown-model guard","status":"open","priority":2,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-17T03:33:21.651812464Z","created_by":"LoCoBench Bot","updated_at":"2026-02-17T03:33:21.651812464Z"} |
| 41 | +{"id":"CodeContextBench-56s","title":"US-008 Add gpt-5.3-codex pricing support and unknown-model guard","status":"closed","priority":2,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-17T03:33:21.651812464Z","created_by":"LoCoBench Bot","updated_at":"2026-02-17T04:03:46.456195307Z","closed_at":"2026-02-17T04:03:46.456195307Z","close_reason":"done"} |
42 | 42 | {"id":"CodeContextBench-5e7","title":"Run investigation benchmark (4 tasks x 3 configs)","status":"closed","priority":1,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-10T12:50:04.232906279Z","created_by":"LoCoBench Bot","updated_at":"2026-02-10T15:49:12.300132241Z","closed_at":"2026-02-10T15:49:12.300132241Z","close_reason":"All 12 runs complete (4 tasks x 3 configs). MANIFEST regenerated."} |
43 | 43 | {"id":"CodeContextBench-5kj","title":"US-002: Create workflow taxonomy module and methodology doc","status":"closed","priority":1,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-15T13:29:45.828982776Z","created_by":"LoCoBench Bot","updated_at":"2026-02-15T13:32:45.597491177Z","closed_at":"2026-02-15T13:32:45.597491177Z","close_reason":"US-002 complete: workflow taxonomy module + methodology doc"} |
44 | 44 | {"id":"CodeContextBench-5m5","title":"Document PyTorch sgt-025 as permanently excluded from SG_full","description":"sgt-025 Docker build fails because the referenced PyTorch commit is unreachable. Two attempts both failed with RuntimeError: Docker compose command failed. This is an unresolvable infrastructure issue. Document in TASK_CATALOG.md and potentially remove from SG_full task list.","status":"closed","priority":4,"issue_type":"task","owner":"locobench@anthropic.com","created_at":"2026-02-10T11:28:28.715732672Z","created_by":"LoCoBench Bot","updated_at":"2026-02-12T10:29:30.648519648Z","closed_at":"2026-02-12T10:29:30.648519648Z","close_reason":"Documented in benchmarks/ccb_pytorch/README.md — new Excluded Tasks section. sgt-025 Docker build fails due to unreachable pre_fix_rev commit. Permanently excluded from SG_full."} |
|
0 commit comments