fix: add SDLC/MCP-unique suite prefixes to promote_run.py

sjarmak · claude · sjarmak · commit c5b29a9fbe40 · 2026-03-01T22:58:12.000Z
DIR_PREFIX_TO_SUITE was missing all current suite prefixes (ccb_debug_,
ccb_feature_, ccb_fix_, ccb_test_, ccb_mcp_*, etc.), causing
"could not infer benchmark" errors that blocked promotion of valid runs.

Also adds selection-file fallback lookup for task IDs, and checks
longest prefixes first to avoid ccb_mcp_crossrepo_ matching before
ccb_mcp_crossrepo_tracing_.

23 staging batches promoted. Gap analysis re-run: 27 tasks remain
(was 26 — ansible-abc-imports-fix-001 uncovered after promotion).

Co-Authored-By: Claude Opus 4.6 &lt;noreply@anthropic.com&gt;
diff --git a/configs/variance_reruns/variance_gap_all_sdlc.json b/configs/variance_reruns/variance_gap_all_sdlc.json
@@ -1,10 +1,9 @@
 {
   "metadata": {
-    "title": "Variance all gaps: 26 tasks (8 need 2 passes, 18 need 1)",
-    "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
+    "title": "Variance rerun: ALL SDLC gap tasks (27 tasks)",
+    "description": "Combined rerun config for all SDLC tasks with < 3 paired passes.",
     "generated_date": "2026-03-01",
-    "total_tasks": 26,
-    "note": "Run this config ONCE. Then run wave1 config once more to complete the 8 tasks that need 2 total additional passes. Total: 26*2 + 8*2 = 68 sandbox runs."
+    "total_tasks": 27
   },
   "methodology": {
     "sdlc_suites": [
@@ -15,11 +14,11 @@
     ]
   },
   "statistics": {
-    "total_tasks": 26,
+    "total_tasks": 27,
     "per_suite": {
       "ccb_debug": 2,
       "ccb_feature": 4,
-      "ccb_fix": 5,
+      "ccb_fix": 6,
       "ccb_test": 15
     }
   },
@@ -112,6 +111,20 @@
       "repo": "microsoft/vscode",
       "mcp_benefit_score": 0.87
     },
+    {
+      "task_id": "ansible-abc-imports-fix-001",
+      "benchmark": "ccb_fix",
+      "task_dir": "ccb_fix/ansible-abc-imports-fix-001",
+      "language": "python",
+      "difficulty": "medium",
+      "current_bl_runs": 3,
+      "current_mcp_runs": 2,
+      "current_paired": 2,
+      "runs_needed": 1,
+      "sdlc_phase": "fix",
+      "repo": "ansible/ansible",
+      "mcp_benefit_score": 0.75
+    },
     {
       "task_id": "flink-window-late-data-fix-001",
       "benchmark": "ccb_fix",
@@ -134,7 +147,7 @@
       "language": "javascript",
       "difficulty": "medium",
       "current_bl_runs": 2,
-      "current_mcp_runs": 4,
+      "current_mcp_runs": 3,
       "current_paired": 2,
       "runs_needed": 1,
       "sdlc_phase": "fix",
diff --git a/configs/variance_reruns/variance_gap_ccb_fix.json b/configs/variance_reruns/variance_gap_ccb_fix.json
@@ -1,9 +1,9 @@
 {
   "metadata": {
-    "title": "Variance rerun: ccb_fix gap tasks (5 tasks, target 3 pairs)",
+    "title": "Variance rerun: ccb_fix gap tasks (6 tasks, target 3 pairs)",
     "description": "Targeted rerun for ccb_fix tasks with < 3 paired passes. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
-    "total_tasks": 5,
+    "total_tasks": 6,
     "max_concurrency_needed": 1,
     "note": "Run with --concurrency 1 to fill all gaps in one batch. Or run with --concurrency 1 multiple times."
   },
@@ -13,12 +13,26 @@
     ]
   },
   "statistics": {
-    "total_tasks": 5,
+    "total_tasks": 6,
     "per_suite": {
-      "ccb_fix": 5
+      "ccb_fix": 6
     }
   },
   "tasks": [
+    {
+      "task_id": "ansible-abc-imports-fix-001",
+      "benchmark": "ccb_fix",
+      "task_dir": "ccb_fix/ansible-abc-imports-fix-001",
+      "language": "python",
+      "difficulty": "medium",
+      "current_bl_runs": 3,
+      "current_mcp_runs": 2,
+      "current_paired": 2,
+      "runs_needed": 1,
+      "sdlc_phase": "fix",
+      "repo": "ansible/ansible",
+      "mcp_benefit_score": 0.75
+    },
     {
       "task_id": "flink-window-late-data-fix-001",
       "benchmark": "ccb_fix",
@@ -41,7 +55,7 @@
       "language": "javascript",
       "difficulty": "medium",
       "current_bl_runs": 2,
-      "current_mcp_runs": 4,
+      "current_mcp_runs": 3,
       "current_paired": 2,
       "runs_needed": 1,
       "sdlc_phase": "fix",
diff --git a/configs/variance_reruns/variance_gap_daytona.json b/configs/variance_reruns/variance_gap_daytona.json
@@ -1,10 +1,10 @@
 {
   "metadata": {
-    "title": "Variance all gaps (Daytona): 22 tasks",
+    "title": "Variance gap: 22 Daytona-compatible tasks",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
     "total_tasks": 22,
-    "note": "Run ONCE, then run wave1_daytona.json once more. 6 need 2 passes, 16 need 1. Total: 56 sandbox runs."
+    "note": "Run ONCE for all tasks. Then run wave1_daytona.json once more for tasks needing 2 passes."
   },
   "methodology": {
     "sdlc_suites": [
@@ -353,4 +353,4 @@
       "mcp_benefit_score": 0.72
     }
   ]
-}
+}
diff --git a/configs/variance_reruns/variance_gap_local.json b/configs/variance_reruns/variance_gap_local.json
@@ -1,10 +1,10 @@
 {
   "metadata": {
-    "title": "Variance gaps (local Docker): 4 sweap-images tasks",
+    "title": "Variance gap: 5 sweap-images tasks (local Docker only)",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
-    "total_tasks": 4,
-    "note": "Run with LOCAL Docker (no Daytona). These tasks use jefzda/sweap-images. Run TWICE for tasks needing 2 passes."
+    "total_tasks": 5,
+    "note": "Daytona-incompatible. Run on local Docker. Tasks needing 2 passes must be run twice."
   },
   "methodology": {
     "sdlc_suites": [
@@ -13,10 +13,10 @@
     ]
   },
   "statistics": {
-    "total_tasks": 4,
+    "total_tasks": 5,
     "per_suite": {
       "ccb_debug": 2,
-      "ccb_fix": 2
+      "ccb_fix": 3
     }
   },
   "tasks": [
@@ -48,14 +48,28 @@
       "repo": "tutanota/tutanota",
       "mcp_benefit_score": 0.75
     },
+    {
+      "task_id": "ansible-abc-imports-fix-001",
+      "benchmark": "ccb_fix",
+      "task_dir": "ccb_fix/ansible-abc-imports-fix-001",
+      "language": "python",
+      "difficulty": "medium",
+      "current_bl_runs": 3,
+      "current_mcp_runs": 2,
+      "current_paired": 2,
+      "runs_needed": 1,
+      "sdlc_phase": "fix",
+      "repo": "ansible/ansible",
+      "mcp_benefit_score": 0.75
+    },
     {
       "task_id": "nodebb-plugin-validate-fix-001",
       "benchmark": "ccb_fix",
       "task_dir": "ccb_fix/nodebb-plugin-validate-fix-001",
       "language": "javascript",
       "difficulty": "medium",
       "current_bl_runs": 2,
-      "current_mcp_runs": 4,
+      "current_mcp_runs": 3,
       "current_paired": 2,
       "runs_needed": 1,
       "sdlc_phase": "fix",
@@ -78,4 +92,4 @@
       "mcp_benefit_score": 0.85
     }
   ]
-}
+}
diff --git a/configs/variance_reruns/wave1_daytona.json b/configs/variance_reruns/wave1_daytona.json
@@ -1,10 +1,10 @@
 {
   "metadata": {
-    "title": "Variance wave 1 (Daytona): 6 tasks needing 2+ passes",
+    "title": "Wave 1 Daytona: 6 tasks needing 2+ passes",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
     "total_tasks": 6,
-    "note": "Run this config TWICE to fill gaps. Daytona-compatible only."
+    "note": "Run this config TWICE on Daytona to fill the gap."
   },
   "methodology": {
     "sdlc_suites": [
@@ -111,4 +111,4 @@
       "mcp_benefit_score": 0.72
     }
   ]
-}
+}
diff --git a/configs/variance_reruns/wave1_need2.json b/configs/variance_reruns/wave1_need2.json
@@ -1,10 +1,9 @@
 {
   "metadata": {
-    "title": "Variance wave 1: tasks needing 2+ passes (8 tasks)",
+    "title": "All tasks needing 2+ passes: 8 tasks",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
-    "total_tasks": 8,
-    "note": "Run this config TWICE (--concurrency 1, two separate invocations) to fill all gaps. These 8 tasks have only 1 paired pass each."
+    "total_tasks": 8
   },
   "methodology": {
     "sdlc_suites": [
@@ -141,4 +140,4 @@
       "mcp_benefit_score": 0.72
     }
   ]
-}
+}
diff --git a/configs/variance_reruns/wave2_daytona.json b/configs/variance_reruns/wave2_daytona.json
@@ -1,10 +1,10 @@
 {
   "metadata": {
-    "title": "Variance wave 2 (Daytona): 16 tasks needing 1 pass",
+    "title": "Wave 2 Daytona: 16 tasks needing 1 pass",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
     "total_tasks": 16,
-    "note": "Run this config ONCE to fill gaps. Daytona-compatible only."
+    "note": "Run this config ONCE on Daytona."
   },
   "methodology": {
     "sdlc_suites": [
@@ -263,4 +263,4 @@
       "mcp_benefit_score": 0.72
     }
   ]
-}
+}
diff --git a/configs/variance_reruns/wave2_need1.json b/configs/variance_reruns/wave2_need1.json
@@ -1,10 +1,9 @@
 {
   "metadata": {
-    "title": "Variance wave 2: tasks needing 1 pass (18 tasks)",
+    "title": "All tasks needing 1 pass: 19 tasks",
     "description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",
     "generated_date": "2026-03-01",
-    "total_tasks": 18,
-    "note": "Run this config ONCE to fill all gaps. These 18 tasks have 2 paired passes and need exactly 1 more."
+    "total_tasks": 19
   },
   "methodology": {
     "sdlc_suites": [
@@ -14,10 +13,10 @@
     ]
   },
   "statistics": {
-    "total_tasks": 18,
+    "total_tasks": 19,
     "per_suite": {
       "ccb_feature": 1,
-      "ccb_fix": 5,
+      "ccb_fix": 6,
       "ccb_test": 12
     }
   },
@@ -37,6 +36,20 @@
       "repo": "kubernetes/kubernetes",
       "mcp_benefit_score": 0.88
     },
+    {
+      "task_id": "ansible-abc-imports-fix-001",
+      "benchmark": "ccb_fix",
+      "task_dir": "ccb_fix/ansible-abc-imports-fix-001",
+      "language": "python",
+      "difficulty": "medium",
+      "current_bl_runs": 3,
+      "current_mcp_runs": 2,
+      "current_paired": 2,
+      "runs_needed": 1,
+      "sdlc_phase": "fix",
+      "repo": "ansible/ansible",
+      "mcp_benefit_score": 0.75
+    },
     {
       "task_id": "flink-window-late-data-fix-001",
       "benchmark": "ccb_fix",
@@ -59,7 +72,7 @@
       "language": "javascript",
       "difficulty": "medium",
       "current_bl_runs": 2,
-      "current_mcp_runs": 4,
+      "current_mcp_runs": 3,
       "current_paired": 2,
       "runs_needed": 1,
       "sdlc_phase": "fix",
@@ -292,4 +305,4 @@
       "mcp_benefit_score": 0.72
     }
   ]
-}
+}
diff --git a/scripts/promote_run.py b/scripts/promote_run.py

Original file line number	Diff line number	Diff line change
`@@ -1,10 +1,10 @@`
`1`	`1`	`{`
`2`	`2`	`"metadata": {`
`3`		`- "title": "Variance all gaps (Daytona): 22 tasks",`
	`3`	`+ "title": "Variance gap: 22 Daytona-compatible tasks",`
`4`	`4`	`"description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",`
`5`	`5`	`"generated_date": "2026-03-01",`
`6`	`6`	`"total_tasks": 22,`
`7`		`- "note": "Run ONCE, then run wave1_daytona.json once more. 6 need 2 passes, 16 need 1. Total: 56 sandbox runs."`
	`7`	`+ "note": "Run ONCE for all tasks. Then run wave1_daytona.json once more for tasks needing 2 passes."`
`8`	`8`	`},`
`9`	`9`	`"methodology": {`
`10`	`10`	`"sdlc_suites": [`
`@@ -353,4 +353,4 @@`
`353`	`353`	`"mcp_benefit_score": 0.72`
`354`	`354`	`}`
`355`	`355`	`]`
`356`		`-}`
	`356`	`+}`
Original file line number	Diff line number	Diff line change
`@@ -1,10 +1,10 @@`
`1`	`1`	`{`
`2`	`2`	`"metadata": {`
`3`		`- "title": "Variance wave 1 (Daytona): 6 tasks needing 2+ passes",`
	`3`	`+ "title": "Wave 1 Daytona: 6 tasks needing 2+ passes",`
`4`	`4`	`"description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",`
`5`	`5`	`"generated_date": "2026-03-01",`
`6`	`6`	`"total_tasks": 6,`
`7`		`- "note": "Run this config TWICE to fill gaps. Daytona-compatible only."`
	`7`	`+ "note": "Run this config TWICE on Daytona to fill the gap."`
`8`	`8`	`},`
`9`	`9`	`"methodology": {`
`10`	`10`	`"sdlc_suites": [`
`@@ -111,4 +111,4 @@`
`111`	`111`	`"mcp_benefit_score": 0.72`
`112`	`112`	`}`
`113`	`113`	`]`
`114`		`-}`
	`114`	`+}`
Original file line number	Diff line number	Diff line change
`@@ -1,10 +1,9 @@`
`1`	`1`	`{`
`2`	`2`	`"metadata": {`
`3`		`- "title": "Variance wave 1: tasks needing 2+ passes (8 tasks)",`
	`3`	`+ "title": "All tasks needing 2+ passes: 8 tasks",`
`4`	`4`	`"description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",`
`5`	`5`	`"generated_date": "2026-03-01",`
`6`		`- "total_tasks": 8,`
`7`		`- "note": "Run this config TWICE (--concurrency 1, two separate invocations) to fill all gaps. These 8 tasks have only 1 paired pass each."`
	`6`	`+ "total_tasks": 8`
`8`	`7`	`},`
`9`	`8`	`"methodology": {`
`10`	`9`	`"sdlc_suites": [`
`@@ -141,4 +140,4 @@`
`141`	`140`	`"mcp_benefit_score": 0.72`
`142`	`141`	`}`
`143`	`142`	`]`
`144`		`-}`
	`143`	`+}`
Original file line number	Diff line number	Diff line change
`@@ -1,10 +1,10 @@`
`1`	`1`	`{`
`2`	`2`	`"metadata": {`
`3`		`- "title": "Variance wave 2 (Daytona): 16 tasks needing 1 pass",`
	`3`	`+ "title": "Wave 2 Daytona: 16 tasks needing 1 pass",`
`4`	`4`	`"description": "Targeted variance rerun. Generated by variance_gap_analysis.py.",`
`5`	`5`	`"generated_date": "2026-03-01",`
`6`	`6`	`"total_tasks": 16,`
`7`		`- "note": "Run this config ONCE to fill gaps. Daytona-compatible only."`
	`7`	`+ "note": "Run this config ONCE on Daytona."`
`8`	`8`	`},`
`9`	`9`	`"methodology": {`
`10`	`10`	`"sdlc_suites": [`
`@@ -263,4 +263,4 @@`
`263`	`263`	`"mcp_benefit_score": 0.72`
`264`	`264`	`}`
`265`	`265`	`]`
`266`		`-}`
	`266`	`+}`