sourcegraph
diff --git a/‎configs/selected_benchmark_tasks.json‎
Lines changed: 67 additions & 56 deletions b/‎configs/selected_benchmark_tasks.json‎
Lines changed: 67 additions & 56 deletions
@@ -1,15 +1,15 @@
 {
   "metadata": {
-    "title": "CodeContextBench Selected Benchmark Tasks (SDLC Suite Reorganization)",
-    "version": "2.0",
+    "title": "CodeScaleBench Selected Benchmark Tasks",
+    "version": "3.0",
     "generated_by": "SDLC suite migration from migration_map.json",
     "generated_date": "2026-02-18",
     "total_available": 835,
     "total_selected": 370,
     "migration_source": "migration_map.json (157 mapped tasks across 8 SDLC suites)",
     "target_total": 370,
     "target_note": "150 SDLC tasks (9 suites, Neyman-optimal) + 220 MCP-unique tasks (11 suites, Neyman-optimal) = 370 active.",
-    "last_updated": "2026-03-01",
+    "last_updated": "2026-03-03",
     "note": "DOE-driven rebalance: 150 SDLC (Neyman-optimal) + 220 MCP-unique (Neyman-optimal). MCP-unique rebalance: 13 scaffolded (IDs 272-284), 7 promoted from onboarding_extra, 20 low-IV tasks moved to benchmarks/backups/*_doe_trim/.",
     "per_suite": {
       "csb_sdlc_debug": 18,
@@ -103,73 +103,84 @@
   },
   "statistics": {
     "tasks_per_sdlc_phase": {
-      "Analysis": 8,
-      "Architecture & Design": 1,
-      "Compliance audit": 2,
-      "Cross-org discovery": 2,
-      "Cross-repo tracing": 3,
-      "Debugging": 5,
-      "Documentation": 16,
-      "Implementation (bug fix)": 1,
-      "Implementation (feature)": 26,
+      "unknown": 61,
+      "Requirements & Discovery": 28,
+      "cross-repo-dep-trace": 24,
+      "Implementation (feature)": 21,
+      "Testing & QA": 18,
+      "fix": 15,
+      "Refactoring": 13,
+      "debug": 13,
+      "migration-inventory": 13,
+      "platform-knowledge": 13,
+      "compliance-audit": 12,
+      "cross-org-discovery": 12,
+      "Documentation": 11,
+      "domain-lineage": 10,
+      "vuln-remediation": 10,
+      "agentic-correctness": 10,
+      "secure": 9,
+      "Onboarding & comprehension": 9,
+      "incident-debug": 9,
+      "design": 8,
+      "Migration analysis": 8,
+      "Implementation (bug fix)": 7,
+      "Analysis": 6,
+      "Security remediation": 6,
+      "Cross-repo tracing": 5,
+      "Debugging": 4,
+      "Incident investigation": 3,
       "Implementation (refactor)": 2,
+      "Platform engineering": 2,
+      "Onboarding comprehension": 2,
+      "Bug Repair": 2,
       "Implementation (refactoring)": 1,
-      "Incident investigation": 3,
-      "Migration analysis": 2,
-      "Onboarding & comprehension": 3,
-      "Platform engineering": 3,
-      "Refactoring": 17,
-      "Requirements & Discovery": 34,
-      "Security remediation": 2,
-      "Security review": 3,
-      "Testing & QA": 18,
-      "debug": 14,
-      "design": 11,
-      "fix": 19,
-      "secure": 14
+      "Security review": 1,
+      "Compliance audit": 1,
+      "Platform knowledge": 1
     },
     "tasks_per_benchmark": {
-      "csb_sdlc_debug": 20,
-      "csb_sdlc_design": 20,
-      "csb_sdlc_document": 20,
-      "csb_sdlc_fix": 25,
-      "csb_org_compliance": 7,
-      "csb_org_crossorg": 5,
-      "csb_org_crossrepo": 1,
-      "csb_org_crossrepo_tracing": 9,
-      "csb_org_domain": 10,
-      "csb_org_incident": 11,
-      "csb_org_migration": 7,
-      "csb_org_onboarding": 11,
-      "csb_org_org": 5,
-      "csb_org_platform": 5,
-      "csb_org_security": 10,
-      "csb_sdlc_secure": 20,
-      "csb_sdlc_test": 20,
-      "csb_sdlc_understand": 20,
-      "csb_sdlc_feature": 20,
-      "csb_sdlc_refactor": 20
+      "csb_org_compliance": 18,
+      "csb_org_crossorg": 15,
+      "csb_org_crossrepo": 14,
+      "csb_org_crossrepo_tracing": 22,
+      "csb_org_domain": 20,
+      "csb_org_incident": 20,
+      "csb_org_migration": 26,
+      "csb_org_onboarding": 28,
+      "csb_org_org": 15,
+      "csb_org_platform": 18,
+      "csb_org_security": 24,
+      "csb_sdlc_debug": 18,
+      "csb_sdlc_design": 14,
+      "csb_sdlc_document": 13,
+      "csb_sdlc_feature": 23,
+      "csb_sdlc_fix": 26,
+      "csb_sdlc_refactor": 16,
+      "csb_sdlc_secure": 12,
+      "csb_sdlc_test": 18,
+      "csb_sdlc_understand": 10
     },
     "tasks_per_language": {
-      "java": 56,
-      "go": 138,
+      "go": 134,
+      "cpp": 73,
+      "java": 57,
+      "python": 55,
       "rust": 12,
+      "c": 10,
+      "javascript": 8,
+      "typescript": 7,
+      "java,cpp": 5,
+      "cpp,c,javascript": 3,
       "python,cpp": 1,
-      "typescript": 4,
-      "python": 52,
       "csharp": 1,
-      "cpp": 75,
-      "javascript": 6,
-      "c": 9,
       "go,protobuf": 1,
       "go,cpp": 1,
       "mixed": 1,
-      "java,cpp": 5,
-      "cpp,c,javascript": 3,
       "unknown": 1
     },
-    "avg_mcp_benefit_score": 0.868,
-    "total_tasks": 390,
+    "avg_mcp_benefit_score": 0.891,
+    "total_tasks": 370,
     "per_suite": {
       "csb_sdlc_feature": 23,
       "csb_sdlc_refactor": 16,