|
50 | 50 | "language": "python", |
51 | 51 | "summary": "Scans run directories, classifies task status, and supports watch mode for active runs." |
52 | 52 | }, |
53 | | - { |
54 | | - "name": "analyze_harness_design.py", |
55 | | - "path": "scripts/analyze_harness_design.py", |
56 | | - "category": "analysis_comparison", |
57 | | - "status": "maintained", |
58 | | - "language": "python", |
59 | | - "summary": "Analysis/comparison script for analyze harness design." |
60 | | - }, |
61 | 53 | { |
62 | 54 | "name": "analyze_mcp_unique_haiku.py", |
63 | 55 | "path": "scripts/analyze_mcp_unique_haiku.py", |
|
66 | 58 | "language": "python", |
67 | 59 | "summary": "Analysis/comparison script for analyze mcp unique haiku." |
68 | 60 | }, |
69 | | - { |
70 | | - "name": "analyze_minimum_subset.py", |
71 | | - "path": "scripts/analyze_minimum_subset.py", |
72 | | - "category": "analysis_comparison", |
73 | | - "status": "maintained", |
74 | | - "language": "python", |
75 | | - "summary": "Analysis/comparison script for analyze minimum subset." |
76 | | - }, |
77 | 61 | { |
78 | 62 | "name": "analyze_paired_cost_official_raw.py", |
79 | 63 | "path": "scripts/analyze_paired_cost_official_raw.py", |
|
82 | 66 | "language": "python", |
83 | 67 | "summary": "Analysis/comparison script for analyze paired cost official raw." |
84 | 68 | }, |
85 | | - { |
86 | | - "name": "analyze_rq_power.py", |
87 | | - "path": "scripts/analyze_rq_power.py", |
88 | | - "category": "analysis_comparison", |
89 | | - "status": "maintained", |
90 | | - "language": "python", |
91 | | - "summary": "Analysis/comparison script for analyze rq power." |
92 | | - }, |
93 | 69 | { |
94 | 70 | "name": "analyze_run_coverage.py", |
95 | 71 | "path": "scripts/analyze_run_coverage.py", |
|
98 | 74 | "language": "python", |
99 | 75 | "summary": "Analysis/comparison script for analyze run coverage." |
100 | 76 | }, |
101 | | - { |
102 | | - "name": "analyze_size_effects.py", |
103 | | - "path": "scripts/analyze_size_effects.py", |
104 | | - "category": "analysis_comparison", |
105 | | - "status": "maintained", |
106 | | - "language": "python", |
107 | | - "summary": "Analysis/comparison script for analyze size effects." |
108 | | - }, |
109 | 77 | { |
110 | 78 | "name": "answer_json_verifier_lib.sh", |
111 | 79 | "path": "scripts/answer_json_verifier_lib.sh", |
|
218 | 186 | "language": "python", |
219 | 187 | "summary": "Historical one-off script: backfill triage from manifest." |
220 | 188 | }, |
221 | | - { |
222 | | - "name": "build_conversation_db.py", |
223 | | - "path": "scripts/build_conversation_db.py", |
224 | | - "category": "infra_mirrors", |
225 | | - "status": "maintained", |
226 | | - "language": "python", |
227 | | - "summary": "Infrastructure or mirror management script for build conversation db." |
228 | | - }, |
229 | 189 | { |
230 | 190 | "name": "build_core_manifest.py", |
231 | 191 | "path": "scripts/build_core_manifest.py", |
|
298 | 258 | "language": "python", |
299 | 259 | "summary": "Utility script for compare contextbench results." |
300 | 260 | }, |
301 | | - { |
302 | | - "name": "compare_old_new_ground_truth.py", |
303 | | - "path": "scripts/compare_old_new_ground_truth.py", |
304 | | - "category": "misc", |
305 | | - "status": "maintained", |
306 | | - "language": "python", |
307 | | - "summary": "Utility script for compare old new ground truth." |
308 | | - }, |
309 | 261 | { |
310 | 262 | "name": "comprehensive_analysis.py", |
311 | 263 | "path": "scripts/comprehensive_analysis.py", |
|
314 | 266 | "language": "python", |
315 | 267 | "summary": "Analysis/comparison script for comprehensive analysis." |
316 | 268 | }, |
317 | | - { |
318 | | - "name": "compute_analysis_ir_metrics.py", |
319 | | - "path": "scripts/compute_analysis_ir_metrics.py", |
320 | | - "category": "misc", |
321 | | - "status": "maintained", |
322 | | - "language": "python", |
323 | | - "summary": "Utility script for compute analysis ir metrics." |
324 | | - }, |
325 | 269 | { |
326 | 270 | "name": "compute_bootstrap_cis.py", |
327 | 271 | "path": "scripts/compute_bootstrap_cis.py", |
|
506 | 450 | "language": "python", |
507 | 451 | "summary": "Utility script for daytona runner." |
508 | 452 | }, |
509 | | - { |
510 | | - "name": "daytona_snapshot_cleanup.py", |
511 | | - "path": "scripts/daytona_snapshot_cleanup.py", |
512 | | - "category": "misc", |
513 | | - "status": "maintained", |
514 | | - "language": "python", |
515 | | - "summary": "Utility script for daytona snapshot cleanup." |
516 | | - }, |
517 | 453 | { |
518 | 454 | "name": "dependeval_eval_dr.py", |
519 | 455 | "path": "scripts/dependeval_eval_dr.py", |
|
618 | 554 | "language": "python", |
619 | 555 | "summary": "Helper library/wrapper used by other scripts (eval matrix)." |
620 | 556 | }, |
621 | | - { |
622 | | - "name": "export_conversation_blog_assets.py", |
623 | | - "path": "scripts/export_conversation_blog_assets.py", |
624 | | - "category": "misc", |
625 | | - "status": "maintained", |
626 | | - "language": "python", |
627 | | - "summary": "Utility script for export conversation blog assets." |
628 | | - }, |
629 | | - { |
630 | | - "name": "export_engineering_diary_assets.py", |
631 | | - "path": "scripts/export_engineering_diary_assets.py", |
632 | | - "category": "misc", |
633 | | - "status": "maintained", |
634 | | - "language": "python", |
635 | | - "summary": "Utility script for export engineering diary assets." |
636 | | - }, |
637 | 557 | { |
638 | 558 | "name": "export_official_results.py", |
639 | 559 | "path": "scripts/export_official_results.py", |
|
1194 | 1114 | "language": "python", |
1195 | 1115 | "summary": "Utility script for plot build narrative." |
1196 | 1116 | }, |
1197 | | - { |
1198 | | - "name": "plot_conversation_blog_svgs.py", |
1199 | | - "path": "scripts/plot_conversation_blog_svgs.py", |
1200 | | - "category": "misc", |
1201 | | - "status": "maintained", |
1202 | | - "language": "python", |
1203 | | - "summary": "Utility script for plot conversation blog svgs." |
1204 | | - }, |
1205 | | - { |
1206 | | - "name": "plot_csb_mcp_blog_figures.py", |
1207 | | - "path": "scripts/plot_csb_mcp_blog_figures.py", |
1208 | | - "category": "misc", |
1209 | | - "status": "maintained", |
1210 | | - "language": "python", |
1211 | | - "summary": "Utility script for plot csb mcp blog figures." |
1212 | | - }, |
1213 | 1117 | { |
1214 | 1118 | "name": "prebuild_images.sh", |
1215 | 1119 | "path": "scripts/prebuild_images.sh", |
|
1482 | 1386 | "language": "shell", |
1483 | 1387 | "summary": "Utility script for run scaling gap oracles." |
1484 | 1388 | }, |
1485 | | - { |
1486 | | - "name": "run_sg_local.sh", |
1487 | | - "path": "scripts/run_sg_local.sh", |
1488 | | - "category": "misc", |
1489 | | - "status": "maintained", |
1490 | | - "language": "shell", |
1491 | | - "summary": "Utility script for run sg local." |
1492 | | - }, |
1493 | | - { |
1494 | | - "name": "run_sg_validation.py", |
1495 | | - "path": "scripts/run_sg_validation.py", |
1496 | | - "category": "misc", |
1497 | | - "status": "maintained", |
1498 | | - "language": "python", |
1499 | | - "summary": "Utility script for run sg validation." |
1500 | | - }, |
1501 | 1389 | { |
1502 | 1390 | "name": "scaffold_contextbench_tasks.py", |
1503 | 1391 | "path": "scripts/scaffold_contextbench_tasks.py", |
|
1820 | 1708 | } |
1821 | 1709 | ], |
1822 | 1710 | "category_counts": { |
1823 | | - "analysis_comparison": 28, |
| 1711 | + "analysis_comparison": 24, |
1824 | 1712 | "core_operations": 13, |
1825 | 1713 | "data_management": 10, |
1826 | 1714 | "generation": 9, |
1827 | | - "infra_mirrors": 23, |
| 1715 | + "infra_mirrors": 22, |
1828 | 1716 | "library_helpers": 7, |
1829 | 1717 | "migration": 5, |
1830 | | - "misc": 99, |
| 1718 | + "misc": 90, |
1831 | 1719 | "qa_quality": 10, |
1832 | 1720 | "submission_reporting": 7, |
1833 | 1721 | "task_creation_selection": 13, |
|
0 commit comments