Add tuning progress report for harness evaluation

This commit is contained in:
2026-06-21 00:48:21 +08:00
parent 426151bc9f
commit 488fae7e63
4 changed files with 752 additions and 0 deletions

View File

@@ -0,0 +1,26 @@
{
"report_id": "qwen27b-abl12-harness-vs-naive",
"output_root": "../../.aituner-reports/qwen27b-abl12-harness-vs-naive",
"target_fraction": 0.95,
"min_final_ratio": 0.98,
"cases": [
{
"case_id": "qwen27b-chat-0-8k-real-output",
"description": "12-trial harness-vs-naive ablation on the 0-8k chat window with real output lengths.",
"tags": ["qwen27b", "chat", "0-8k", "h20", "real-output"],
"budgets": [1, 2, 3, 4, 6, 8, 12],
"arms": [
{
"name": "harness",
"kind": "harness",
"study_root": "../../.aituner/abl12-harness/dash0-qwen27b-ablation-harness-on"
},
{
"name": "naive",
"kind": "naive",
"study_root": "../../.aituner/abl12-naive/dash0-qwen27b-ablation-naive-off"
}
]
}
]
}