Initial AITuner study orchestrator

This commit is contained in:
gahow
2026-04-04 21:26:37 +08:00
commit cdcca1d9d7
24 changed files with 3357 additions and 0 deletions

View File

@@ -0,0 +1,14 @@
{
"prefill_service_by_bucket": {
"4k": {
"tp4_ms": 320,
"tp8_ms": 240
}
},
"queueing_knee_by_bucket": {
"4k": {
"tp4_tok_s_per_gpu": 1000,
"tp8_tok_s_per_gpu": 1100
}
}
}