Initial AITuner study orchestrator
This commit is contained in:
14
configs/examples/capability.example.json
Normal file
14
configs/examples/capability.example.json
Normal file
@@ -0,0 +1,14 @@
|
||||
{
|
||||
"prefill_service_by_bucket": {
|
||||
"4k": {
|
||||
"tp4_ms": 320,
|
||||
"tp8_ms": 240
|
||||
}
|
||||
},
|
||||
"queueing_knee_by_bucket": {
|
||||
"4k": {
|
||||
"tp4_tok_s_per_gpu": 1000,
|
||||
"tp8_tok_s_per_gpu": 1100
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user