feat: add bucketed service and strict global routing

This commit is contained in:
2026-04-17 15:03:10 +08:00
parent 96019082cc
commit fa381b5db3
19 changed files with 533 additions and 128 deletions

View File

@@ -89,13 +89,13 @@ impl Router for EstimatedTtftRouter {
}
}
RouteDecision {
req_id: req.req_id,
mode: "estimated_ttft",
chosen: best,
probe_overhead_s: 0.0,
crate::router::local_route_decision(
req.req_id,
"estimated_ttft",
best,
0.0,
candidates,
reason: "argmin(drain + scheduler + kv_prepare + prefill + first_token_tail)",
}
"argmin(drain + scheduler + kv_prepare + prefill + first_token_tail)",
)
}
}