fix: kvcache evict workflow
This commit is contained in:
@@ -14,11 +14,12 @@ model:
|
||||
hardware:
|
||||
type: 8xb300
|
||||
hbm_bytes: 1900.0e9 # KV budget after FP4 weights (~372 GB)
|
||||
dram_bytes: 1.5e12 # ~1.5 TB usable CPU DRAM per node
|
||||
|
||||
cluster:
|
||||
num_instances: 32
|
||||
num_instances: 8
|
||||
meta_store:
|
||||
ttl_seconds: 120.0
|
||||
ttl_seconds: 300.0
|
||||
router:
|
||||
mode: prefix_affinity
|
||||
prefix_k: 8
|
||||
|
||||
Reference in New Issue
Block a user