Pin 27B A/B to GPUs 2-7 (route around leaked GPU0/1 memory)
Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
This commit is contained in:
@@ -48,7 +48,8 @@
|
|||||||
"VLLM_DP_MASTER_PORT": "9528",
|
"VLLM_DP_MASTER_PORT": "9528",
|
||||||
"VLLM_RESPONSE_TIMEOUT": "300",
|
"VLLM_RESPONSE_TIMEOUT": "300",
|
||||||
"VLLM_LOG_REQ_KV_LENS": "1",
|
"VLLM_LOG_REQ_KV_LENS": "1",
|
||||||
"DS_LLM_GRACEFUL_SHUTDOWN_KEEP_SECONDS": "600"
|
"DS_LLM_GRACEFUL_SHUTDOWN_KEEP_SECONDS": "600",
|
||||||
|
"CUDA_VISIBLE_DEVICES": "2,3,4,5,6,7"
|
||||||
},
|
},
|
||||||
"base_flags": {
|
"base_flags": {
|
||||||
"host": "127.0.0.1",
|
"host": "127.0.0.1",
|
||||||
|
|||||||
Reference in New Issue
Block a user