Fix Stop-A validation config: system vllm, cap max-model-len

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
This commit is contained in:
2026-06-15 15:22:48 +08:00
parent 0f57ee96a9
commit 958739027a
2 changed files with 108 additions and 3 deletions

View File

@@ -14,7 +14,7 @@
"engine": {
"engine_name": "vllm",
"engine_version": "0.20.0",
"exec_path": "/tmp/wjh/venvs/vllm-0.20.0-cu129/bin/vllm",
"exec_path": "/usr/local/bin/vllm",
"cwd": "/home/admin/cpfs/wjh/aituner/aituner",
"host": "127.0.0.1",
"port": 18230,
@@ -33,7 +33,11 @@
"base_flags": {
"host": "127.0.0.1",
"port": 18230,
"served-model-name": "qwen3-30b-a3b-community"
"served-model-name": "qwen3-30b-a3b-community",
"gpu-memory-utilization": 0.9,
"max-model-len": 16384,
"trust-remote-code": true,
"enable-prefix-caching": true
},
"tunable_envs": [],
"tunable_flags": [
@@ -123,7 +127,7 @@
"low": 0.0,
"high": 0.125,
"tolerance": 0.001,
"max_probes": 5,
"max_probes": 4,
"sample_seed": 20260325
},
"llm": {