third_party/vllm/ now tracked in git for direct patch management.
Based on vLLM v0.18.1 release with one patch applied:
vllm/v1/core/sched/scheduler.py:
Replace fatal assert with graceful skip when KV transfer callback
arrives for an already-aborted request during PD disaggregated serving.
Future vLLM modifications should be made directly in third_party/vllm/
and committed normally. The patches/ directory is kept as documentation
of what changed from upstream.
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
26 lines
584 B
YAML
26 lines
584 B
YAML
name: vllm_ci
|
|
job_dirs:
|
|
- ".buildkite/image_build"
|
|
- ".buildkite/test_areas"
|
|
- ".buildkite/hardware_tests"
|
|
run_all_patterns:
|
|
- "docker/Dockerfile"
|
|
- "CMakeLists.txt"
|
|
- "requirements/common.txt"
|
|
- "requirements/cuda.txt"
|
|
- "requirements/build.txt"
|
|
- "requirements/test.txt"
|
|
- "setup.py"
|
|
- "csrc/"
|
|
- "cmake/"
|
|
run_all_exclude_patterns:
|
|
- "docker/Dockerfile."
|
|
- "csrc/cpu/"
|
|
- "csrc/rocm/"
|
|
- "cmake/hipify.py"
|
|
- "cmake/cpu_extension.cmake"
|
|
registries: public.ecr.aws/q9t5s3a7
|
|
repositories:
|
|
main: "vllm-ci-postmerge-repo"
|
|
premerge: "vllm-ci-test-repo"
|