third_party/vllm/ now tracked in git for direct patch management.
Based on vLLM v0.18.1 release with one patch applied:
vllm/v1/core/sched/scheduler.py:
Replace fatal assert with graceful skip when KV transfer callback
arrives for an already-aborted request during PD disaggregated serving.
Future vLLM modifications should be made directly in third_party/vllm/
and committed normally. The patches/ directory is kept as documentation
of what changed from upstream.
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
32 lines
912 B
YAML
32 lines
912 B
YAML
version: 2
|
|
updates:
|
|
# Maintain dependencies for GitHub Actions
|
|
- package-ecosystem: "github-actions"
|
|
directory: "/"
|
|
schedule:
|
|
interval: "weekly"
|
|
- package-ecosystem: "pip"
|
|
directory: "/"
|
|
schedule:
|
|
interval: "weekly"
|
|
labels: ["dependencies"]
|
|
open-pull-requests-limit: 5
|
|
reviewers: ["khluu", "simon-mo"]
|
|
allow:
|
|
- dependency-type: "all"
|
|
ignore:
|
|
- dependency-name: "*"
|
|
update-types: ["version-update:semver-patch"]
|
|
- dependency-name: "torch"
|
|
- dependency-name: "torchvision"
|
|
- dependency-name: "xformers"
|
|
- dependency-name: "lm-format-enforcer"
|
|
- dependency-name: "gguf"
|
|
- dependency-name: "compressed-tensors"
|
|
- dependency-name: "ray[cgraph]" # Ray Compiled Graph
|
|
- dependency-name: "lm-eval"
|
|
groups:
|
|
minor-update:
|
|
applies-to: version-updates
|
|
update-types: ["minor"]
|