agentic-kvc/tests/test_scheduler_step_log_patch.py

"""Tests for A3 vLLM scheduler patch: per-step JSONL log hooks.

The vendored vLLM at third_party/vllm/vllm/v1/core/sched/scheduler.py must
contain the agentic-kv hooks. We test by inspecting the file on disk because
importing vllm.Scheduler requires the full GPU runtime — those imports are
expensive and not portable to CI. Hooks are anchor strings we control.
"""

from __future__ import annotations

import py_compile
from pathlib import Path

SCHEDULER_PATH = (
    Path(__file__).resolve().parent.parent
    / "third_party" / "vllm" / "vllm" / "v1" / "core" / "sched" / "scheduler.py"
)


def test_scheduler_file_exists():
    assert SCHEDULER_PATH.exists(), f"missing {SCHEDULER_PATH}"


def test_scheduler_syntactically_valid():
    py_compile.compile(str(SCHEDULER_PATH), doraise=True)


def test_scheduler_has_agentic_step_log_init_hook():
    src = SCHEDULER_PATH.read_text()
    assert "AGENTIC_STEP_LOG_PATH" in src
    assert "AGENTIC_WORKER_ID" in src
    assert "self._agentic_step_log_fh" in src
    assert "self._agentic_worker_id" in src


def test_scheduler_has_step_emit_helper():
    src = SCHEDULER_PATH.read_text()
    assert "def _agentic_emit_step_log(" in src
    assert "prefill_tokens" in src
    assert "decode_tokens" in src
    assert "n_running_total" in src
    assert "n_waiting" in src
    assert "per_req" in src


def test_scheduler_emit_is_invoked_in_schedule_return_path():
    """The emit call must sit between _update_after_schedule and return."""
    src = SCHEDULER_PATH.read_text()
    assert "self._agentic_emit_step_log(" in src
    update_idx = src.index("self._update_after_schedule(scheduler_output)")
    emit_idx = src.index("self._agentic_emit_step_log(")
    return_idx = src.index("return scheduler_output", update_idx)
    assert update_idx < emit_idx < return_idx, (
        "emit hook must be after update_after_schedule and before return"
    )


def test_bench_script_threads_step_log_env():
    bench = (
        Path(__file__).resolve().parent.parent / "scripts" / "bench.sh"
    ).read_text()
    assert "AGENTIC_STEP_LOG_DIR" in bench
    assert "AGENTIC_STEP_LOG_PATH" in bench
    assert "AGENTIC_WORKER_ID" in bench