diff --git a/scripts/bench.sh b/scripts/bench.sh index c5c6e97..207c0ae 100755 --- a/scripts/bench.sh +++ b/scripts/bench.sh @@ -133,6 +133,7 @@ launch_instances() { local logfile="$OUTDIR/vllm_inst_${i}.log" if [ "$MODE" = "elastic" ]; then + PYTHONHASHSEED=42 \ VLLM_MOONCAKE_BOOTSTRAP_PORT=$((8998 + i)) \ MASTER_PORT=$master \ CUDA_VISIBLE_DEVICES=$i \ diff --git a/third_party/vllm/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils.py b/third_party/vllm/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils.py index 0620b72..afc7ead 100644 --- a/third_party/vllm/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils.py +++ b/third_party/vllm/vllm/distributed/kv_transfer/kv_connector/v1/mooncake/mooncake_utils.py @@ -252,11 +252,17 @@ class MooncakeBootstrapServer: prev_hash = block_hash bid = self._hash_table.get(block_hash.hex()) + if i == 0: + table_sample = next(iter(self._hash_table)) if self._hash_table else "empty" + logger.info( + "_lookup_by_tokens: block0 hash=%s, NONE_HASH=%s, table_sample=%s", + block_hash.hex()[:16], NONE_HASH.hex()[:16], table_sample[:16]) if bid is not None: block_ids.append(bid) pinned_ids.append(bid) else: - block_ids.append(None) + if i == 0: + block_ids.append(None) break return block_ids, pinned_ids