Skip to content

Commit a0c03cd

Browse files
committed
more simple immediate retry
Signed-off-by: Will Eaton <weaton@redhat.com>
1 parent 9dd2c1c commit a0c03cd

File tree

1 file changed

+14
-4
lines changed

1 file changed

+14
-4
lines changed

vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py

Lines changed: 14 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -923,12 +923,22 @@ def _process_completed_handshakes(self):
923923
if engine_id in self._pending_requests:
924924
pending_reqs = self._pending_requests[engine_id]
925925
logger.debug(
926-
"Handshake completed for %s, clearing %d pending requests "
927-
"(will retry naturally on next start_load_kv)",
926+
"Handshake completed for %s, immediately retrying %d pending requests",
928927
engine_id, len(pending_reqs))
929928

930-
# clear pending requests - they'll be retried naturally
931-
# by the event loop on the next start_load_kv() call
929+
for req_id, meta in pending_reqs:
930+
logger.debug("Immediately retrying request %s for engine %s",
931+
req_id, engine_id)
932+
try:
933+
self._read_blocks(
934+
request_id=req_id,
935+
dst_engine_id=meta.remote_engine_id,
936+
local_block_ids=meta.local_block_ids,
937+
remote_block_ids=meta.remote_block_ids,
938+
)
939+
except Exception as e:
940+
logger.error("Failed to retry request %s: %s", req_id, e)
941+
932942
del self._pending_requests[engine_id]
933943

934944
for engine_id in completed_engines:

0 commit comments

Comments
 (0)