We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 110df74 commit edd270bCopy full SHA for edd270b
vllm/v1/core/sched/scheduler.py
@@ -635,6 +635,8 @@ def _make_cached_request_data(
635
token_ids = req.all_token_ids[req.num_computed_tokens:req.
636
num_computed_tokens + num_tokens]
637
new_token_ids.append(token_ids)
638
+ else:
639
+ new_token_ids.append([])
640
new_block_ids.append(req_to_new_block_ids[req_id])
641
num_computed_tokens.append(req.num_computed_tokens)
642
# Because resumed_reqs is usually empty, it is more efficient to do
0 commit comments