Skip to content

Commit de379a5

Browse files
committed
Fixed: v0 style broken issue in vllm main branch.
1 parent 68fb634 commit de379a5

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

vllm_ascend/core/scheduler.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -132,7 +132,7 @@ def skip_cur_request():
132132
continue
133133

134134
new_blocks = self.kv_cache_manager.allocate_slots(
135-
request, num_new_tokens, computed_blocks)
135+
request, num_new_tokens, num_computed_tokens, computed_blocks)
136136
if new_blocks is None:
137137
# The request cannot be scheduled.
138138
break
@@ -151,7 +151,7 @@ def skip_cur_request():
151151
if self.lora_config and request.lora_request:
152152
scheduled_loras.add(request.lora_request.lora_int_id)
153153
req_to_new_block_ids[request.request_id] = [
154-
b.block_id for b in computed_blocks + new_blocks
154+
b.block_id for b in computed_blocks.blocks + new_blocks.blocks
155155
]
156156
# Update request info.
157157
num_scheduled_tokens[request.request_id] = num_new_tokens
@@ -211,7 +211,7 @@ def skip_cur_request():
211211
scheduled_running_reqs.append(request)
212212
self.scheduled_req_ids.add(request.request_id)
213213
req_to_new_block_ids[request.request_id] = [
214-
b.block_id for b in new_blocks
214+
b.block_id for b in new_blocks.blocks
215215
]
216216
num_scheduled_tokens[request.request_id] = num_new_tokens
217217
token_budget -= num_new_tokens
@@ -307,7 +307,7 @@ def _check_watermark_for_prefill(self,
307307
num_new_tokens,
308308
computed_blocks,
309309
watermark=0.01):
310-
computed_blocks = computed_blocks or []
310+
computed_blocks = computed_blocks.blocks() or []
311311
watermark_blocks = self.kv_cache_config.num_blocks * watermark
312312
num_computed_tokens = (request.num_computed_tokens +
313313
len(computed_blocks) * self.block_size)

0 commit comments

Comments
 (0)