We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b97baf4 commit d232d49Copy full SHA for d232d49
vllm_ascend/multistream/ms_split.py
@@ -313,7 +313,7 @@ def model_input_split_v1_attn(
313
# chunked prefill
314
assert attn_metadata.attn_mask is not None
315
if has_prefill_pre:
316
- attn_state_pre = attn_state_post = AscendAttentionState.ChunkedPrefill # noqa
+ attn_state_pre = attn_state_post = AscendAttentionState.ChunkedPrefill # noqa
317
attn_mask_pre = attn_metadata.attn_mask[:token_index, :max(
318
seq_lens_pre)].contiguous()
319
attn_state_post = AscendAttentionState.ChunkedPrefill # noqa
0 commit comments