handle clean code

weijinqian · weijinqian · commit 644d22fdb971 · 2025-07-12T00:33:33.000+08:00
Signed-off-by: weijinqian_v1 &lt;weijinqian@huawei.com&gt;
diff --git a/vllm_ascend/multistream/ms_split.py b/vllm_ascend/multistream/ms_split.py
@@ -304,25 +304,24 @@ def model_input_split_v1_attn(
         # the attn_mla kernel in torch npu only accept 128*128 attn mask
         attn_mask_pre = attn_mask_post = attn_metadata.attn_mask
         attn_state_pre = attn_state_post = attn_metadata.attn_state
-
     elif attn_metadata.attn_state == AscendAttentionState.DecodeOnly:
         # should be none in decode only state
         attn_mask_pre = attn_mask_post = attn_metadata.attn_mask
-        attn_state_pre = attn_state_post = AscendAttentionState.DecodeOnly  # noqa
+        attn_state_pre = attn_state_post = AscendAttentionState.DecodeOnly  # type: ignore
     else:
         # chunked prefill
         assert attn_metadata.attn_mask is not None
         if has_prefill_pre:
-            attn_state_pre = attn_state_post = AscendAttentionState.ChunkedPrefill  # noqa
+            attn_state_pre = attn_state_post = AscendAttentionState.ChunkedPrefill  # type: ignore
             attn_mask_pre = attn_metadata.attn_mask[:token_index, :max(
                 seq_lens_pre)].contiguous()
-            attn_state_post = AscendAttentionState.ChunkedPrefill  # noqa
+            attn_state_post = AscendAttentionState.ChunkedPrefill  # type: ignore
             attn_mask_post = attn_metadata.attn_mask[
                 token_index:, :max(seq_lens_post)].contiguous()
         else:
-            attn_state_pre = AscendAttentionState.DecodeOnly  # noqa
+            attn_state_pre = AscendAttentionState.DecodeOnly  # type: ignore
             attn_mask_pre = None
-            attn_state_post = AscendAttentionState.ChunkedPrefill  # noqa
+            attn_state_post = AscendAttentionState.ChunkedPrefill  # type: ignore
             attn_mask_post = attn_metadata.attn_mask[
                 token_index:, :max(seq_lens_post)].contiguous()