Skip to content

Commit c4e6875

Browse files
committed
add mc2 mask
Signed-off-by: weiguihua2 <weiguihua2@huawei.com>
1 parent 9126969 commit c4e6875

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

vllm_ascend/attention/mla_v1.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -208,7 +208,7 @@ def __init__(self,
208208
ascend_config = get_ascend_config()
209209
self.torchair_graph_enabled = ascend_config.torchair_graph_config.enabled
210210

211-
def generate_active_mask(self, actual_seqs_num, batch_size):
211+
def generate_activate_mask(self, actual_seqs_num, batch_size):
212212
mc2_mask = torch.zeros(batch_size,
213213
dtype=torch.bool,
214214
device=current_platform.device_type)
@@ -345,7 +345,7 @@ def build_torchair_graph_dummy(
345345
else:
346346
attn_state = AscendAttentionState.DecodeOnly
347347
num_decode_tokens = 1
348-
mc2_mask = self.generate_active_mask(num_actual_tokens, num_reqs)
348+
mc2_mask = self.generate_activate_mask(num_actual_tokens, num_reqs)
349349
decode_metadata = AscendMLADecodeMetadata(
350350
input_positions=input_positions,
351351
block_table=block_table,
@@ -511,7 +511,7 @@ def build(
511511
num_reqs_pad_size]
512512
else:
513513
seq_lens_list = seq_lens.tolist()
514-
mc2_mask = self.generate_active_mask(num_actual_tokens,
514+
mc2_mask = self.generate_activate_mask(num_actual_tokens,
515515
num_reqs + num_reqs_pad_size)
516516

517517
decode_metadata = AscendMLADecodeMetadata(

0 commit comments

Comments
 (0)