Skip to content

Commit 8058c91

Browse files
authored
[HOT-FIX] Add kv_sharing_target_layer_name argument to cutlass_mla backend (#19374)
Signed-off-by: Pavani Majety <pmajety@nvidia.com>
1 parent 7d44c46 commit 8058c91

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm/v1/attention/backends/mla/cutlass_mla.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,12 +40,13 @@ def __init__(
4040
blocksparse_params: Optional[dict[str, Any]],
4141
logits_soft_cap: Optional[float],
4242
attn_type: str,
43+
kv_sharing_target_layer_name: Optional[str],
4344
# MLA Specific Arguments
4445
**mla_args) -> None:
4546
super().__init__(num_heads, head_size, scale, num_kv_heads,
4647
alibi_slopes, sliding_window, kv_cache_dtype,
4748
blocksparse_params, logits_soft_cap, attn_type,
48-
**mla_args)
49+
kv_sharing_target_layer_name, **mla_args)
4950

5051
unsupported_features = [
5152
alibi_slopes, sliding_window, blocksparse_params, logits_soft_cap

0 commit comments

Comments
 (0)