Skip to content

Commit 9a2821d

Browse files
committed
refactor(mla_cp): remove unused layer_name parameter from _forward_prefill method
Signed-off-by: F.Liu <1661888967@qq.com>
1 parent 16d93f0 commit 9a2821d

1 file changed

Lines changed: 1 addition & 4 deletions

File tree

  • vllm_ascend/attention/context_parallel

vllm_ascend/attention/context_parallel/mla_cp.py

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -505,12 +505,9 @@ def _forward_prefill(
505505
value: torch.Tensor,
506506
kv_c_and_k_pe_cache: tuple[torch.Tensor],
507507
attn_metadata: AscendMLAMetadata,
508-
layer_name,
509508
) -> torch.Tensor:
510509
if not self.pcp_size > 1:
511-
return super()._forward_prefill(
512-
q_nope, q_pe, k_nope, k_pe, value, kv_c_and_k_pe_cache, attn_metadata, layer_name
513-
)
510+
return super()._forward_prefill(q_nope, q_pe, k_nope, k_pe, value, kv_c_and_k_pe_cache, attn_metadata)
514511
assert attn_metadata.prefill is not None
515512
assert attn_metadata.prefill.pcp_metadata is not None
516513
num_tokens = q_nope.size(0)

0 commit comments

Comments
 (0)