Skip to content

Commit 52dc355

Browse files
author
hanxudong.hxd
committed
fix glm5
1 parent a2b16da commit 52dc355

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

slime_plugins/models/glm5/glm5.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -421,14 +421,15 @@ def get_absorb_query_key_value_tensors(
421421
assert hidden_states.ndim == 3, f"hidden_states should be 3D, [s, b, n*h], got {hidden_states.ndim}D"
422422
assert packed_seq_params is not None
423423

424+
packed_seq = packed_seq_params is not None and packed_seq_params.qkv_format == 'thd'
424425
# =========================================
425426
# Prepare RoPE and seqlen related params
426427
# =========================================
427428
rotary_seq_len = self.rotary_pos_emb.get_rotary_seq_len(
428429
inference_context, None, hidden_states, self.config, packed_seq_params
429430
)
430431
# TODO: support apply_rope_fusion
431-
rotary_pos_emb, mscale = self.rotary_pos_emb(rotary_seq_len, packed_seq_params=packed_seq_params)
432+
rotary_pos_emb, mscale = self.rotary_pos_emb(rotary_seq_len, packed_seq=packed_seq)
432433

433434
cu_seqlens_q = packed_seq_params.cu_seqlens_q
434435
cu_seqlens_kv = packed_seq_params.cu_seqlens_kv

0 commit comments

Comments
 (0)