From d5abb9c70a853ed7fc3ef67e163c28b6f76b509d Mon Sep 17 00:00:00 2001 From: tomzw11 Date: Thu, 4 Jun 2026 14:59:49 +0800 Subject: [PATCH] Fix assertion error when packed_seq_params is passed without proper qkv_format Only set cu_seqlens when all conditions are met: - packed_seq_params is not None - qkv_format is 'thd' - cu_seqlens_q is not None --- src/mcore_bridge/model/modules/gated_delta_net.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/src/mcore_bridge/model/modules/gated_delta_net.py b/src/mcore_bridge/model/modules/gated_delta_net.py index d2ee0dd..84dd0fd 100644 --- a/src/mcore_bridge/model/modules/gated_delta_net.py +++ b/src/mcore_bridge/model/modules/gated_delta_net.py @@ -184,7 +184,13 @@ def forward( # TODO: support inference raise NotImplementedError('GDN does not support inference for now.') - cu_seqlens = None if packed_seq_params is None else packed_seq_params.cu_seqlens_q + # Only use packed sequences when qkv_format is 'thd' and cu_seqlens_q is present + cu_seqlens = None + if (packed_seq_params is not None and + hasattr(packed_seq_params, 'qkv_format') and + packed_seq_params.qkv_format == 'thd' and + packed_seq_params.cu_seqlens_q is not None): + cu_seqlens = packed_seq_params.cu_seqlens_q # Input projection num_key_heads_per_device = self.num_key_heads // self.tp_size // cp_size nvtx_range_push(suffix='in_proj')