Skip to content

Commit bc937a8

Browse files
fix error info
Signed-off-by: shikang-hangzhou <459956190@qq.com>
1 parent e8037d5 commit bc937a8

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

vllm_ascend/multistream/ms_split.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,8 +95,10 @@ def model_input_split_v1_mla_attn(
9595
[num_prefills_pre, num_prefills_post
9696
] = split_attn_int_type(attn_metadata.num_prefills,
9797
max(0, seq_index - attn_metadata.num_decodes))
98-
seq_lens = attn_metadata.prefill.seq_lens if attn_metadata.num_prefills > 0 else attn_metadata.decode.seq_lens
99-
[seq_lens_pre, seq_lens_post] = split_attn_tensor_type(seq_lens, seq_index)
98+
seq_lens = attn_metadata.seq_lens if attn_metadata.num_prefills > 0 else attn_metadata.decode.seq_lens
99+
[seq_lens_pre, seq_lens_post
100+
] = split_attn_tensor_type(seq_lens,
101+
max(0, seq_index - attn_metadata.num_decodes))
100102

101103
query_start_loc_pre = query_start_loc_post = None
102104
if attn_metadata.query_start_loc is not None:
@@ -153,7 +155,7 @@ def model_input_split_v1_mla_attn(
153155
attn_metadata.num_decodes:]
154156
) - attn_metadata.prefill.query_start_loc[seq_index -
155157
attn_metadata.num_decodes]
156-
context_len_pre = seq_lens_pre[attn_metadata.num_decodes:]
158+
context_len_pre = seq_lens_pre
157159
context_len_post = seq_lens_post
158160
prefill_max_query_len_pre = max(prefill_query_lens_pre)
159161
prefill_max_query_len_post = max(prefill_query_lens_post)

0 commit comments

Comments
 (0)