Skip to content

Commit 91b22c9

Browse files
fix verify rules
Signed-off-by: SunnyLee219 <3294305115@qq.com>
1 parent 64c8ca6 commit 91b22c9

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

vllm_ascend/core/schedule_config.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,11 @@ def __post_init__(self) -> None:
5555
self.max_num_encoder_input_tokens = self.max_num_batched_tokens
5656
self.encoder_cache_size = self.max_num_batched_tokens
5757
self.chunked_prefill_enabled = self.enable_chunked_prefill
58-
if (self.max_num_batched_tokens < self.max_model_len
58+
if self.enable_sequence_parallel:
59+
model_len_per_sp_cp = self.max_model_len // self.context_parallel_size // self.tensor_parallel_size
60+
else:
61+
model_len_per_sp_cp = self.max_model_len // self.context_parallel_size
62+
if (self.max_num_batched_tokens < model_len_per_sp_cp
5963
and not self.chunked_prefill_enabled):
6064
raise ValueError(
6165
"Ascend scheduler is enabled without chunked prefill feature. "

0 commit comments

Comments
 (0)