File tree Expand file tree Collapse file tree 1 file changed +5
-1
lines changed Expand file tree Collapse file tree 1 file changed +5
-1
lines changed Original file line number Diff line number Diff line change @@ -55,7 +55,11 @@ def __post_init__(self) -> None:
55
55
self .max_num_encoder_input_tokens = self .max_num_batched_tokens
56
56
self .encoder_cache_size = self .max_num_batched_tokens
57
57
self .chunked_prefill_enabled = self .enable_chunked_prefill
58
- if (self .max_num_batched_tokens < self .max_model_len
58
+ if self .enable_sequence_parallel :
59
+ model_len_per_sp_cp = self .max_model_len // self .context_parallel_size // self .tensor_parallel_size
60
+ else :
61
+ model_len_per_sp_cp = self .max_model_len // self .context_parallel_size
62
+ if (self .max_num_batched_tokens < model_len_per_sp_cp
59
63
and not self .chunked_prefill_enabled ):
60
64
raise ValueError (
61
65
"Ascend scheduler is enabled without chunked prefill feature. "
You can’t perform that action at this time.
0 commit comments