Skip to content

Commit 4dd626f

Browse files
committed
don't enable AscendScheduler when async_scheduling is enabled
Signed-off-by: Ronald1995 <ronaldautomobile@163.com>
1 parent d01fd1d commit 4dd626f

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm_ascend/platform.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -135,7 +135,8 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
135135
else:
136136
structured_outputs_config = vllm_config.structured_outputs_config
137137

138-
if model_config is not None and not model_config.use_mla:
138+
if (model_config is not None and not model_config.use_mla
139+
and not scheduler_config.async_scheduling):
139140
logger.info(
140141
"Non-MLA LLMs forcibly disable the chunked prefill feature,"
141142
"as the performance of operators supporting this feature "

0 commit comments

Comments
 (0)