Skip to content

Commit e8bb2cd

Browse files
committed
modify parallel_factor
Signed-off-by: whx-sjtu <2952154980@qq.com>
1 parent e939ddd commit e8bb2cd

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm_ascend/utils.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -321,7 +321,8 @@ def update_aclgraph_sizes(vllm_config: VllmConfig) -> None:
321321
if os.getenv("HCCL_OP_EXPANSION_MODE") == 'AIV':
322322
# TODO: Find out whether we need to take into account the pp_size
323323
parallel_factor = 1 + num_comm_groups + int(
324-
parallel_config.enable_expert_parallel)
324+
parallel_config.enable_expert_parallel) + int(
325+
vllm_config.additional_config.get("multistream_overlap_shared_expert", False))
325326
if is_moe_model(vllm_config):
326327
parallel_factor += (parallel_config.data_parallel_size > 1)
327328
# Calculate maximum supported batch sizes considering model architecture on the A2 Hardware Device

0 commit comments

Comments
 (0)