File tree Expand file tree Collapse file tree 2 files changed +3
-1
lines changed Expand file tree Collapse file tree 2 files changed +3
-1
lines changed Original file line number Diff line number Diff line change @@ -129,6 +129,7 @@ def _pangu_torchair_test_fixture(
129
129
distributed_executor_backend = "mp" ,
130
130
enforce_eager = False ,
131
131
additional_config = additional_config ,
132
+ enable_expert_parallel = True ,
132
133
) as vllm_model :
133
134
# use greedy sampler to make sure the generated results are fix
134
135
vllm_output = vllm_model .generate_greedy (example_prompts , 5 )
Original file line number Diff line number Diff line change @@ -356,7 +356,7 @@ def pangu_group8_topk(
356
356
num_tokens = scores .shape [0 ]
357
357
router_scale = _ROUTER_SCALE .squeeze ( # type: ignore
358
358
)
359
-
359
+ # TODO: support disable expert parallel
360
360
ep_size = get_ep_group ().world_size
361
361
local_num_experts = global_num_experts // ep_size
362
362
local_num_group = topk // ep_size
@@ -463,6 +463,7 @@ def __init__(
463
463
custom_routing_function = topk_wrapper (num_voted_experts ),
464
464
prefix = f"{ prefix } .experts" ,
465
465
)
466
+ self .use_ep = self .experts .use_ep
466
467
467
468
self .gate = ReplicatedLinear (
468
469
config .hidden_size ,
You can’t perform that action at this time.
0 commit comments