Skip to content

Commit ad76e33

Browse files
committed
feat(moe): Add patch for Shared Fused MoE integration with DeepSeek-V2 and Llama4
Signed-off-by: Yizhou Liu <liu_yizhou@outlook.com>
1 parent 7a4854b commit ad76e33

File tree

3 files changed

+22
-4
lines changed

3 files changed

+22
-4
lines changed

vllm_ascend/models/deepseek_v2.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,6 @@
5555
ParallelLMHead, VocabParallelEmbedding)
5656
from vllm.model_executor.model_loader.weight_utils import (
5757
default_weight_loader, maybe_remap_kv_scale_name)
58-
from vllm.model_executor.models import deepseek_v2
5958
from vllm.model_executor.models.deepseek_v2 import \
6059
DeepseekV2ForCausalLM # noqa: E501
6160
from vllm.model_executor.models.deepseek_v2 import \
@@ -69,14 +68,11 @@
6968
from vllm.sequence import IntermediateTensors
7069

7170
from vllm_ascend.ascend_config import get_ascend_config
72-
from vllm_ascend.ops.common_fused_moe import AscendSharedFusedMoE
7371
from vllm_ascend.ops.fused_moe import AscendFusedMoE
7472
from vllm_ascend.quantization.quant_config import AscendLinearMethod
7573
from vllm_ascend.quantization.w8a8_dynamic import AscendW8A8DynamicLinearMethod
7674
from vllm_ascend.utils import dispose_tensor
7775

78-
deepseek_v2.SharedFusedMoE = AscendSharedFusedMoE
79-
8076

8177
class CustomDeepseekV2SiluAndMul(SiluAndMul):
8278

vllm_ascend/patch/platform/patch_common/__init__.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,3 +16,4 @@
1616
#
1717

1818
import vllm_ascend.patch.platform.patch_common.patch_distributed # noqa
19+
import vllm_ascend.patch.platform.patch_common.patch_shared_fused_moe # noqa
Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
2+
# Copyright 2023 The vLLM team.
3+
#
4+
# Licensed under the Apache License, Version 2.0 (the "License");
5+
# you may not use this file except in compliance with the License.
6+
# You may obtain a copy of the License at
7+
#
8+
# http://www.apache.org/licenses/LICENSE-2.0
9+
#
10+
# Unless required by applicable law or agreed to in writing, software
11+
# distributed under the License is distributed on an "AS IS" BASIS,
12+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
# See the License for the specific language governing permissions and
14+
# limitations under the License.
15+
16+
from vllm.model_executor.models import deepseek_v2, llama4
17+
18+
from vllm_ascend.ops.common_fused_moe import AscendSharedFusedMoE
19+
20+
deepseek_v2.SharedFusedMoE = AscendSharedFusedMoE
21+
llama4.SharedFusedMoE = AscendSharedFusedMoE

0 commit comments

Comments
 (0)