Skip to content

Commit 464270e

Browse files
Remove useless PD check in deepseek (#3161)
### What this PR does / why we need it? Remove useless PD check in deepseek ### How was this patch tested? - vLLM version: v0.10.2 - vLLM main: vllm-project/vllm@f225ea7 Signed-off-by: wangxiaoteng <wangxiaoteng@huawei.com> Co-authored-by: wangxiaoteng <wangxiaoteng@huawei.com>
1 parent 4ee58e2 commit 464270e

File tree

1 file changed

+1
-12
lines changed

1 file changed

+1
-12
lines changed

vllm_ascend/torchair/models/torchair_deepseek_v2.py

Lines changed: 1 addition & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -32,8 +32,7 @@
3232
from torch import nn
3333
from transformers import PretrainedConfig
3434
from vllm.attention import Attention, AttentionMetadata
35-
from vllm.config import (CacheConfig, ModelConfig, VllmConfig,
36-
get_current_vllm_config)
35+
from vllm.config import CacheConfig, ModelConfig, VllmConfig
3736
from vllm.distributed import (get_pp_group, get_tensor_model_parallel_rank,
3837
get_tensor_model_parallel_world_size,
3938
get_tp_group, split_tensor_along_last_dim,
@@ -376,10 +375,6 @@ def __init__(
376375
self.tp_group = get_tp_group().device_group
377376
self.tp_rank = get_tp_group().rank_in_group
378377
self.ep_group = get_ep_group()
379-
self.kv_consumer = None
380-
transfer_config = get_current_vllm_config().kv_transfer_config
381-
if transfer_config is not None:
382-
self.kv_consumer = transfer_config.kv_role == "kv_consumer"
383378

384379
self.params_dtype = torch.get_default_dtype()
385380
self.rm_router_logits = self.experts.rm_router_logits
@@ -397,12 +392,6 @@ def forward(self,
397392

398393
is_prefill = forward_context.with_prefill
399394

400-
# If this node is kv_consumer, we force the moe always runs in decode path to make sure
401-
# the behaviour aligned between dummy_run and normal model_execute.
402-
if self.kv_consumer:
403-
is_prefill = False
404-
enable_force_load_balance = False
405-
406395
# router_logits: (num_tokens, n_experts)
407396
router_logits = None
408397
if not self.rm_router_logits and not self.multistream_overlap_shared_expert:

0 commit comments

Comments
 (0)