Skip to content

Commit 46f1b64

Browse files
committed
fix sleepmode level2 e2e test
Signed-off-by: wangx700 <wangxin700@huawei.com>
1 parent 737cad2 commit 46f1b64

File tree

5 files changed

+14
-2
lines changed

5 files changed

+14
-2
lines changed

.github/workflows/_e2e_test.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -182,7 +182,7 @@ jobs:
182182
pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py
183183
pytest -sv tests/e2e/multicard/test_data_parallel.py
184184
pytest -sv tests/e2e/multicard/test_expert_parallel.py
185-
# pytest -sv tests/e2e/multicard/test_external_launcher.py
185+
pytest -sv tests/e2e/multicard/test_external_launcher.py
186186
pytest -sv tests/e2e/multicard/test_single_request_aclgraph.py
187187
pytest -sv tests/e2e/multicard/test_fused_moe_allgather_ep.py
188188
pytest -sv tests/e2e/multicard/test_ilama_lora_tp2.py

tests/e2e/multicard/test_external_launcher.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -108,6 +108,7 @@ def test_moe_external_launcher(model):
108108
assert proc.returncode == 0
109109

110110

111+
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_NZ": "0"})
111112
def test_external_launcher_and_sleepmode():
112113
script = Path(
113114
__file__
@@ -154,6 +155,7 @@ def test_external_launcher_and_sleepmode():
154155
assert proc.returncode == 0
155156

156157

158+
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_NZ": "0"})
157159
def test_external_launcher_and_sleepmode_level2():
158160
script = Path(
159161
__file__

tests/e2e/singlecard/test_camem.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,8 @@
1818
#
1919

2020
import gc
21+
import os
22+
from unittest.mock import patch
2123

2224
import torch
2325
from vllm import SamplingParams
@@ -71,6 +73,7 @@ def test_basic_camem():
7173

7274

7375
@fork_new_process_for_each_test
76+
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_NZ": "0"})
7477
def test_end_to_end():
7578
free, total = torch.npu.mem_get_info()
7679
used_bytes_baseline = total - free # in case other process is running

tests/ut/worker/test_worker_v1.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -273,6 +273,7 @@ def test_sleep_mode_disabled_raises_error(self, mock_sleep_mode_enabled):
273273

274274
@patch("vllm_ascend.worker.worker_v1.sleep_mode_enabled")
275275
@patch("vllm_ascend.worker.worker_v1.CaMemAllocator")
276+
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_NZ": "0"})
276277
def test_wake_up_mode_enabled(self, mock_allocator_class,
277278
mock_sleep_mode_enabled):
278279
"""Test wake_up method when sleep mode is enabled"""
@@ -295,6 +296,7 @@ def test_wake_up_mode_enabled(self, mock_allocator_class,
295296
mock_allocator.wake_up.assert_called_once_with(tags=["test_tag"])
296297

297298
@patch("vllm_ascend.worker.worker_v1.sleep_mode_enabled")
299+
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_NZ": "0"})
298300
def test_wake_up_mode_disabled_raises_error(self, mock_sleep_mode_enabled):
299301
"""Test wake_up method raises exception when sleep mode is disabled"""
300302
from vllm_ascend.worker.worker_v1 import NPUWorker

vllm_ascend/worker/worker_v1.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@
4747
from vllm_ascend.device_allocator.camem import CaMemAllocator
4848
from vllm_ascend.distributed.parallel_state import init_ascend_model_parallel
4949
from vllm_ascend.platform import NPUPlatform
50-
from vllm_ascend.utils import (init_ascend_soc_version,
50+
from vllm_ascend.utils import (init_ascend_soc_version, is_enable_nz,
5151
prefill_context_parallel_enable,
5252
register_ascend_customop, sleep_mode_enabled,
5353
try_register_lib, vllm_version_is)
@@ -184,6 +184,11 @@ def wake_up(self, tags: Optional[list[str]] = None) -> None:
184184
raise ValueError(
185185
"Sleep mode is not enabled. Please compile vllm-ascend with COMPILE_CUSTOM_KERNELS=1."
186186
)
187+
188+
if is_enable_nz():
189+
raise ValueError(
190+
"FRACTAL_NZ mode is enabled. This may cause model parameter precision issues "
191+
"in the RL scenarios. Please set VLLM_ASCEND_ENABLE_NZ=0.")
187192
allocator = CaMemAllocator.get_instance()
188193
allocator.wake_up(tags=tags)
189194

0 commit comments

Comments
 (0)