@@ -179,23 +179,24 @@ jobs:
179
179
VLLM_WORKER_MULTIPROC_METHOD : spawn
180
180
run : |
181
181
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
182
- VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
183
- # guided decoding doesn't work, fix it later
184
- # pytest -sv tests/singlecard/test_guided_decoding.py.py
185
- # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
186
- pytest -sv tests/singlecard/test_ascend_config.py
187
- pytest -sv tests/singlecard/test_camem.py
188
- pytest -sv tests/singlecard/core/test_ascend_scheduler.py
189
- pytest -sv tests/singlecard/core/test_ascend_scheduler_e2e.py
190
- pytest -sv tests/singlecard/ \
191
- --ignore=tests/singlecard/test_offline_inference.py \
192
- --ignore=tests/singlecard/test_guided_decoding.py \
193
- --ignore=tests/singlecard/test_ascend_config.py \
194
- --ignore=tests/singlecard/test_camem.py \
195
- --ignore=tests/singlecard/core/test_ascend_scheduler.py \
196
- --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
182
+ echo "skip single card"
183
+ # VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
184
+ # # guided decoding doesn't work, fix it later
185
+ # # pytest -sv tests/singlecard/test_guided_decoding.py.py
186
+ # # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
187
+ # pytest -sv tests/singlecard/test_ascend_config.py
188
+ # pytest -sv tests/singlecard/test_camem.py
189
+ # pytest -sv tests/singlecard/core/test_ascend_scheduler.py
190
+ # pytest -sv tests/singlecard/core/test_ascend_scheduler_e2e.py
191
+ # pytest -sv tests/singlecard/ \
192
+ # --ignore=tests/singlecard/test_offline_inference.py \
193
+ # --ignore=tests/singlecard/test_guided_decoding.py \
194
+ # --ignore=tests/singlecard/test_ascend_config.py \
195
+ # --ignore=tests/singlecard/test_camem.py \
196
+ # --ignore=tests/singlecard/core/test_ascend_scheduler.py \
197
+ # --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
197
198
else
198
- pytest -sv tests/multicard/test_ilama_lora_tp2.py
199
+ # pytest -sv tests/multicard/test_ilama_lora_tp2.py
199
200
# To avoid oom, we need to run the test in a single process.
200
201
VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ
201
202
VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek
@@ -210,21 +211,22 @@ jobs:
210
211
VLLM_USE_V1 : 0
211
212
run : |
212
213
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
213
- VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
214
- # guided decoding doesn't work, fix it later
215
- # pytest -sv tests/singlecard/test_guided_decoding.py.py
216
- pytest -sv tests/singlecard/test_camem.py
217
- # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
218
- pytest -sv tests/singlecard/test_ascend_config.py
219
- pytest -sv tests/singlecard/test_prompt_embedding.py
220
- pytest -sv tests/singlecard/ \
221
- --ignore=tests/singlecard/test_offline_inference.py \
222
- --ignore=tests/singlecard/test_guided_decoding.py \
223
- --ignore=tests/singlecard/test_camem.py \
224
- --ignore=tests/singlecard/test_ascend_config.py \
225
- --ignore=tests/singlecard/test_prompt_embedding.py \
226
- --ignore=tests/singlecard/core/test_ascend_scheduler.py \
227
- --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
214
+ echo "skip single card"
215
+ # VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
216
+ # # guided decoding doesn't work, fix it later
217
+ # # pytest -sv tests/singlecard/test_guided_decoding.py.py
218
+ # pytest -sv tests/singlecard/test_camem.py
219
+ # # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
220
+ # pytest -sv tests/singlecard/test_ascend_config.py
221
+ # pytest -sv tests/singlecard/test_prompt_embedding.py
222
+ # pytest -sv tests/singlecard/ \
223
+ # --ignore=tests/singlecard/test_offline_inference.py \
224
+ # --ignore=tests/singlecard/test_guided_decoding.py \
225
+ # --ignore=tests/singlecard/test_camem.py \
226
+ # --ignore=tests/singlecard/test_ascend_config.py \
227
+ # --ignore=tests/singlecard/test_prompt_embedding.py \
228
+ # --ignore=tests/singlecard/core/test_ascend_scheduler.py \
229
+ # --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
228
230
else
229
231
pytest -sv tests/multicard/test_ilama_lora_tp2.py
230
232
# Fixme: run VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py will raise error.
0 commit comments