@@ -179,24 +179,23 @@ jobs:
179
179
VLLM_WORKER_MULTIPROC_METHOD : spawn
180
180
run : |
181
181
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
182
- echo "skip single card"
183
- # VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
184
- # # guided decoding doesn't work, fix it later
185
- # # pytest -sv tests/singlecard/test_guided_decoding.py.py
186
- # # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
187
- # pytest -sv tests/singlecard/test_ascend_config.py
188
- # pytest -sv tests/singlecard/test_camem.py
189
- # pytest -sv tests/singlecard/core/test_ascend_scheduler.py
190
- # pytest -sv tests/singlecard/core/test_ascend_scheduler_e2e.py
191
- # pytest -sv tests/singlecard/ \
192
- # --ignore=tests/singlecard/test_offline_inference.py \
193
- # --ignore=tests/singlecard/test_guided_decoding.py \
194
- # --ignore=tests/singlecard/test_ascend_config.py \
195
- # --ignore=tests/singlecard/test_camem.py \
196
- # --ignore=tests/singlecard/core/test_ascend_scheduler.py \
197
- # --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
182
+ VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
183
+ # guided decoding doesn't work, fix it later
184
+ # pytest -sv tests/singlecard/test_guided_decoding.py.py
185
+ # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
186
+ pytest -sv tests/singlecard/test_ascend_config.py
187
+ pytest -sv tests/singlecard/test_camem.py
188
+ pytest -sv tests/singlecard/core/test_ascend_scheduler.py
189
+ pytest -sv tests/singlecard/core/test_ascend_scheduler_e2e.py
190
+ pytest -sv tests/singlecard/ \
191
+ --ignore=tests/singlecard/test_offline_inference.py \
192
+ --ignore=tests/singlecard/test_guided_decoding.py \
193
+ --ignore=tests/singlecard/test_ascend_config.py \
194
+ --ignore=tests/singlecard/test_camem.py \
195
+ --ignore=tests/singlecard/core/test_ascend_scheduler.py \
196
+ --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
198
197
else
199
- # pytest -sv tests/multicard/test_ilama_lora_tp2.py
198
+ pytest -sv tests/multicard/test_ilama_lora_tp2.py
200
199
# To avoid oom, we need to run the test in a single process.
201
200
VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ
202
201
VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek
@@ -211,22 +210,21 @@ jobs:
211
210
VLLM_USE_V1 : 0
212
211
run : |
213
212
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
214
- echo "skip single card"
215
- # VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
216
- # # guided decoding doesn't work, fix it later
217
- # # pytest -sv tests/singlecard/test_guided_decoding.py.py
218
- # pytest -sv tests/singlecard/test_camem.py
219
- # # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
220
- # pytest -sv tests/singlecard/test_ascend_config.py
221
- # pytest -sv tests/singlecard/test_prompt_embedding.py
222
- # pytest -sv tests/singlecard/ \
223
- # --ignore=tests/singlecard/test_offline_inference.py \
224
- # --ignore=tests/singlecard/test_guided_decoding.py \
225
- # --ignore=tests/singlecard/test_camem.py \
226
- # --ignore=tests/singlecard/test_ascend_config.py \
227
- # --ignore=tests/singlecard/test_prompt_embedding.py \
228
- # --ignore=tests/singlecard/core/test_ascend_scheduler.py \
229
- # --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
213
+ VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
214
+ # guided decoding doesn't work, fix it later
215
+ # pytest -sv tests/singlecard/test_guided_decoding.py.py
216
+ pytest -sv tests/singlecard/test_camem.py
217
+ # test_ascend_config.py should be ran separately because it will regenerate the global config many times.
218
+ pytest -sv tests/singlecard/test_ascend_config.py
219
+ pytest -sv tests/singlecard/test_prompt_embedding.py
220
+ pytest -sv tests/singlecard/ \
221
+ --ignore=tests/singlecard/test_offline_inference.py \
222
+ --ignore=tests/singlecard/test_guided_decoding.py \
223
+ --ignore=tests/singlecard/test_camem.py \
224
+ --ignore=tests/singlecard/test_ascend_config.py \
225
+ --ignore=tests/singlecard/test_prompt_embedding.py \
226
+ --ignore=tests/singlecard/core/test_ascend_scheduler.py \
227
+ --ignore=tests/singlecard/core/test_ascend_scheduler_e2e.py
230
228
else
231
229
pytest -sv tests/multicard/test_ilama_lora_tp2.py
232
230
# Fixme: run VLLM_USE_MODELSCOPE=True pytest -sv tests/multicard/test_offline_inference_distributed.py will raise error.
0 commit comments