|
25 | 25 | branches:
|
26 | 26 | - 'main'
|
27 | 27 | - '*-dev'
|
28 |
| - |
29 | 28 | # Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
|
30 | 29 | # declared as "shell: bash -el {0}" on steps that need to be properly activated.
|
31 | 30 | # It's used to activate ascend-toolkit environment variables.
|
|
44 | 43 | uses: ./.github/workflows/pre-commit.yml
|
45 | 44 |
|
46 | 45 | changes:
|
47 |
| - runs-on: ubuntu-latest |
| 46 | + runs-on: linux-amd64-cpu-0 |
| 47 | + container: |
| 48 | + image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11 |
48 | 49 | outputs:
|
49 | 50 | e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
|
50 | 51 | ut_tracker: ${{ steps.filter.outputs.ut_tracker }}
|
|
68 | 69 | - 'packages.txt'
|
69 | 70 | ut_tracker:
|
70 | 71 | - 'tests/ut/**'
|
| 72 | +
|
71 | 73 | ut:
|
72 | 74 | needs: [lint, changes]
|
73 | 75 | name: unit test
|
|
81 | 83 | VLLM_USE_MODELSCOPE: True
|
82 | 84 | strategy:
|
83 | 85 | matrix:
|
84 |
| - vllm_version: [v0.10.1.1, main] |
| 86 | + vllm_version: [main] |
85 | 87 | steps:
|
86 | 88 | - name: Install packages
|
87 | 89 | run: |
|
@@ -129,16 +131,16 @@ jobs:
|
129 | 131 | name: vllm-ascend
|
130 | 132 | verbose: true
|
131 | 133 |
|
132 |
| - e2e: |
| 134 | + e2e-light: |
133 | 135 | needs: [lint, changes]
|
134 | 136 | # only trigger e2e test after lint passed and the change is e2e related with pull request.
|
135 |
| - if: ${{ github.event_name == 'pull_request' && needs.lint.result == 'success' && needs.changes.outputs.e2e_tracker == 'true' }} |
| 137 | + if: ${{ github.event_name == 'pull_request' && needs.lint.result == 'success' && needs.changes.outputs.e2e_tracker == 'true' && !contains(github.event.pull_request.labels.*.name, 'ready') }} |
136 | 138 | strategy:
|
137 | 139 | max-parallel: 2
|
138 | 140 | matrix:
|
139 | 141 | os: [linux-aarch64-a2-1]
|
140 |
| - vllm_version: [v0.10.1.1, main] |
141 |
| - name: singlecard e2e test |
| 142 | + vllm_version: [main] |
| 143 | + name: singlecard e2e test - light |
142 | 144 | runs-on: ${{ matrix.os }}
|
143 | 145 | container:
|
144 | 146 | image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
|
@@ -191,38 +193,19 @@ jobs:
|
191 | 193 | VLLM_WORKER_MULTIPROC_METHOD: spawn
|
192 | 194 | VLLM_USE_MODELSCOPE: True
|
193 | 195 | run: |
|
194 |
| - # We found that if running aclgraph tests in batch, it will cause AclmdlRICaptureBegin error. So we run |
195 |
| - # the test separately. |
196 |
| -
|
197 | 196 | pytest -sv tests/e2e/singlecard/test_aclgraph.py
|
198 |
| - pytest -sv tests/e2e/singlecard/test_ascend_scheduler.py |
199 |
| - pytest -sv tests/e2e/singlecard/test_camem.py |
200 |
| - pytest -sv tests/e2e/singlecard/test_chunked.py |
201 |
| - pytest -sv tests/e2e/singlecard/test_embedding.py |
202 |
| - pytest -sv tests/e2e/singlecard/test_guided_decoding.py |
203 |
| - # TODO: Fix lora accuracy error |
204 |
| - pytest -sv tests/e2e/singlecard/test_ilama_lora.py |
205 |
| - pytest -sv tests/e2e/singlecard/test_profile_execute_duration.py |
206 | 197 | pytest -sv tests/e2e/singlecard/test_quantization.py
|
207 |
| - pytest -sv tests/e2e/singlecard/test_sampler.py |
208 |
| - pytest -sv tests/e2e/singlecard/test_vlm.py |
209 |
| -
|
210 |
| - # ------------------------------------ v1 spec decode test ------------------------------------ # |
211 |
| - pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py |
212 |
| - pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py |
213 |
| - pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py |
214 |
| -
|
215 |
| - pytest -sv tests/e2e/singlecard/ops/ |
| 198 | + pytest -sv tests/e2e/singlecard/test_vlm.py::test_multimodal_vl |
216 | 199 |
|
217 |
| - e2e-2-cards: |
218 |
| - needs: [e2e] |
219 |
| - if: ${{ needs.e2e.result == 'success' }} |
| 200 | + e2e-2-cards-light: |
| 201 | + needs: [e2e-light] |
| 202 | + if: ${{ needs.e2e-light.result == 'success' }} |
220 | 203 | strategy:
|
221 | 204 | max-parallel: 2
|
222 | 205 | matrix:
|
223 | 206 | os: [linux-aarch64-a2-2]
|
224 |
| - vllm_version: [v0.10.1.1, main] |
225 |
| - name: multicard e2e test |
| 207 | + vllm_version: [main] |
| 208 | + name: multicard e2e test - light |
226 | 209 | runs-on: ${{ matrix.os }}
|
227 | 210 | container:
|
228 | 211 | image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
|
@@ -275,22 +258,4 @@ jobs:
|
275 | 258 | VLLM_WORKER_MULTIPROC_METHOD: spawn
|
276 | 259 | VLLM_USE_MODELSCOPE: True
|
277 | 260 | run: |
|
278 |
| - pytest -sv tests/e2e/multicard/test_data_parallel.py |
279 |
| - pytest -sv tests/e2e/multicard/test_expert_parallel.py |
280 |
| - # external_launcher test is not stable enough. Fix it later |
281 |
| - # pytest -sv tests/e2e/multicard/test_external_launcher.py |
282 |
| - pytest -sv tests/e2e/multicard/test_fused_moe_allgather_ep.py |
283 |
| - pytest -sv tests/e2e/multicard/test_ilama_lora_tp2.py |
284 |
| -
|
285 |
| - # To avoid oom, we need to run the test in a single process. |
286 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ |
287 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_multistream_moe |
288 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W8A8 |
289 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_Qwen3_W4A8DYNAMIC |
290 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_DeepSeek_W4A8DYNAMIC |
291 |
| - pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_sp_for_qwen3_moe |
292 |
| -
|
293 |
| - #pytest -sv tests/e2e/multicard/test_pipeline_parallel.py |
294 |
| - pytest -sv tests/e2e/multicard/test_prefix_caching.py |
295 |
| - pytest -sv tests/e2e/multicard/test_qwen3_moe.py |
296 |
| - pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py |
| 261 | + pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP |
0 commit comments