|
47 | 47 | runs-on: ubuntu-latest
|
48 | 48 | strategy:
|
49 | 49 | matrix:
|
50 |
| - python-version: ["3.10"] |
| 50 | + python-version: ["3.11"] |
51 | 51 | vllm_version: [v0.9.1]
|
52 | 52 | steps:
|
53 | 53 | - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
|
@@ -114,12 +114,12 @@ jobs:
|
114 | 114 | strategy:
|
115 | 115 | max-parallel: 2
|
116 | 116 | matrix:
|
117 |
| - os: [linux-arm64-npu-1, linux-arm64-npu-4] |
| 117 | + os: [linux-aarch64-a2-1, linux-aarch64-a2-4] |
118 | 118 | vllm_version: [v0.9.1]
|
119 | 119 | concurrency:
|
120 | 120 | group: >
|
121 | 121 | ${{
|
122 |
| - matrix.os == 'linux-arm64-npu-4' |
| 122 | + matrix.os == 'linux-aarch64-a2-4' |
123 | 123 | && github.event.pull_request.number
|
124 | 124 | && format('pr-{0}-limit-npu-4', github.event.pull_request.number)
|
125 | 125 | || format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_version, github.event.pull_request.number)
|
@@ -179,7 +179,7 @@ jobs:
|
179 | 179 | VLLM_USE_V1: 1
|
180 | 180 | VLLM_WORKER_MULTIPROC_METHOD: spawn
|
181 | 181 | run: |
|
182 |
| - if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then |
| 182 | + if [[ "${{ matrix.os }}" == "linux-aarch64-a2-1" ]]; then |
183 | 183 | VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
|
184 | 184 | # guided decoding doesn't work, fix it later
|
185 | 185 | # pytest -sv tests/singlecard/test_guided_decoding.py.py
|
@@ -216,7 +216,7 @@ jobs:
|
216 | 216 | env:
|
217 | 217 | VLLM_USE_V1: 0
|
218 | 218 | run: |
|
219 |
| - if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then |
| 219 | + if [[ "${{ matrix.os }}" == "linux-aarch64-a2-1" ]]; then |
220 | 220 | VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
|
221 | 221 | # guided decoding doesn't work, fix it later
|
222 | 222 | # pytest -sv tests/singlecard/test_guided_decoding.py.py
|
|
0 commit comments