Skip to content

Commit cf9ffd4

Browse files
committed
Switch Infra to linux-aarch64-a2 and python to 3.11
Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
1 parent 8129317 commit cf9ffd4

File tree

7 files changed

+17
-15
lines changed

7 files changed

+17
-15
lines changed

.github/Dockerfile.buildwheel

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
# limitations under the License.
1515
# This file is a part of the vllm-ascend project.
1616
#
17-
ARG PY_VERSION=3.10
17+
ARG PY_VERSION=3.11
1818
FROM quay.io/ascend/manylinux:8.0.0-910b-manylinux_2_28-py${PY_VERSION}
1919

2020
ARG COMPILE_CUSTOM_KERNELS=1

.github/actionlint.yaml

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,10 @@
11
self-hosted-runner:
22
# Labels of self-hosted runner in array of strings.
33
labels:
4-
- linux-arm64-npu-1
5-
- linux-arm64-npu-2
6-
- linux-arm64-npu-4
4+
- linux-aarch64-a2-0
5+
- linux-aarch64-a2-1
6+
- linux-aarch64-a2-2
7+
- linux-aarch64-a2-4
8+
- linux-aarch64-a2-8
79
- linux-arm64-npu-static-8
810
- ubuntu-24.04-arm

.github/workflows/accuracy_test.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -79,8 +79,8 @@ jobs:
7979
}}
8080
runs-on: >-
8181
${{
82-
(matrix.model_name == 'Qwen/Qwen2.5-VL-7B-Instruct' && 'linux-arm64-npu-4') ||
83-
'linux-arm64-npu-2'
82+
(matrix.model_name == 'Qwen/Qwen2.5-VL-7B-Instruct' && 'linux-aarch64-a2-4') ||
83+
'linux-aarch64-a2-2'
8484
}}
8585
strategy:
8686
matrix:

.github/workflows/release_code.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ jobs:
5353
runs-on: ubuntu-latest
5454
strategy:
5555
matrix:
56-
python-version: ["3.10"]
56+
python-version: ["3.11"]
5757
steps:
5858
- uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
5959

.github/workflows/vllm_ascend_doctest.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ jobs:
4545
matrix:
4646
vllm_verison: [main, v0.7.3-dev, main-openeuler, v0.7.3-dev-openeuler]
4747
name: vLLM Ascend test
48-
runs-on: linux-arm64-npu-1
48+
runs-on: linux-aarch64-a2-1
4949
container:
5050
image: m.daocloud.io/quay.io/ascend/vllm-ascend:${{ matrix.vllm_verison }}
5151
steps:

.github/workflows/vllm_ascend_test.yaml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ jobs:
4747
runs-on: ubuntu-latest
4848
strategy:
4949
matrix:
50-
python-version: ["3.10"]
50+
python-version: ["3.11"]
5151
vllm_version: [v0.9.1]
5252
steps:
5353
- uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
@@ -114,12 +114,12 @@ jobs:
114114
strategy:
115115
max-parallel: 2
116116
matrix:
117-
os: [linux-arm64-npu-1, linux-arm64-npu-4]
117+
os: [linux-aarch64-a2-1, linux-aarch64-a2-4]
118118
vllm_version: [v0.9.1]
119119
concurrency:
120120
group: >
121121
${{
122-
matrix.os == 'linux-arm64-npu-4'
122+
matrix.os == 'linux-aarch64-a2-4'
123123
&& github.event.pull_request.number
124124
&& format('pr-{0}-limit-npu-4', github.event.pull_request.number)
125125
|| format('job-{0}-{1}-{2}', matrix.os, matrix.vllm_version, github.event.pull_request.number)
@@ -179,7 +179,7 @@ jobs:
179179
VLLM_USE_V1: 1
180180
VLLM_WORKER_MULTIPROC_METHOD: spawn
181181
run: |
182-
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
182+
if [[ "${{ matrix.os }}" == "linux-aarch64-a2-1" ]]; then
183183
VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
184184
# guided decoding doesn't work, fix it later
185185
# pytest -sv tests/singlecard/test_guided_decoding.py.py
@@ -216,7 +216,7 @@ jobs:
216216
env:
217217
VLLM_USE_V1: 0
218218
run: |
219-
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
219+
if [[ "${{ matrix.os }}" == "linux-aarch64-a2-1" ]]; then
220220
VLLM_USE_MODELSCOPE=True pytest -sv tests/singlecard/test_offline_inference.py
221221
# guided decoding doesn't work, fix it later
222222
# pytest -sv tests/singlecard/test_guided_decoding.py.py

.github/workflows/vllm_ascend_test_long_term.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ jobs:
3939
strategy:
4040
max-parallel: 2
4141
matrix:
42-
os: [linux-arm64-npu-1, linux-arm64-npu-4]
42+
os: [linux-aarch64-a2-1, linux-aarch64-a2-4]
4343
vllm_version: [v0.9.1]
4444
name: vLLM Ascend long term test
4545
runs-on: ${{ matrix.os }}
@@ -93,7 +93,7 @@ jobs:
9393
9494
- name: Run vllm-project/vllm-ascend long term test
9595
run: |
96-
if [[ "${{ matrix.os }}" == "linux-arm64-npu-1" ]]; then
96+
if [[ "${{ matrix.os }}" == "llinux-aarch64-a2-1" ]]; then
9797
# v0 spec decode test
9898
# VLLM_USE_MODELSCOPE=True pytest -sv tests/long_term/spec_decode_v0/e2e/test_mtp_correctness.py # it needs a clean process
9999
# pytest -sv tests/long_term/spec_decode_v0 --ignore=tests/long_term/spec_decode_v0/e2e/test_mtp_correctness.py

0 commit comments

Comments
 (0)