[Doc] eval-type not support service but server, and test the result b… #12344

Workflow file for this run

.github/workflows/vllm_ascend_test.yaml at 56efa2d

	#
	# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# This file is a part of the vllm-ascend project.
	#

	name: 'test'

	on:
	push:
	branches:
	- 'main'
	pull_request:
	branches:
	- 'main'
	- '*-dev'
	# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
	# declared as "shell: bash -el {0}" on steps that need to be properly activated.
	# It's used to activate ascend-toolkit environment variables.
	defaults:
	run:
	shell: bash -el {0}

	# only cancel in-progress runs of the same workflow
	# and ignore the lint / 1 card / 4 cards test type
	concurrency:
	group: ${{ github.workflow }}-${{ github.ref }}
	cancel-in-progress: true

	jobs:
	lint:
	uses: ./.github/workflows/pre-commit.yml

	changes:
	if: github.event_name == 'pull_request'
	runs-on: ubuntu-latest
	outputs:
	e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
	ut_tracker: ${{ steps.filter.outputs.ut_tracker }}
	steps:
	- uses: actions/checkout@v4
	- uses: dorny/paths-filter@v3
	id: filter
	with:
	filters: \|
	e2e_tracker:
	- '.github/workflows/vllm_ascend_test.yaml'
	- 'vllm_ascend/**'
	- 'csrc/**'
	- 'cmake/**'
	- 'tests/e2e/**'
	- 'CMakeLists.txt'
	- 'setup.py'
	- 'requirements.txt'
	- 'requirements-dev.txt'
	- 'requirements-lint.txt'
	- 'packages.txt'
	ut_tracker:
	- 'tests/ut/**'

	ut:
	needs: [lint, changes]
	name: unit test
	# only trigger unit test after lint passed and the change is e2e and ut related.
	if: ${{ needs.lint.result == 'success' && (needs.changes.outputs.e2e_tracker == 'true' \|\| needs.changes.outputs.ut_tracker == 'true') }}
	runs-on: ubuntu-latest
	container:
	image: quay.io/ascend/cann:8.2.rc1-910b-ubuntu22.04-py3.11
	env:
	VLLM_LOGGING_LEVEL: ERROR
	VLLM_USE_MODELSCOPE: True
	strategy:
	matrix:
	vllm_version: [v0.10.2]
	steps:
	- name: Install packages
	run: \|
	apt-get update -y
	apt-get install -y python3-pip git vim wget net-tools gcc g++ cmake libnuma-dev curl gnupg2

	- name: Checkout vllm-project/vllm repo
	uses: actions/checkout@v4
	with:
	repository: vllm-project/vllm
	ref: ${{ matrix.vllm_version }}
	path: ./vllm-empty

	- name: Install vllm-project/vllm from source
	working-directory: ./vllm-empty
	run: \|
	VLLM_TARGET_DEVICE=empty python3 -m pip install . --extra-index https://download.pytorch.org/whl/cpu/
	python3 -m pip uninstall -y triton

	- name: Checkout vllm-project/vllm-ascend repo
	uses: actions/checkout@v4

	- name: Install vllm-project/vllm-ascend
	run: \|
	export PIP_EXTRA_INDEX_URL=https://mirrors.huaweicloud.com/ascend/repos/pypi
	export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/x86_64-linux/devlib
	python3 -m pip install -r requirements-dev.txt --extra-index https://download.pytorch.org/whl/cpu/
	python3 -m pip install -v . --extra-index https://download.pytorch.org/whl/cpu/

	- name: Run unit test
	env:
	VLLM_WORKER_MULTIPROC_METHOD: spawn
	TORCH_DEVICE_BACKEND_AUTOLOAD: 0
	run: \|
	export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/x86_64-linux/devlib
	pytest -sv --cov --cov-report=xml:unittests-coverage.xml tests/ut --ignore=tests/ut/test_platform.py --ignore=tests/ut/ops/test_vocab_parallel_embedding.py

	- name: Upload coverage to Codecov
	if: ${{ matrix.vllm_version == 'main' }}
	uses: codecov/codecov-action@v5
	env:
	CODECOV_TOKEN: ${{ secrets.CODECOV_TOKEN }}
	with:
	flags: unittests
	name: vllm-ascend
	verbose: true

	e2e-light:
	needs: [lint, changes]
	# only trigger e2e test after lint passed and the change is e2e related with pull request.
	if: ${{ github.event_name == 'pull_request' && needs.lint.result == 'success' && needs.changes.outputs.e2e_tracker == 'true' && !contains(github.event.pull_request.labels.*.name, 'ready') }}
	strategy:
	max-parallel: 2
	matrix:
	os: [linux-aarch64-a2-1]
	vllm_version: [v0.10.2]
	name: singlecard e2e test - light
	runs-on: ${{ matrix.os }}
	container:
	image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
	env:
	VLLM_LOGGING_LEVEL: ERROR
	VLLM_USE_MODELSCOPE: True
	steps:
	- name: Check npu and CANN info
	run: \|
	npu-smi info
	cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info

	- name: Config mirrors
	run: \|
	sed -Ei 's@(ports\|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
	pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
	pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
	apt-get update -y
	apt install git -y

	- name: Checkout vllm-project/vllm-ascend repo
	uses: actions/checkout@v4

	- name: Install system dependencies
	run: \|
	apt-get -y install `cat packages.txt`
	apt-get -y install gcc g++ cmake libnuma-dev

	- name: Checkout vllm-project/vllm repo
	uses: actions/checkout@v4
	with:
	repository: vllm-project/vllm
	ref: ${{ matrix.vllm_version }}
	path: ./vllm-empty

	- name: Install vllm-project/vllm from source
	working-directory: ./vllm-empty
	run: \|
	VLLM_TARGET_DEVICE=empty pip install -e .

	- name: Install vllm-project/vllm-ascend
	env:
	PIP_EXTRA_INDEX_URL: https://mirrors.huaweicloud.com/ascend/repos/pypi
	run: \|
	pip install -r requirements-dev.txt
	pip install -v -e .

	- name: Run e2e test
	env:
	VLLM_WORKER_MULTIPROC_METHOD: spawn
	VLLM_USE_MODELSCOPE: True
	run: \|
	pytest -sv tests/e2e/singlecard/test_aclgraph.py
	pytest -sv tests/e2e/singlecard/test_quantization.py
	pytest -sv tests/e2e/singlecard/test_vlm.py::test_multimodal_vl

	e2e-2-cards-light:
	needs: [e2e-light]
	if: ${{ needs.e2e-light.result == 'success' }}
	strategy:
	max-parallel: 2
	matrix:
	os: [linux-aarch64-a2-2]
	vllm_version: [v0.10.2]
	name: multicard e2e test - light
	runs-on: ${{ matrix.os }}
	container:
	image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
	env:
	VLLM_LOGGING_LEVEL: ERROR
	VLLM_USE_MODELSCOPE: True
	steps:
	- name: Check npu and CANN info
	run: \|
	npu-smi info
	cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info

	- name: Config mirrors
	run: \|
	sed -Ei 's@(ports\|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
	pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
	pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
	apt-get update -y
	apt install git -y

	- name: Checkout vllm-project/vllm-ascend repo
	uses: actions/checkout@v4

	- name: Install system dependencies
	run: \|
	apt-get -y install `cat packages.txt`
	apt-get -y install gcc g++ cmake libnuma-dev

	- name: Checkout vllm-project/vllm repo
	uses: actions/checkout@v4
	with:
	repository: vllm-project/vllm
	ref: ${{ matrix.vllm_version }}
	path: ./vllm-empty

	- name: Install vllm-project/vllm from source
	working-directory: ./vllm-empty
	run: \|
	VLLM_TARGET_DEVICE=empty pip install -e .

	- name: Install vllm-project/vllm-ascend
	env:
	PIP_EXTRA_INDEX_URL: https://mirrors.huaweicloud.com/ascend/repos/pypi
	run: \|
	pip install -r requirements-dev.txt
	pip install -v -e .

	- name: Run vllm-project/vllm-ascend test
	env:
	VLLM_WORKER_MULTIPROC_METHOD: spawn
	VLLM_USE_MODELSCOPE: True
	run: \|
	pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[Doc] eval-type not support service but server, and test the result b… #12344

Workflow file

[Doc] eval-type not support service but server, and test the result b… #12344

Uh oh!

Jobs

Run details

Workflow file for this run