Skip to content

Commit 840da0d

Browse files
committed
Upgrade to 0.11.1 newest vllm commit
Signed-off-by: 22dimensions <waitingwind@foxmail.com>
1 parent 5f08e07 commit 840da0d

File tree

17 files changed

+104
-20
lines changed

17 files changed

+104
-20
lines changed

.github/workflows/format_pr_body.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ jobs:
3636

3737
- name: Get vLLM version
3838
run: |
39-
VLLM_COMMIT=83f478bb19489b41e9d208b47b4bb5a95ac171ac
39+
VLLM_COMMIT=releases/v0.11.1
4040
echo "VLLM_COMMIT=https://github.com/vllm-project/vllm/commit/$VLLM_COMMIT" >> $GITHUB_ENV
4141
4242
- name: Checkout repository

.github/workflows/vllm_ascend_test.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ jobs:
4242
lint:
4343
uses: ./.github/workflows/pre-commit.yml
4444
with:
45-
vllm: 83f478bb19489b41e9d208b47b4bb5a95ac171ac
45+
vllm: releases/v0.11.1
4646
changes:
4747
runs-on: ubuntu-latest
4848
outputs:
@@ -83,7 +83,7 @@ jobs:
8383
VLLM_USE_MODELSCOPE: True
8484
strategy:
8585
matrix:
86-
vllm_version: [83f478bb19489b41e9d208b47b4bb5a95ac171ac, v0.11.0]
86+
vllm_version: [releases/v0.11.1, v0.11.0]
8787
steps:
8888
- name: Install packages
8989
run: |
@@ -138,7 +138,7 @@ jobs:
138138
name: e2e-light
139139
strategy:
140140
matrix:
141-
vllm_version: [83f478bb19489b41e9d208b47b4bb5a95ac171ac, v0.11.0]
141+
vllm_version: [releases/v0.11.1, v0.11.0]
142142
# Note (yikun): If CI resource are limited we can split job into two chain jobs
143143
needs: [lint, changes]
144144
# only trigger e2e test after lint passed and the change is e2e related with pull request.

.github/workflows/vllm_ascend_test_full.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,7 @@ jobs:
6969
name: e2e-full
7070
strategy:
7171
matrix:
72-
vllm_version: [83f478bb19489b41e9d208b47b4bb5a95ac171ac, v0.11.0]
72+
vllm_version: [releases/v0.11.1, v0.11.0]
7373
needs: [changes]
7474
if: ${{ needs.changes.outputs.e2e_tracker == 'true' }}
7575
uses: ./.github/workflows/_e2e_test.yaml

tests/ut/worker/test_worker_v1.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,9 @@
77
from tests.ut.base import TestBase
88
from vllm_ascend.utils import vllm_version_is
99

10+
init_cached_hf_modules_path = "vllm.utils.init_cached_hf_modules" if vllm_version_is(
11+
"0.11.0") else "vllm.utils.import_utils.init_cached_hf_modules"
12+
1013

1114
class TestNPUWorker(TestBase):
1215

@@ -46,7 +49,7 @@ def setUp(self):
4649
@patch("vllm_ascend.worker.worker_v1.init_ascend_config")
4750
@patch("vllm_ascend.worker.worker_v1.init_ascend_soc_version")
4851
@patch("vllm_ascend.worker.worker_v1.try_register_lib")
49-
@patch("vllm.utils.init_cached_hf_modules")
52+
@patch(init_cached_hf_modules_path)
5053
@patch("vllm_ascend.worker.worker_v1.NPUWorker._init_profiler")
5154
def test_init_npu_worker_normal_case(
5255
self,
@@ -108,7 +111,7 @@ def test_init_npu_worker_normal_case(
108111
@patch("vllm_ascend.worker.worker_v1.init_ascend_config")
109112
@patch("vllm_ascend.worker.worker_v1.init_ascend_soc_version")
110113
@patch("vllm_ascend.worker.worker_v1.try_register_lib")
111-
@patch("vllm.utils.init_cached_hf_modules")
114+
@patch(init_cached_hf_modules_path)
112115
@patch("vllm_ascend.worker.worker_v1.NPUWorker._init_profiler")
113116
def test_init_npu_worker_with_trust_remote_code(
114117
self,
@@ -153,7 +156,7 @@ def test_init_npu_worker_with_trust_remote_code(
153156
@patch("vllm_ascend.worker.worker_v1.init_ascend_config")
154157
@patch("vllm_ascend.worker.worker_v1.init_ascend_soc_version")
155158
@patch("vllm_ascend.worker.worker_v1.try_register_lib")
156-
@patch("vllm.utils.init_cached_hf_modules")
159+
@patch(init_cached_hf_modules_path)
157160
@patch("vllm_ascend.worker.worker_v1.NPUWorker._init_profiler")
158161
def test_init_npu_worker_with_custom_cache_dtype(
159162
self,

vllm_ascend/attention/attention_v1.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,14 @@
3131
get_decode_context_model_parallel_rank,
3232
get_decode_context_model_parallel_world_size)
3333
from vllm.forward_context import ForwardContext, get_forward_context
34-
from vllm.utils import cdiv
34+
35+
from vllm_ascend.utils import vllm_version_is
36+
37+
if vllm_version_is("0.11.0"):
38+
from vllm.utils import cdiv
39+
else:
40+
from vllm.utils.math_utils import cdiv
41+
3542
from vllm.v1.attention.backends.utils import AttentionCGSupport
3643
from vllm.v1.core.sched.output import SchedulerOutput
3744
from vllm.v1.kv_cache_interface import AttentionSpec

vllm_ascend/attention/mla_v1.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,14 @@
2222
from vllm.logger import logger
2323
from vllm.model_executor.layers.linear import (LinearBase,
2424
UnquantizedLinearMethod)
25-
from vllm.utils import cdiv, round_down
25+
26+
from vllm_ascend.utils import vllm_version_is
27+
28+
if vllm_version_is("0.11.0"):
29+
from vllm.utils import cdiv, round_down
30+
else:
31+
from vllm.utils.math_utils import cdiv, round_down
32+
2633
from vllm.v1.attention.backends.utils import AttentionCGSupport
2734

2835
from vllm_ascend import envs

vllm_ascend/core/scheduler.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,14 @@
2222
from vllm.distributed.kv_events import KVEventBatch
2323
from vllm.logger import logger
2424
from vllm.multimodal import MULTIMODAL_REGISTRY, MultiModalRegistry
25-
from vllm.utils import cdiv
25+
26+
from vllm_ascend.utils import vllm_version_is
27+
28+
if vllm_version_is("0.11.0"):
29+
from vllm.utils import cdiv
30+
else:
31+
from vllm.utils.math_utils import cdiv
32+
2633
from vllm.v1.core.kv_cache_manager import KVCacheBlocks
2734
from vllm.v1.core.sched.output import NewRequestData, SchedulerOutput
2835
from vllm.v1.core.sched.scheduler import Scheduler

vllm_ascend/distributed/mooncake/config_data.py

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,15 @@
88
import torch
99
from vllm.distributed.kv_transfer.kv_connector.v1.base import \
1010
KVConnectorMetadata
11-
from vllm.utils import cdiv, logger
11+
from vllm.utils import logger
12+
13+
from vllm_ascend.utils import vllm_version_is
14+
15+
if vllm_version_is("0.11.0"):
16+
from vllm.utils import cdiv
17+
else:
18+
from vllm.utils.math_utils import cdiv
19+
1220
from vllm.v1.core.sched.output import NewRequestData
1321

1422

vllm_ascend/patch/platform/patch_mamba_config.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,14 @@
33
from vllm.logger import init_logger
44
from vllm.model_executor.models import ModelRegistry
55
from vllm.model_executor.models.config import MambaModelConfig
6-
from vllm.utils import cdiv
6+
7+
from vllm_ascend.utils import vllm_version_is
8+
9+
if vllm_version_is("0.11.0"):
10+
from vllm.utils import cdiv
11+
else:
12+
from vllm.utils.math_utils import cdiv
13+
714
from vllm.v1.kv_cache_interface import FullAttentionSpec, MambaSpec
815

916
from vllm_ascend.utils import vllm_version_is

vllm_ascend/spec_decode/mtp_proposer.py

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,14 @@
1515
from vllm.model_executor.models.deepseek_mtp import DeepSeekMTP
1616
from vllm.model_executor.models.deepseek_v2 import DeepseekV32IndexerCache
1717
from vllm.model_executor.models.llama_eagle3 import Eagle3LlamaForCausalLM
18-
from vllm.utils import cdiv
18+
19+
from vllm_ascend.utils import vllm_version_is
20+
21+
if vllm_version_is("0.11.0"):
22+
from vllm.utils import cdiv
23+
else:
24+
from vllm.utils.math_utils import cdiv
25+
1926
from vllm.v1.attention.backends.utils import (AttentionMetadataBuilder,
2027
CommonAttentionMetadata)
2128
from vllm.v1.core.sched.output import SchedulerOutput

0 commit comments

Comments
 (0)