Skip to content

Commit 82a3644

Browse files
committed
Fix: initialize kv_rank and kv_parallel_size based on kv_transfer_config
Signed-off-by: luolun <luolun1995@cmbchina.com>
1 parent 4331bc8 commit 82a3644

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

vllm_ascend/worker/worker_v1.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,13 @@ def __init__(
8787
distributed_init_method=distributed_init_method,
8888
is_driver_worker=is_driver_worker)
8989

90+
if vllm_config.kv_transfer_config is not None:
91+
self.kv_rank = vllm_config.kv_transfer_config.kv_rank
92+
self.kv_parallel_size = vllm_config.kv_transfer_config.kv_parallel_size
93+
else:
94+
self.kv_rank = 0
95+
self.kv_parallel_size = 0
96+
9097
# Try to import mindie_turbo to accelerate vLLM inference.
9198
try_register_lib(
9299
"mindie_turbo",

0 commit comments

Comments
 (0)