We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4331bc8 commit 82a3644Copy full SHA for 82a3644
vllm_ascend/worker/worker_v1.py
@@ -87,6 +87,13 @@ def __init__(
87
distributed_init_method=distributed_init_method,
88
is_driver_worker=is_driver_worker)
89
90
+ if vllm_config.kv_transfer_config is not None:
91
+ self.kv_rank = vllm_config.kv_transfer_config.kv_rank
92
+ self.kv_parallel_size = vllm_config.kv_transfer_config.kv_parallel_size
93
+ else:
94
+ self.kv_rank = 0
95
+ self.kv_parallel_size = 0
96
+
97
# Try to import mindie_turbo to accelerate vLLM inference.
98
try_register_lib(
99
"mindie_turbo",
0 commit comments