We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent adcbd5a commit 874625dCopy full SHA for 874625d
vllm_ascend/distributed/mooncake_connector.py
@@ -109,7 +109,7 @@ def _retrieve_expired_requests(self):
109
request_id = next(iter(self.delayed_free_requests))
110
delay_start_time = self.delayed_free_requests[request_id]
111
if (current_time - delay_start_time
112
- > envs_ascend.VLLM_ASCEND_KVCACHE_DELAY_FREE_TIMEOUT):
+ > envs_ascend.VLLM_NIXL_ABORT_REQUEST_TIMEOUT):
113
self.delayed_free_requests.popitem(last=False)
114
expired_requests.add(request_id)
115
logger.info("Force freed request: %s", request_id)
0 commit comments