bugfix_mla

wangxiaoteng888 · wangxiaoteng888 · commit 98d234ab3e68 · 2025-09-17T10:26:17.000+08:00
Signed-off-by: wangxiaoteng &lt;wangxiaoteng@huawei.com&gt;
diff --git a/vllm_ascend/worker/worker_v1.py b/vllm_ascend/worker/worker_v1.py
@@ -181,7 +181,8 @@ def determine_available_memory(self) -> int:
             peak_memory = torch_npu.npu.memory_stats()["allocated_bytes.all.peak"] + \
             chuked_prefill_work_space_size
         else:
-            peak_memory = torch_npu.npu.memory_stats()["allocated_bytes.all.peak"]
+            peak_memory = torch_npu.npu.memory_stats(
+            )["allocated_bytes.all.peak"]
         # TODO: don`t need impl this func after empty_cache in
         # Worker.determine_num_available_blocks() unified`
         NPUPlatform.empty_cache()