We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9a3963a commit 60c0a7fCopy full SHA for 60c0a7f
vllm_ascend/attention/mla_v1.py
@@ -482,7 +482,7 @@ def __init__(
482
ascend_config = get_ascend_config()
483
self.enable_shared_expert_dp = ascend_config.enable_shared_expert_dp
484
self.enable_mla_prefetch = ascend_config.enable_mla_prefetch
485
- self.exable_kv_nz = ascend_config.enable_kv_nz
+ self.exable_kv_nz = ascend_config.torchair_graph_config.enable_kv_nz
486
487
# Adapt torch air graph mode with spec decoding.
488
speculative_config = get_current_vllm_config().speculative_config
0 commit comments