We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a5d37e2 commit 0b852f1Copy full SHA for 0b852f1
vllm_ascend/ascend_config.py
@@ -71,7 +71,7 @@ def __init__(self, torchair_graph_config):
71
"enable_multistream_moe", False)
72
self.enable_view_optimize = torchair_graph_config.get(
73
"enable_view_optimize", True)
74
- self.enable_kv_nz = additional_config.get("enable_kv_nz", False)
+ self.enable_kv_nz = torchair_graph_config.get("enable_kv_nz", False)
75
76
if not isinstance(self.graph_batch_sizes, list):
77
raise TypeError("graph_batch_sizes must be list[int]")
0 commit comments