We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent aa7ea20 commit 5473fb6Copy full SHA for 5473fb6
vllm_ascend/ascend_config.py
@@ -56,7 +56,8 @@ def __init__(self, torchair_graph_config):
56
"graph_batch_sizes_init", False)
57
self.enable_multistream_shared_expert = torchair_graph_config.get(
58
"enable_multistream_shared_expert", False)
59
- self.enable_kv_nz = bool(int(os.getenv("VLLM_ASCEND_ENABLE_KV_NZ", '0')))
+ self.enable_kv_nz = bool(
60
+ int(os.getenv("VLLM_ASCEND_ENABLE_KV_NZ", '0')))
61
62
if not isinstance(self.graph_batch_sizes, list):
63
raise TypeError("graph_batch_sizes must be list[int]")
0 commit comments