Skip to content

Commit 9757e24

Browse files
committed
tiny_fix
Signed-off-by: Icey <1790571317@qq.com>
1 parent 45cf486 commit 9757e24

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

vllm_ascend/worker/model_runner_v1.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2644,6 +2644,7 @@ def initialize_kv_cache(self, kv_cache_config: KVCacheConfig) -> None:
26442644
"""
26452645
kv_cache_config = deepcopy(kv_cache_config)
26462646
self.kv_cache_config = kv_cache_config
2647+
self.initialize_attn_backend(kv_cache_config)
26472648
self.use_hybrid_blocks = (len(self.attn_groups) > 1)
26482649
# NOTE: Currently, we determine whether we need `num_accepted_tokens` through `MambaSpec`.
26492650
self.need_accepted_tokens = any([
@@ -2653,7 +2654,6 @@ def initialize_kv_cache(self, kv_cache_config: KVCacheConfig) -> None:
26532654

26542655
self.may_reinitialize_input_batch(kv_cache_config)
26552656
self.may_add_encoder_only_layers_to_kv_cache_config()
2656-
self.initialize_attn_backend(kv_cache_config)
26572657

26582658
if self.ascend_config.is_deepseek_sfa:
26592659
kv_caches = self.initialize_kv_cache_tensors_deepseek_sfa(

0 commit comments

Comments
 (0)