Skip to content

Commit 682865e

Browse files
author
wucong25
committed
add attn_groups judge
1 parent 2b4f7a5 commit 682865e

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

vllm_ascend/worker/model_runner_v1.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2697,7 +2697,8 @@ def initialize_kv_cache(self, kv_cache_config: KVCacheConfig) -> None:
26972697
self.kv_cache_config = kv_cache_config
26982698
self.may_add_encoder_only_layers_to_kv_cache_config()
26992699
# NOTE(cmq): initialize_attn_backend must before using self.attn_groups
2700-
self.initialize_attn_backend(kv_cache_config)
2700+
if not self.attn_groups:
2701+
self.initialize_attn_backend(kv_cache_config)
27012702
self.use_hybrid_blocks = (len(self.attn_groups) > 1)
27022703
# NOTE: Currently, we determine whether we need `num_accepted_tokens` through `MambaSpec`.
27032704
self.need_accepted_tokens = any([

0 commit comments

Comments
 (0)