fix draft attn metadata mapping

jiahanc · jiahanc · commit 677ebddf6746 · 2025-09-23T09:26:35.000-07:00
Signed-off-by: jiahanc &lt;173873397+jiahanc@users.noreply.github.com&gt;
diff --git a/vllm/v1/worker/gpu_model_runner.py b/vllm/v1/worker/gpu_model_runner.py
@@ -1178,11 +1178,13 @@ def _prepare_inputs(
             )
 
             if (self.speculative_config
-                    and spec_decode_common_attn_metadata is None
-                    and isinstance(self.drafter, EagleProposer)
-                    and self.drafter.attn_layer_names[0]
-                    in kv_cache_group_spec.layer_names):
-                spec_decode_common_attn_metadata = common_attn_metadata
+                    and spec_decode_common_attn_metadata is None):
+                if isinstance(self.drafter, EagleProposer):
+                    if (self.drafter.attn_layer_names[0]
+                            in kv_cache_group_spec.layer_names):
+                        spec_decode_common_attn_metadata = common_attn_metadata
+                else:
+                    spec_decode_common_attn_metadata = common_attn_metadata
 
             for attn_group in self.attn_groups[kv_cache_group_id]:
                 # Prepare for cascade attention if enabled & beneficial.