File tree Expand file tree Collapse file tree 1 file changed +1
-3
lines changed Expand file tree Collapse file tree 1 file changed +1
-3
lines changed Original file line number Diff line number Diff line change 2222from vllm .platforms import current_platform
2323from vllm .utils import is_pin_memory_available
2424from vllm .v1 .attention .backends .flash_attn import FlashAttentionMetadata
25- from vllm .v1 .attention .backends .flashinfer import FlashInferMetadata
2625from vllm .v1 .attention .backends .tree_attn import (TreeAttentionMetadata ,
2726 TreeAttentionMetadataBuilder )
2827from vllm .v1 .attention .backends .triton_attn import TritonAttentionMetadata
@@ -133,8 +132,7 @@ def __init__(
133132 self .allowed_attn_types = tuple (rocm_types )
134133 else :
135134 self .allowed_attn_types = (FlashAttentionMetadata ,
136- TreeAttentionMetadata ,
137- FlashInferMetadata )
135+ TreeAttentionMetadata )
138136
139137 # Parse the speculative token tree.
140138 spec_token_tree = self .speculative_config .speculative_token_tree
You can’t perform that action at this time.
0 commit comments