File tree Expand file tree Collapse file tree 1 file changed +5
-3
lines changed Expand file tree Collapse file tree 1 file changed +5
-3
lines changed Original file line number Diff line number Diff line change 11# SPDX-License-Identifier: Apache-2.0
22# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
33import functools
4- from typing import List , Optional
4+ from typing import ClassVar , List , Optional
55
66import torch
77
1111from vllm .attention .selector import get_attn_backend
1212from vllm .config import CacheConfig , QuantizationConfig
1313from vllm .v1 .attention .backends .utils import (
14- CommonAttentionMetadata , make_local_attention_virtual_batches ,
15- subclass_attention_backend )
14+ AttentionCGSupport , CommonAttentionMetadata ,
15+ make_local_attention_virtual_batches , subclass_attention_backend )
1616
1717from ..layer import Attention
1818
@@ -28,6 +28,8 @@ def create_chunked_local_attention_backend(
2828 underlying_builder = underlying_attn_backend .get_builder_cls ()
2929
3030 class ChunkedLocalAttentionBuilder (underlying_builder ): # type: ignore
31+ cudagraph_support : ClassVar [AttentionCGSupport ] = \
32+ AttentionCGSupport .NEVER
3133
3234 def build (self ,
3335 common_prefix_len : int ,
You can’t perform that action at this time.
0 commit comments