File tree Expand file tree Collapse file tree 1 file changed +5
-3
lines changed Expand file tree Collapse file tree 1 file changed +5
-3
lines changed Original file line number Diff line number Diff line change 11# SPDX-License-Identifier: Apache-2.0
22# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
33import functools
4- from typing import List , Optional
4+ from typing import ClassVar , List , Optional
55
66import torch
77
1212from vllm .config import CacheConfig
1313from vllm .model_executor .layers .quantization import QuantizationConfig
1414from vllm .v1 .attention .backends .utils import (
15- CommonAttentionMetadata , make_local_attention_virtual_batches ,
16- subclass_attention_backend )
15+ AttentionCGSupport , CommonAttentionMetadata ,
16+ make_local_attention_virtual_batches , subclass_attention_backend )
1717
1818from ..layer import Attention
1919
@@ -29,6 +29,8 @@ def create_chunked_local_attention_backend(
2929 underlying_builder = underlying_attn_backend .get_builder_cls ()
3030
3131 class ChunkedLocalAttentionBuilder (underlying_builder ): # type: ignore
32+ cudagraph_support : ClassVar [AttentionCGSupport ] = \
33+ AttentionCGSupport .NEVER
3234
3335 def build (self ,
3436 common_prefix_len : int ,
You can’t perform that action at this time.
0 commit comments