diff --git a/vllm/attention/backends/sage_attention.py b/vllm/attention/backends/sage_attention.py index 4ecd5974d3103..fe32aacd5fb18 100644 --- a/vllm/attention/backends/sage_attention.py +++ b/vllm/attention/backends/sage_attention.py @@ -275,7 +275,7 @@ def get_seq_len_block_table_args( class SageAttentionMetadataBuilder( - AttentionMetadataBuilder[SageAttentionMetadata]): + AttentionMetadataBuilder[SageAttentionMetadata]): def __init__(self, input_builder: ModelInputForCPUBuilder) -> None: self.chunked_prefill = input_builder.chunked_prefill