[Misc] Minor type annotation fix (#3716)

2024-03-28 21:12:24 -07:00 · 2024-03-28 21:12:24 -07:00 · 395aa823ea
commit 395aa823ea
parent 26422e477b
1 changed files with 2 additions and 1 deletions
--- a/vllm/attention/selector.py
+++ b/vllm/attention/selector.py
@ -1,4 +1,5 @@
 from functools import lru_cache
 from typing import Type
 import torch
@ -10,7 +11,7 @@ logger = init_logger(__name__)
@lru_cache(maxsize=None)
-def get_attn_backend(dtype: torch.dtype) -> AttentionBackend:
+def get_attn_backend(dtype: torch.dtype) -> Type[AttentionBackend]:
    if _can_use_flash_attn(dtype):
        logger.info("Using FlashAttention backend.")
        from vllm.attention.backends.flash_attn import (  # noqa: F401