vllm/vllm/platforms/__init__.py

from .interface import _Backend  # noqa: F401
from .interface import Platform, PlatformEnum, UnspecifiedPlatform

current_platform: Platform

# NOTE: we don't use `torch.version.cuda` / `torch.version.hip` because
# they only indicate the build configuration, not the runtime environment.
# For example, people can install a cuda build of pytorch but run on tpu.

is_tpu = False
try:
    # While it's technically possible to install libtpu on a non-TPU machine,
    # this is a very uncommon scenario. Therefore, we assume that libtpu is
    # installed if and only if the machine has TPUs.
    import libtpu  # noqa: F401
    is_tpu = True
except Exception:
    pass

is_cuda = False

try:
    import pynvml
    pynvml.nvmlInit()
    try:
        if pynvml.nvmlDeviceGetCount() > 0:
            is_cuda = True
    finally:
        pynvml.nvmlShutdown()
except Exception:
    pass

is_rocm = False

try:
    import amdsmi
    amdsmi.amdsmi_init()
    try:
        if len(amdsmi.amdsmi_get_processor_handles()) > 0:
            is_rocm = True
    finally:
        amdsmi.amdsmi_shut_down()
except Exception:
    pass

is_hpu = False
try:
    from importlib import util
    is_hpu = util.find_spec('habana_frameworks') is not None
except Exception:
    pass

is_xpu = False

try:
    # installed IPEX if the machine has XPUs.
    import intel_extension_for_pytorch  # noqa: F401
    import oneccl_bindings_for_pytorch  # noqa: F401
    import torch
    if hasattr(torch, 'xpu') and torch.xpu.is_available():
        is_xpu = True
except Exception:
    pass

is_cpu = False
try:
    from importlib.metadata import version
    is_cpu = "cpu" in version("vllm")
except Exception:
    pass

is_neuron = False
try:
    import transformers_neuronx  # noqa: F401
    is_neuron = True
except ImportError:
    pass

is_openvino = False
try:
    from importlib.metadata import version
    is_openvino = "openvino" in version("vllm")
except Exception:
    pass

if is_tpu:
    # people might install pytorch built with cuda but run on tpu
    # so we need to check tpu first
    from .tpu import TpuPlatform
    current_platform = TpuPlatform()
elif is_cuda:
    from .cuda import CudaPlatform
    current_platform = CudaPlatform()
elif is_rocm:
    from .rocm import RocmPlatform
    current_platform = RocmPlatform()
elif is_hpu:
    from .hpu import HpuPlatform
    current_platform = HpuPlatform()
elif is_xpu:
    from .xpu import XPUPlatform
    current_platform = XPUPlatform()
elif is_cpu:
    from .cpu import CpuPlatform
    current_platform = CpuPlatform()
elif is_neuron:
    from .neuron import NeuronPlatform
    current_platform = NeuronPlatform()
elif is_openvino:
    from .openvino import OpenVinoPlatform
    current_platform = OpenVinoPlatform()
else:
    current_platform = UnspecifiedPlatform()

__all__ = ['Platform', 'PlatformEnum', 'current_platform']
[Platform][Refactor] Extract func `get_default_attn_backend` to `Platform` (#10358) Signed-off-by: Mengqing Cao <cmq0113@163.com> 2024-11-19 11:22:26 +08:00			`from .interface import _Backend # noqa: F401`
[Misc] Add a wrapper for torch.inference_mode (#6618) 2024-07-22 09:43:11 +08:00			`from .interface import Platform, PlatformEnum, UnspecifiedPlatform`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00
[hardware] unify usage of is_tpu to current_platform.is_tpu() (#7102) 2024-08-13 15:16:42 +08:00			`current_platform: Platform`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00
[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			# NOTE: we don't use `torch.version.cuda` / `torch.version.hip` because
			`# they only indicate the build configuration, not the runtime environment.`
			`# For example, people can install a cuda build of pytorch but run on tpu.`

			`is_tpu = False`
			`try:`
[TPU] Avoid initializing TPU runtime in is_tpu (#7763) 2024-08-22 12:31:49 +08:00			`# While it's technically possible to install libtpu on a non-TPU machine,`
			`# this is a very uncommon scenario. Therefore, we assume that libtpu is`
			`# installed if and only if the machine has TPUs.`
			`import libtpu # noqa: F401`
[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			`is_tpu = True`
			`except Exception:`
			`pass`

			`is_cuda = False`

			`try:`
			`import pynvml`
			`pynvml.nvmlInit()`
			`try:`
			`if pynvml.nvmlDeviceGetCount() > 0:`
			`is_cuda = True`
			`finally:`
			`pynvml.nvmlShutdown()`
			`except Exception:`
			`pass`

			`is_rocm = False`

[hardware] unify usage of is_tpu to current_platform.is_tpu() (#7102) 2024-08-13 15:16:42 +08:00			`try:`
[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			`import amdsmi`
			`amdsmi.amdsmi_init()`
			`try:`
			`if len(amdsmi.amdsmi_get_processor_handles()) > 0:`
			`is_rocm = True`
			`finally:`
			`amdsmi.amdsmi_shut_down()`
			`except Exception:`
			`pass`
[hardware] unify usage of is_tpu to current_platform.is_tpu() (#7102) 2024-08-13 15:16:42 +08:00
[Hardware][Intel-Gaudi] Add Intel Gaudi (HPU) inference backend (#6143) Signed-off-by: yuwenzho <yuwen.zhou@intel.com> Signed-off-by: Chendi.Xue <chendi.xue@intel.com> Signed-off-by: Bob Zhu <bob.zhu@intel.com> Signed-off-by: zehao-intel <zehao.huang@intel.com> Signed-off-by: Konrad Zawora <kzawora@habana.ai> Co-authored-by: Kunshang Ji <kunshang.ji@intel.com> Co-authored-by: Sanju C Sudhakaran <scsudhakaran@habana.ai> Co-authored-by: Michal Adamczyk <madamczyk@habana.ai> Co-authored-by: Marceli Fylcek <mfylcek@habana.ai> Co-authored-by: Himangshu Lahkar <49579433+hlahkar@users.noreply.github.com> Co-authored-by: Vivek Goel <vgoel@habana.ai> Co-authored-by: yuwenzho <yuwen.zhou@intel.com> Co-authored-by: Dominika Olszewska <dolszewska@habana.ai> Co-authored-by: barak goldberg <149692267+bgoldberg-habana@users.noreply.github.com> Co-authored-by: Michal Szutenberg <37601244+szutenberg@users.noreply.github.com> Co-authored-by: Jan Kaniecki <jkaniecki@habana.ai> Co-authored-by: Agata Dobrzyniewicz <160237065+adobrzyniewicz-habana@users.noreply.github.com> Co-authored-by: Krzysztof Wisniewski <kwisniewski@habana.ai> Co-authored-by: Dudi Lester <160421192+dudilester@users.noreply.github.com> Co-authored-by: Ilia Taraban <tarabanil@gmail.com> Co-authored-by: Chendi.Xue <chendi.xue@intel.com> Co-authored-by: Michał Kuligowski <mkuligowski@habana.ai> Co-authored-by: Jakub Maksymczuk <jmaksymczuk@habana.ai> Co-authored-by: Tomasz Zielinski <85164140+tzielinski-habana@users.noreply.github.com> Co-authored-by: Sun Choi <schoi@habana.ai> Co-authored-by: Iryna Boiko <iboiko@habana.ai> Co-authored-by: Bob Zhu <41610754+czhu15@users.noreply.github.com> Co-authored-by: hlin99 <73271530+hlin99@users.noreply.github.com> Co-authored-by: Zehao Huang <zehao.huang@intel.com> Co-authored-by: Andrzej Kotłowski <Andrzej.Kotlowski@intel.com> Co-authored-by: Yan Tomsinsky <73292515+Yantom1@users.noreply.github.com> Co-authored-by: Nir David <ndavid@habana.ai> Co-authored-by: Yu-Zhou <yu.zhou@intel.com> Co-authored-by: Ruheena Suhani Shaik <rsshaik@habana.ai> Co-authored-by: Karol Damaszke <kdamaszke@habana.ai> Co-authored-by: Marcin Swiniarski <mswiniarski@habana.ai> Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu> Co-authored-by: Jacek Czaja <jacek.czaja@intel.com> Co-authored-by: Jacek Czaja <jczaja@habana.ai> Co-authored-by: Yuan <yuan.zhou@outlook.com> 2024-11-06 17:09:10 +08:00			`is_hpu = False`
			`try:`
			`from importlib import util`
			`is_hpu = util.find_spec('habana_frameworks') is not None`
			`except Exception:`
			`pass`

[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-28 14:45:50 +08:00			`is_xpu = False`

			`try:`
[Bugfix] Fix multi nodes TP+PP for XPU (#8884) Signed-off-by: YiSheng5 <syhm@mail.ustc.edu.cn> Signed-off-by: yan ma <yan.ma@intel.com> Co-authored-by: YiSheng5 <syhm@mail.ustc.edu.cn> 2024-10-30 12:34:45 +08:00			`# installed IPEX if the machine has XPUs.`
			`import intel_extension_for_pytorch # noqa: F401`
			`import oneccl_bindings_for_pytorch # noqa: F401`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-28 14:45:50 +08:00			`import torch`
			`if hasattr(torch, 'xpu') and torch.xpu.is_available():`
			`is_xpu = True`
			`except Exception:`
			`pass`

[Hardware][Intel] Support compressed-tensor W8A8 for CPU backend (#7257) 2024-09-12 00:46:46 +08:00			`is_cpu = False`
			`try:`
			`from importlib.metadata import version`
			`is_cpu = "cpu" in version("vllm")`
			`except Exception:`
			`pass`

[Neuron] [Bugfix] Fix neuron startup (#9374) Co-authored-by: Jerzy Zagorski <jzagorsk@amazon.com> 2024-10-22 20:51:41 +08:00			`is_neuron = False`
			`try:`
			`import transformers_neuronx # noqa: F401`
			`is_neuron = True`
			`except ImportError:`
			`pass`

[Hardware][openvino] is_openvino --> current_platform.is_openvino (#9716) 2024-10-26 18:59:06 +08:00			`is_openvino = False`
			`try:`
			`from importlib.metadata import version`
			`is_openvino = "openvino" in version("vllm")`
			`except Exception:`
			`pass`

[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			`if is_tpu:`
[hardware] unify usage of is_tpu to current_platform.is_tpu() (#7102) 2024-08-13 15:16:42 +08:00			`# people might install pytorch built with cuda but run on tpu`
			`# so we need to check tpu first`
			`from .tpu import TpuPlatform`
			`current_platform = TpuPlatform()`
[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			`elif is_cuda:`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00			`from .cuda import CudaPlatform`
			`current_platform = CudaPlatform()`
[doc] fix doc build error caused by msgspec (#7659) 2024-08-20 08:50:59 +08:00			`elif is_rocm:`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00			`from .rocm import RocmPlatform`
			`current_platform = RocmPlatform()`
[Hardware][Intel-Gaudi] Add Intel Gaudi (HPU) inference backend (#6143) Signed-off-by: yuwenzho <yuwen.zhou@intel.com> Signed-off-by: Chendi.Xue <chendi.xue@intel.com> Signed-off-by: Bob Zhu <bob.zhu@intel.com> Signed-off-by: zehao-intel <zehao.huang@intel.com> Signed-off-by: Konrad Zawora <kzawora@habana.ai> Co-authored-by: Kunshang Ji <kunshang.ji@intel.com> Co-authored-by: Sanju C Sudhakaran <scsudhakaran@habana.ai> Co-authored-by: Michal Adamczyk <madamczyk@habana.ai> Co-authored-by: Marceli Fylcek <mfylcek@habana.ai> Co-authored-by: Himangshu Lahkar <49579433+hlahkar@users.noreply.github.com> Co-authored-by: Vivek Goel <vgoel@habana.ai> Co-authored-by: yuwenzho <yuwen.zhou@intel.com> Co-authored-by: Dominika Olszewska <dolszewska@habana.ai> Co-authored-by: barak goldberg <149692267+bgoldberg-habana@users.noreply.github.com> Co-authored-by: Michal Szutenberg <37601244+szutenberg@users.noreply.github.com> Co-authored-by: Jan Kaniecki <jkaniecki@habana.ai> Co-authored-by: Agata Dobrzyniewicz <160237065+adobrzyniewicz-habana@users.noreply.github.com> Co-authored-by: Krzysztof Wisniewski <kwisniewski@habana.ai> Co-authored-by: Dudi Lester <160421192+dudilester@users.noreply.github.com> Co-authored-by: Ilia Taraban <tarabanil@gmail.com> Co-authored-by: Chendi.Xue <chendi.xue@intel.com> Co-authored-by: Michał Kuligowski <mkuligowski@habana.ai> Co-authored-by: Jakub Maksymczuk <jmaksymczuk@habana.ai> Co-authored-by: Tomasz Zielinski <85164140+tzielinski-habana@users.noreply.github.com> Co-authored-by: Sun Choi <schoi@habana.ai> Co-authored-by: Iryna Boiko <iboiko@habana.ai> Co-authored-by: Bob Zhu <41610754+czhu15@users.noreply.github.com> Co-authored-by: hlin99 <73271530+hlin99@users.noreply.github.com> Co-authored-by: Zehao Huang <zehao.huang@intel.com> Co-authored-by: Andrzej Kotłowski <Andrzej.Kotlowski@intel.com> Co-authored-by: Yan Tomsinsky <73292515+Yantom1@users.noreply.github.com> Co-authored-by: Nir David <ndavid@habana.ai> Co-authored-by: Yu-Zhou <yu.zhou@intel.com> Co-authored-by: Ruheena Suhani Shaik <rsshaik@habana.ai> Co-authored-by: Karol Damaszke <kdamaszke@habana.ai> Co-authored-by: Marcin Swiniarski <mswiniarski@habana.ai> Co-authored-by: Woosuk Kwon <woosuk.kwon@berkeley.edu> Co-authored-by: Jacek Czaja <jacek.czaja@intel.com> Co-authored-by: Jacek Czaja <jczaja@habana.ai> Co-authored-by: Yuan <yuan.zhou@outlook.com> 2024-11-06 17:09:10 +08:00			`elif is_hpu:`
			`from .hpu import HpuPlatform`
			`current_platform = HpuPlatform()`
[Bugfix][Intel] Fix XPU Dockerfile Build (#7824) Signed-off-by: tylertitsworth <tyler.titsworth@intel.com> Co-authored-by: youkaichao <youkaichao@126.com> 2024-09-28 14:45:50 +08:00			`elif is_xpu:`
			`from .xpu import XPUPlatform`
			`current_platform = XPUPlatform()`
[Hardware][Intel] Support compressed-tensor W8A8 for CPU backend (#7257) 2024-09-12 00:46:46 +08:00			`elif is_cpu:`
			`from .cpu import CpuPlatform`
			`current_platform = CpuPlatform()`
[Neuron] [Bugfix] Fix neuron startup (#9374) Co-authored-by: Jerzy Zagorski <jzagorsk@amazon.com> 2024-10-22 20:51:41 +08:00			`elif is_neuron:`
			`from .neuron import NeuronPlatform`
			`current_platform = NeuronPlatform()`
[Hardware][openvino] is_openvino --> current_platform.is_openvino (#9716) 2024-10-26 18:59:06 +08:00			`elif is_openvino:`
			`from .openvino import OpenVinoPlatform`
			`current_platform = OpenVinoPlatform()`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00			`else:`
[Misc] Add a wrapper for torch.inference_mode (#6618) 2024-07-22 09:43:11 +08:00			`current_platform = UnspecifiedPlatform()`
[hardware][misc] introduce platform abstraction (#6080) 2024-07-03 11:12:22 +08:00
			`__all__ = ['Platform', 'PlatformEnum', 'current_platform']`