Skip to content

vllm.v1.worker.xpu_model_runner

logger module-attribute

logger = init_logger(__name__)

XPUModelRunner

Bases: GPUModelRunner

A model runner for XPU devices.

Source code in vllm/v1/worker/xpu_model_runner.py
class XPUModelRunner(GPUModelRunner):
    """A model runner for XPU devices."""

    def __init__(
        self,
        vllm_config: VllmConfig,
        device: torch.device,
    ):
        super().__init__(vllm_config, device)
        # FIXME: To be verified.
        self.cascade_attn_enabled = False

    def _init_device_properties(self) -> None:
        pass

    def _sync_device(self) -> None:
        torch.xpu.synchronize()

cascade_attn_enabled instance-attribute

cascade_attn_enabled = False

__init__

__init__(vllm_config: VllmConfig, device: device)
Source code in vllm/v1/worker/xpu_model_runner.py
def __init__(
    self,
    vllm_config: VllmConfig,
    device: torch.device,
):
    super().__init__(vllm_config, device)
    # FIXME: To be verified.
    self.cascade_attn_enabled = False

_init_device_properties

_init_device_properties() -> None
Source code in vllm/v1/worker/xpu_model_runner.py
def _init_device_properties(self) -> None:
    pass

_sync_device

_sync_device() -> None
Source code in vllm/v1/worker/xpu_model_runner.py
def _sync_device(self) -> None:
    torch.xpu.synchronize()