Bases: GPUModelRunner
A model runner for XPU devices.
Source code in vllm/v1/worker/xpu_model_runner.py
| class XPUModelRunner(GPUModelRunner):
"""A model runner for XPU devices."""
def __init__(
self,
vllm_config: VllmConfig,
device: torch.device,
):
super().__init__(vllm_config, device)
# FIXME: To be verified.
self.cascade_attn_enabled = False
def _init_device_properties(self) -> None:
pass
def _sync_device(self) -> None:
torch.xpu.synchronize()
|
cascade_attn_enabled
instance-attribute
cascade_attn_enabled = False
__init__
Source code in vllm/v1/worker/xpu_model_runner.py
| def __init__(
self,
vllm_config: VllmConfig,
device: torch.device,
):
super().__init__(vllm_config, device)
# FIXME: To be verified.
self.cascade_attn_enabled = False
|
_init_device_properties
_init_device_properties() -> None
Source code in vllm/v1/worker/xpu_model_runner.py
| def _init_device_properties(self) -> None:
pass
|
_sync_device
Source code in vllm/v1/worker/xpu_model_runner.py
| def _sync_device(self) -> None:
torch.xpu.synchronize()
|