Skip to content

vllm.v1.worker.xpu_model_runner

XPUModelRunner

Bases: GPUModelRunner

A model runner for XPU devices.

Source code in vllm/v1/worker/xpu_model_runner.py
class XPUModelRunner(GPUModelRunner):
    """A model runner for XPU devices."""

    def __init__(
        self,
        vllm_config: VllmConfig,
        device: torch.device,
    ):
        with _torch_cuda_wrapper():
            super().__init__(vllm_config, device)
        # FIXME: To be verified.
        self.cascade_attn_enabled = False

XPUModelRunnerV2

Bases: GPUModelRunner

A model runner for XPU devices.

Source code in vllm/v1/worker/xpu_model_runner.py
class XPUModelRunnerV2(GPUModelRunnerV2):
    """A model runner for XPU devices."""

    def __init__(
        self,
        vllm_config: VllmConfig,
        device: torch.device,
    ):
        with _torch_cuda_wrapper():
            super().__init__(vllm_config, device)