Skip to content

vllm.entrypoints.serve.instrumentator.health

health async

health(raw_request: Request) -> Response

Health check.

Source code in vllm/entrypoints/serve/instrumentator/health.py
@router.get("/health", response_class=Response)
async def health(raw_request: Request) -> Response:
    """Health check."""
    client = engine_client(raw_request)
    if client is None:
        # Render-only servers have no engine; they are always healthy.
        return Response(status_code=200)
    try:
        await client.check_health()
        return Response(status_code=200)
    except EngineDeadError:
        return Response(status_code=503)