47 lines
1.4 KiB
Python
47 lines
1.4 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
|
|
|
|
|
|
from fastapi import APIRouter, FastAPI, Request
|
|
from fastapi.responses import Response
|
|
|
|
from vllm.config import ProfilerConfig
|
|
from vllm.engine.protocol import EngineClient
|
|
from vllm.logger import init_logger
|
|
|
|
logger = init_logger(__name__)
|
|
|
|
router = APIRouter()
|
|
|
|
|
|
def engine_client(request: Request) -> EngineClient:
|
|
return request.app.state.engine_client
|
|
|
|
|
|
@router.post("/start_profile")
|
|
async def start_profile(raw_request: Request):
|
|
logger.info("Starting profiler...")
|
|
await engine_client(raw_request).start_profile()
|
|
logger.info("Profiler started.")
|
|
return Response(status_code=200)
|
|
|
|
|
|
@router.post("/stop_profile")
|
|
async def stop_profile(raw_request: Request):
|
|
logger.info("Stopping profiler...")
|
|
await engine_client(raw_request).stop_profile()
|
|
logger.info("Profiler stopped.")
|
|
return Response(status_code=200)
|
|
|
|
|
|
def attach_router(app: FastAPI):
|
|
profiler_config = getattr(app.state.args, "profiler_config", None)
|
|
assert profiler_config is None or isinstance(profiler_config, ProfilerConfig)
|
|
if profiler_config is not None and profiler_config.profiler is not None:
|
|
logger.warning_once(
|
|
"Profiler with mode '%s' is enabled in the "
|
|
"API server. This should ONLY be used for local development!",
|
|
profiler_config.profiler,
|
|
)
|
|
app.include_router(router)
|