From 3b08fe2b13ced7fe76abe17c99614dd36e4b4788 Mon Sep 17 00:00:00 2001 From: youkaichao Date: Sun, 7 Jul 2024 15:11:12 -0700 Subject: [PATCH] [misc][frontend] log all available endpoints (#6195) Co-authored-by: Cody Yu --- vllm/entrypoints/api_server.py | 11 +++++++++++ vllm/entrypoints/openai/api_server.py | 8 ++++++++ 2 files changed, 19 insertions(+) diff --git a/vllm/entrypoints/api_server.py b/vllm/entrypoints/api_server.py index feb904c5..66941442 100644 --- a/vllm/entrypoints/api_server.py +++ b/vllm/entrypoints/api_server.py @@ -16,10 +16,13 @@ from fastapi.responses import JSONResponse, Response, StreamingResponse from vllm.engine.arg_utils import AsyncEngineArgs from vllm.engine.async_llm_engine import AsyncLLMEngine +from vllm.logger import init_logger from vllm.sampling_params import SamplingParams from vllm.usage.usage_lib import UsageContext from vllm.utils import FlexibleArgumentParser, random_uuid +logger = init_logger("vllm.entrypoints.api_server") + TIMEOUT_KEEP_ALIVE = 5 # seconds. app = FastAPI() engine = None @@ -107,6 +110,14 @@ if __name__ == "__main__": engine_args, usage_context=UsageContext.API_SERVER) app.root_path = args.root_path + + logger.info("Available routes are:") + for route in app.routes: + if not hasattr(route, 'methods'): + continue + methods = ', '.join(route.methods) + logger.info("Route: %s, Methods: %s", route.path, methods) + uvicorn.run(app, host=args.host, port=args.port, diff --git a/vllm/entrypoints/openai/api_server.py b/vllm/entrypoints/openai/api_server.py index 76879c96..d3ed1ec7 100644 --- a/vllm/entrypoints/openai/api_server.py +++ b/vllm/entrypoints/openai/api_server.py @@ -240,6 +240,14 @@ if __name__ == "__main__": openai_serving_embedding = OpenAIServingEmbedding(engine, model_config, served_model_names) app.root_path = args.root_path + + logger.info("Available routes are:") + for route in app.routes: + if not hasattr(route, 'methods'): + continue + methods = ', '.join(route.methods) + logger.info("Route: %s, Methods: %s", route.path, methods) + uvicorn.run(app, host=args.host, port=args.port,