From be54f8e5c4083831aeaa4a1da9e248ddafcef54b Mon Sep 17 00:00:00 2001 From: Nicolas Frenay Date: Thu, 6 Jul 2023 20:15:17 -0500 Subject: [PATCH] [Fix] Change /generate response-type to json for non-streaming (#374) --- vllm/entrypoints/api_server.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/vllm/entrypoints/api_server.py b/vllm/entrypoints/api_server.py index e2b709ce..58ea2e22 100644 --- a/vllm/entrypoints/api_server.py +++ b/vllm/entrypoints/api_server.py @@ -3,7 +3,7 @@ import json from typing import AsyncGenerator from fastapi import BackgroundTasks, FastAPI, Request -from fastapi.responses import Response, StreamingResponse +from fastapi.responses import JSONResponse, Response, StreamingResponse import uvicorn from vllm.engine.arg_utils import AsyncEngineArgs @@ -64,7 +64,7 @@ async def generate(request: Request) -> Response: prompt = final_output.prompt text_outputs = [prompt + output.text for output in final_output.outputs] ret = {"text": text_outputs} - return Response(content=json.dumps(ret)) + return JSONResponse(ret) if __name__ == "__main__":