[Fix] Change /generate response-type to json for non-streaming (#374)

This commit is contained in:
Nicolas Frenay 2023-07-06 20:15:17 -05:00 committed by GitHub
parent b396cb4998
commit be54f8e5c4
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -3,7 +3,7 @@ import json
from typing import AsyncGenerator
from fastapi import BackgroundTasks, FastAPI, Request
from fastapi.responses import Response, StreamingResponse
from fastapi.responses import JSONResponse, Response, StreamingResponse
import uvicorn
from vllm.engine.arg_utils import AsyncEngineArgs
@ -64,7 +64,7 @@ async def generate(request: Request) -> Response:
prompt = final_output.prompt
text_outputs = [prompt + output.text for output in final_output.outputs]
ret = {"text": text_outputs}
return Response(content=json.dumps(ret))
return JSONResponse(ret)
if __name__ == "__main__":