mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 05:25:00 +08:00
fix: only response [DONE] once when streaming response. (#378)
This commit is contained in:
parent
1c395b4eaa
commit
b396cb4998
@ -269,7 +269,7 @@ async def create_chat_completion(raw_request: Request):
|
||||
finish_reason=output.finish_reason,
|
||||
)
|
||||
yield f"data: {response_json}\n\n"
|
||||
yield "data: [DONE]\n\n"
|
||||
yield "data: [DONE]\n\n"
|
||||
|
||||
# Streaming response
|
||||
if request.stream:
|
||||
@ -465,7 +465,7 @@ async def create_completion(raw_request: Request):
|
||||
finish_reason=output.finish_reason,
|
||||
)
|
||||
yield f"data: {response_json}\n\n"
|
||||
yield "data: [DONE]\n\n"
|
||||
yield "data: [DONE]\n\n"
|
||||
|
||||
# Streaming response
|
||||
if stream:
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user