mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 01:55:01 +08:00
[Misc] Fixed the abnormally high TTFT issue in the PD disaggregation example (#18644)
Signed-off-by: zhaohaidao <zhaohaidao2008@hotmail.com> Signed-off-by: zhaohaiyuan <zhaohaiyuan@xiaohongshu.com> Co-authored-by: zhaohaiyuan <zhaohaiyuan@xiaohongshu.com>
This commit is contained in:
parent
fba0642704
commit
8820821b59
@ -135,7 +135,7 @@ async def handle_completions(request: Request):
|
||||
yield chunk
|
||||
|
||||
return StreamingResponse(generate_stream(),
|
||||
media_type="application/json")
|
||||
media_type="text/event-stream")
|
||||
|
||||
except Exception as e:
|
||||
import sys
|
||||
@ -172,7 +172,7 @@ async def handle_chat_completions(request: Request):
|
||||
yield chunk
|
||||
|
||||
return StreamingResponse(generate_stream(),
|
||||
media_type="application/json")
|
||||
media_type="text/event-stream")
|
||||
|
||||
except Exception as e:
|
||||
import sys
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user