From 8820821b59121192205077d0cdc56490e215b9fb Mon Sep 17 00:00:00 2001 From: AlexZhao Date: Mon, 26 May 2025 13:51:27 +0800 Subject: [PATCH] [Misc] Fixed the abnormally high TTFT issue in the PD disaggregation example (#18644) Signed-off-by: zhaohaidao Signed-off-by: zhaohaiyuan Co-authored-by: zhaohaiyuan --- .../lmcache/disagg_prefill_lmcache_v1/disagg_proxy_server.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/lmcache/disagg_prefill_lmcache_v1/disagg_proxy_server.py b/examples/lmcache/disagg_prefill_lmcache_v1/disagg_proxy_server.py index 8db93bc8931b2..32d36da9f2e86 100644 --- a/examples/lmcache/disagg_prefill_lmcache_v1/disagg_proxy_server.py +++ b/examples/lmcache/disagg_prefill_lmcache_v1/disagg_proxy_server.py @@ -135,7 +135,7 @@ async def handle_completions(request: Request): yield chunk return StreamingResponse(generate_stream(), - media_type="application/json") + media_type="text/event-stream") except Exception as e: import sys @@ -172,7 +172,7 @@ async def handle_chat_completions(request: Request): yield chunk return StreamingResponse(generate_stream(), - media_type="application/json") + media_type="text/event-stream") except Exception as e: import sys