mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-26 19:34:31 +08:00
[gpt-oss] Fix harmony parser in streaming responses (#30205)
Signed-off-by: AlonKejzman <alonkeizman@gmail.com>
This commit is contained in:
parent
256a33ecb4
commit
bd6d5a7475
@ -811,6 +811,11 @@ class OpenAIServingChat(OpenAIServing):
|
|||||||
delta_text += harmony_parser.last_content_delta or ""
|
delta_text += harmony_parser.last_content_delta or ""
|
||||||
cur_channel = harmony_parser.current_channel
|
cur_channel = harmony_parser.current_channel
|
||||||
cur_recipient = harmony_parser.current_recipient
|
cur_recipient = harmony_parser.current_recipient
|
||||||
|
# handle the case where several tokens where generated at once
|
||||||
|
# including the final token, leading to a delta in the text
|
||||||
|
# but the current channel to be empty (start state)
|
||||||
|
if not cur_channel and delta_text:
|
||||||
|
cur_channel = "final"
|
||||||
else:
|
else:
|
||||||
delta_text = output.text
|
delta_text = output.text
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user