mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-05 06:30:52 +08:00
[Model] Fixed stream generator for gpt-oss + spec-decoding (#26027)
Signed-off-by: Aleksandr Samarin <astrlrd@nebius.com> Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
d8b1f9ccc3
commit
c40c0d9c82
@ -691,11 +691,13 @@ class OpenAIServingChat(OpenAIServing):
|
||||
if self.use_harmony:
|
||||
harmony_parser = harmony_parsers[i]
|
||||
prev_recipient = harmony_parser.current_recipient
|
||||
delta_text = ""
|
||||
for token_id in output.token_ids:
|
||||
harmony_parser.process(token_id)
|
||||
delta_text += (harmony_parser.last_content_delta
|
||||
or "")
|
||||
cur_channel = harmony_parser.current_channel
|
||||
cur_recipient = harmony_parser.current_recipient
|
||||
delta_text = harmony_parser.last_content_delta or ""
|
||||
else:
|
||||
delta_text = output.text
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user