We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent adae0c1 commit 73a99ccCopy full SHA for 73a99cc
vllm/entrypoints/openai/serving_chat.py
@@ -691,11 +691,13 @@ async def chat_completion_stream_generator(
691
if self.use_harmony:
692
harmony_parser = harmony_parsers[i]
693
prev_recipient = harmony_parser.current_recipient
694
+ delta_text = ""
695
for token_id in output.token_ids:
696
harmony_parser.process(token_id)
697
+ delta_text += (harmony_parser.last_content_delta
698
+ or "")
699
cur_channel = harmony_parser.current_channel
700
cur_recipient = harmony_parser.current_recipient
- delta_text = harmony_parser.last_content_delta or ""
701
else:
702
delta_text = output.text
703
0 commit comments