Fix handling of special tokens in decoding. (#418)

2025-12-17 12:26:27 +08:00 · 2023-07-12 23:14:56 +08:00 · 2023-07-12 23:14:56 +08:00 · c6dfc3cdbe
commit c6dfc3cdbe
parent 51be365143
2 changed files with 6 additions and 3 deletions
--- a/vllm/engine/llm_engine.py
+++ b/vllm/engine/llm_engine.py
@ -276,6 +276,7 @@ class LLMEngine:
                    seq.get_last_token_id(),
                    skip_special_tokens=True,
                )
                if new_token is not None:
                    seq.output_tokens.append(new_token)
                    seq.output_text = new_output_text
--- a/vllm/transformers_utils/tokenizer.py
+++ b/vllm/transformers_utils/tokenizer.py
@ -80,6 +80,8 @@ def detokenize_incrementally(
        new_token: The new token as a string.
        output_text: The new output text as a string.
    """
    if skip_special_tokens and (new_token_id in tokenizer.all_special_ids):
        return None, prev_output_tokens
    new_token = tokenizer.convert_ids_to_tokens(
        new_token_id, skip_special_tokens=skip_special_tokens)
    output_tokens = prev_output_tokens + [new_token]
@ -99,7 +101,7 @@ def detokenize_incrementally(
    sub_texts = []
    current_sub_text = []
    for token in output_tokens:
-        if skip_special_tokens and token in tokenizer.all_special_ids:
+        if skip_special_tokens and token in tokenizer.all_special_tokens:
            continue
        if token in tokenizer.added_tokens_encoder:
            if current_sub_text: