From 58eee5f2e05b74eb2cb1a3bbda9c04df4805e4cc Mon Sep 17 00:00:00 2001 From: Vadim Gimpelson <156319763+vadiklyutiy@users.noreply.github.com> Date: Sat, 2 Aug 2025 12:43:52 +0400 Subject: [PATCH] [PERF] Use faster way of decode in tokenizer: avoid useless list-to-list conversion (#20000) Signed-off-by: Vadim Gimpelson --- vllm/transformers_utils/tokenizer.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/vllm/transformers_utils/tokenizer.py b/vllm/transformers_utils/tokenizer.py index 24ddd35abea6..6a31a4198069 100644 --- a/vllm/transformers_utils/tokenizer.py +++ b/vllm/transformers_utils/tokenizer.py @@ -50,11 +50,12 @@ def decode_tokens( `skip_special_tokens=None` means to use the backend's default settings. """ + decode_method = getattr(tokenizer, "_decode", tokenizer.decode) if skip_special_tokens is not None: - return tokenizer.decode(token_ids, - skip_special_tokens=skip_special_tokens) + return decode_method(token_ids, + skip_special_tokens=skip_special_tokens) - return tokenizer.decode(token_ids) + return decode_method(token_ids) def encode_tokens(