diff --git a/vllm/tokenizers/hf.py b/vllm/tokenizers/hf.py index a7b565dca5d8f..2a95f9c82fbd3 100644 --- a/vllm/tokenizers/hf.py +++ b/vllm/tokenizers/hf.py @@ -58,7 +58,9 @@ def get_cached_tokenizer(tokenizer: HfTokenizer) -> HfTokenizer: def __reduce__(self): return get_cached_tokenizer, (tokenizer,) - CachedTokenizer.__name__ = f"Cached{tokenizer.__class__.__name__}" + # Preserve original class name for HuggingFace compatibility. + # Some processors validate tokenizer type by checking __name__. + CachedTokenizer.__name__ = tokenizer.__class__.__name__ cached_tokenizer.__class__ = CachedTokenizer return cached_tokenizer