diff --git a/vllm/v1/structured_output/backend_guidance.py b/vllm/v1/structured_output/backend_guidance.py index ec7e627191a5d..9150a28570bdd 100644 --- a/vllm/v1/structured_output/backend_guidance.py +++ b/vllm/v1/structured_output/backend_guidance.py @@ -46,7 +46,8 @@ class GuidanceBackend(StructuredOutputBackend): in vllm_config.decoding_config.guided_decoding_backend) tokenizer = tokenizer_group.get_lora_tokenizer(None) - self.ll_tokenizer = llguidance_hf.from_tokenizer(tokenizer, None) + self.ll_tokenizer = llguidance_hf.from_tokenizer( + tokenizer, self.vocab_size) def compile_grammar(self, request_type: StructuredOutputOptions, grammar_spec: str) -> StructuredOutputGrammar: