[Bugfix] Fix BLIP-2 processing (#12412)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
Cyrus Leung 2025-01-25 11:42:42 +08:00 committed by GitHub
parent 221d388cc5
commit fb30ee92ee
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -481,14 +481,14 @@ class Blip2MultiModalProcessor(BaseMultiModalProcessor[Blip2ProcessingInfo]):
bos_token_id = tokenizer.bos_token_id bos_token_id = tokenizer.bos_token_id
assert isinstance(bos_token_id, int) assert isinstance(bos_token_id, int)
image_token_id = vocab["image"] image_token_id = vocab["<image>"]
num_image_tokens = self.info.get_num_image_tokens() num_image_tokens = self.info.get_num_image_tokens()
image_tokens = [image_token_id] * num_image_tokens image_tokens = [image_token_id] * num_image_tokens
return [ return [
PromptReplacement( PromptReplacement(
modality="image", modality="image",
target="</s>", target=[bos_token_id],
replacement=PromptReplacementDetails( replacement=PromptReplacementDetails(
full=image_tokens + [bos_token_id], full=image_tokens + [bos_token_id],
features=image_tokens, features=image_tokens,