[Bugfix] Update InternVL input mapper to support image embeds (#9351)
This commit is contained in:
parent
8e836d982a
commit
55e081fbad
@ -342,6 +342,8 @@ class InternVLInputPipeline:
|
|||||||
elif is_list_of(data, Image.Image):
|
elif is_list_of(data, Image.Image):
|
||||||
# we can't stack here because images may have different num_patches
|
# we can't stack here because images may have different num_patches
|
||||||
data = [image_pixel_values_mapper(img) for img in data]
|
data = [image_pixel_values_mapper(img) for img in data]
|
||||||
|
else:
|
||||||
|
return MultiModalInputs({"image_embeds": data})
|
||||||
model_config = ctx.model_config
|
model_config = ctx.model_config
|
||||||
tokenizer = cached_get_tokenizer(
|
tokenizer = cached_get_tokenizer(
|
||||||
model_config.tokenizer,
|
model_config.tokenizer,
|
||||||
|
Loading…
x
Reference in New Issue
Block a user