[Bugfix] Validate and concatenate image embeddings in MiniCPMVBaseModel (#11631)

This commit is contained in:
whyiug 2024-12-31 02:51:04 +08:00 committed by GitHub
parent 5886aa496e
commit 36e7670045
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -487,6 +487,12 @@ class MiniCPMVBaseModel(nn.Module, SupportsMultiModal, SupportsPP):
image_embeds = kwargs.pop("image_embeds", None) image_embeds = kwargs.pop("image_embeds", None)
if image_embeds is not None: if image_embeds is not None:
if not isinstance(image_embeds, (torch.Tensor, list)):
raise ValueError(f"Incorrect type of image embeds. "
f"Got type: {type(image_embeds)}")
if isinstance(image_embeds, list):
image_embeds = torch.concat(image_embeds)
return MiniCPMVImageEmbeddingInputs( return MiniCPMVImageEmbeddingInputs(
image_bounds=self._get_image_bounds(input_ids, im_start_id, image_bounds=self._get_image_bounds(input_ids, im_start_id,
im_end_id, slice_start_id, im_end_id, slice_start_id,