refactor: unify names of the feature field of MultimodalDataItem (#8075)

This commit is contained in:
Mick
2025-07-17 08:52:38 +08:00
committed by GitHub
parent c28ad1990d
commit 4395c87a9b
33 changed files with 66 additions and 83 deletions

View File

@@ -510,7 +510,7 @@ class InternVLChatModel(nn.Module):
Returns:
image_features (`torch.Tensor`): Image feature tensor of shape `(num_images, image_length, embed_dim)`).
"""
pixel_values = torch.cat([item.pixel_values for item in items])
pixel_values = torch.cat([item.feature for item in items])
image_features = self.extract_feature(pixel_values)
return image_features