File tree Expand file tree Collapse file tree 3 files changed +5
-2
lines changed
Expand file tree Collapse file tree 3 files changed +5
-2
lines changed Original file line number Diff line number Diff line change @@ -21,6 +21,8 @@ class MediaWithBytes(Generic[_T]):
2121
2222 The wrapper delegates attribute access to the underlying media object,
2323 making it behave transparently like the wrapped type (e.g., PIL.Image).
24+
25+ NOTE: Currently, this wrapper is used only for the image modality.
2426 """
2527
2628 media : _T
Original file line number Diff line number Diff line change 3232 from PIL .Image import Image
3333 from transformers .feature_extraction_utils import BatchFeature
3434
35+ from .base import MediaWithBytes
3536 from .processing import MultiModalHashes
3637
3738else :
5960item, which can be passed to a HuggingFace `AudioProcessor`.
6061"""
6162
62- ImageItem : TypeAlias = Union [HfImageItem , "torch.Tensor" ]
63+ ImageItem : TypeAlias = Union [HfImageItem , "torch.Tensor" , "MediaWithBytes[HfImageItem]" ]
6364"""
6465A `transformers.image_utils.ImageInput` representing a single image
6566item, which can be passed to a HuggingFace `ImageProcessor`.
Original file line number Diff line number Diff line change @@ -484,7 +484,7 @@ def _parse_image_data(
484484 return ImageEmbeddingItems (data )
485485
486486 if (
487- isinstance (data , PILImage .Image )
487+ isinstance (data , ( PILImage .Image , MediaWithBytes ) )
488488 or isinstance (data , (np .ndarray , torch .Tensor ))
489489 and data .ndim == 3
490490 ):
You can’t perform that action at this time.
0 commit comments