Include video support in conversion_utils.

The TensorFlow Datasets Authors · The TensorFlow Datasets Authors · commit fbeaf63e7dba · 2025-07-29T02:23:23.000-07:00
PiperOrigin-RevId: 788365222
diff --git a/tensorflow_datasets/core/utils/conversion_utils.py b/tensorflow_datasets/core/utils/conversion_utils.py
@@ -128,6 +128,18 @@ def to_tfds_value(value: Any, feature: feature_lib.FeatureConnector) -> Any:
   match feature:
     case feature_lib.ClassLabel() | feature_lib.Scalar():
       return value
+    case feature_lib.Video():
+      match value:
+        case dict():
+          if 'path' in value and value['path']:
+            return value['path']
+          elif 'bytes' in value and value['bytes']:
+            return value['bytes']
+          else:
+            raise ValueError(
+                'Dictionary-like video features must have either a `path` or'
+                ' `bytes` key.'
+            )
     case feature_lib.FeaturesDict():
       return {
           name: to_tfds_value(value.get(name), inner_feature)
diff --git a/tensorflow_datasets/core/utils/conversion_utils_test.py b/tensorflow_datasets/core/utils/conversion_utils_test.py
@@ -81,7 +81,7 @@ def test_convert_value_raises(value, feature):
 @pytest.mark.parametrize(
     'value,feature,expected_value',
     [
-        # datetime
+        # Datetime.
         (
             datetime.datetime(1970, 1, 1, tzinfo=datetime.timezone.utc),
             feature_lib.Scalar(dtype=np.int64),
@@ -92,14 +92,14 @@ def test_convert_value_raises(value, feature):
             feature_lib.Scalar(dtype=np.int64),
             86400,
         ),
-        # scalar
+        # Scalar.
         (42, feature_lib.Scalar(dtype=np.int64), 42),
         (42, feature_lib.Scalar(dtype=np.int32), 42),
         ('abc', feature_lib.Scalar(dtype=np.object_), 'abc'),
         (True, feature_lib.Scalar(dtype=np.bool_), True),
         (False, feature_lib.Scalar(dtype=np.bool_), False),
         (42.0, feature_lib.Scalar(dtype=np.float32), 42.0),
-        # sequence
+        # Sequence.
         ([42], feature_lib.Sequence(feature=tf.int64), [42]),
         (42, feature_lib.Sequence(feature=tf.int64), [42]),
         (None, feature_lib.Sequence(feature=tf.int64), []),
@@ -111,15 +111,15 @@ def test_convert_value_raises(value, feature):
             ),
             {'someint': [b'', 'string', b'']},
         ),
-        # image
+        # Image.
         (
             lazy_imports_lib.lazy_imports.PIL_Image.new(mode='L', size=(4, 4)),
             feature_lib.Image(),
             lazy_imports_lib.lazy_imports.PIL_Image.new(
                 mode='RGB', size=(4, 4)
             ),
         ),
-        # dict
+        # Dict.
         (
             {
                 'de': b'Hallo Welt',
@@ -148,7 +148,18 @@ def test_convert_value_raises(value, feature):
             }),
             {'name': b'Name', 'age': 100},
         ),
-        # nan, but the feature type is not float
+        # Video.
+        (
+            {'path': 'path/to/video.avi', 'bytes': None},
+            feature_lib.Video(),
+            'path/to/video.avi',
+        ),
+        (
+            {'path': None, 'bytes': b'video_bytes'},
+            feature_lib.Video(),
+            b'video_bytes',
+        ),
+        # nan, but the feature type is not float.
         (
             np.nan,
             feature_lib.Text(),