Skip to content

Commit f3cf375

Browse files
author
The TensorFlow Datasets Authors
committed
Add audio support for croissant builder.
PiperOrigin-RevId: 783663338
1 parent 37a607d commit f3cf375

File tree

2 files changed

+14
-0
lines changed

2 files changed

+14
-0
lines changed

tensorflow_datasets/core/dataset_builders/croissant_builder.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -48,6 +48,7 @@
4848
from tensorflow_datasets.core import download
4949
from tensorflow_datasets.core import split_builder as split_builder_lib
5050
from tensorflow_datasets.core import splits as splits_lib
51+
from tensorflow_datasets.core.features import audio_feature
5152
from tensorflow_datasets.core.features import bounding_boxes
5253
from tensorflow_datasets.core.features import feature as feature_lib
5354
from tensorflow_datasets.core.features import features_dict
@@ -177,6 +178,10 @@ def datatype_converter(
177178
feature = bounding_boxes.BBoxFeature(
178179
doc=field.description, bbox_format=None
179180
)
181+
elif field_data_type == mlc.DataType.AUDIO_OBJECT:
182+
feature = audio_feature.Audio(
183+
doc=field.description, sample_rate=field.source.sampling_rate
184+
)
180185
else:
181186
raise ValueError(f'Unknown data type: {field_data_type}.')
182187

tensorflow_datasets/core/dataset_builders/croissant_builder_test.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@
2020
from tensorflow_datasets import testing
2121
from tensorflow_datasets.core import file_adapters
2222
from tensorflow_datasets.core.dataset_builders import croissant_builder
23+
from tensorflow_datasets.core.features import audio_feature
2324
from tensorflow_datasets.core.features import bounding_boxes
2425
from tensorflow_datasets.core.features import features_dict
2526
from tensorflow_datasets.core.features import image_feature
@@ -150,6 +151,14 @@ def test_simple_datatype_converter(
150151
image_feature.Image,
151152
None,
152153
),
154+
(
155+
mlc.Field(
156+
data_types=mlc.DataType.AUDIO_OBJECT,
157+
description="Audio feature",
158+
),
159+
audio_feature.Audio,
160+
None,
161+
),
153162
(
154163
mlc.Field(
155164
data_types=mlc.DataType.BOUNDING_BOX,

0 commit comments

Comments
 (0)