Skip to content

Commit 1b8b37a

Browse files
author
The TensorFlow Datasets Authors
committed
Add progress bar to convert_format_utils.py
PiperOrigin-RevId: 672955580
1 parent 7d81c6b commit 1b8b37a

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

tensorflow_datasets/scripts/cli/convert_format_utils.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@
2727
with epy.lazy_imports():
2828
# pylint: disable=g-import-not-at-top
2929
import concurrent.futures
30+
import tqdm
3031

3132
from absl import logging
3233
import apache_beam as beam
@@ -59,9 +60,10 @@ class ShardInstruction:
5960
convert_fn: ConvertFn | None = None
6061

6162
def convert(self) -> None:
63+
"""Converts the shard to the desired file format."""
6264
def read_in() -> Iterator[type_utils.KeySerializedExample]:
6365
in_dataset = self.in_file_adapter.make_tf_data(filename=self.in_path)
64-
for i, row in enumerate(in_dataset):
66+
for i, row in tqdm.tqdm(enumerate(in_dataset)):
6567
if self.convert_fn is not None:
6668
yield i, self.convert_fn(row)
6769
else:
@@ -364,7 +366,7 @@ def _convert_dataset_dirs(
364366
)
365367

366368
logging.info('All shards have been converted. Now converting metadata.')
367-
for dataset_dir, info in found_dataset_versions.items():
369+
for dataset_dir, info in tqdm.tqdm(found_dataset_versions.items()):
368370
out_dir = from_to_dirs[dataset_dir]
369371
logging.info('Converting metadata in %s.', dataset_dir)
370372
convert_metadata(

0 commit comments

Comments
 (0)