We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 50aab94 commit 8c776b8Copy full SHA for 8c776b8
nemo_asr/run_eval.py
@@ -52,6 +52,14 @@ def download_audio_files(batch):
52
durations = []
53
54
for id, sample in zip(batch["id"], batch["audio"]):
55
+
56
+ # frist step added here to make ID and wav filenames unique
57
+ # several datasets like earnings22 have a hierarchical structure
58
+ # for eg. earnings22/test/4432298/281.wav, earnings22/test/4450488/281.wav
59
+ # lhotse uses the filename (281.wav) here as unique ID to create and name cuts
60
+ # ref: https://github.com/lhotse-speech/lhotse/blob/master/lhotse/dataset/collation.py#L186
61
+ id = id.replace('/', '_').removesuffix('.wav')
62
63
audio_path = os.path.join(CACHE_DIR, f"{id}.wav")
64
65
if "array" in sample:
0 commit comments