diff --git a/dataset_configs/multilingual/granary/config.yaml b/dataset_configs/multilingual/granary/config.yaml index 78e778b0..2a476b88 100644 --- a/dataset_configs/multilingual/granary/config.yaml +++ b/dataset_configs/multilingual/granary/config.yaml @@ -71,7 +71,7 @@ documentation: | ``ConvertToTarredAudioDataset`` *(optional, only if tar-sharding is enabled)*:: - pip install lhotse "nemo-toolkit[common]==2.2.1" + pip install lhotse "nemo-toolkit[common]==2.3.2" Quick start ----------- diff --git a/docker/Dockerfile.tts_sdp b/docker/Dockerfile.tts_sdp index f174c7b1..849c145d 100644 --- a/docker/Dockerfile.tts_sdp +++ b/docker/Dockerfile.tts_sdp @@ -41,6 +41,6 @@ RUN pip install -r requirements/tts.txt RUN pip install flash-attn --no-build-isolation RUN pip install https://github.com/LahiLuk/YouTokenToMe/archive/master.zip RUN pip install megatron-core transformer_engine[pytorch]==2.4.0 -RUN pip install nemo_toolkit['all']==2.1.0 +RUN pip install nemo_toolkit['all']==2.3.2 WORKDIR /src/NeMo-speech-data-processor \ No newline at end of file