|
77 | 77 | logger.warn("Flash attention 2 is not installed")
|
78 | 78 |
|
79 | 79 | _CONFIG_FOR_DOC = "ParlerTTSConfig"
|
80 |
| -_CHECKPOINT_FOR_DOC = "facebook/parler_tts-small" |
| 80 | +_CHECKPOINT_FOR_DOC = "parler-tts/parler-tts-mini-v1" |
81 | 81 |
|
82 | 82 | MUSICGEN_PRETRAINED_MODEL_ARCHIVE_LIST = [
|
83 |
| - "facebook/parler_tts-small", |
| 83 | + "parler-tts/parler-tts-mini-v1", |
84 | 84 | # See all ParlerTTS models at https://huggingface.co/models?filter=parler_tts
|
85 | 85 | ]
|
86 | 86 |
|
@@ -2357,7 +2357,7 @@ def from_pretrained(cls, pretrained_model_name_or_path, *model_args, **kwargs):
|
2357 | 2357 | ```python
|
2358 | 2358 | >>> from parler_tts import ParlerTTSForConditionalGeneration
|
2359 | 2359 |
|
2360 |
| - >>> model = ParlerTTSForConditionalGeneration.from_pretrained("facebook/parler_tts-small") |
| 2360 | + >>> model = ParlerTTSForConditionalGeneration.from_pretrained("parler-tts/parler-tts-mini-v1") |
2361 | 2361 | ```"""
|
2362 | 2362 |
|
2363 | 2363 | # At the moment fast initialization is not supported for composite models
|
@@ -2411,7 +2411,7 @@ def from_sub_models_pretrained(
|
2411 | 2411 |
|
2412 | 2412 | - A string, the *model id* of a pretrained model hosted inside a model repo on huggingface.co.
|
2413 | 2413 | Valid model ids can be located at the root-level, like `gpt2`, or namespaced under a user or
|
2414 |
| - organization name, like `facebook/parler_tts-small`. |
| 2414 | + organization name, like `parler-tts/parler-tts-mini-v1`. |
2415 | 2415 | - A path to a *directory* containing model weights saved using
|
2416 | 2416 | [`~PreTrainedModel.save_pretrained`], e.g., `./my_model_directory/`.
|
2417 | 2417 |
|
@@ -2440,7 +2440,7 @@ def from_sub_models_pretrained(
|
2440 | 2440 | >>> model = ParlerTTSForConditionalGeneration.from_sub_models_pretrained(
|
2441 | 2441 | ... text_encoder_pretrained_model_name_or_path="t5-base",
|
2442 | 2442 | ... audio_encoder_pretrained_model_name_or_path="facebook/encodec_24khz",
|
2443 |
| - ... decoder_pretrained_model_name_or_path="facebook/parler_tts-small", |
| 2443 | + ... decoder_pretrained_model_name_or_path="parler-tts/parler-tts-mini-v1", |
2444 | 2444 | ... )
|
2445 | 2445 | >>> # saving model after fine-tuning
|
2446 | 2446 | >>> model.save_pretrained("./parler_tts-ft")
|
@@ -2607,8 +2607,8 @@ def forward(
|
2607 | 2607 | >>> from transformers import AutoProcessor, ParlerTTSForConditionalGeneration
|
2608 | 2608 | >>> import torch
|
2609 | 2609 |
|
2610 |
| - >>> processor = AutoProcessor.from_pretrained("facebook/parler_tts-small") |
2611 |
| - >>> model = ParlerTTSForConditionalGeneration.from_pretrained("facebook/parler_tts-small") |
| 2610 | + >>> processor = AutoProcessor.from_pretrained("parler-tts/parler-tts-mini-v1") |
| 2611 | + >>> model = ParlerTTSForConditionalGeneration.from_pretrained("parler-tts/parler-tts-mini-v1") |
2612 | 2612 |
|
2613 | 2613 | >>> inputs = processor(
|
2614 | 2614 | ... text=["80s pop track with bassy drums and synth", "90s rock song with loud guitars and heavy drums"],
|
|
0 commit comments