Skip to content

Commit cabca9f

Browse files
committed
🚀 Enhance tacotron2 dataset to adapt with any reduction factor, apply black.
1 parent 7258ba0 commit cabca9f

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

47 files changed

+3531
-2139
lines changed

‎examples/fastspeech/decode_fastspeech.py‎

Lines changed: 61 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -33,32 +33,60 @@ def main():
3333
"""Run fastspeech decoding from folder."""
3434
parser = argparse.ArgumentParser(
3535
description="Decode soft-mel features from charactor with trained FastSpeech "
36-
"(See detail in examples/fastspeech/decode_fastspeech.py).")
37-
parser.add_argument("--rootdir", default=None, type=str, required=True,
38-
help="directory including ids/durations files.")
39-
parser.add_argument("--outdir", type=str, required=True,
40-
help="directory to save generated speech.")
41-
parser.add_argument("--checkpoint", type=str, required=True,
42-
help="checkpoint file to be loaded.")
43-
parser.add_argument("--config", default=None, type=str, required=True,
44-
help="yaml format configuration file. if not explicitly provided, "
45-
"it will be searched in the checkpoint directory. (default=None)")
46-
parser.add_argument("--batch-size", default=8, type=int, required=False,
47-
help="Batch size for inference.")
48-
parser.add_argument("--verbose", type=int, default=1,
49-
help="logging level. higher is more logging. (default=1)")
36+
"(See detail in examples/fastspeech/decode_fastspeech.py)."
37+
)
38+
parser.add_argument(
39+
"--rootdir",
40+
default=None,
41+
type=str,
42+
required=True,
43+
help="directory including ids/durations files.",
44+
)
45+
parser.add_argument(
46+
"--outdir", type=str, required=True, help="directory to save generated speech."
47+
)
48+
parser.add_argument(
49+
"--checkpoint", type=str, required=True, help="checkpoint file to be loaded."
50+
)
51+
parser.add_argument(
52+
"--config",
53+
default=None,
54+
type=str,
55+
required=True,
56+
help="yaml format configuration file. if not explicitly provided, "
57+
"it will be searched in the checkpoint directory. (default=None)",
58+
)
59+
parser.add_argument(
60+
"--batch-size",
61+
default=8,
62+
type=int,
63+
required=False,
64+
help="Batch size for inference.",
65+
)
66+
parser.add_argument(
67+
"--verbose",
68+
type=int,
69+
default=1,
70+
help="logging level. higher is more logging. (default=1)",
71+
)
5072
args = parser.parse_args()
5173

5274
# set logger
5375
if args.verbose > 1:
5476
logging.basicConfig(
55-
level=logging.DEBUG, format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s")
77+
level=logging.DEBUG,
78+
format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s",
79+
)
5680
elif args.verbose > 0:
5781
logging.basicConfig(
58-
level=logging.INFO, format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s")
82+
level=logging.INFO,
83+
format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s",
84+
)
5985
else:
6086
logging.basicConfig(
61-
level=logging.WARN, format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s")
87+
level=logging.WARN,
88+
format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s",
89+
)
6290
logging.warning("Skip DEBUG/INFO messages")
6391

6492
# check directory existence
@@ -81,12 +109,14 @@ def main():
81109
root_dir=args.rootdir,
82110
charactor_query=char_query,
83111
charactor_load_fn=char_load_fn,
84-
return_utt_id=True
112+
return_utt_id=True,
85113
)
86114
dataset = dataset.create(batch_size=args.batch_size)
87115

88116
# define model and load checkpoint
89-
fastspeech = TFFastSpeech(config=FastSpeechConfig(**config["fastspeech_params"]), name='fastspeech')
117+
fastspeech = TFFastSpeech(
118+
config=FastSpeechConfig(**config["fastspeech_params"]), name="fastspeech"
119+
)
90120
fastspeech._build()
91121
fastspeech.load_weights(args.checkpoint)
92122

@@ -107,15 +137,22 @@ def main():
107137
masked_mel_afters = masked_mel_after.numpy()
108138

109139
for (utt_id, mel_before, mel_after, durations) in zip(
110-
utt_ids, masked_mel_befores, masked_mel_afters, duration_outputs):
140+
utt_ids, masked_mel_befores, masked_mel_afters, duration_outputs
141+
):
111142
# real len of mel predicted
112143
real_length = durations.numpy().sum()
113144
utt_id = utt_id.numpy().decode("utf-8")
114145
# save to folder.
115-
np.save(os.path.join(args.outdir, f"{utt_id}-fs-before-feats.npy"),
116-
mel_before[:real_length, :].astype(np.float32), allow_pickle=False)
117-
np.save(os.path.join(args.outdir, f"{utt_id}-fs-after-feats.npy"),
118-
mel_after[:real_length, :].astype(np.float32), allow_pickle=False)
146+
np.save(
147+
os.path.join(args.outdir, f"{utt_id}-fs-before-feats.npy"),
148+
mel_before[:real_length, :].astype(np.float32),
149+
allow_pickle=False,
150+
)
151+
np.save(
152+
os.path.join(args.outdir, f"{utt_id}-fs-after-feats.npy"),
153+
mel_after[:real_length, :].astype(np.float32),
154+
allow_pickle=False,
155+
)
119156

120157

121158
if __name__ == "__main__":

0 commit comments

Comments
 (0)