@@ -33,32 +33,60 @@ def main():
3333 """Run fastspeech decoding from folder."""
3434 parser = argparse .ArgumentParser (
3535 description = "Decode soft-mel features from charactor with trained FastSpeech "
36- "(See detail in examples/fastspeech/decode_fastspeech.py)." )
37- parser .add_argument ("--rootdir" , default = None , type = str , required = True ,
38- help = "directory including ids/durations files." )
39- parser .add_argument ("--outdir" , type = str , required = True ,
40- help = "directory to save generated speech." )
41- parser .add_argument ("--checkpoint" , type = str , required = True ,
42- help = "checkpoint file to be loaded." )
43- parser .add_argument ("--config" , default = None , type = str , required = True ,
44- help = "yaml format configuration file. if not explicitly provided, "
45- "it will be searched in the checkpoint directory. (default=None)" )
46- parser .add_argument ("--batch-size" , default = 8 , type = int , required = False ,
47- help = "Batch size for inference." )
48- parser .add_argument ("--verbose" , type = int , default = 1 ,
49- help = "logging level. higher is more logging. (default=1)" )
36+ "(See detail in examples/fastspeech/decode_fastspeech.py)."
37+ )
38+ parser .add_argument (
39+ "--rootdir" ,
40+ default = None ,
41+ type = str ,
42+ required = True ,
43+ help = "directory including ids/durations files." ,
44+ )
45+ parser .add_argument (
46+ "--outdir" , type = str , required = True , help = "directory to save generated speech."
47+ )
48+ parser .add_argument (
49+ "--checkpoint" , type = str , required = True , help = "checkpoint file to be loaded."
50+ )
51+ parser .add_argument (
52+ "--config" ,
53+ default = None ,
54+ type = str ,
55+ required = True ,
56+ help = "yaml format configuration file. if not explicitly provided, "
57+ "it will be searched in the checkpoint directory. (default=None)" ,
58+ )
59+ parser .add_argument (
60+ "--batch-size" ,
61+ default = 8 ,
62+ type = int ,
63+ required = False ,
64+ help = "Batch size for inference." ,
65+ )
66+ parser .add_argument (
67+ "--verbose" ,
68+ type = int ,
69+ default = 1 ,
70+ help = "logging level. higher is more logging. (default=1)" ,
71+ )
5072 args = parser .parse_args ()
5173
5274 # set logger
5375 if args .verbose > 1 :
5476 logging .basicConfig (
55- level = logging .DEBUG , format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" )
77+ level = logging .DEBUG ,
78+ format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" ,
79+ )
5680 elif args .verbose > 0 :
5781 logging .basicConfig (
58- level = logging .INFO , format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" )
82+ level = logging .INFO ,
83+ format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" ,
84+ )
5985 else :
6086 logging .basicConfig (
61- level = logging .WARN , format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" )
87+ level = logging .WARN ,
88+ format = "%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s" ,
89+ )
6290 logging .warning ("Skip DEBUG/INFO messages" )
6391
6492 # check directory existence
@@ -81,12 +109,14 @@ def main():
81109 root_dir = args .rootdir ,
82110 charactor_query = char_query ,
83111 charactor_load_fn = char_load_fn ,
84- return_utt_id = True
112+ return_utt_id = True ,
85113 )
86114 dataset = dataset .create (batch_size = args .batch_size )
87115
88116 # define model and load checkpoint
89- fastspeech = TFFastSpeech (config = FastSpeechConfig (** config ["fastspeech_params" ]), name = 'fastspeech' )
117+ fastspeech = TFFastSpeech (
118+ config = FastSpeechConfig (** config ["fastspeech_params" ]), name = "fastspeech"
119+ )
90120 fastspeech ._build ()
91121 fastspeech .load_weights (args .checkpoint )
92122
@@ -107,15 +137,22 @@ def main():
107137 masked_mel_afters = masked_mel_after .numpy ()
108138
109139 for (utt_id , mel_before , mel_after , durations ) in zip (
110- utt_ids , masked_mel_befores , masked_mel_afters , duration_outputs ):
140+ utt_ids , masked_mel_befores , masked_mel_afters , duration_outputs
141+ ):
111142 # real len of mel predicted
112143 real_length = durations .numpy ().sum ()
113144 utt_id = utt_id .numpy ().decode ("utf-8" )
114145 # save to folder.
115- np .save (os .path .join (args .outdir , f"{ utt_id } -fs-before-feats.npy" ),
116- mel_before [:real_length , :].astype (np .float32 ), allow_pickle = False )
117- np .save (os .path .join (args .outdir , f"{ utt_id } -fs-after-feats.npy" ),
118- mel_after [:real_length , :].astype (np .float32 ), allow_pickle = False )
146+ np .save (
147+ os .path .join (args .outdir , f"{ utt_id } -fs-before-feats.npy" ),
148+ mel_before [:real_length , :].astype (np .float32 ),
149+ allow_pickle = False ,
150+ )
151+ np .save (
152+ os .path .join (args .outdir , f"{ utt_id } -fs-after-feats.npy" ),
153+ mel_after [:real_length , :].astype (np .float32 ),
154+ allow_pickle = False ,
155+ )
119156
120157
121158if __name__ == "__main__" :
0 commit comments