Skip to content

Commit c1395e3

Browse files
committed
add synthesize for ernie_sat aishell3 and aishell3_vctk, test=tts
1 parent 72fa817 commit c1395e3

File tree

3 files changed

+85
-3
lines changed

3 files changed

+85
-3
lines changed
Lines changed: 42 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1,42 @@
1-
#!/bin/bash
1+
#!/bin/bash
2+
3+
config_path=$1
4+
train_output_path=$2
5+
ckpt_name=$3
6+
7+
stage=1
8+
stop_stage=1
9+
10+
# pwgan
11+
if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
12+
FLAGS_allocator_strategy=naive_best_fit \
13+
FLAGS_fraction_of_gpu_memory_to_use=0.01 \
14+
python3 ${BIN_DIR}/synthesize.py \
15+
--erniesat_config=${config_path} \
16+
--erniesat_ckpt=${train_output_path}/checkpoints/${ckpt_name} \
17+
--erniesat_stat=dump/train/speech_stats.npy \
18+
--voc=pwgan_aishell3 \
19+
--voc_config=pwg_aishell3_ckpt_0.5/default.yaml \
20+
--voc_ckpt=pwg_aishell3_ckpt_0.5/snapshot_iter_1000000.pdz \
21+
--voc_stat=pwg_aishell3_ckpt_0.5/feats_stats.npy \
22+
--test_metadata=dump/test/norm/metadata.jsonl \
23+
--output_dir=${train_output_path}/test \
24+
--phones_dict=dump/phone_id_map.txt
25+
fi
26+
27+
# hifigan
28+
if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
29+
FLAGS_allocator_strategy=naive_best_fit \
30+
FLAGS_fraction_of_gpu_memory_to_use=0.01 \
31+
python3 ${BIN_DIR}/synthesize.py \
32+
--erniesat_config=${config_path} \
33+
--erniesat_ckpt=${train_output_path}/checkpoints/${ckpt_name} \
34+
--erniesat_stat=dump/train/speech_stats.npy \
35+
--voc=hifigan_aishell3 \
36+
--voc_config=hifigan_aishell3_ckpt_0.2.0/default.yaml \
37+
--voc_ckpt=hifigan_aishell3_ckpt_0.2.0/snapshot_iter_2500000.pdz \
38+
--voc_stat=hifigan_aishell3_ckpt_0.2.0/feats_stats.npy \
39+
--test_metadata=dump/test/norm/metadata.jsonl \
40+
--output_dir=${train_output_path}/test \
41+
--phones_dict=dump/phone_id_map.txt
42+
fi

examples/aishell3/tts3/local/synthesize.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
3737
--am_stat=dump/train/speech_stats.npy \
3838
--voc=hifigan_aishell3 \
3939
--voc_config=hifigan_aishell3_ckpt_0.2.0/default.yaml \
40-
--voc_ckpt=hifigan_aishell3_ckpt_0.2.0/snapshot_iter_2500000.pd \
40+
--voc_ckpt=hifigan_aishell3_ckpt_0.2.0/snapshot_iter_2500000.pdz \
4141
--voc_stat=hifigan_aishell3_ckpt_0.2.0/feats_stats.npy \
4242
--test_metadata=dump/test/norm/metadata.jsonl \
4343
--output_dir=${train_output_path}/test \
Lines changed: 42 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1,42 @@
1-
#!/bin/bash
1+
#!/bin/bash
2+
3+
config_path=$1
4+
train_output_path=$2
5+
ckpt_name=$3
6+
7+
stage=1
8+
stop_stage=1
9+
10+
# pwgan
11+
if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
12+
FLAGS_allocator_strategy=naive_best_fit \
13+
FLAGS_fraction_of_gpu_memory_to_use=0.01 \
14+
python3 ${BIN_DIR}/synthesize.py \
15+
--erniesat_config=${config_path} \
16+
--erniesat_ckpt=${train_output_path}/checkpoints/${ckpt_name} \
17+
--erniesat_stat=dump/train/speech_stats.npy \
18+
--voc=pwgan_aishell3 \
19+
--voc_config=pwg_aishell3_ckpt_0.5/default.yaml \
20+
--voc_ckpt=pwg_aishell3_ckpt_0.5/snapshot_iter_1000000.pdz \
21+
--voc_stat=pwg_aishell3_ckpt_0.5/feats_stats.npy \
22+
--test_metadata=dump/test/norm/metadata.jsonl \
23+
--output_dir=${train_output_path}/test \
24+
--phones_dict=dump/phone_id_map.txt
25+
fi
26+
27+
# hifigan
28+
if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
29+
FLAGS_allocator_strategy=naive_best_fit \
30+
FLAGS_fraction_of_gpu_memory_to_use=0.01 \
31+
python3 ${BIN_DIR}/synthesize.py \
32+
--erniesat_config=${config_path} \
33+
--erniesat_ckpt=${train_output_path}/checkpoints/${ckpt_name} \
34+
--erniesat_stat=dump/train/speech_stats.npy \
35+
--voc=hifigan_aishell3 \
36+
--voc_config=hifigan_aishell3_ckpt_0.2.0/default.yaml \
37+
--voc_ckpt=hifigan_aishell3_ckpt_0.2.0/snapshot_iter_2500000.pdz \
38+
--voc_stat=hifigan_aishell3_ckpt_0.2.0/feats_stats.npy \
39+
--test_metadata=dump/test/norm/metadata.jsonl \
40+
--output_dir=${train_output_path}/test \
41+
--phones_dict=dump/phone_id_map.txt
42+
fi

0 commit comments

Comments
 (0)