update csmsc/tts3_rhy

pull/4008/head
nyx-c-language 6 months ago
parent 39cead0bfe
commit 6077fa59d9

@ -20,7 +20,7 @@ Run the command below to
3. train the model.
4. synthesize wavs.
- synthesize waveform from `metadata.jsonl`.
- select vocoder type via `--stage` (0 = pwgan, 1 = hifigan)
- select vocoder type via `--stage` (0 = pwgan, 1 = multi band melgan, 3 = hifigan, 4 = wavernn)
- synthesize waveform from a text file.
5. inference using the static model.
```bash

@ -33,6 +33,9 @@ if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
fi
if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
# synthesize_e2e, vocoder is pwgan by default stage 0, stage 1 will use hifigan as vocoder
# synthesize_e2e, vocoder is pwgan by default stage 0
# stage 1 will use multi band melgan as vocoder
# stage 3 will use hifigan as vocoder
# stage 4 will use wavernn as vocoder
CUDA_VISIBLE_DEVICES=${gpus} ./local/synthesize_e2e.sh --stage 0 ${conf_path} ${train_output_path} ${ckpt_name} || exit -1
fi

Loading…
Cancel
Save