You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
89 lines
2.9 KiB
89 lines
2.9 KiB
# This is the parameter configuration file for PaddleSpeech Serving.
|
|
|
|
#################################################################################
|
|
# SERVER SETTING #
|
|
#################################################################################
|
|
host: 127.0.0.1
|
|
port: 8092
|
|
|
|
# The task format in the engin_list is: <speech task>_<engine type>
|
|
# task choices = ['tts_online', 'tts_online-onnx']
|
|
# protocol = ['websocket', 'http'] (only one can be selected).
|
|
protocol: 'http'
|
|
engine_list: ['tts_online']
|
|
|
|
|
|
#################################################################################
|
|
# ENGINE CONFIG #
|
|
#################################################################################
|
|
|
|
################################### TTS #########################################
|
|
################### speech task: tts; engine_type: online #######################
|
|
tts_online:
|
|
# am (acoustic model) choices=['fastspeech2_csmsc', 'fastspeech2_cnndecoder_csmsc']
|
|
am: 'fastspeech2_cnndecoder_csmsc'
|
|
am_config:
|
|
am_ckpt:
|
|
am_stat:
|
|
phones_dict:
|
|
tones_dict:
|
|
speaker_dict:
|
|
spk_id: 0
|
|
|
|
# voc (vocoder) choices=['mb_melgan_csmsc, hifigan_csmsc']
|
|
voc: 'mb_melgan_csmsc'
|
|
voc_config:
|
|
voc_ckpt:
|
|
voc_stat:
|
|
|
|
# others
|
|
lang: 'zh'
|
|
device: 'cpu' # set 'gpu:id' or 'cpu'
|
|
am_block: 42
|
|
am_pad: 12
|
|
voc_block: 14
|
|
voc_pad: 14
|
|
|
|
|
|
|
|
#################################################################################
|
|
# ENGINE CONFIG #
|
|
#################################################################################
|
|
|
|
################################### TTS #########################################
|
|
################### speech task: tts; engine_type: online-onnx #######################
|
|
tts_online-onnx:
|
|
# am (acoustic model) choices=['fastspeech2_csmsc_onnx', 'fastspeech2_cnndecoder_csmsc_onnx']
|
|
am: 'fastspeech2_cnndecoder_csmsc_onnx'
|
|
# am_ckpt is a list, if am is fastspeech2_cnndecoder_csmsc_onnx, am_ckpt = [encoder model, decoder model, postnet model];
|
|
# if am is fastspeech2_csmsc_onnx, am_ckpt = [ckpt model];
|
|
am_ckpt: # list
|
|
am_stat:
|
|
phones_dict:
|
|
tones_dict:
|
|
speaker_dict:
|
|
spk_id: 0
|
|
am_sample_rate: 24000
|
|
am_sess_conf:
|
|
device: "cpu" # set 'gpu:id' or 'cpu'
|
|
use_trt: False
|
|
cpu_threads: 1
|
|
|
|
# voc (vocoder) choices=['mb_melgan_csmsc_onnx, hifigan_csmsc_onnx']
|
|
voc: 'mb_melgan_csmsc_onnx'
|
|
voc_ckpt:
|
|
voc_sample_rate: 24000
|
|
voc_sess_conf:
|
|
device: "cpu" # set 'gpu:id' or 'cpu'
|
|
use_trt: False
|
|
cpu_threads: 1
|
|
|
|
# others
|
|
lang: 'zh'
|
|
am_block: 42
|
|
am_pad: 12
|
|
voc_block: 14
|
|
voc_pad: 14
|
|
voc_upsample: 300
|
|
|