Canton CLI, test=tts

pull/2977/head
WongLaw 3 years ago
parent ff8c56b08b
commit 3c85fe8a1a

@ -13,3 +13,7 @@
# limitations under the License.
import _locale
_locale._getdefaultlocale = (lambda *args: ['en_US', 'utf8'])
__version__ = '0.0.0'
__commit__ = 'ff8c56b08bcbbe9bea6f3eadd52921d3981b37ee'

@ -82,6 +82,7 @@ class TTSExecutor(BaseExecutor):
'tacotron2_csmsc',
'tacotron2_ljspeech',
'fastspeech2_male',
'fastspeech2_canton',
],
help='Choose acoustic model type of tts task.')
self.parser.add_argument(
@ -273,7 +274,7 @@ class TTSExecutor(BaseExecutor):
use_pretrained_voc = False
voc_lang = lang
# When speaker is 174 (csmsc), use csmsc's vocoder is better than aishell3's
if lang == 'mix':
if lang == 'mix' or lang == 'canton':
voc_dataset = voc[voc.rindex('_') + 1:]
if voc_dataset in {"ljspeech", "vctk"}:
voc_lang = 'en'
@ -487,7 +488,7 @@ class TTSExecutor(BaseExecutor):
# fastspeech2
else:
# multi speaker
if am_dataset in {'aishell3', 'vctk', 'mix'}:
if am_dataset in {'aishell3', 'vctk', 'mix', 'canton'}:
mel = self.am_inference(
part_phone_ids, spk_id=paddle.to_tensor(spk_id))
else:

@ -889,6 +889,24 @@ tts_dynamic_pretrained_models = {
'phone_id_map.txt',
},
},
"fastspeech2_canton-canton": {
'1.0': {
'url':
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_canton_ckpt_1.4.0.zip',
'md5':
'504560c082deba82120927627c900374',
'config':
'default.yaml',
'ckpt':
'snapshot_iter_140000.pdz',
'speech_stats':
'speech_stats.npy',
'phones_dict':
'phone_id_map.txt',
'speaker_dict':
'speaker_id_map.txt',
},
},
"fastspeech2_ljspeech-en": {
'1.0': {
'url':

Loading…
Cancel
Save