Merge pull request #1917 from KPatr1ck/resource
[Resource][CLI][Server] Add paddlespeech.resource module.pull/1998/head
commit
0fa32e4aae
@ -1,151 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
# The tags for pretrained_models should be "{model_name}[_{dataset}][-{lang}][-...]".
|
||||
# e.g. "conformer_wenetspeech-zh-16k" and "panns_cnn6-32k".
|
||||
# Command line and python api use "{model_name}[_{dataset}]" as --model, usage:
|
||||
# "paddlespeech asr --model conformer_wenetspeech --lang zh --sr 16000 --input ./input.wav"
|
||||
"conformer_wenetspeech-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr1_conformer_wenetspeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'76cb19ed857e6623856b7cd7ebbfeda4',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/conformer/checkpoints/wenetspeech',
|
||||
},
|
||||
"conformer_online_wenetspeech-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr1/asr1_chunk_conformer_wenetspeech_ckpt_1.0.0a.model.tar.gz',
|
||||
'md5':
|
||||
'b8c02632b04da34aca88459835be54a6',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/avg_10',
|
||||
},
|
||||
"conformer_online_multicn-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/multi_cn/asr1/asr1_chunk_conformer_multi_cn_ckpt_0.2.0.model.tar.gz',
|
||||
'md5':
|
||||
'7989b3248c898070904cf042fd656003',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn',
|
||||
},
|
||||
"conformer_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr1/asr1_conformer_aishell_ckpt_0.1.2.model.tar.gz',
|
||||
'md5':
|
||||
'3f073eccfa7bb14e0c6867d65fc0dc3a',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/conformer/checkpoints/avg_30',
|
||||
},
|
||||
"conformer_online_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr1/asr1_chunk_conformer_aishell_ckpt_0.2.0.model.tar.gz',
|
||||
'md5':
|
||||
'b374cfb93537761270b6224fb0bfc26a',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/avg_30',
|
||||
},
|
||||
"transformer_librispeech-en-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/librispeech/asr1/asr1_transformer_librispeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'2c667da24922aad391eacafe37bc1660',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/transformer/checkpoints/avg_10',
|
||||
},
|
||||
"deepspeech2online_wenetspeech-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr0/asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz',
|
||||
'md5':
|
||||
'e393d4d274af0f6967db24fc146e8074',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2_online/checkpoints/avg_10',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
"deepspeech2offline_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_aishell_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'932c3593d62fe5c741b59b31318aa314',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
"deepspeech2online_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_online_aishell_fbank161_ckpt_0.2.1.model.tar.gz',
|
||||
'md5':
|
||||
'98b87b171b7240b7cae6e07d8d0bc9be',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
"deepspeech2offline_librispeech-en-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/librispeech/asr0/asr0_deepspeech2_librispeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'f5666c81ad015c8de03aac2bc92e5762',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/en_lm/common_crawl_00.prune01111.trie.klm',
|
||||
'lm_md5':
|
||||
'099a601759d467cd0a8523ff939819c5'
|
||||
},
|
||||
}
|
||||
|
||||
model_alias = {
|
||||
"deepspeech2offline":
|
||||
"paddlespeech.s2t.models.ds2:DeepSpeech2Model",
|
||||
"deepspeech2online":
|
||||
"paddlespeech.s2t.models.ds2_online:DeepSpeech2ModelOnline",
|
||||
"conformer":
|
||||
"paddlespeech.s2t.models.u2:U2Model",
|
||||
"conformer_online":
|
||||
"paddlespeech.s2t.models.u2:U2Model",
|
||||
"transformer":
|
||||
"paddlespeech.s2t.models.u2:U2Model",
|
||||
"wenetspeech":
|
||||
"paddlespeech.s2t.models.u2:U2Model",
|
||||
}
|
@ -1,47 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
# The tags for pretrained_models should be "{model_name}[_{dataset}][-{lang}][-...]".
|
||||
# e.g. "conformer_wenetspeech-zh-16k", "transformer_aishell-zh-16k" and "panns_cnn6-32k".
|
||||
# Command line and python api use "{model_name}[_{dataset}]" as --model, usage:
|
||||
# "paddlespeech asr --model conformer_wenetspeech --lang zh --sr 16000 --input ./input.wav"
|
||||
"panns_cnn6-32k": {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn6.tar.gz',
|
||||
'md5': '4cf09194a95df024fd12f84712cf0f9c',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn6.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
"panns_cnn10-32k": {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn10.tar.gz',
|
||||
'md5': 'cb8427b22176cc2116367d14847f5413',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn10.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
"panns_cnn14-32k": {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn14.tar.gz',
|
||||
'md5': 'e3b9b5614a1595001161d0ab95edee97',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn14.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
}
|
||||
|
||||
model_alias = {
|
||||
"panns_cnn6": "paddlespeech.cls.models.panns:CNN6",
|
||||
"panns_cnn10": "paddlespeech.cls.models.panns:CNN10",
|
||||
"panns_cnn14": "paddlespeech.cls.models.panns:CNN14",
|
||||
}
|
@ -1,35 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
"fat_st_ted-en-zh": {
|
||||
"url":
|
||||
"https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/st1_transformer_mtl_noam_ted-en-zh_ckpt_0.1.1.model.tar.gz",
|
||||
"md5":
|
||||
"d62063f35a16d91210a71081bd2dd557",
|
||||
"cfg_path":
|
||||
"model.yaml",
|
||||
"ckpt_path":
|
||||
"exp/transformer_mtl_noam/checkpoints/fat_st_ted-en-zh.pdparams",
|
||||
}
|
||||
}
|
||||
|
||||
model_alias = {"fat_st": "paddlespeech.s2t.models.u2_st:U2STModel"}
|
||||
|
||||
kaldi_bins = {
|
||||
"url":
|
||||
"https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/kaldi_bins.tar.gz",
|
||||
"md5":
|
||||
"c0682303b3f3393dbf6ed4c4e35a53eb",
|
||||
}
|
@ -1,146 +0,0 @@
|
||||
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
import argparse
|
||||
from typing import List
|
||||
|
||||
from prettytable import PrettyTable
|
||||
|
||||
from ..utils import cli_register
|
||||
from ..utils import stats_wrapper
|
||||
|
||||
__all__ = ['StatsExecutor']
|
||||
|
||||
model_name_format = {
|
||||
'asr': 'Model-Language-Sample Rate',
|
||||
'cls': 'Model-Sample Rate',
|
||||
'st': 'Model-Source language-Target language',
|
||||
'text': 'Model-Task-Language',
|
||||
'tts': 'Model-Language',
|
||||
'vector': 'Model-Sample Rate'
|
||||
}
|
||||
|
||||
|
||||
@cli_register(
|
||||
name='paddlespeech.stats',
|
||||
description='Get speech tasks support models list.')
|
||||
class StatsExecutor():
|
||||
def __init__(self):
|
||||
super().__init__()
|
||||
|
||||
self.parser = argparse.ArgumentParser(
|
||||
prog='paddlespeech.stats', add_help=True)
|
||||
self.task_choices = ['asr', 'cls', 'st', 'text', 'tts', 'vector']
|
||||
self.parser.add_argument(
|
||||
'--task',
|
||||
type=str,
|
||||
default='asr',
|
||||
choices=self.task_choices,
|
||||
help='Choose speech task.',
|
||||
required=True)
|
||||
|
||||
def show_support_models(self, pretrained_models: dict):
|
||||
fields = model_name_format[self.task].split("-")
|
||||
table = PrettyTable(fields)
|
||||
for key in pretrained_models:
|
||||
table.add_row(key.split("-"))
|
||||
print(table)
|
||||
|
||||
def execute(self, argv: List[str]) -> bool:
|
||||
"""
|
||||
Command line entry.
|
||||
"""
|
||||
parser_args = self.parser.parse_args(argv)
|
||||
has_exceptions = False
|
||||
try:
|
||||
self(parser_args.task)
|
||||
except Exception as e:
|
||||
has_exceptions = True
|
||||
if has_exceptions:
|
||||
return False
|
||||
else:
|
||||
return True
|
||||
|
||||
@stats_wrapper
|
||||
def __call__(
|
||||
self,
|
||||
task: str=None, ):
|
||||
"""
|
||||
Python API to call an executor.
|
||||
"""
|
||||
self.task = task
|
||||
if self.task not in self.task_choices:
|
||||
print("Please input correct speech task, choices = " + str(
|
||||
self.task_choices))
|
||||
|
||||
elif self.task == 'asr':
|
||||
try:
|
||||
from ..asr.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of ASR pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print("Failed to get the list of ASR pretrained models.")
|
||||
|
||||
elif self.task == 'cls':
|
||||
try:
|
||||
from ..cls.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of CLS pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print("Failed to get the list of CLS pretrained models.")
|
||||
|
||||
elif self.task == 'st':
|
||||
try:
|
||||
from ..st.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of ST pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print("Failed to get the list of ST pretrained models.")
|
||||
|
||||
elif self.task == 'text':
|
||||
try:
|
||||
from ..text.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of TEXT pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print("Failed to get the list of TEXT pretrained models.")
|
||||
|
||||
elif self.task == 'tts':
|
||||
try:
|
||||
from ..tts.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of TTS pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print("Failed to get the list of TTS pretrained models.")
|
||||
|
||||
elif self.task == 'vector':
|
||||
try:
|
||||
from ..vector.pretrained_models import pretrained_models
|
||||
print(
|
||||
"Here is the list of Speaker Recognition pretrained models released by PaddleSpeech that can be used by command line and python API"
|
||||
)
|
||||
self.show_support_models(pretrained_models)
|
||||
except BaseException:
|
||||
print(
|
||||
"Failed to get the list of Speaker Recognition pretrained models."
|
||||
)
|
@ -1,54 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
# The tags for pretrained_models should be "{model_name}[_{dataset}][-{lang}][-...]".
|
||||
# e.g. "conformer_wenetspeech-zh-16k", "transformer_aishell-zh-16k" and "panns_cnn6-32k".
|
||||
# Command line and python api use "{model_name}[_{dataset}]" as --model, usage:
|
||||
# "paddlespeech asr --model conformer_wenetspeech --lang zh --sr 16000 --input ./input.wav"
|
||||
"ernie_linear_p7_wudao-punc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/text/ernie_linear_p7_wudao-punc-zh.tar.gz',
|
||||
'md5':
|
||||
'12283e2ddde1797c5d1e57036b512746',
|
||||
'cfg_path':
|
||||
'ckpt/model_config.json',
|
||||
'ckpt_path':
|
||||
'ckpt/model_state.pdparams',
|
||||
'vocab_file':
|
||||
'punc_vocab.txt',
|
||||
},
|
||||
"ernie_linear_p3_wudao-punc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/text/ernie_linear_p3_wudao-punc-zh.tar.gz',
|
||||
'md5':
|
||||
'448eb2fdf85b6a997e7e652e80c51dd2',
|
||||
'cfg_path':
|
||||
'ckpt/model_config.json',
|
||||
'ckpt_path':
|
||||
'ckpt/model_state.pdparams',
|
||||
'vocab_file':
|
||||
'punc_vocab.txt',
|
||||
},
|
||||
}
|
||||
|
||||
model_alias = {
|
||||
"ernie_linear_p7": "paddlespeech.text.models:ErnieLinear",
|
||||
"ernie_linear_p3": "paddlespeech.text.models:ErnieLinear",
|
||||
}
|
||||
|
||||
tokenizer_alias = {
|
||||
"ernie_linear_p7": "paddlenlp.transformers:ErnieTokenizer",
|
||||
"ernie_linear_p3": "paddlenlp.transformers:ErnieTokenizer",
|
||||
}
|
@ -1,300 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
# speedyspeech
|
||||
"speedyspeech_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/speedyspeech/speedyspeech_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'6f6fa967b408454b6662c8c00c0027cb',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_30600.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'tones_dict':
|
||||
'tone_id_map.txt',
|
||||
},
|
||||
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_baker_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'637d28a5e53aa60275612ba4393d5f22',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_76000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
"fastspeech2_ljspeech-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_ljspeech_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'ffed800c93deaf16ca9b3af89bfcd747',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_100000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
"fastspeech2_aishell3-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_aishell3_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'f4dd4a5f49a4552b77981f544ab3392e',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_96400.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'speaker_dict':
|
||||
'speaker_id_map.txt',
|
||||
},
|
||||
"fastspeech2_vctk-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_vctk_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'743e5024ca1e17a88c5c271db9779ba4',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_66200.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'speaker_dict':
|
||||
'speaker_id_map.txt',
|
||||
},
|
||||
# tacotron2
|
||||
"tacotron2_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/tacotron2/tacotron2_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'0df4b6f0bcbe0d73c5ed6df8867ab91a',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_30600.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
"tacotron2_ljspeech-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/tacotron2/tacotron2_ljspeech_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'6a5eddd81ae0e81d16959b97481135f3',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_60300.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
|
||||
# pwgan
|
||||
"pwgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_baker_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'2e481633325b5bdf0a3823c714d2c117',
|
||||
'config':
|
||||
'pwg_default.yaml',
|
||||
'ckpt':
|
||||
'pwg_snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'pwg_stats.npy',
|
||||
},
|
||||
"pwgan_ljspeech-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_ljspeech_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'53610ba9708fd3008ccaf8e99dacbaf0',
|
||||
'config':
|
||||
'pwg_default.yaml',
|
||||
'ckpt':
|
||||
'pwg_snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'pwg_stats.npy',
|
||||
},
|
||||
"pwgan_aishell3-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_aishell3_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'd7598fa41ad362d62f85ffc0f07e3d84',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1000000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
"pwgan_vctk-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_vctk_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'b3da1defcde3e578be71eb284cb89f2c',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'ee5f0604e20091f0d495b6ec4618b90d',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1000000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
# style_melgan
|
||||
"style_melgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/style_melgan/style_melgan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'5de2d5348f396de0c966926b8c462755',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
# hifigan
|
||||
"hifigan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'dd40a3d88dfcf64513fba2f0f961ada6',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
"hifigan_ljspeech-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_ljspeech_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'70e9131695decbca06a65fe51ed38a72',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
"hifigan_aishell3-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_aishell3_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'3bb49bc75032ed12f79c00c8cc79a09a',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
"hifigan_vctk-en": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_vctk_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'7da8f88359bca2457e705d924cf27bd4',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
|
||||
# wavernn
|
||||
"wavernn_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/wavernn/wavernn_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'ee37b752f09bcba8f2af3b777ca38e13',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
}
|
||||
}
|
||||
|
||||
model_alias = {
|
||||
# acoustic model
|
||||
"speedyspeech":
|
||||
"paddlespeech.t2s.models.speedyspeech:SpeedySpeech",
|
||||
"speedyspeech_inference":
|
||||
"paddlespeech.t2s.models.speedyspeech:SpeedySpeechInference",
|
||||
"fastspeech2":
|
||||
"paddlespeech.t2s.models.fastspeech2:FastSpeech2",
|
||||
"fastspeech2_inference":
|
||||
"paddlespeech.t2s.models.fastspeech2:FastSpeech2Inference",
|
||||
"tacotron2":
|
||||
"paddlespeech.t2s.models.tacotron2:Tacotron2",
|
||||
"tacotron2_inference":
|
||||
"paddlespeech.t2s.models.tacotron2:Tacotron2Inference",
|
||||
# voc
|
||||
"pwgan":
|
||||
"paddlespeech.t2s.models.parallel_wavegan:PWGGenerator",
|
||||
"pwgan_inference":
|
||||
"paddlespeech.t2s.models.parallel_wavegan:PWGInference",
|
||||
"mb_melgan":
|
||||
"paddlespeech.t2s.models.melgan:MelGANGenerator",
|
||||
"mb_melgan_inference":
|
||||
"paddlespeech.t2s.models.melgan:MelGANInference",
|
||||
"style_melgan":
|
||||
"paddlespeech.t2s.models.melgan:StyleMelGANGenerator",
|
||||
"style_melgan_inference":
|
||||
"paddlespeech.t2s.models.melgan:StyleMelGANInference",
|
||||
"hifigan":
|
||||
"paddlespeech.t2s.models.hifigan:HiFiGANGenerator",
|
||||
"hifigan_inference":
|
||||
"paddlespeech.t2s.models.hifigan:HiFiGANInference",
|
||||
"wavernn":
|
||||
"paddlespeech.t2s.models.wavernn:WaveRNN",
|
||||
"wavernn_inference":
|
||||
"paddlespeech.t2s.models.wavernn:WaveRNNInference",
|
||||
}
|
@ -1,36 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
# The tags for pretrained_models should be "{model_name}[-{dataset}][-{sr}][-...]".
|
||||
# e.g. "ecapatdnn_voxceleb12-16k".
|
||||
# Command line and python api use "{model_name}[-{dataset}]" as --model, usage:
|
||||
# "paddlespeech vector --task spk --model ecapatdnn_voxceleb12-16k --sr 16000 --input ./input.wav"
|
||||
"ecapatdnn_voxceleb12-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/vector/voxceleb/sv0_ecapa_tdnn_voxceleb12_ckpt_0_2_1.tar.gz',
|
||||
'md5':
|
||||
'67c7ff8885d5246bd16e0f5ac1cba99f',
|
||||
'cfg_path':
|
||||
'conf/model.yaml', # the yaml config path
|
||||
'ckpt_path':
|
||||
'model/model', # the format is ${dir}/{model_name},
|
||||
# so the first 'model' is dir, the second 'model' is the name
|
||||
# this means we have a model stored as model/model.pdparams
|
||||
},
|
||||
}
|
||||
|
||||
model_alias = {
|
||||
"ecapatdnn": "paddlespeech.vector.models.ecapa_tdnn:EcapaTdnn",
|
||||
}
|
@ -0,0 +1,87 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
__all__ = [
|
||||
'model_alias',
|
||||
]
|
||||
|
||||
# Records of model name to import class
|
||||
model_alias = {
|
||||
# ---------------------------------
|
||||
# -------------- ASR --------------
|
||||
# ---------------------------------
|
||||
"deepspeech2offline": ["paddlespeech.s2t.models.ds2:DeepSpeech2Model"],
|
||||
"deepspeech2online":
|
||||
["paddlespeech.s2t.models.ds2_online:DeepSpeech2ModelOnline"],
|
||||
"conformer": ["paddlespeech.s2t.models.u2:U2Model"],
|
||||
"conformer_online": ["paddlespeech.s2t.models.u2:U2Model"],
|
||||
"transformer": ["paddlespeech.s2t.models.u2:U2Model"],
|
||||
"wenetspeech": ["paddlespeech.s2t.models.u2:U2Model"],
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- CLS --------------
|
||||
# ---------------------------------
|
||||
"panns_cnn6": ["paddlespeech.cls.models.panns:CNN6"],
|
||||
"panns_cnn10": ["paddlespeech.cls.models.panns:CNN10"],
|
||||
"panns_cnn14": ["paddlespeech.cls.models.panns:CNN14"],
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- ST ---------------
|
||||
# ---------------------------------
|
||||
"fat_st": ["paddlespeech.s2t.models.u2_st:U2STModel"],
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- TEXT -------------
|
||||
# ---------------------------------
|
||||
"ernie_linear_p7": [
|
||||
"paddlespeech.text.models:ErnieLinear",
|
||||
"paddlenlp.transformers:ErnieTokenizer"
|
||||
],
|
||||
"ernie_linear_p3": [
|
||||
"paddlespeech.text.models:ErnieLinear",
|
||||
"paddlenlp.transformers:ErnieTokenizer"
|
||||
],
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- TTS --------------
|
||||
# ---------------------------------
|
||||
# acoustic model
|
||||
"speedyspeech": ["paddlespeech.t2s.models.speedyspeech:SpeedySpeech"],
|
||||
"speedyspeech_inference":
|
||||
["paddlespeech.t2s.models.speedyspeech:SpeedySpeechInference"],
|
||||
"fastspeech2": ["paddlespeech.t2s.models.fastspeech2:FastSpeech2"],
|
||||
"fastspeech2_inference":
|
||||
["paddlespeech.t2s.models.fastspeech2:FastSpeech2Inference"],
|
||||
"tacotron2": ["paddlespeech.t2s.models.tacotron2:Tacotron2"],
|
||||
"tacotron2_inference":
|
||||
["paddlespeech.t2s.models.tacotron2:Tacotron2Inference"],
|
||||
# voc
|
||||
"pwgan": ["paddlespeech.t2s.models.parallel_wavegan:PWGGenerator"],
|
||||
"pwgan_inference":
|
||||
["paddlespeech.t2s.models.parallel_wavegan:PWGInference"],
|
||||
"mb_melgan": ["paddlespeech.t2s.models.melgan:MelGANGenerator"],
|
||||
"mb_melgan_inference": ["paddlespeech.t2s.models.melgan:MelGANInference"],
|
||||
"style_melgan": ["paddlespeech.t2s.models.melgan:StyleMelGANGenerator"],
|
||||
"style_melgan_inference":
|
||||
["paddlespeech.t2s.models.melgan:StyleMelGANInference"],
|
||||
"hifigan": ["paddlespeech.t2s.models.hifigan:HiFiGANGenerator"],
|
||||
"hifigan_inference": ["paddlespeech.t2s.models.hifigan:HiFiGANInference"],
|
||||
"wavernn": ["paddlespeech.t2s.models.wavernn:WaveRNN"],
|
||||
"wavernn_inference": ["paddlespeech.t2s.models.wavernn:WaveRNNInference"],
|
||||
|
||||
# ---------------------------------
|
||||
# ------------ Vector -------------
|
||||
# ---------------------------------
|
||||
"ecapatdnn": ["paddlespeech.vector.models.ecapa_tdnn:EcapaTdnn"],
|
||||
}
|
@ -0,0 +1,838 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
__all__ = [
|
||||
'asr_dynamic_pretrained_models',
|
||||
'asr_static_pretrained_models',
|
||||
'cls_dynamic_pretrained_models',
|
||||
'cls_static_pretrained_models',
|
||||
'st_dynamic_pretrained_models',
|
||||
'st_kaldi_bins',
|
||||
'text_dynamic_pretrained_models',
|
||||
'tts_dynamic_pretrained_models',
|
||||
'tts_static_pretrained_models',
|
||||
'tts_onnx_pretrained_models',
|
||||
'vector_dynamic_pretrained_models',
|
||||
]
|
||||
|
||||
# The tags for pretrained_models should be "{model_name}[_{dataset}][-{lang}][-...]".
|
||||
# e.g. "conformer_wenetspeech-zh-16k" and "panns_cnn6-32k".
|
||||
# Command line and python api use "{model_name}[_{dataset}]" as --model, usage:
|
||||
# "paddlespeech asr --model conformer_wenetspeech --lang zh --sr 16000 --input ./input.wav"
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- ASR --------------
|
||||
# ---------------------------------
|
||||
asr_dynamic_pretrained_models = {
|
||||
"conformer_wenetspeech-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr1_conformer_wenetspeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'76cb19ed857e6623856b7cd7ebbfeda4',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/conformer/checkpoints/wenetspeech',
|
||||
},
|
||||
},
|
||||
"conformer_online_wenetspeech-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr1/asr1_chunk_conformer_wenetspeech_ckpt_1.0.0a.model.tar.gz',
|
||||
'md5':
|
||||
'b8c02632b04da34aca88459835be54a6',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/avg_10',
|
||||
'model':
|
||||
'exp/chunk_conformer/checkpoints/avg_10.pdparams',
|
||||
'params':
|
||||
'exp/chunk_conformer/checkpoints/avg_10.pdparams',
|
||||
'lm_url':
|
||||
'',
|
||||
'lm_md5':
|
||||
'',
|
||||
},
|
||||
},
|
||||
"conformer_online_multicn-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/multi_cn/asr1/asr1_chunk_conformer_multi_cn_ckpt_0.2.0.model.tar.gz',
|
||||
'md5':
|
||||
'7989b3248c898070904cf042fd656003',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn',
|
||||
},
|
||||
'2.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/multi_cn/asr1/asr1_chunk_conformer_multi_cn_ckpt_0.2.3.model.tar.gz',
|
||||
'md5':
|
||||
'0ac93d390552336f2a906aec9e33c5fa',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn',
|
||||
'model':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn.pdparams',
|
||||
'params':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn.pdparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3',
|
||||
},
|
||||
},
|
||||
"conformer_aishell-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr1/asr1_conformer_aishell_ckpt_0.1.2.model.tar.gz',
|
||||
'md5':
|
||||
'3f073eccfa7bb14e0c6867d65fc0dc3a',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/conformer/checkpoints/avg_30',
|
||||
},
|
||||
},
|
||||
"conformer_online_aishell-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr1/asr1_chunk_conformer_aishell_ckpt_0.2.0.model.tar.gz',
|
||||
'md5':
|
||||
'b374cfb93537761270b6224fb0bfc26a',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/avg_30',
|
||||
},
|
||||
},
|
||||
"transformer_librispeech-en-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/librispeech/asr1/asr1_transformer_librispeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'2c667da24922aad391eacafe37bc1660',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/transformer/checkpoints/avg_10',
|
||||
},
|
||||
},
|
||||
"deepspeech2online_wenetspeech-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr0/asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz',
|
||||
'md5':
|
||||
'e393d4d274af0f6967db24fc146e8074',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2_online/checkpoints/avg_10',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
},
|
||||
"deepspeech2offline_aishell-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_aishell_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'932c3593d62fe5c741b59b31318aa314',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
},
|
||||
"deepspeech2online_aishell-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_online_aishell_fbank161_ckpt_0.2.1.model.tar.gz',
|
||||
'md5':
|
||||
'98b87b171b7240b7cae6e07d8d0bc9be',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1',
|
||||
'model':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1.jit.pdmodel',
|
||||
'params':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1.jit.pdiparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
},
|
||||
"deepspeech2offline_librispeech-en-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/librispeech/asr0/asr0_deepspeech2_librispeech_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'f5666c81ad015c8de03aac2bc92e5762',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/en_lm/common_crawl_00.prune01111.trie.klm',
|
||||
'lm_md5':
|
||||
'099a601759d467cd0a8523ff939819c5'
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
asr_static_pretrained_models = {
|
||||
"deepspeech2offline_aishell-zh-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_aishell_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'932c3593d62fe5c741b59b31318aa314',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'model':
|
||||
'exp/deepspeech2/checkpoints/avg_1.jit.pdmodel',
|
||||
'params':
|
||||
'exp/deepspeech2/checkpoints/avg_1.jit.pdiparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
}
|
||||
},
|
||||
}
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- CLS --------------
|
||||
# ---------------------------------
|
||||
cls_dynamic_pretrained_models = {
|
||||
"panns_cnn6-32k": {
|
||||
'1.0': {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn6.tar.gz',
|
||||
'md5': '4cf09194a95df024fd12f84712cf0f9c',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn6.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
"panns_cnn10-32k": {
|
||||
'1.0': {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn10.tar.gz',
|
||||
'md5': 'cb8427b22176cc2116367d14847f5413',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn10.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
"panns_cnn14-32k": {
|
||||
'1.0': {
|
||||
'url': 'https://paddlespeech.bj.bcebos.com/cls/panns_cnn14.tar.gz',
|
||||
'md5': 'e3b9b5614a1595001161d0ab95edee97',
|
||||
'cfg_path': 'panns.yaml',
|
||||
'ckpt_path': 'cnn14.pdparams',
|
||||
'label_file': 'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
cls_static_pretrained_models = {
|
||||
"panns_cnn6-32k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn6_static.tar.gz',
|
||||
'md5':
|
||||
'da087c31046d23281d8ec5188c1967da',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
"panns_cnn10-32k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn10_static.tar.gz',
|
||||
'md5':
|
||||
'5460cc6eafbfaf0f261cc75b90284ae1',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
"panns_cnn14-32k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn14_static.tar.gz',
|
||||
'md5':
|
||||
'ccc80b194821274da79466862b2ab00f',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- ST ---------------
|
||||
# ---------------------------------
|
||||
st_dynamic_pretrained_models = {
|
||||
"fat_st_ted-en-zh": {
|
||||
'1.0': {
|
||||
"url":
|
||||
"https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/st1_transformer_mtl_noam_ted-en-zh_ckpt_0.1.1.model.tar.gz",
|
||||
"md5":
|
||||
"d62063f35a16d91210a71081bd2dd557",
|
||||
"cfg_path":
|
||||
"model.yaml",
|
||||
"ckpt_path":
|
||||
"exp/transformer_mtl_noam/checkpoints/fat_st_ted-en-zh.pdparams",
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
st_kaldi_bins = {
|
||||
"url":
|
||||
"https://paddlespeech.bj.bcebos.com/s2t/ted_en_zh/st1/kaldi_bins.tar.gz",
|
||||
"md5":
|
||||
"c0682303b3f3393dbf6ed4c4e35a53eb",
|
||||
}
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- TEXT -------------
|
||||
# ---------------------------------
|
||||
text_dynamic_pretrained_models = {
|
||||
"ernie_linear_p7_wudao-punc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/text/ernie_linear_p7_wudao-punc-zh.tar.gz',
|
||||
'md5':
|
||||
'12283e2ddde1797c5d1e57036b512746',
|
||||
'cfg_path':
|
||||
'ckpt/model_config.json',
|
||||
'ckpt_path':
|
||||
'ckpt/model_state.pdparams',
|
||||
'vocab_file':
|
||||
'punc_vocab.txt',
|
||||
},
|
||||
},
|
||||
"ernie_linear_p3_wudao-punc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/text/ernie_linear_p3_wudao-punc-zh.tar.gz',
|
||||
'md5':
|
||||
'448eb2fdf85b6a997e7e652e80c51dd2',
|
||||
'cfg_path':
|
||||
'ckpt/model_config.json',
|
||||
'ckpt_path':
|
||||
'ckpt/model_state.pdparams',
|
||||
'vocab_file':
|
||||
'punc_vocab.txt',
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
# ---------------------------------
|
||||
# -------------- TTS --------------
|
||||
# ---------------------------------
|
||||
tts_dynamic_pretrained_models = {
|
||||
# speedyspeech
|
||||
"speedyspeech_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/speedyspeech/speedyspeech_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'6f6fa967b408454b6662c8c00c0027cb',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_30600.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'tones_dict':
|
||||
'tone_id_map.txt',
|
||||
},
|
||||
},
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_baker_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'637d28a5e53aa60275612ba4393d5f22',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_76000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
},
|
||||
"fastspeech2_ljspeech-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_ljspeech_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'ffed800c93deaf16ca9b3af89bfcd747',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_100000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
},
|
||||
"fastspeech2_aishell3-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_aishell3_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'f4dd4a5f49a4552b77981f544ab3392e',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_96400.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'speaker_dict':
|
||||
'speaker_id_map.txt',
|
||||
},
|
||||
},
|
||||
"fastspeech2_vctk-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_vctk_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'743e5024ca1e17a88c5c271db9779ba4',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_66200.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'speaker_dict':
|
||||
'speaker_id_map.txt',
|
||||
},
|
||||
},
|
||||
# tacotron2
|
||||
"tacotron2_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/tacotron2/tacotron2_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'0df4b6f0bcbe0d73c5ed6df8867ab91a',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_30600.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
},
|
||||
"tacotron2_ljspeech-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/tacotron2/tacotron2_ljspeech_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'6a5eddd81ae0e81d16959b97481135f3',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_60300.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
},
|
||||
# pwgan
|
||||
"pwgan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_baker_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'2e481633325b5bdf0a3823c714d2c117',
|
||||
'config':
|
||||
'pwg_default.yaml',
|
||||
'ckpt':
|
||||
'pwg_snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'pwg_stats.npy',
|
||||
},
|
||||
},
|
||||
"pwgan_ljspeech-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_ljspeech_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'53610ba9708fd3008ccaf8e99dacbaf0',
|
||||
'config':
|
||||
'pwg_default.yaml',
|
||||
'ckpt':
|
||||
'pwg_snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'pwg_stats.npy',
|
||||
},
|
||||
},
|
||||
"pwgan_aishell3-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_aishell3_ckpt_0.5.zip',
|
||||
'md5':
|
||||
'd7598fa41ad362d62f85ffc0f07e3d84',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1000000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
"pwgan_vctk-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_vctk_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'b3da1defcde3e578be71eb284cb89f2c',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'ee5f0604e20091f0d495b6ec4618b90d',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1000000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
# style_melgan
|
||||
"style_melgan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/style_melgan/style_melgan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'5de2d5348f396de0c966926b8c462755',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
# hifigan
|
||||
"hifigan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'dd40a3d88dfcf64513fba2f0f961ada6',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
"hifigan_ljspeech-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_ljspeech_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'70e9131695decbca06a65fe51ed38a72',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
"hifigan_aishell3-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_aishell3_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'3bb49bc75032ed12f79c00c8cc79a09a',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
"hifigan_vctk-en": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_vctk_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'7da8f88359bca2457e705d924cf27bd4',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
# wavernn
|
||||
"wavernn_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/wavernn/wavernn_csmsc_ckpt_0.2.0.zip',
|
||||
'md5':
|
||||
'ee37b752f09bcba8f2af3b777ca38e13',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_400000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
},
|
||||
"fastspeech2_cnndecoder_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_cnndecoder_csmsc_ckpt_1.0.0.zip',
|
||||
'md5':
|
||||
'6eb28e22ace73e0ebe7845f86478f89f',
|
||||
'config':
|
||||
'cnndecoder.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_153000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
tts_static_pretrained_models = {
|
||||
# speedyspeech
|
||||
"speedyspeech_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/speedyspeech/speedyspeech_nosil_baker_static_0.5.zip',
|
||||
'md5':
|
||||
'f10cbdedf47dc7a9668d2264494e1823',
|
||||
'model':
|
||||
'speedyspeech_csmsc.pdmodel',
|
||||
'params':
|
||||
'speedyspeech_csmsc.pdiparams',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'tones_dict':
|
||||
'tone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_baker_static_0.4.zip',
|
||||
'md5':
|
||||
'9788cd9745e14c7a5d12d32670b2a5a7',
|
||||
'model':
|
||||
'fastspeech2_csmsc.pdmodel',
|
||||
'params':
|
||||
'fastspeech2_csmsc.pdiparams',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# pwgan
|
||||
"pwgan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_baker_static_0.4.zip',
|
||||
'md5':
|
||||
'e3504aed9c5a290be12d1347836d2742',
|
||||
'model':
|
||||
'pwgan_csmsc.pdmodel',
|
||||
'params':
|
||||
'pwgan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_static_0.1.1.zip',
|
||||
'md5':
|
||||
'ac6eee94ba483421d750433f4c3b8d36',
|
||||
'model':
|
||||
'mb_melgan_csmsc.pdmodel',
|
||||
'params':
|
||||
'mb_melgan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# hifigan
|
||||
"hifigan_csmsc-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_static_0.1.1.zip',
|
||||
'md5':
|
||||
'7edd8c436b3a5546b3a7cb8cff9d5a0c',
|
||||
'model':
|
||||
'hifigan_csmsc.pdmodel',
|
||||
'params':
|
||||
'hifigan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
tts_onnx_pretrained_models = {
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc_onnx-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'fd3ad38d83273ad51f0ea4f4abf3ab4e',
|
||||
'ckpt': ['fastspeech2_csmsc.onnx'],
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
"fastspeech2_cnndecoder_csmsc_onnx-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_cnndecoder_csmsc_streaming_onnx_1.0.0.zip',
|
||||
'md5':
|
||||
'5f70e1a6bcd29d72d54e7931aa86f266',
|
||||
'ckpt': [
|
||||
'fastspeech2_csmsc_am_encoder_infer.onnx',
|
||||
'fastspeech2_csmsc_am_decoder.onnx',
|
||||
'fastspeech2_csmsc_am_postnet.onnx',
|
||||
],
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc_onnx-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'5b83ec746e8414bc29032d954ffd07ec',
|
||||
'ckpt':
|
||||
'mb_melgan_csmsc.onnx',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
# hifigan
|
||||
"hifigan_csmsc_onnx-zh": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'1a7dc0385875889e46952e50c0994a6b',
|
||||
'ckpt':
|
||||
'hifigan_csmsc.onnx',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
# ---------------------------------
|
||||
# ------------ Vector -------------
|
||||
# ---------------------------------
|
||||
vector_dynamic_pretrained_models = {
|
||||
"ecapatdnn_voxceleb12-16k": {
|
||||
'1.0': {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/vector/voxceleb/sv0_ecapa_tdnn_voxceleb12_ckpt_0_2_0.tar.gz',
|
||||
'md5':
|
||||
'cc33023c54ab346cd318408f43fcaf95',
|
||||
'cfg_path':
|
||||
'conf/model.yaml', # the yaml config path
|
||||
'ckpt_path':
|
||||
'model/model', # the format is ${dir}/{model_name},
|
||||
# so the first 'model' is dir, the second 'model' is the name
|
||||
# this means we have a model stored as model/model.pdparams
|
||||
},
|
||||
},
|
||||
}
|
@ -0,0 +1,222 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
import os
|
||||
from collections import OrderedDict
|
||||
from typing import Dict
|
||||
from typing import List
|
||||
from typing import Optional
|
||||
|
||||
from ..cli.utils import download_and_decompress
|
||||
from ..cli.utils import MODEL_HOME
|
||||
from ..utils.dynamic_import import dynamic_import
|
||||
from .model_alias import model_alias
|
||||
|
||||
task_supported = ['asr', 'cls', 'st', 'text', 'tts', 'vector']
|
||||
model_format_supported = ['dynamic', 'static', 'onnx']
|
||||
inference_mode_supported = ['online', 'offline']
|
||||
|
||||
|
||||
class CommonTaskResource:
|
||||
def __init__(self, task: str, model_format: str='dynamic', **kwargs):
|
||||
assert task in task_supported, 'Arg "task" must be one of {}.'.format(
|
||||
task_supported)
|
||||
assert model_format in model_format_supported, 'Arg "model_format" must be one of {}.'.format(
|
||||
model_format_supported)
|
||||
|
||||
self.task = task
|
||||
self.model_format = model_format
|
||||
self.pretrained_models = self._get_pretrained_models()
|
||||
|
||||
if 'inference_mode' in kwargs:
|
||||
assert kwargs[
|
||||
'inference_mode'] in inference_mode_supported, 'Arg "inference_mode" must be one of {}.'.format(
|
||||
inference_mode_supported)
|
||||
self._inference_mode_filter(kwargs['inference_mode'])
|
||||
|
||||
# Initialize after model and version had been set.
|
||||
self.model_tag = None
|
||||
self.version = None
|
||||
self.res_dict = None
|
||||
self.res_dir = None
|
||||
|
||||
if self.task == 'tts':
|
||||
# For vocoder
|
||||
self.voc_model_tag = None
|
||||
self.voc_version = None
|
||||
self.voc_res_dict = None
|
||||
self.voc_res_dir = None
|
||||
|
||||
def set_task_model(self,
|
||||
model_tag: str,
|
||||
model_type: int=0,
|
||||
version: Optional[str]=None):
|
||||
"""Set model tag and version of current task.
|
||||
|
||||
Args:
|
||||
model_tag (str): Model tag.
|
||||
model_type (int): 0 for acoustic model otherwise vocoder in tts task.
|
||||
version (Optional[str], optional): Version of pretrained model. Defaults to None.
|
||||
"""
|
||||
assert model_tag in self.pretrained_models, \
|
||||
"Can't find \"{}\" in resource. Model name must be one of {}".format(model_tag, list(self.pretrained_models.keys()))
|
||||
|
||||
if version is None:
|
||||
version = self._get_default_version(model_tag)
|
||||
|
||||
assert version in self.pretrained_models[model_tag], \
|
||||
"Can't find version \"{}\" in \"{}\". Model name must be one of {}".format(
|
||||
version, model_tag, list(self.pretrained_models[model_tag].keys()))
|
||||
|
||||
if model_type == 0:
|
||||
self.model_tag = model_tag
|
||||
self.version = version
|
||||
self.res_dict = self.pretrained_models[model_tag][version]
|
||||
self.res_dir = self._fetch(self.res_dict,
|
||||
self._get_model_dir(model_type))
|
||||
else:
|
||||
assert self.task == 'tts', 'Vocoder will only be used in tts task.'
|
||||
self.voc_model_tag = model_tag
|
||||
self.voc_version = version
|
||||
self.voc_res_dict = self.pretrained_models[model_tag][version]
|
||||
self.voc_res_dir = self._fetch(self.voc_res_dict,
|
||||
self._get_model_dir(model_type))
|
||||
|
||||
@staticmethod
|
||||
def get_model_class(model_name) -> List[object]:
|
||||
"""Dynamic import model class.
|
||||
Args:
|
||||
model_name (str): Model name.
|
||||
|
||||
Returns:
|
||||
List[object]: Return a list of model class.
|
||||
"""
|
||||
assert model_name in model_alias, 'No model classes found for "{}"'.format(
|
||||
model_name)
|
||||
|
||||
ret = []
|
||||
for import_path in model_alias[model_name]:
|
||||
ret.append(dynamic_import(import_path))
|
||||
|
||||
if len(ret) == 1:
|
||||
return ret[0]
|
||||
else:
|
||||
return ret
|
||||
|
||||
def get_versions(self, model_tag: str) -> List[str]:
|
||||
"""List all available versions.
|
||||
|
||||
Args:
|
||||
model_tag (str): Model tag.
|
||||
|
||||
Returns:
|
||||
List[str]: Version list of model.
|
||||
"""
|
||||
return list(self.pretrained_models[model_tag].keys())
|
||||
|
||||
def _get_default_version(self, model_tag: str) -> str:
|
||||
"""Get default version of model.
|
||||
|
||||
Args:
|
||||
model_tag (str): Model tag.
|
||||
|
||||
Returns:
|
||||
str: Default version.
|
||||
"""
|
||||
return self.get_versions(model_tag)[-1] # get latest version
|
||||
|
||||
def _get_model_dir(self, model_type: int=0) -> os.PathLike:
|
||||
"""Get resource directory.
|
||||
|
||||
Args:
|
||||
model_type (int): 0 for acoustic model otherwise vocoder in tts task.
|
||||
|
||||
Returns:
|
||||
os.PathLike: Directory of model resource.
|
||||
"""
|
||||
if model_type == 0:
|
||||
model_tag = self.model_tag
|
||||
version = self.version
|
||||
else:
|
||||
model_tag = self.voc_model_tag
|
||||
version = self.voc_version
|
||||
|
||||
return os.path.join(MODEL_HOME, model_tag, version)
|
||||
|
||||
def _get_pretrained_models(self) -> Dict[str, str]:
|
||||
"""Get all available models for current task.
|
||||
|
||||
Returns:
|
||||
Dict[str, str]: A dictionary with model tag and resources info.
|
||||
"""
|
||||
try:
|
||||
import_models = '{}_{}_pretrained_models'.format(self.task,
|
||||
self.model_format)
|
||||
exec('from .pretrained_models import {}'.format(import_models))
|
||||
models = OrderedDict(locals()[import_models])
|
||||
except ImportError:
|
||||
models = OrderedDict({}) # no models.
|
||||
finally:
|
||||
return models
|
||||
|
||||
def _inference_mode_filter(self, inference_mode: Optional[str]):
|
||||
"""Filter models dict based on inference_mode.
|
||||
|
||||
Args:
|
||||
inference_mode (Optional[str]): 'online', 'offline' or None.
|
||||
"""
|
||||
if inference_mode is None:
|
||||
return
|
||||
|
||||
if self.task == 'asr':
|
||||
online_flags = [
|
||||
'online' in model_tag
|
||||
for model_tag in self.pretrained_models.keys()
|
||||
]
|
||||
for online_flag, model_tag in zip(
|
||||
online_flags, list(self.pretrained_models.keys())):
|
||||
if inference_mode == 'online' and online_flag:
|
||||
continue
|
||||
elif inference_mode == 'offline' and not online_flag:
|
||||
continue
|
||||
else:
|
||||
del self.pretrained_models[model_tag]
|
||||
elif self.task == 'tts':
|
||||
# Hardcode for tts online models.
|
||||
tts_online_models = [
|
||||
'fastspeech2_csmsc-zh', 'fastspeech2_cnndecoder_csmsc-zh',
|
||||
'mb_melgan_csmsc-zh', 'hifigan_csmsc-zh'
|
||||
]
|
||||
for model_tag in list(self.pretrained_models.keys()):
|
||||
if inference_mode == 'online' and model_tag in tts_online_models:
|
||||
continue
|
||||
elif inference_mode == 'offline':
|
||||
continue
|
||||
else:
|
||||
del self.pretrained_models[model_tag]
|
||||
else:
|
||||
raise NotImplementedError('Only supports asr and tts task.')
|
||||
|
||||
@staticmethod
|
||||
def _fetch(res_dict: Dict[str, str],
|
||||
target_dir: os.PathLike) -> os.PathLike:
|
||||
"""Fetch archive from url.
|
||||
|
||||
Args:
|
||||
res_dict (Dict[str, str]): Info dict of a resource.
|
||||
target_dir (os.PathLike): Directory to save archives.
|
||||
|
||||
Returns:
|
||||
os.PathLike: Directory of model resource.
|
||||
"""
|
||||
return download_and_decompress(res_dict, target_dir)
|
@ -1,70 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
"deepspeech2online_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_online_aishell_fbank161_ckpt_0.2.1.model.tar.gz',
|
||||
'md5':
|
||||
'98b87b171b7240b7cae6e07d8d0bc9be',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1',
|
||||
'model':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1.jit.pdmodel',
|
||||
'params':
|
||||
'exp/deepspeech2_online/checkpoints/avg_1.jit.pdiparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
"conformer_online_multicn-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/multi_cn/asr1/asr1_chunk_conformer_multi_cn_ckpt_0.2.3.model.tar.gz',
|
||||
'md5':
|
||||
'0ac93d390552336f2a906aec9e33c5fa',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn',
|
||||
'model':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn.pdparams',
|
||||
'params':
|
||||
'exp/chunk_conformer/checkpoints/multi_cn.pdparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
"conformer_online_wenetspeech-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr1/asr1_chunk_conformer_wenetspeech_ckpt_1.0.0a.model.tar.gz',
|
||||
'md5':
|
||||
'b8c02632b04da34aca88459835be54a6',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/chunk_conformer/checkpoints/avg_10',
|
||||
'model':
|
||||
'exp/chunk_conformer/checkpoints/avg_10.pdparams',
|
||||
'params':
|
||||
'exp/chunk_conformer/checkpoints/avg_10.pdparams',
|
||||
'lm_url':
|
||||
'',
|
||||
'lm_md5':
|
||||
'',
|
||||
},
|
||||
}
|
@ -1,34 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
"deepspeech2offline_aishell-zh-16k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_aishell_ckpt_0.1.1.model.tar.gz',
|
||||
'md5':
|
||||
'932c3593d62fe5c741b59b31318aa314',
|
||||
'cfg_path':
|
||||
'model.yaml',
|
||||
'ckpt_path':
|
||||
'exp/deepspeech2/checkpoints/avg_1',
|
||||
'model':
|
||||
'exp/deepspeech2/checkpoints/avg_1.jit.pdmodel',
|
||||
'params':
|
||||
'exp/deepspeech2/checkpoints/avg_1.jit.pdiparams',
|
||||
'lm_url':
|
||||
'https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm',
|
||||
'lm_md5':
|
||||
'29e02312deb2e59b3c8686c7966d4fe3'
|
||||
},
|
||||
}
|
@ -1,58 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
pretrained_models = {
|
||||
"panns_cnn6-32k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn6_static.tar.gz',
|
||||
'md5':
|
||||
'da087c31046d23281d8ec5188c1967da',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
"panns_cnn10-32k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn10_static.tar.gz',
|
||||
'md5':
|
||||
'5460cc6eafbfaf0f261cc75b90284ae1',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
"panns_cnn14-32k": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/cls/inference_model/panns_cnn14_static.tar.gz',
|
||||
'md5':
|
||||
'ccc80b194821274da79466862b2ab00f',
|
||||
'cfg_path':
|
||||
'panns.yaml',
|
||||
'model_path':
|
||||
'inference.pdmodel',
|
||||
'params_path':
|
||||
'inference.pdiparams',
|
||||
'label_file':
|
||||
'audioset_labels.txt',
|
||||
},
|
||||
}
|
@ -1,69 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# support online model
|
||||
pretrained_models = {
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc_onnx-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'fd3ad38d83273ad51f0ea4f4abf3ab4e',
|
||||
'ckpt': ['fastspeech2_csmsc.onnx'],
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
"fastspeech2_cnndecoder_csmsc_onnx-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_cnndecoder_csmsc_streaming_onnx_1.0.0.zip',
|
||||
'md5':
|
||||
'5f70e1a6bcd29d72d54e7931aa86f266',
|
||||
'ckpt': [
|
||||
'fastspeech2_csmsc_am_encoder_infer.onnx',
|
||||
'fastspeech2_csmsc_am_decoder.onnx',
|
||||
'fastspeech2_csmsc_am_postnet.onnx',
|
||||
],
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc_onnx-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'5b83ec746e8414bc29032d954ffd07ec',
|
||||
'ckpt':
|
||||
'mb_melgan_csmsc.onnx',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
|
||||
# hifigan
|
||||
"hifigan_csmsc_onnx-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_onnx_0.2.0.zip',
|
||||
'md5':
|
||||
'1a7dc0385875889e46952e50c0994a6b',
|
||||
'ckpt':
|
||||
'hifigan_csmsc.onnx',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
}
|
@ -1,73 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# support online model
|
||||
pretrained_models = {
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_baker_ckpt_0.4.zip',
|
||||
'md5':
|
||||
'637d28a5e53aa60275612ba4393d5f22',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_76000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
"fastspeech2_cnndecoder_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_cnndecoder_csmsc_ckpt_1.0.0.zip',
|
||||
'md5':
|
||||
'6eb28e22ace73e0ebe7845f86478f89f',
|
||||
'config':
|
||||
'cnndecoder.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_153000.pdz',
|
||||
'speech_stats':
|
||||
'speech_stats.npy',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
},
|
||||
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'ee5f0604e20091f0d495b6ec4618b90d',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_1000000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
|
||||
# hifigan
|
||||
"hifigan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_ckpt_0.1.1.zip',
|
||||
'md5':
|
||||
'dd40a3d88dfcf64513fba2f0f961ada6',
|
||||
'config':
|
||||
'default.yaml',
|
||||
'ckpt':
|
||||
'snapshot_iter_2500000.pdz',
|
||||
'speech_stats':
|
||||
'feats_stats.npy',
|
||||
},
|
||||
}
|
@ -1,87 +0,0 @@
|
||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
# Static model applied on paddle inference
|
||||
pretrained_models = {
|
||||
# speedyspeech
|
||||
"speedyspeech_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/speedyspeech/speedyspeech_nosil_baker_static_0.5.zip',
|
||||
'md5':
|
||||
'f10cbdedf47dc7a9668d2264494e1823',
|
||||
'model':
|
||||
'speedyspeech_csmsc.pdmodel',
|
||||
'params':
|
||||
'speedyspeech_csmsc.pdiparams',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'tones_dict':
|
||||
'tone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
# fastspeech2
|
||||
"fastspeech2_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/fastspeech2/fastspeech2_nosil_baker_static_0.4.zip',
|
||||
'md5':
|
||||
'9788cd9745e14c7a5d12d32670b2a5a7',
|
||||
'model':
|
||||
'fastspeech2_csmsc.pdmodel',
|
||||
'params':
|
||||
'fastspeech2_csmsc.pdiparams',
|
||||
'phones_dict':
|
||||
'phone_id_map.txt',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
# pwgan
|
||||
"pwgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/pwgan/pwg_baker_static_0.4.zip',
|
||||
'md5':
|
||||
'e3504aed9c5a290be12d1347836d2742',
|
||||
'model':
|
||||
'pwgan_csmsc.pdmodel',
|
||||
'params':
|
||||
'pwgan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
# mb_melgan
|
||||
"mb_melgan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/mb_melgan/mb_melgan_csmsc_static_0.1.1.zip',
|
||||
'md5':
|
||||
'ac6eee94ba483421d750433f4c3b8d36',
|
||||
'model':
|
||||
'mb_melgan_csmsc.pdmodel',
|
||||
'params':
|
||||
'mb_melgan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
# hifigan
|
||||
"hifigan_csmsc-zh": {
|
||||
'url':
|
||||
'https://paddlespeech.bj.bcebos.com/Parakeet/released_models/hifigan/hifigan_csmsc_static_0.1.1.zip',
|
||||
'md5':
|
||||
'7edd8c436b3a5546b3a7cb8cff9d5a0c',
|
||||
'model':
|
||||
'hifigan_csmsc.pdmodel',
|
||||
'params':
|
||||
'hifigan_csmsc.pdiparams',
|
||||
'sample_rate':
|
||||
24000,
|
||||
},
|
||||
}
|
Loading…
Reference in new issue