parent
a1f5db8d7f
commit
98f0806353
@ -0,0 +1,9 @@
|
|||||||
|
# PaddleSpeech Command Line
|
||||||
|
|
||||||
|
The simplest approach to use PaddleSpeech models.
|
||||||
|
|
||||||
|
## Help
|
||||||
|
`paddlespeech help`
|
||||||
|
|
||||||
|
## S2T
|
||||||
|
`paddlespeech s2t --config ./s2t.yaml --input ./zh.wav --device gpu`
|
@ -0,0 +1,16 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
from .base_commands import BaseCommand
|
||||||
|
from .base_commands import HelpCommand
|
||||||
|
from .s2t import S2TExecutor
|
@ -0,0 +1,49 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
from typing import List
|
||||||
|
|
||||||
|
from .entry import commands
|
||||||
|
from .utils import cli_register
|
||||||
|
from .utils import get_command
|
||||||
|
|
||||||
|
__all__ = [
|
||||||
|
'BaseCommand',
|
||||||
|
'HelpCommand',
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
|
@cli_register(name='paddlespeech')
|
||||||
|
class BaseCommand:
|
||||||
|
def execute(self, argv: List[str]) -> bool:
|
||||||
|
help = get_command('paddlespeech.help')
|
||||||
|
return help().execute(argv)
|
||||||
|
|
||||||
|
|
||||||
|
@cli_register(name='paddlespeech.help', description='Show help for commands.')
|
||||||
|
class HelpCommand:
|
||||||
|
def execute(self, argv: List[str]) -> bool:
|
||||||
|
msg = 'Usage:\n'
|
||||||
|
msg += ' paddlespeech <command> <options>\n\n'
|
||||||
|
msg += 'Commands:\n'
|
||||||
|
for command, detail in commands['paddlespeech'].items():
|
||||||
|
if command.startswith('_'):
|
||||||
|
continue
|
||||||
|
|
||||||
|
if '_description' not in detail:
|
||||||
|
continue
|
||||||
|
msg += ' {:<15} {}\n'.format(command,
|
||||||
|
detail['_description'])
|
||||||
|
|
||||||
|
print(msg)
|
||||||
|
return True
|
@ -0,0 +1,38 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
import sys
|
||||||
|
from collections import defaultdict
|
||||||
|
|
||||||
|
__all__ = ['commands']
|
||||||
|
|
||||||
|
|
||||||
|
def _CommandDict():
|
||||||
|
return defaultdict(_CommandDict)
|
||||||
|
|
||||||
|
|
||||||
|
def _execute():
|
||||||
|
com = commands
|
||||||
|
for idx, _argv in enumerate(['paddlespeech'] + sys.argv[1:]):
|
||||||
|
if _argv not in com:
|
||||||
|
break
|
||||||
|
com = com[_argv]
|
||||||
|
|
||||||
|
# The method 'execute' of a command instance returns 'True' for a success
|
||||||
|
# while 'False' for a failure. Here converts this result into a exit status
|
||||||
|
# in bash: 0 for a success and 1 for a failure.
|
||||||
|
status = 0 if com['_entry']().execute(sys.argv[idx:]) else 1
|
||||||
|
return status
|
||||||
|
|
||||||
|
|
||||||
|
commands = _CommandDict()
|
@ -0,0 +1,67 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
import os
|
||||||
|
from abc import ABC
|
||||||
|
from abc import abstractmethod
|
||||||
|
from typing import Optional
|
||||||
|
from typing import Union
|
||||||
|
|
||||||
|
import paddle
|
||||||
|
|
||||||
|
|
||||||
|
class BaseExecutor(ABC):
|
||||||
|
"""
|
||||||
|
An abstract executor of paddlespeech tasks.
|
||||||
|
"""
|
||||||
|
|
||||||
|
def __init__(self):
|
||||||
|
self.input = None
|
||||||
|
self.output = None
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def _get_default_cfg_path(self):
|
||||||
|
"""
|
||||||
|
Returns a default config file path of current task.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def _init_from_cfg(self, cfg_path: Optional[os.PathLike]=None):
|
||||||
|
"""
|
||||||
|
Init model from a specific config file.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def preprocess(self, input: Union[str, os.PathLike]):
|
||||||
|
"""
|
||||||
|
Input preprocess and return paddle.Tensor stored in self.input.
|
||||||
|
Input content can be a text(t2s), a file(s2t, cls) or a streaming(not supported yet).
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@paddle.no_grad()
|
||||||
|
@abstractmethod
|
||||||
|
def infer(self, device: str):
|
||||||
|
"""
|
||||||
|
Model inference and result stored in self.output.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def postprocess(self) -> Union[str, os.PathLike]:
|
||||||
|
"""
|
||||||
|
Output postprocess and return human-readable results such as texts and audio files.
|
||||||
|
"""
|
||||||
|
pass
|
@ -0,0 +1,14 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
from .infer import S2TExecutor
|
@ -0,0 +1,102 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
import argparse
|
||||||
|
import os
|
||||||
|
from typing import List
|
||||||
|
from typing import Optional
|
||||||
|
from typing import Union
|
||||||
|
|
||||||
|
import paddle
|
||||||
|
|
||||||
|
from ..executor import BaseExecutor
|
||||||
|
from ..utils import cli_register
|
||||||
|
|
||||||
|
__all__ = ['S2TExecutor']
|
||||||
|
|
||||||
|
|
||||||
|
@cli_register(name='paddlespeech.s2t', description='Asr infer command.')
|
||||||
|
class S2TExecutor(BaseExecutor):
|
||||||
|
def __init__(self):
|
||||||
|
super(S2TExecutor, self).__init__()
|
||||||
|
|
||||||
|
self.parser = argparse.ArgumentParser(
|
||||||
|
prog='paddlespeech.s2t', add_help=True)
|
||||||
|
self.parser.add_argument(
|
||||||
|
'--config',
|
||||||
|
type=str,
|
||||||
|
default=None,
|
||||||
|
help='Config of s2t task. Use deault config when it is None.')
|
||||||
|
self.parser.add_argument(
|
||||||
|
'--input', type=str, help='Audio file to recognize.')
|
||||||
|
self.parser.add_argument(
|
||||||
|
'--device',
|
||||||
|
type=str,
|
||||||
|
default='cpu',
|
||||||
|
help='Choose device to execute model inference.')
|
||||||
|
|
||||||
|
def _get_default_cfg_path(self):
|
||||||
|
"""
|
||||||
|
Returns a default config file path of current task.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
def _init_from_cfg(self, cfg_path: Optional[os.PathLike]=None):
|
||||||
|
"""
|
||||||
|
Init model from a specific config file.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
def preprocess(self, input: Union[str, os.PathLike]):
|
||||||
|
"""
|
||||||
|
Input preprocess and return paddle.Tensor stored in self.input.
|
||||||
|
Input content can be a text(t2s), a file(s2t, cls) or a streaming(not supported yet).
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@paddle.no_grad()
|
||||||
|
def infer(self):
|
||||||
|
"""
|
||||||
|
Model inference and result stored in self.output.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
def postprocess(self) -> Union[str, os.PathLike]:
|
||||||
|
"""
|
||||||
|
Output postprocess and return human-readable results such as texts and audio files.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
def execute(self, argv: List[str]) -> bool:
|
||||||
|
parser_args = self.parser.parse_args(argv)
|
||||||
|
print(parser_args)
|
||||||
|
|
||||||
|
config = parser_args.config
|
||||||
|
audio_file = parser_args.input
|
||||||
|
device = parser_args.device
|
||||||
|
|
||||||
|
if config is not None:
|
||||||
|
assert os.path.isfile(config), 'Config file is not valid.'
|
||||||
|
else:
|
||||||
|
config = self._get_default_cfg_path()
|
||||||
|
|
||||||
|
try:
|
||||||
|
self._init_from_cfg(config)
|
||||||
|
self.preprocess(audio_file)
|
||||||
|
self.infer()
|
||||||
|
res = self.postprocess() # Retrieve result of s2t.
|
||||||
|
print(res)
|
||||||
|
return True
|
||||||
|
except Exception as e:
|
||||||
|
print(e)
|
||||||
|
return False
|
@ -0,0 +1,86 @@
|
|||||||
|
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||||
|
# you may not use this file except in compliance with the License.
|
||||||
|
# You may obtain a copy of the License at
|
||||||
|
#
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
#
|
||||||
|
# Unless required by applicable law or agreed to in writing, software
|
||||||
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
# See the License for the specific language governing permissions and
|
||||||
|
# limitations under the License.
|
||||||
|
import os
|
||||||
|
from typing import Any
|
||||||
|
from typing import Dict
|
||||||
|
from typing import List
|
||||||
|
|
||||||
|
from paddle.framework import load
|
||||||
|
from paddle.utils import download
|
||||||
|
|
||||||
|
from .entry import commands
|
||||||
|
|
||||||
|
__all__ = [
|
||||||
|
'cli_register',
|
||||||
|
'get_command',
|
||||||
|
'download_and_decompress',
|
||||||
|
'load_state_dict_from_url',
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
|
def cli_register(name: str, description: str='') -> Any:
|
||||||
|
def _warpper(command):
|
||||||
|
items = name.split('.')
|
||||||
|
|
||||||
|
com = commands
|
||||||
|
for item in items:
|
||||||
|
com = com[item]
|
||||||
|
com['_entry'] = command
|
||||||
|
if description:
|
||||||
|
com['_description'] = description
|
||||||
|
return command
|
||||||
|
|
||||||
|
return _warpper
|
||||||
|
|
||||||
|
|
||||||
|
def get_command(name: str) -> Any:
|
||||||
|
items = name.split('.')
|
||||||
|
com = commands
|
||||||
|
for item in items:
|
||||||
|
com = com[item]
|
||||||
|
|
||||||
|
return com['_entry']
|
||||||
|
|
||||||
|
|
||||||
|
def decompress(file: str):
|
||||||
|
"""
|
||||||
|
Extracts all files from a compressed file.
|
||||||
|
"""
|
||||||
|
assert os.path.isfile(file), "File: {} not exists.".format(file)
|
||||||
|
download._decompress(file)
|
||||||
|
|
||||||
|
|
||||||
|
def download_and_decompress(archives: List[Dict[str, str]], path: str):
|
||||||
|
"""
|
||||||
|
Download archieves and decompress to specific path.
|
||||||
|
"""
|
||||||
|
if not os.path.isdir(path):
|
||||||
|
os.makedirs(path)
|
||||||
|
|
||||||
|
for archive in archives:
|
||||||
|
assert 'url' in archive and 'md5' in archive, \
|
||||||
|
'Dictionary keys of "url" and "md5" are required in the archive, but got: {list(archieve.keys())}'
|
||||||
|
|
||||||
|
download.get_path_from_url(archive['url'], path, archive['md5'])
|
||||||
|
|
||||||
|
|
||||||
|
def load_state_dict_from_url(url: str, path: str, md5: str=None):
|
||||||
|
"""
|
||||||
|
Download and load a state dict from url
|
||||||
|
"""
|
||||||
|
if not os.path.isdir(path):
|
||||||
|
os.makedirs(path)
|
||||||
|
|
||||||
|
download.get_path_from_url(url, path, md5)
|
||||||
|
return load(os.path.join(path, os.path.basename(url)))
|
Loading…
Reference in new issue