PaddleSpeech/paddlespeech/server/bin/paddlespeech_client.py

# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import argparse
import asyncio
import base64
import io
import json
import os
import random
import time
from typing import List

import numpy as np
import requests
import soundfile

from ..executor import BaseExecutor
from ..util import cli_client_register
from ..util import stats_wrapper
from paddlespeech.cli.log import logger
from paddlespeech.server.utils.audio_handler import ASRWsAudioHandler
from paddlespeech.server.utils.audio_process import wav2pcm
from paddlespeech.server.utils.util import wav2base64

__all__ = [
    'TTSClientExecutor', 'TTSOnlineClientExecutor', 'ASRClientExecutor',
    'CLSClientExecutor'
]


@cli_client_register(
    name='paddlespeech_client.tts', description='visit tts service')
class TTSClientExecutor(BaseExecutor):
    def __init__(self):
        super(TTSClientExecutor, self).__init__()
        self.parser = argparse.ArgumentParser(
            prog='paddlespeech_client.tts', add_help=True)
        self.parser.add_argument(
            '--server_ip', type=str, default='127.0.0.1', help='server ip')
        self.parser.add_argument(
            '--port', type=int, default=8090, help='server port')
        self.parser.add_argument(
            '--input',
            type=str,
            default=None,
            help='Text to be synthesized.',
            required=True)
        self.parser.add_argument(
            '--spk_id', type=int, default=0, help='Speaker id')
        self.parser.add_argument(
            '--speed',
            type=float,
            default=1.0,
            help='Audio speed, the value should be set between 0 and 3')
        self.parser.add_argument(
            '--volume',
            type=float,
            default=1.0,
            help='Audio volume, the value should be set between 0 and 3')
        self.parser.add_argument(
            '--sample_rate',
            type=int,
            default=0,
            choices=[0, 8000, 16000],
            help='Sampling rate, the default is the same as the model')
        self.parser.add_argument(
            '--output', type=str, default=None, help='Synthesized audio file')

    def postprocess(self, wav_base64: str, outfile: str) -> float:
        audio_data_byte = base64.b64decode(wav_base64)
        # from byte
        samples, sample_rate = soundfile.read(
            io.BytesIO(audio_data_byte), dtype='float32')

        # transform audio
        if outfile.endswith(".wav"):
            soundfile.write(outfile, samples, sample_rate)
        elif outfile.endswith(".pcm"):
            temp_wav = str(random.getrandbits(128)) + ".wav"
            soundfile.write(temp_wav, samples, sample_rate)
            wav2pcm(temp_wav, outfile, data_type=np.int16)
            os.system("rm %s" % (temp_wav))
        else:
            logger.error("The format for saving audio only supports wav or pcm")

    def execute(self, argv: List[str]) -> bool:
        args = self.parser.parse_args(argv)
        input_ = args.input
        server_ip = args.server_ip
        port = args.port
        spk_id = args.spk_id
        speed = args.speed
        volume = args.volume
        sample_rate = args.sample_rate
        output = args.output

        try:
            time_start = time.time()
            res = self(
                input=input_,
                server_ip=server_ip,
                port=port,
                spk_id=spk_id,
                speed=speed,
                volume=volume,
                sample_rate=sample_rate,
                output=output)
            time_end = time.time()
            time_consume = time_end - time_start
            response_dict = res.json()
            logger.info(response_dict["message"])
            logger.info("Save synthesized audio successfully on %s." % (output))
            logger.info("Audio duration: %f s." %
                        (response_dict['result']['duration']))
            logger.info("Response time: %f s." % (time_consume))
            return True
        except Exception as e:
            logger.error("Failed to synthesized audio.")
            return False

    @stats_wrapper
    def __call__(self,
                 input: str,
                 server_ip: str="127.0.0.1",
                 port: int=8090,
                 spk_id: int=0,
                 speed: float=1.0,
                 volume: float=1.0,
                 sample_rate: int=0,
                 output: str=None):
        """
        Python API to call an executor.
        """

        url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/tts'
        request = {
            "text": input,
            "spk_id": spk_id,
            "speed": speed,
            "volume": volume,
            "sample_rate": sample_rate,
            "save_path": output
        }

        res = requests.post(url, json.dumps(request))
        response_dict = res.json()
        if output is not None:
            self.postprocess(response_dict["result"]["audio"], output)
        return res


@cli_client_register(
    name='paddlespeech_client.tts_online',
    description='visit tts online service')
class TTSOnlineClientExecutor(BaseExecutor):
    def __init__(self):
        super(TTSOnlineClientExecutor, self).__init__()
        self.parser = argparse.ArgumentParser(
            prog='paddlespeech_client.tts_online', add_help=True)
        self.parser.add_argument(
            '--server_ip', type=str, default='127.0.0.1', help='server ip')
        self.parser.add_argument(
            '--port', type=int, default=8092, help='server port')
        self.parser.add_argument(
            '--protocol',
            type=str,
            default="http",
            choices=["http", "websocket"],
            help='server protocol')
        self.parser.add_argument(
            '--input',
            type=str,
            default=None,
            help='Text to be synthesized.',
            required=True)
        self.parser.add_argument(
            '--spk_id', type=int, default=0, help='Speaker id')
        self.parser.add_argument(
            '--speed',
            type=float,
            default=1.0,
            help='Audio speed, the value should be set between 0 and 3')
        self.parser.add_argument(
            '--volume',
            type=float,
            default=1.0,
            help='Audio volume, the value should be set between 0 and 3')
        self.parser.add_argument(
            '--sample_rate',
            type=int,
            default=0,
            choices=[0, 8000, 16000],
            help='Sampling rate, the default is the same as the model')
        self.parser.add_argument(
            '--output', type=str, default=None, help='Synthesized audio file')
        self.parser.add_argument(
            "--play", type=bool, help="whether to play audio", default=False)

    def execute(self, argv: List[str]) -> bool:
        args = self.parser.parse_args(argv)
        input_ = args.input
        server_ip = args.server_ip
        port = args.port
        protocol = args.protocol
        spk_id = args.spk_id
        speed = args.speed
        volume = args.volume
        sample_rate = args.sample_rate
        output = args.output
        play = args.play

        try:
            res = self(
                input=input_,
                server_ip=server_ip,
                port=port,
                protocol=protocol,
                spk_id=spk_id,
                speed=speed,
                volume=volume,
                sample_rate=sample_rate,
                output=output,
                play=play)
            return True
        except Exception as e:
            logger.error("Failed to synthesized audio.")
            return False

    @stats_wrapper
    def __call__(self,
                 input: str,
                 server_ip: str="127.0.0.1",
                 port: int=8092,
                 protocol: str="http",
                 spk_id: int=0,
                 speed: float=1.0,
                 volume: float=1.0,
                 sample_rate: int=0,
                 output: str=None,
                 play: bool=False):
        """
        Python API to call an executor.
        """

        if protocol == "http":
            logger.info("tts http client start")
            from paddlespeech.server.utils.audio_handler import TTSHttpHandler
            handler = TTSHttpHandler(server_ip, port, play)
            handler.run(input, spk_id, speed, volume, sample_rate, output)

        elif protocol == "websocket":
            from paddlespeech.server.utils.audio_handler import TTSWsHandler
            logger.info("tts websocket client start")
            handler = TTSWsHandler(server_ip, port, play)
            loop = asyncio.get_event_loop()
            loop.run_until_complete(handler.run(input, output))

        else:
            logger.error("Please set correct protocol, http or websocket")


@cli_client_register(
    name='paddlespeech_client.asr', description='visit asr service')
class ASRClientExecutor(BaseExecutor):
    def __init__(self):
        super(ASRClientExecutor, self).__init__()
        self.parser = argparse.ArgumentParser(
            prog='paddlespeech_client.asr', add_help=True)
        self.parser.add_argument(
            '--server_ip', type=str, default='127.0.0.1', help='server ip')
        self.parser.add_argument(
            '--port', type=int, default=8090, help='server port')
        self.parser.add_argument(
            '--input',
            type=str,
            default=None,
            help='Audio file to be recognized',
            required=True)
        self.parser.add_argument(
            '--protocol',
            type=str,
            default="http",
            choices=["http", "websocket"],
            help='server protocol')
        self.parser.add_argument(
            '--sample_rate', type=int, default=16000, help='audio sample rate')
        self.parser.add_argument(
            '--lang', type=str, default="zh_cn", help='language')
        self.parser.add_argument(
            '--audio_format', type=str, default="wav", help='audio format')

        self.parser.add_argument(
            '--punc.server_ip',
            type=str,
            default=None,
            dest="punc_server_ip",
            help='Punctuation server ip')
        self.parser.add_argument(
            '--punc.port',
            type=int,
            default=8091,
            dest="punc_server_port",
            help='Punctuation server port')

    def execute(self, argv: List[str]) -> bool:
        args = self.parser.parse_args(argv)
        input_ = args.input
        server_ip = args.server_ip
        port = args.port
        sample_rate = args.sample_rate
        lang = args.lang
        audio_format = args.audio_format
        protocol = args.protocol

        try:
            time_start = time.time()
            res = self(
                input=input_,
                server_ip=server_ip,
                port=port,
                sample_rate=sample_rate,
                lang=lang,
                audio_format=audio_format,
                protocol=protocol,
                punc_server_ip=args.punc_server_ip,
                punc_server_port=args.punc_server_port)
            time_end = time.time()
            logger.info(f"ASR result: {res}")
            logger.info("Response time %f s." % (time_end - time_start))
            return True
        except Exception as e:
            logger.error("Failed to speech recognition.")
            logger.error(e)
            return False

    @stats_wrapper
    def __call__(self,
                 input: str,
                 server_ip: str="127.0.0.1",
                 port: int=8090,
                 sample_rate: int=16000,
                 lang: str="zh_cn",
                 audio_format: str="wav",
                 protocol: str="http",
                 punc_server_ip: str="127.0.0.1",
                 punc_server_port: int=8091):
        """Python API to call an executor.

        Args:
            input (str): The input audio file path
            server_ip (str, optional): The ASR server ip. Defaults to "127.0.0.1".
            port (int, optional): The ASR server port. Defaults to 8090.
            sample_rate (int, optional): The audio sample rate. Defaults to 16000.
            lang (str, optional): The audio language type. Defaults to "zh_cn".
            audio_format (str, optional): The audio format information. Defaults to "wav".
            protocol (str, optional): The ASR server. Defaults to "http".

        Returns:
            str: The ASR results
        """
        # we use the asr server to recognize the audio text content
        if protocol.lower() == "http":
            from paddlespeech.server.utils.audio_handler import ASRHttpHandler
            logger.info("asr http client start")
            handler = ASRHttpHandler(server_ip=server_ip, port=port)
            res = handler.run(input, audio_format, sample_rate, lang)
            res = res['result']['transcription']
            logger.info("asr http client finished")

        elif protocol.lower() == "websocket":
            logger.info("asr websocket client start")
            handler = ASRWsAudioHandler(
                server_ip,
                port,
                punc_server_ip=punc_server_ip,
                punc_server_port=punc_server_port)
            loop = asyncio.get_event_loop()
            res = loop.run_until_complete(handler.run(input))
            res = res['result']
            logger.info("asr websocket client finished")
        else:
            logger.error(f"Sorry, we have not support protocol: {protocol},"
                         "please use http or websocket protocol")
            sys.exit(-1)

        return res


@cli_client_register(
    name='paddlespeech_client.cls', description='visit cls service')
class CLSClientExecutor(BaseExecutor):
    def __init__(self):
        super(CLSClientExecutor, self).__init__()
        self.parser = argparse.ArgumentParser(
            prog='paddlespeech_client.cls', add_help=True)
        self.parser.add_argument(
            '--server_ip', type=str, default='127.0.0.1', help='server ip')
        self.parser.add_argument(
            '--port', type=int, default=8090, help='server port')
        self.parser.add_argument(
            '--input',
            type=str,
            default=None,
            help='Audio file to classify.',
            required=True)
        self.parser.add_argument(
            '--topk',
            type=int,
            default=1,
            help='Return topk scores of classification result.')

    def execute(self, argv: List[str]) -> bool:
        args = self.parser.parse_args(argv)
        input_ = args.input
        server_ip = args.server_ip
        port = args.port
        topk = args.topk

        try:
            time_start = time.time()
            res = self(input=input_, server_ip=server_ip, port=port, topk=topk)
            time_end = time.time()
            logger.info(res.json())
            logger.info("Response time %f s." % (time_end - time_start))
            return True
        except Exception as e:
            logger.error("Failed to speech classification.")
            return False

    @stats_wrapper
    def __call__(self,
                 input: str,
                 server_ip: str="127.0.0.1",
                 port: int=8090,
                 topk: int=1):
        """
        Python API to call an executor.
        """

        url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/cls'
        audio = wav2base64(input)
        data = {"audio": audio, "topk": topk}

        res = requests.post(url=url, data=json.dumps(data))
        return res


@cli_client_register(
    name='paddlespeech_client.text', description='visit the text service')
class TextClientExecutor(BaseExecutor):
    def __init__(self):
        super(TextClientExecutor, self).__init__()
        self.parser = argparse.ArgumentParser(
            prog='paddlespeech_client.text', add_help=True)
        self.parser.add_argument(
            '--server_ip', type=str, default='127.0.0.1', help='server ip')
        self.parser.add_argument(
            '--port', type=int, default=8090, help='server port')
        self.parser.add_argument(
            '--input',
            type=str,
            default=None,
            help='sentence to be process by text server.',
            required=True)

    def execute(self, argv: List[str]) -> bool:
        """Execute the request from the argv.

        Args:
            argv (List): the request arguments

        Returns:
            str: the request flag
        """
        args = self.parser.parse_args(argv)
        input_ = args.input
        server_ip = args.server_ip
        port = args.port
        output = args.output

        try:
            time_start = time.time()
            res = self(input=input_, server_ip=server_ip, port=port)
            time_end = time.time()
            logger.info(f"The punc text: {res}")
            logger.info("Response time %f s." % (time_end - time_start))
            return True
        except Exception as e:
            logger.error("Failed to Text punctuation.")
            return False

    @stats_wrapper
    def __call__(self, input: str, server_ip: str="127.0.0.1", port: int=8090):
        """
        Python API to call text executor.

        Args:
            input (str): the request sentence text
            server_ip (str, optional): the server ip. Defaults to "127.0.0.1".
            port (int, optional): the server port. Defaults to 8090.

        Returns:
            str: the punctuation text
        """

        url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/text'
        request = {
            "text": input,
        }

        res = requests.post(url=url, data=json.dumps(request))
        response_dict = res.json()
        punc_text = response_dict["result"]["punc_text"]
        return punc_text
added engine type and asr inference , test=doc 3 years ago			`# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
			`import argparse`
format 2 years ago			`import asyncio`
added engine type and asr inference , test=doc 3 years ago			`import base64`
			`import io`
			`import json`
			`import os`
			`import random`
			`import time`
			`from typing import List`

			`import numpy as np`
			`import requests`
			`import soundfile`

add readme, test=doc 3 years ago			`from ..executor import BaseExecutor`
added engine type and asr inference , test=doc 3 years ago			`from ..util import cli_client_register`
add server demo, test=doc 3 years ago			`from ..util import stats_wrapper`
			`from paddlespeech.cli.log import logger`
update the asr server api, test=doc 2 years ago			`from paddlespeech.server.utils.audio_handler import ASRWsAudioHandler`
added engine type and asr inference , test=doc 3 years ago			`from paddlespeech.server.utils.audio_process import wav2pcm`
			`from paddlespeech.server.utils.util import wav2base64`

add streaming asr demo, test=doc 2 years ago			`__all__ = [`
add streaming tts demos, test=doc 2 years ago			`'TTSClientExecutor', 'TTSOnlineClientExecutor', 'ASRClientExecutor',`
asr client add punctuatjion server, test=doc 2 years ago			`'CLSClientExecutor'`
add streaming asr demo, test=doc 2 years ago			`]`
added engine type and asr inference , test=doc 3 years ago

			`@cli_client_register(`
			`name='paddlespeech_client.tts', description='visit tts service')`
add readme, test=doc 3 years ago			`class TTSClientExecutor(BaseExecutor):`
added engine type and asr inference , test=doc 3 years ago			`def __init__(self):`
add server demo, test=doc 3 years ago			`super(TTSClientExecutor, self).__init__()`
			`self.parser = argparse.ArgumentParser(`
			`prog='paddlespeech_client.tts', add_help=True)`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
			`'--server_ip', type=str, default='127.0.0.1', help='server ip')`
			`self.parser.add_argument(`
			`'--port', type=int, default=8090, help='server port')`
			`self.parser.add_argument(`
add readme, test=doc 3 years ago			`'--input',`
added engine type and asr inference , test=doc 3 years ago			`type=str,`
paras required, test=doc 3 years ago			`default=None,`
			`help='Text to be synthesized.',`
			`required=True)`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
			`'--spk_id', type=int, default=0, help='Speaker id')`
			`self.parser.add_argument(`
add server demo, test=doc 3 years ago			`'--speed',`
			`type=float,`
			`default=1.0,`
			`help='Audio speed, the value should be set between 0 and 3')`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
add server demo, test=doc 3 years ago			`'--volume',`
			`type=float,`
			`default=1.0,`
			`help='Audio volume, the value should be set between 0 and 3')`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
			`'--sample_rate',`
			`type=int,`
			`default=0,`
add server demo, test=doc 3 years ago			`choices=[0, 8000, 16000],`
added engine type and asr inference , test=doc 3 years ago			`help='Sampling rate, the default is the same as the model')`
			`self.parser.add_argument(`
modify, test=doc 3 years ago			`'--output', type=str, default=None, help='Synthesized audio file')`
added engine type and asr inference , test=doc 3 years ago
modify, test=doc 3 years ago			`def postprocess(self, wav_base64: str, outfile: str) -> float:`
added engine type and asr inference , test=doc 3 years ago			`audio_data_byte = base64.b64decode(wav_base64)`
			`# from byte`
			`samples, sample_rate = soundfile.read(`
			`io.BytesIO(audio_data_byte), dtype='float32')`

			`# transform audio`
			`if outfile.endswith(".wav"):`
			`soundfile.write(outfile, samples, sample_rate)`
			`elif outfile.endswith(".pcm"):`
			`temp_wav = str(random.getrandbits(128)) + ".wav"`
			`soundfile.write(temp_wav, samples, sample_rate)`
			`wav2pcm(temp_wav, outfile, data_type=np.int16)`
			`os.system("rm %s" % (temp_wav))`
			`else:`
add server demo, test=doc 3 years ago			`logger.error("The format for saving audio only supports wav or pcm")`
added engine type and asr inference , test=doc 3 years ago
			`def execute(self, argv: List[str]) -> bool:`
			`args = self.parser.parse_args(argv)`
modify, test=doc 3 years ago			`input_ = args.input`
			`server_ip = args.server_ip`
			`port = args.port`
			`spk_id = args.spk_id`
			`speed = args.speed`
			`volume = args.volume`
			`sample_rate = args.sample_rate`
			`output = args.output`
add server demo, test=doc 3 years ago
modify, test=doc 3 years ago			`try:`
			`time_start = time.time()`
			`res = self(`
			`input=input_,`
			`server_ip=server_ip,`
			`port=port,`
			`spk_id=spk_id,`
			`speed=speed,`
			`volume=volume,`
			`sample_rate=sample_rate,`
			`output=output)`
			`time_end = time.time()`
			`time_consume = time_end - time_start`
			`response_dict = res.json()`
add server demo, test=doc 3 years ago			`logger.info(response_dict["message"])`
modify, test=doc 3 years ago			`logger.info("Save synthesized audio successfully on %s." % (output))`
			`logger.info("Audio duration: %f s." %`
			`(response_dict['result']['duration']))`
add server demo, test=doc 3 years ago			`logger.info("Response time: %f s." % (time_consume))`
			`return True`
modify, test=doc 3 years ago			`except Exception as e:`
add server demo, test=doc 3 years ago			`logger.error("Failed to synthesized audio.")`
			`return False`

			`@stats_wrapper`
			`def __call__(self,`
			`input: str,`
			`server_ip: str="127.0.0.1",`
			`port: int=8090,`
			`spk_id: int=0,`
			`speed: float=1.0,`
			`volume: float=1.0,`
			`sample_rate: int=0,`
modify, test=doc 3 years ago			`output: str=None):`
add server demo, test=doc 3 years ago			`"""`
			`Python API to call an executor.`
			`"""`

			`url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/tts'`
			`request = {`
			`"text": input,`
			`"spk_id": spk_id,`
			`"speed": speed,`
			`"volume": volume,`
			`"sample_rate": sample_rate,`
			`"save_path": output`
			`}`

modify, test=doc 3 years ago			`res = requests.post(url, json.dumps(request))`
			`response_dict = res.json()`
Update paddlespeech_client.py 3 years ago			`if output is not None:`
modify, test=doc 3 years ago			`self.postprocess(response_dict["result"]["audio"], output)`
			`return res`
added engine type and asr inference , test=doc 3 years ago

add streaming tts demos, test=doc 2 years ago			`@cli_client_register(`
			`name='paddlespeech_client.tts_online',`
			`description='visit tts online service')`
			`class TTSOnlineClientExecutor(BaseExecutor):`
			`def __init__(self):`
			`super(TTSOnlineClientExecutor, self).__init__()`
			`self.parser = argparse.ArgumentParser(`
			`prog='paddlespeech_client.tts_online', add_help=True)`
			`self.parser.add_argument(`
			`'--server_ip', type=str, default='127.0.0.1', help='server ip')`
			`self.parser.add_argument(`
			`'--port', type=int, default=8092, help='server port')`
			`self.parser.add_argument(`
			`'--protocol',`
			`type=str,`
			`default="http",`
			`choices=["http", "websocket"],`
			`help='server protocol')`
			`self.parser.add_argument(`
			`'--input',`
			`type=str,`
			`default=None,`
			`help='Text to be synthesized.',`
			`required=True)`
			`self.parser.add_argument(`
			`'--spk_id', type=int, default=0, help='Speaker id')`
			`self.parser.add_argument(`
			`'--speed',`
			`type=float,`
			`default=1.0,`
			`help='Audio speed, the value should be set between 0 and 3')`
			`self.parser.add_argument(`
			`'--volume',`
			`type=float,`
			`default=1.0,`
			`help='Audio volume, the value should be set between 0 and 3')`
			`self.parser.add_argument(`
			`'--sample_rate',`
			`type=int,`
			`default=0,`
			`choices=[0, 8000, 16000],`
			`help='Sampling rate, the default is the same as the model')`
			`self.parser.add_argument(`
			`'--output', type=str, default=None, help='Synthesized audio file')`
			`self.parser.add_argument(`
			`"--play", type=bool, help="whether to play audio", default=False)`

			`def execute(self, argv: List[str]) -> bool:`
			`args = self.parser.parse_args(argv)`
			`input_ = args.input`
			`server_ip = args.server_ip`
			`port = args.port`
			`protocol = args.protocol`
			`spk_id = args.spk_id`
			`speed = args.speed`
			`volume = args.volume`
			`sample_rate = args.sample_rate`
			`output = args.output`
			`play = args.play`

			`try:`
			`res = self(`
			`input=input_,`
			`server_ip=server_ip,`
			`port=port,`
			`protocol=protocol,`
			`spk_id=spk_id,`
			`speed=speed,`
			`volume=volume,`
			`sample_rate=sample_rate,`
			`output=output,`
			`play=play)`
			`return True`
			`except Exception as e:`
			`logger.error("Failed to synthesized audio.")`
			`return False`

			`@stats_wrapper`
			`def __call__(self,`
			`input: str,`
			`server_ip: str="127.0.0.1",`
			`port: int=8092,`
			`protocol: str="http",`
			`spk_id: int=0,`
			`speed: float=1.0,`
			`volume: float=1.0,`
			`sample_rate: int=0,`
			`output: str=None,`
			`play: bool=False):`
			`"""`
			`Python API to call an executor.`
			`"""`

			`if protocol == "http":`
			`logger.info("tts http client start")`
			`from paddlespeech.server.utils.audio_handler import TTSHttpHandler`
			`handler = TTSHttpHandler(server_ip, port, play)`
			`handler.run(input, spk_id, speed, volume, sample_rate, output)`

			`elif protocol == "websocket":`
			`from paddlespeech.server.utils.audio_handler import TTSWsHandler`
			`logger.info("tts websocket client start")`
			`handler = TTSWsHandler(server_ip, port, play)`
			`loop = asyncio.get_event_loop()`
			`loop.run_until_complete(handler.run(input, output))`

			`else:`
			`logger.error("Please set correct protocol, http or websocket")`


added engine type and asr inference , test=doc 3 years ago			`@cli_client_register(`
			`name='paddlespeech_client.asr', description='visit asr service')`
add readme, test=doc 3 years ago			`class ASRClientExecutor(BaseExecutor):`
added engine type and asr inference , test=doc 3 years ago			`def __init__(self):`
add server demo, test=doc 3 years ago			`super(ASRClientExecutor, self).__init__()`
			`self.parser = argparse.ArgumentParser(`
			`prog='paddlespeech_client.asr', add_help=True)`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
			`'--server_ip', type=str, default='127.0.0.1', help='server ip')`
			`self.parser.add_argument(`
			`'--port', type=int, default=8090, help='server port')`
			`self.parser.add_argument(`
add readme, test=doc 3 years ago			`'--input',`
added engine type and asr inference , test=doc 3 years ago			`type=str,`
paras required, test=doc 3 years ago			`default=None,`
			`help='Audio file to be recognized',`
			`required=True)`
asr client add punctuatjion server, test=doc 2 years ago			`self.parser.add_argument(`
			`'--protocol',`
			`type=str,`
			`default="http",`
			`choices=["http", "websocket"],`
			`help='server protocol')`
added engine type and asr inference , test=doc 3 years ago			`self.parser.add_argument(`
			`'--sample_rate', type=int, default=16000, help='audio sample rate')`
add readme, test=doc 3 years ago			`self.parser.add_argument(`
			`'--lang', type=str, default="zh_cn", help='language')`
			`self.parser.add_argument(`
			`'--audio_format', type=str, default="wav", help='audio format')`
added engine type and asr inference , test=doc 3 years ago
added online asr doc and online asr command line, test=doc 2 years ago			`self.parser.add_argument(`
asr client add punctuatjion server, test=doc 2 years ago			`'--punc.server_ip',`
added online asr doc and online asr command line, test=doc 2 years ago			`type=str,`
			`default=None,`
asr client add punctuatjion server, test=doc 2 years ago			`dest="punc_server_ip",`
			`help='Punctuation server ip')`
added online asr doc and online asr command line, test=doc 2 years ago			`self.parser.add_argument(`
asr client add punctuatjion server, test=doc 2 years ago			`'--punc.port',`
			`type=int,`
			`default=8091,`
			`dest="punc_server_port",`
			`help='Punctuation server port')`
added online asr doc and online asr command line, test=doc 2 years ago
			`def execute(self, argv: List[str]) -> bool:`
			`args = self.parser.parse_args(argv)`
			`input_ = args.input`
			`server_ip = args.server_ip`
			`port = args.port`
			`sample_rate = args.sample_rate`
			`lang = args.lang`
			`audio_format = args.audio_format`
asr client add punctuatjion server, test=doc 2 years ago			`protocol = args.protocol`
added online asr doc and online asr command line, test=doc 2 years ago
			`try:`
			`time_start = time.time()`
			`res = self(`
			`input=input_,`
			`server_ip=server_ip,`
			`port=port,`
			`sample_rate=sample_rate,`
			`lang=lang,`
asr client add punctuatjion server, test=doc 2 years ago			`audio_format=audio_format,`
			`protocol=protocol,`
			`punc_server_ip=args.punc_server_ip,`
			`punc_server_port=args.punc_server_port)`
added online asr doc and online asr command line, test=doc 2 years ago			`time_end = time.time()`
asr client add punctuatjion server, test=doc 2 years ago			`logger.info(f"ASR result: {res}")`
added online asr doc and online asr command line, test=doc 2 years ago			`logger.info("Response time %f s." % (time_end - time_start))`
			`return True`
			`except Exception as e:`
			`logger.error("Failed to speech recognition.")`
fix the asr online client bug, return None, test=doc 2 years ago			`logger.error(e)`
added online asr doc and online asr command line, test=doc 2 years ago			`return False`

			`@stats_wrapper`
			`def __call__(self,`
			`input: str,`
			`server_ip: str="127.0.0.1",`
asr client add punctuatjion server, test=doc 2 years ago			`port: int=8090,`
added online asr doc and online asr command line, test=doc 2 years ago			`sample_rate: int=16000,`
			`lang: str="zh_cn",`
asr client add punctuatjion server, test=doc 2 years ago			`audio_format: str="wav",`
			`protocol: str="http",`
			`punc_server_ip: str="127.0.0.1",`
			`punc_server_port: int=8091):`
			`"""Python API to call an executor.`

			`Args:`
			`input (str): The input audio file path`
			`server_ip (str, optional): The ASR server ip. Defaults to "127.0.0.1".`
			`port (int, optional): The ASR server port. Defaults to 8090.`
			`sample_rate (int, optional): The audio sample rate. Defaults to 16000.`
			`lang (str, optional): The audio language type. Defaults to "zh_cn".`
			`audio_format (str, optional): The audio format information. Defaults to "wav".`
			`protocol (str, optional): The ASR server. Defaults to "http".`

			`Returns:`
			`str: The ASR results`
added online asr doc and online asr command line, test=doc 2 years ago			`"""`
update the asr server api, test=doc 2 years ago			`# we use the asr server to recognize the audio text content`
asr client add punctuatjion server, test=doc 2 years ago			`if protocol.lower() == "http":`
			`from paddlespeech.server.utils.audio_handler import ASRHttpHandler`
			`logger.info("asr http client start")`
			`handler = ASRHttpHandler(server_ip=server_ip, port=port)`
			`res = handler.run(input, audio_format, sample_rate, lang)`
			`res = res['result']['transcription']`
			`logger.info("asr http client finished")`

			`elif protocol.lower() == "websocket":`
			`logger.info("asr websocket client start")`
update the asr server api, test=doc 2 years ago			`handler = ASRWsAudioHandler(`
asr client add punctuatjion server, test=doc 2 years ago			`server_ip,`
			`port,`
			`punc_server_ip=punc_server_ip,`
			`punc_server_port=punc_server_port)`
			`loop = asyncio.get_event_loop()`
			`res = loop.run_until_complete(handler.run(input))`
update the ws asr response, final_result to result, test=doc 2 years ago			`res = res['result']`
asr client add punctuatjion server, test=doc 2 years ago			`logger.info("asr websocket client finished")`
			`else:`
			`logger.error(f"Sorry, we have not support protocol: {protocol},"`
			`"please use http or websocket protocol")`
			`sys.exit(-1)`

			`return res`
added online asr doc and online asr command line, test=doc 2 years ago
add streaming asr demo, test=doc 2 years ago
add server cls, test=doc 3 years ago			`@cli_client_register(`
			`name='paddlespeech_client.cls', description='visit cls service')`
			`class CLSClientExecutor(BaseExecutor):`
			`def __init__(self):`
			`super(CLSClientExecutor, self).__init__()`
			`self.parser = argparse.ArgumentParser(`
			`prog='paddlespeech_client.cls', add_help=True)`
			`self.parser.add_argument(`
			`'--server_ip', type=str, default='127.0.0.1', help='server ip')`
			`self.parser.add_argument(`
			`'--port', type=int, default=8090, help='server port')`
			`self.parser.add_argument(`
			`'--input',`
			`type=str,`
			`default=None,`
			`help='Audio file to classify.',`
			`required=True)`
			`self.parser.add_argument(`
			`'--topk',`
			`type=int,`
			`default=1,`
			`help='Return topk scores of classification result.')`

			`def execute(self, argv: List[str]) -> bool:`
			`args = self.parser.parse_args(argv)`
modify, test=doc 3 years ago			`input_ = args.input`
			`server_ip = args.server_ip`
			`port = args.port`
			`topk = args.topk`

add server cls, test=doc 3 years ago			`try:`
modify, test=doc 3 years ago			`time_start = time.time()`
			`res = self(input=input_, server_ip=server_ip, port=port, topk=topk)`
add server cls, test=doc 3 years ago			`time_end = time.time()`
modify, test=doc 3 years ago			`logger.info(res.json())`
add server cls, test=doc 3 years ago			`logger.info("Response time %f s." % (time_end - time_start))`
			`return True`
modify, test=doc 3 years ago			`except Exception as e:`
add server cls, test=doc 3 years ago			`logger.error("Failed to speech classification.")`
			`return False`

			`@stats_wrapper`
			`def __call__(self,`
			`input: str,`
			`server_ip: str="127.0.0.1",`
			`port: int=8090,`
			`topk: int=1):`
			`"""`
			`Python API to call an executor.`
			`"""`

			`url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/cls'`
			`audio = wav2base64(input)`
			`data = {"audio": audio, "topk": topk}`
modify, test=doc 3 years ago
			`res = requests.post(url=url, data=json.dumps(data))`
			`return res`
add text punc server, test=doc 2 years ago

			`@cli_client_register(`
			`name='paddlespeech_client.text', description='visit the text service')`
			`class TextClientExecutor(BaseExecutor):`
			`def __init__(self):`
			`super(TextClientExecutor, self).__init__()`
			`self.parser = argparse.ArgumentParser(`
			`prog='paddlespeech_client.text', add_help=True)`
			`self.parser.add_argument(`
			`'--server_ip', type=str, default='127.0.0.1', help='server ip')`
			`self.parser.add_argument(`
			`'--port', type=int, default=8090, help='server port')`
			`self.parser.add_argument(`
			`'--input',`
			`type=str,`
			`default=None,`
			`help='sentence to be process by text server.',`
			`required=True)`

			`def execute(self, argv: List[str]) -> bool:`
			`"""Execute the request from the argv.`

			`Args:`
			`argv (List): the request arguments`

			`Returns:`
			`str: the request flag`
			`"""`
			`args = self.parser.parse_args(argv)`
			`input_ = args.input`
			`server_ip = args.server_ip`
			`port = args.port`
			`output = args.output`

			`try:`
			`time_start = time.time()`
			`res = self(input=input_, server_ip=server_ip, port=port)`
			`time_end = time.time()`
			`logger.info(f"The punc text: {res}")`
			`logger.info("Response time %f s." % (time_end - time_start))`
			`return True`
			`except Exception as e:`
			`logger.error("Failed to Text punctuation.")`
			`return False`

			`@stats_wrapper`
			`def __call__(self, input: str, server_ip: str="127.0.0.1", port: int=8090):`
			`"""`
			`Python API to call text executor.`

			`Args:`
			`input (str): the request sentence text`
			`server_ip (str, optional): the server ip. Defaults to "127.0.0.1".`
			`port (int, optional): the server port. Defaults to 8090.`

			`Returns:`
			`str: the punctuation text`
			`"""`

			`url = 'http://' + server_ip + ":" + str(port) + '/paddlespeech/text'`
			`request = {`
			`"text": input,`
			`}`

			`res = requests.post(url=url, data=json.dumps(request))`
			`response_dict = res.json()`
			`punc_text = response_dict["result"]["punc_text"]`
			`return punc_text`