PaddleSpeech/paddlespeech/server/restful/request.py

# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from typing import Optional

from pydantic import BaseModel

__all__ = ['ASRRequest', 'TTSRequest', 'CLSRequest', 'VectorRequest']


#****************************************************************************************/
#************************************ ASR request ***************************************/
#****************************************************************************************/
class ASRRequest(BaseModel):
    """
    request body example
    {
        "audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",
        "audio_format": "wav",
        "sample_rate": 16000,
        "lang": "zh_cn",
        "punc":false
    }
    """
    audio: str
    audio_format: str
    sample_rate: int
    lang: str
    punc: Optional[bool] = None


#****************************************************************************************/
#************************************ TTS request ***************************************/
#****************************************************************************************/
class TTSRequest(BaseModel):
    """TTS request

    request body example
    {
        "text": "你好，欢迎使用百度飞桨语音合成服务。",
        "spk_id": 0,
        "speed": 1.0,
        "volume": 1.0,
        "sample_rate": 0,
        "tts_audio_path": "./tts.wav"
    }
    
    """

    text: str
    spk_id: int = 0
    speed: float = 1.0
    volume: float = 1.0
    sample_rate: int = 0
    save_path: str = None


#****************************************************************************************/
#************************************ CLS request ***************************************/
#****************************************************************************************/
class CLSRequest(BaseModel):
    """
    request body example
    {
        "audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",
        "topk": 1
    }
    """
    audio: str
    topk: int = 1


#****************************************************************************************/
#************************************ Text request **************************************/
#****************************************************************************************/
class TextRequest(BaseModel):
    text: str


#****************************************************************************************/
#************************************ Vecotr request ************************************/
#****************************************************************************************/
class VectorRequest(BaseModel):
    """
    request body example
    {
        "audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",
        "task": "spk",
        "audio_format": "wav",
        "sample_rate": 16000,
    }
    """
    audio: str
    task: str
    audio_format: str
    sample_rate: int


class VectorScoreRequest(BaseModel):
    """
    request body example
    {
        "enroll_audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",
        "test_audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",
        "task": "spk",
        "audio_format": "wav",
        "sample_rate": 16000,
    }
    """
    enroll_audio: str
    test_audio: str
    task: str
    audio_format: str
    sample_rate: int
servert dir arch 3 years ago			`# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`
add tts server, test=tts 3 years ago			`from typing import Optional`
servert dir arch 3 years ago
			`from pydantic import BaseModel`

add vector server, test=doc 3 years ago			`__all__ = ['ASRRequest', 'TTSRequest', 'CLSRequest', 'VectorRequest']`
servert dir arch 3 years ago

			`#****************************************************************************************/`
			`#********************************** ASR request *************************************/`
			`#****************************************************************************************/`
			`class ASRRequest(BaseModel):`
			`"""`
			`request body example`
			`{`
			`"audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",`
			`"audio_format": "wav",`
			`"sample_rate": 16000,`
added engine framework (#1383) 3 years ago			`"lang": "zh_cn",`
added asr engine and fixed bugs, test=doc 3 years ago			`"punc":false`
servert dir arch 3 years ago			`}`
			`"""`
			`audio: str`
			`audio_format: str`
			`sample_rate: int`
			`lang: str`
added asr engine and fixed bugs, test=doc 3 years ago			`punc: Optional[bool] = None`
servert dir arch 3 years ago

			`#****************************************************************************************/`
			`#********************************** TTS request *************************************/`
			`#****************************************************************************************/`
			`class TTSRequest(BaseModel):`
add tts server, test=tts 3 years ago			`"""TTS request`

servert dir arch 3 years ago			`request body example`
			`{`
add tts server, test=tts 3 years ago			`"text": "你好，欢迎使用百度飞桨语音合成服务。",`
			`"spk_id": 0,`
			`"speed": 1.0,`
			`"volume": 1.0,`
			`"sample_rate": 0,`
add postproces, test=doc 3 years ago			`"tts_audio_path": "./tts.wav"`
servert dir arch 3 years ago			`}`
add tts server, test=tts 3 years ago
			`"""`

			`text: str`
			`spk_id: int = 0`
			`speed: float = 1.0`
			`volume: float = 1.0`
			`sample_rate: int = 0`
			`save_path: str = None`
add server cls, test=doc 3 years ago

			`#****************************************************************************************/`
			`#********************************** CLS request *************************************/`
			`#****************************************************************************************/`
			`class CLSRequest(BaseModel):`
			`"""`
			`request body example`
			`{`
			`"audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",`
			`"topk": 1`
			`}`
			`"""`
			`audio: str`
			`topk: int = 1`
add text punc server, test=doc 3 years ago

			`#****************************************************************************************/`
			`#********************************** Text request ************************************/`
			`#****************************************************************************************/`
			`class TextRequest(BaseModel):`
			`text: str`
add vector server, test=doc 3 years ago

			`#****************************************************************************************/`
			`#********************************** Vecotr request **********************************/`
			`#****************************************************************************************/`
			`class VectorRequest(BaseModel):`
			`"""`
			`request body example`
			`{`
			`"audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",`
			`"task": "spk",`
			`"audio_format": "wav",`
			`"sample_rate": 16000,`
			`}`
			`"""`
			`audio: str`
			`task: str`
			`audio_format: str`
			`sample_rate: int`


			`class VectorScoreRequest(BaseModel):`
			`"""`
			`request body example`
			`{`
			`"enroll_audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",`
			`"test_audio": "exSI6ICJlbiIsCgkgICAgInBvc2l0aW9uIjogImZhbHNlIgoJf...",`
			`"task": "spk",`
			`"audio_format": "wav",`
			`"sample_rate": 16000,`
			`}`
			`"""`
			`enroll_audio: str`
			`test_audio: str`
			`task: str`
			`audio_format: str`
			`sample_rate: int`