parent
15b25199c2
commit
7be6b0e8cf
@ -1,77 +0,0 @@
|
|||||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
|
||||||
#
|
|
||||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
||||||
# you may not use this file except in compliance with the License.
|
|
||||||
# You may obtain a copy of the License at
|
|
||||||
#
|
|
||||||
# http://www.apache.org/licenses/LICENSE-2.0
|
|
||||||
#
|
|
||||||
# Unless required by applicable law or agreed to in writing, software
|
|
||||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
||||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
||||||
# See the License for the specific language governing permissions and
|
|
||||||
# limitations under the License.
|
|
||||||
import argparse
|
|
||||||
|
|
||||||
import uvicorn
|
|
||||||
from fastapi import FastAPI
|
|
||||||
|
|
||||||
from paddlespeech.server.engine.engine_pool import init_engine_pool
|
|
||||||
from paddlespeech.server.restful.api import setup_router as setup_http_router
|
|
||||||
from paddlespeech.server.utils.config import get_config
|
|
||||||
from paddlespeech.server.ws.api import setup_router as setup_ws_router
|
|
||||||
|
|
||||||
app = FastAPI(
|
|
||||||
title="PaddleSpeech Serving API", description="Api", version="0.0.1")
|
|
||||||
|
|
||||||
|
|
||||||
def init(config):
|
|
||||||
"""system initialization
|
|
||||||
|
|
||||||
Args:
|
|
||||||
config (CfgNode): config object
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
bool:
|
|
||||||
"""
|
|
||||||
# init api
|
|
||||||
api_list = list(engine.split("_")[0] for engine in config.engine_list)
|
|
||||||
if config.protocol == "websocket":
|
|
||||||
api_router = setup_ws_router(api_list)
|
|
||||||
elif config.protocol == "http":
|
|
||||||
api_router = setup_http_router(api_list)
|
|
||||||
else:
|
|
||||||
raise Exception("unsupported protocol")
|
|
||||||
app.include_router(api_router)
|
|
||||||
|
|
||||||
if not init_engine_pool(config):
|
|
||||||
return False
|
|
||||||
|
|
||||||
return True
|
|
||||||
|
|
||||||
|
|
||||||
def main(args):
|
|
||||||
"""main function"""
|
|
||||||
|
|
||||||
config = get_config(args.config_file)
|
|
||||||
|
|
||||||
if init(config):
|
|
||||||
uvicorn.run(app, host=config.host, port=config.port, debug=True)
|
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
|
||||||
parser = argparse.ArgumentParser()
|
|
||||||
parser.add_argument(
|
|
||||||
"--config_file",
|
|
||||||
action="store",
|
|
||||||
help="yaml file of the app",
|
|
||||||
default="./conf/application.yaml")
|
|
||||||
|
|
||||||
parser.add_argument(
|
|
||||||
"--log_file",
|
|
||||||
action="store",
|
|
||||||
help="log file",
|
|
||||||
default="./log/paddlespeech.log")
|
|
||||||
args = parser.parse_args()
|
|
||||||
|
|
||||||
main(args)
|
|
@ -1,110 +0,0 @@
|
|||||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
|
||||||
#
|
|
||||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
||||||
# you may not use this file except in compliance with the License.
|
|
||||||
# You may obtain a copy of the License at
|
|
||||||
#
|
|
||||||
# http://www.apache.org/licenses/LICENSE-2.0
|
|
||||||
#
|
|
||||||
# Unless required by applicable law or agreed to in writing, software
|
|
||||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
||||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
||||||
# See the License for the specific language governing permissions and
|
|
||||||
# limitations under the License.
|
|
||||||
import json
|
|
||||||
|
|
||||||
from fastapi import APIRouter
|
|
||||||
from fastapi import WebSocket
|
|
||||||
from fastapi import WebSocketDisconnect
|
|
||||||
from starlette.websockets import WebSocketState as WebSocketState
|
|
||||||
|
|
||||||
from paddlespeech.server.engine.asr.online.asr_engine import PaddleASRConnectionHanddler
|
|
||||||
from paddlespeech.server.engine.engine_pool import get_engine_pool
|
|
||||||
|
|
||||||
router = APIRouter()
|
|
||||||
|
|
||||||
|
|
||||||
@router.websocket('/paddlespeech/asr/streaming')
|
|
||||||
async def websocket_endpoint(websocket: WebSocket):
|
|
||||||
"""PaddleSpeech Online ASR Server api
|
|
||||||
|
|
||||||
Args:
|
|
||||||
websocket (WebSocket): the websocket instance
|
|
||||||
"""
|
|
||||||
|
|
||||||
#1. the interface wait to accept the websocket protocal header
|
|
||||||
# and only we receive the header, it establish the connection with specific thread
|
|
||||||
await websocket.accept()
|
|
||||||
|
|
||||||
#2. if we accept the websocket headers, we will get the online asr engine instance
|
|
||||||
engine_pool = get_engine_pool()
|
|
||||||
asr_engine = engine_pool['asr']
|
|
||||||
|
|
||||||
#3. each websocket connection, we will create an PaddleASRConnectionHanddler to process such audio
|
|
||||||
# and each connection has its own connection instance to process the request
|
|
||||||
# and only if client send the start signal, we create the PaddleASRConnectionHanddler instance
|
|
||||||
connection_handler = None
|
|
||||||
|
|
||||||
try:
|
|
||||||
#4. we do a loop to process the audio package by package according the protocal
|
|
||||||
# and only if the client send finished signal, we will break the loop
|
|
||||||
while True:
|
|
||||||
# careful here, changed the source code from starlette.websockets
|
|
||||||
# 4.1 we wait for the client signal for the specific action
|
|
||||||
assert websocket.application_state == WebSocketState.CONNECTED
|
|
||||||
message = await websocket.receive()
|
|
||||||
websocket._raise_on_disconnect(message)
|
|
||||||
|
|
||||||
#4.2 text for the action command and bytes for pcm data
|
|
||||||
if "text" in message:
|
|
||||||
# we first parse the specific command
|
|
||||||
message = json.loads(message["text"])
|
|
||||||
if 'signal' not in message:
|
|
||||||
resp = {"status": "ok", "message": "no valid json data"}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
|
|
||||||
# start command, we create the PaddleASRConnectionHanddler instance to process the audio data
|
|
||||||
# end command, we process the all the last audio pcm and return the final result
|
|
||||||
# and we break the loop
|
|
||||||
if message['signal'] == 'start':
|
|
||||||
resp = {"status": "ok", "signal": "server_ready"}
|
|
||||||
# do something at begining here
|
|
||||||
# create the instance to process the audio
|
|
||||||
connection_handler = PaddleASRConnectionHanddler(asr_engine)
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
elif message['signal'] == 'end':
|
|
||||||
# reset single engine for an new connection
|
|
||||||
# and we will destroy the connection
|
|
||||||
connection_handler.decode(is_finished=True)
|
|
||||||
connection_handler.rescoring()
|
|
||||||
asr_results = connection_handler.get_result()
|
|
||||||
word_time_stamp = connection_handler.get_word_time_stamp()
|
|
||||||
connection_handler.reset()
|
|
||||||
|
|
||||||
resp = {
|
|
||||||
"status": "ok",
|
|
||||||
"signal": "finished",
|
|
||||||
'result': asr_results,
|
|
||||||
'times': word_time_stamp
|
|
||||||
}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
break
|
|
||||||
else:
|
|
||||||
resp = {"status": "ok", "message": "no valid json data"}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
elif "bytes" in message:
|
|
||||||
# bytes for the pcm data
|
|
||||||
message = message["bytes"]
|
|
||||||
|
|
||||||
# we extract the remained audio pcm
|
|
||||||
# and decode for the result in this package data
|
|
||||||
connection_handler.extract_feat(message)
|
|
||||||
connection_handler.decode(is_finished=False)
|
|
||||||
asr_results = connection_handler.get_result()
|
|
||||||
|
|
||||||
# return the current period result
|
|
||||||
# if the engine create the vad instance, this connection will have many period results
|
|
||||||
resp = {'result': asr_results}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
except WebSocketDisconnect:
|
|
||||||
pass
|
|
@ -1,61 +0,0 @@
|
|||||||
# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
|
|
||||||
#
|
|
||||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
||||||
# you may not use this file except in compliance with the License.
|
|
||||||
# You may obtain a copy of the License at
|
|
||||||
#
|
|
||||||
# http://www.apache.org/licenses/LICENSE-2.0
|
|
||||||
#
|
|
||||||
# Unless required by applicable law or agreed to in writing, software
|
|
||||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
||||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
||||||
# See the License for the specific language governing permissions and
|
|
||||||
# limitations under the License.
|
|
||||||
import json
|
|
||||||
|
|
||||||
from fastapi import APIRouter
|
|
||||||
from fastapi import WebSocket
|
|
||||||
from fastapi import WebSocketDisconnect
|
|
||||||
from starlette.websockets import WebSocketState as WebSocketState
|
|
||||||
|
|
||||||
from paddlespeech.cli.log import logger
|
|
||||||
from paddlespeech.server.engine.engine_pool import get_engine_pool
|
|
||||||
|
|
||||||
router = APIRouter()
|
|
||||||
|
|
||||||
|
|
||||||
@router.websocket('/paddlespeech/tts/streaming')
|
|
||||||
async def websocket_endpoint(websocket: WebSocket):
|
|
||||||
await websocket.accept()
|
|
||||||
|
|
||||||
try:
|
|
||||||
# careful here, changed the source code from starlette.websockets
|
|
||||||
assert websocket.application_state == WebSocketState.CONNECTED
|
|
||||||
message = await websocket.receive()
|
|
||||||
websocket._raise_on_disconnect(message)
|
|
||||||
|
|
||||||
# get engine
|
|
||||||
engine_pool = get_engine_pool()
|
|
||||||
tts_engine = engine_pool['tts']
|
|
||||||
|
|
||||||
# 获取 message 并转文本
|
|
||||||
message = json.loads(message["text"])
|
|
||||||
text_bese64 = message["text"]
|
|
||||||
sentence = tts_engine.preprocess(text_bese64=text_bese64)
|
|
||||||
|
|
||||||
# run
|
|
||||||
wav_generator = tts_engine.run(sentence)
|
|
||||||
|
|
||||||
while True:
|
|
||||||
try:
|
|
||||||
tts_results = next(wav_generator)
|
|
||||||
resp = {"status": 1, "audio": tts_results}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
except StopIteration as e:
|
|
||||||
resp = {"status": 2, "audio": ''}
|
|
||||||
await websocket.send_json(resp)
|
|
||||||
logger.info("Complete the transmission of audio streams")
|
|
||||||
break
|
|
||||||
|
|
||||||
except WebSocketDisconnect:
|
|
||||||
pass
|
|
Loading…
Reference in new issue