From 73aa29062673d9a20cf9a4d1fa0601f61641bc7f Mon Sep 17 00:00:00 2001 From: Hui Zhang Date: Thu, 21 Apr 2022 08:04:57 +0000 Subject: [PATCH] update speechx install doc,test=doc --- speechx/README.md | 5 +++-- speechx/build.sh | 2 +- speechx/examples/ds2_ol/websocket/websocket_client_main.cc | 2 +- speechx/examples/ds2_ol/websocket/websocket_server_main.cc | 2 +- 4 files changed, 6 insertions(+), 5 deletions(-) diff --git a/speechx/README.md b/speechx/README.md index 610b88a8..34a66278 100644 --- a/speechx/README.md +++ b/speechx/README.md @@ -3,7 +3,7 @@ ## Environment We develop under: -* docker - registry.baidubce.com/paddlepaddle/paddle:2.1.1-gpu-cuda10.2-cudnn7 +* docker - `registry.baidubce.com/paddlepaddle/paddle:2.2.2-gpu-cuda10.2-cudnn7` * os - Ubuntu 16.04.7 LTS * gcc/g++/gfortran - 8.2.0 * cmake - 3.16.0 @@ -19,7 +19,7 @@ We develop under: 1. First to launch docker container. ``` -nvidia-docker run --privileged --net=host --ipc=host -it --rm -v $PWD:/workspace --name=dev registry.baidubce.com/paddlepaddle/paddle:2.1.1-gpu-cuda10.2-cudnn7 /bin/bash +docker run --privileged --net=host --ipc=host -it --rm -v $PWD:/workspace --name=dev registry.baidubce.com/paddlepaddle/paddle:2.2.2-gpu-cuda10.2-cudnn7 /bin/bash ``` * More `Paddle` docker images you can see [here](https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/install/docker/linux-docker.html). @@ -60,4 +60,5 @@ popd ## TODO +### Deepspeech2 with linear feature * DecibelNormalizer: there is a little bit difference between offline and online db norm. The computation of online db norm read feature chunk by chunk, which causes the feature size is different with offline db norm. In normalizer.cc:73, the samples.size() is different, which causes the difference of result. diff --git a/speechx/build.sh b/speechx/build.sh index 8e36d233..a6eef656 100755 --- a/speechx/build.sh +++ b/speechx/build.sh @@ -22,6 +22,6 @@ cd build cmake .. -DBOOST_ROOT:STRING=${boost_SOURCE_DIR} #cmake .. -make -j10 +make -j cd - diff --git a/speechx/examples/ds2_ol/websocket/websocket_client_main.cc b/speechx/examples/ds2_ol/websocket/websocket_client_main.cc index 68ea898a..d6f0d480 100644 --- a/speechx/examples/ds2_ol/websocket/websocket_client_main.cc +++ b/speechx/examples/ds2_ol/websocket/websocket_client_main.cc @@ -18,7 +18,7 @@ #include "kaldi/util/table-types.h" DEFINE_string(host, "127.0.0.1", "host of websocket server"); -DEFINE_int32(port, 201314, "port of websocket server"); +DEFINE_int32(port, 8082, "port of websocket server"); DEFINE_string(wav_rspecifier, "", "test wav scp path"); DEFINE_double(streaming_chunk, 0.1, "streaming feature chunk size"); diff --git a/speechx/examples/ds2_ol/websocket/websocket_server_main.cc b/speechx/examples/ds2_ol/websocket/websocket_server_main.cc index 43cbd6bb..109da96b 100644 --- a/speechx/examples/ds2_ol/websocket/websocket_server_main.cc +++ b/speechx/examples/ds2_ol/websocket/websocket_server_main.cc @@ -15,7 +15,7 @@ #include "websocket/websocket_server.h" #include "decoder/param.h" -DEFINE_int32(port, 201314, "websocket listening port"); +DEFINE_int32(port, 8082, "websocket listening port"); int main(int argc, char *argv[]) { gflags::ParseCommandLineFlags(&argc, &argv, false);