[engine] add wfst recognizer in example (#3173)
* update wfst script * add skip blankpull/3198/head
parent
5e2251afda
commit
8c2196ea0c
@ -0,0 +1,36 @@
|
||||
#!/bin/bash
|
||||
set -e
|
||||
|
||||
data=data
|
||||
exp=exp
|
||||
nj=20
|
||||
|
||||
. utils/parse_options.sh
|
||||
|
||||
mkdir -p $exp
|
||||
ckpt_dir=./data/model
|
||||
model_dir=$ckpt_dir/onnx_model/
|
||||
aishell_wav_scp=aishell_test.scp
|
||||
text=$data/test/text
|
||||
|
||||
./local/split_data.sh $data $data/$aishell_wav_scp $aishell_wav_scp $nj
|
||||
|
||||
utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recognizer.fd.log \
|
||||
recognizer_main \
|
||||
--use_fbank=true \
|
||||
--num_bins=80 \
|
||||
--model_path=$model_dir \
|
||||
--word_symbol_table=$model_dir/unit.txt \
|
||||
--nnet_decoder_chunk=16 \
|
||||
--receptive_field_length=7 \
|
||||
--subsampling_rate=4 \
|
||||
--with_onnx_model=true \
|
||||
--wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
|
||||
--result_wspecifier=ark,t:$data/split${nj}/JOB/recognizer.fd.rsl.ark
|
||||
|
||||
|
||||
cat $data/split${nj}/*/recognizer.fd.rsl.ark > $exp/aishell.recognizer.fd.rsl
|
||||
utils/compute-wer.py --char=1 --v=1 $text $exp/aishell.recognizer.fd.rsl > $exp/aishell.recognizer.fd.err
|
||||
echo "recognizer fd test have finished!!!"
|
||||
echo "please checkout in $exp/aishell.recognizer.fd.err"
|
||||
tail -n 7 $exp/aishell.recognizer.fd.err
|
@ -0,0 +1,51 @@
|
||||
#!/bin/bash
|
||||
set -e
|
||||
|
||||
data=data
|
||||
exp=exp
|
||||
nj=20
|
||||
|
||||
. utils/parse_options.sh
|
||||
|
||||
mkdir -p $exp
|
||||
ckpt_dir=./data/model
|
||||
model_dir=$ckpt_dir/onnx_model/
|
||||
aishell_wav_scp=aishell_test.scp
|
||||
text=$data/test/text
|
||||
|
||||
./local/split_data.sh $data $data/$aishell_wav_scp $aishell_wav_scp $nj
|
||||
|
||||
lang_dir=./data/lang_test/
|
||||
graph=$lang_dir/TLG.fst
|
||||
word_table=$lang_dir/words.txt
|
||||
|
||||
if [ ! -f $graph ]; then
|
||||
# download ngram, if you want to make graph by yourself, please refer local/run_build_tlg.sh
|
||||
mkdir -p $lang_dir
|
||||
pushd $lang_dir
|
||||
wget -c https://paddlespeech.bj.bcebos.com/speechx/examples/ngram/zh/tlg.zip
|
||||
unzip tlg.zip
|
||||
popd
|
||||
fi
|
||||
|
||||
utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recognizer_wfst_fd.log \
|
||||
recognizer_main \
|
||||
--use_fbank=true \
|
||||
--num_bins=80 \
|
||||
--model_path=$model_dir \
|
||||
--graph_path=$lang_dir/TLG.fst \
|
||||
--word_symbol_table=$word_table \
|
||||
--nnet_decoder_chunk=16 \
|
||||
--receptive_field_length=7 \
|
||||
--subsampling_rate=4 \
|
||||
--wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
|
||||
--rescoring_weight=0.0 \
|
||||
--acoustic_scale=2 \
|
||||
--result_wspecifier=ark,t:$data/split${nj}/JOB/result_recognizer_wfst_fd.ark
|
||||
|
||||
|
||||
cat $data/split${nj}/*/result_recognizer_wfst_fd.ark > $exp/aishell_recognizer_wfst_fd
|
||||
utils/compute-wer.py --char=1 --v=1 $text $exp/aishell_recognizer_wfst_fd > $exp/aishell.recognizer_wfst_fd.err
|
||||
echo "recognizer test have finished!!!"
|
||||
echo "please checkout in $exp/aishell.recognizer_wfst_fd.err"
|
||||
tail -n 7 $exp/aishell.recognizer_wfst_fd.err
|
Loading…
Reference in new issue