diff --git a/speechx/examples/ds2_ol/README.md b/speechx/examples/ds2_ol/README.md
deleted file mode 100644
index d1da96cc9..000000000
--- a/speechx/examples/ds2_ol/README.md
+++ /dev/null
@@ -1,7 +0,0 @@
-# Deepspeech2 Streaming ASR
-
-## Examples
-
-* `websocket` - Streaming ASR with websocket for deepspeech2_aishell.    
-* `aishell` - Streaming Decoding under aishell dataset, for local WER test.    
-* `onnx` - Example to convert deepspeech2 to onnx format.
diff --git a/speechx/examples/ds2_ol/aishell/.gitignore b/speechx/examples/ds2_ol/aishell/.gitignore
deleted file mode 100644
index 68f993b47..000000000
--- a/speechx/examples/ds2_ol/aishell/.gitignore
+++ /dev/null
@@ -1,3 +0,0 @@
-data
-exp
-aishell_*
diff --git a/speechx/examples/ds2_ol/aishell/README.md b/speechx/examples/ds2_ol/aishell/README.md
deleted file mode 100644
index 2ee0bbca9..000000000
--- a/speechx/examples/ds2_ol/aishell/README.md
+++ /dev/null
@@ -1,133 +0,0 @@
-# Aishell - Deepspeech2 Streaming
-
-> We recommend using U2/U2++ model instead of DS2, please see [here](../../u2pp_ol/wenetspeech/).
-
-A C++ deployment example for using the deepspeech2 model to recognize `wav` and compute `CER`. We using AISHELL-1 as test data.
-
-## Source path.sh
-
-```bash
-. path.sh
-```
-
-SpeechX bins is under `echo $SPEECHX_BUILD`, more info please see `path.sh`.
-
-## Recognize with linear feature
-
-```bash
-bash run.sh
-```
-
-`run.sh` has multi stage, for details please see `run.sh`: 
-
-1. donwload dataset, model and lm
-2. convert cmvn format and compute feature
-3. decode w/o lm by feature
-4. decode w/ ngram lm by feature
-5. decode w/ TLG graph by feature
-6. recognize w/ TLG graph by wav input
-
-### Recognize with `.scp` file for wav
-
-This sciprt using `recognizer_main` to recognize wav file.
-
-The input is `scp` file which look like this:
-```text
-# head data/split1/1/aishell_test.scp 
-BAC009S0764W0121        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0121.wav
-BAC009S0764W0122        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0122.wav
-...
-BAC009S0764W0125        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0125.wav
-```
-
-If you want to recognize one wav, you can make `scp` file like this:
-```text
-key  path/to/wav/file
-```
-
-Then specify `--wav_rspecifier=` param for `recognizer_main` bin. For other flags meaning, please see `help`:
-```bash
-recognizer_main --help
-```
-
-For the exmaple to using `recognizer_main` please see `run.sh`.
-
-
-### CTC Prefix Beam Search w/o LM
-
-```
-Overall -> 16.14 % N=104612 C=88190 S=16110 D=312 I=465
-Mandarin -> 16.14 % N=104612 C=88190 S=16110 D=312 I=465
-Other -> 0.00 % N=0 C=0 S=0 D=0 I=0
-```
-
-### CTC Prefix Beam Search w/ LM
-
-LM: zh_giga.no_cna_cmn.prune01244.klm
-```
-Overall -> 7.86 % N=104768 C=96865 S=7573 D=330 I=327
-Mandarin -> 7.86 % N=104768 C=96865 S=7573 D=330 I=327
-Other -> 0.00 % N=0 C=0 S=0 D=0 I=0
-```
-
-### CTC TLG WFST
-
-LM: [aishell train](http://paddlespeech.bj.bcebos.com/speechx/examples/ds2_ol/aishell/aishell_graph.zip)
---acoustic_scale=1.2
-```
-Overall -> 11.14 % N=103017 C=93363 S=9583 D=71 I=1819
-Mandarin -> 11.14 % N=103017 C=93363 S=9583 D=71 I=1818
-Other -> 0.00 % N=0 C=0 S=0 D=0 I=1
-```
-
-LM: [wenetspeech](http://paddlespeech.bj.bcebos.com/speechx/examples/ds2_ol/aishell/wenetspeech_graph.zip)
---acoustic_scale=1.5
-```
-Overall -> 10.93 % N=104765 C=93410 S=9780 D=1575 I=95
-Mandarin -> 10.93 % N=104762 C=93410 S=9779 D=1573 I=95
-Other -> 100.00 % N=3 C=0 S=1 D=2 I=0
-```
-
-## Recognize with fbank feature
-
-This script is same to `run.sh`, but using fbank feature.
-
-```bash
-bash run_fbank.sh
-```
-
-### CTC Prefix Beam Search w/o LM
-
-```
-Overall -> 10.44 % N=104765 C=94194 S=10174 D=397 I=369
-Mandarin -> 10.44 % N=104762 C=94194 S=10171 D=397 I=369
-Other -> 100.00 % N=3 C=0 S=3 D=0 I=0
-```
-
-### CTC Prefix Beam Search w/ LM
-
-LM: zh_giga.no_cna_cmn.prune01244.klm
-
-```
-Overall -> 5.82 % N=104765 C=99386 S=4944 D=435 I=720
-Mandarin -> 5.82 % N=104762 C=99386 S=4941 D=435 I=720
-English -> 0.00 % N=0 C=0 S=0 D=0 I=0
-```
-
-### CTC TLG WFST
-
-LM: [aishell train](https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_graph2.zip)
-```
-Overall -> 9.58 % N=104765 C=94817 S=4326 D=5622 I=84
-Mandarin -> 9.57 % N=104762 C=94817 S=4325 D=5620 I=84
-Other -> 100.00 % N=3 C=0 S=1 D=2 I=0
-```
-
-## Build TLG WFST graph 
-
-The script is for building TLG wfst graph, depending on `srilm`, please make sure it is installed.
-For more information please see the script below.
-
-```bash
- bash ./local/run_build_tlg.sh
-```
diff --git a/speechx/examples/ds2_ol/aishell/local/aishell_train_lms.sh b/speechx/examples/ds2_ol/aishell/local/aishell_train_lms.sh
deleted file mode 100755
index 544a1f59a..000000000
--- a/speechx/examples/ds2_ol/aishell/local/aishell_train_lms.sh
+++ /dev/null
@@ -1,71 +0,0 @@
-#!/bin/bash
-
-# To be run from one directory above this script.
-. ./path.sh
-
-nj=40
-text=data/local/lm/text
-lexicon=data/local/dict/lexicon.txt
-
-for f in "$text" "$lexicon"; do
-  [ ! -f $x ] && echo "$0: No such file $f" && exit 1;
-done
-
-# Check SRILM tools
-if ! which ngram-count > /dev/null; then
-    echo "srilm tools are not found, please download it and install it from: "
-    echo "http://www.speech.sri.com/projects/srilm/download.html"
-    echo "Then add the tools to your PATH"
-    exit 1
-fi
-
-# This script takes no arguments.  It assumes you have already run
-# aishell_data_prep.sh.
-# It takes as input the files
-# data/local/lm/text
-# data/local/dict/lexicon.txt
-dir=data/local/lm
-mkdir -p $dir
-
-cleantext=$dir/text.no_oov
-
-# oov to <SPOKEN_NOISE>
-# lexicon line: word char0 ... charn
-# text line: utt word0 ... wordn -> line: <SPOKEN_NOISE> word0 ... wordn
-text_dir=$(dirname $text)
-split_name=$(basename $text)
-./local/split_data.sh $text_dir $text $split_name $nj
-
-utils/run.pl JOB=1:$nj $text_dir/split${nj}/JOB/${split_name}.no_oov.log \
-  cat ${text_dir}/split${nj}/JOB/${split_name} \| awk -v lex=$lexicon 'BEGIN{while((getline<lex) >0){ seen[$1]=1; } }
-    {for(n=1; n<=NF;n++) {  if (seen[$n]) { printf("%s ", $n); } else {printf("<SPOKEN_NOISE> ");} } printf("\n");}' \
-    \> ${text_dir}/split${nj}/JOB/${split_name}.no_oov || exit 1;
-cat ${text_dir}/split${nj}/*/${split_name}.no_oov  > $cleantext
-
-# compute word counts, sort in descending order
-# line: count word
-cat $cleantext | awk '{for(n=2;n<=NF;n++) print $n; }' | sort --parallel=`nproc` | uniq -c | \
-   sort --parallel=`nproc` -nr > $dir/word.counts || exit 1;
-
-# Get counts from acoustic training transcripts, and add  one-count
-# for each word in the lexicon (but not silence, we don't want it
-# in the LM-- we'll add it optionally later).
-cat $cleantext | awk '{for(n=2;n<=NF;n++) print $n; }' | \
-  cat - <(grep -w -v '!SIL' $lexicon | awk '{print $1}') | \
-   sort --parallel=`nproc` | uniq -c | sort --parallel=`nproc` -nr > $dir/unigram.counts || exit 1;
-
-# word with <s> </s>
-cat $dir/unigram.counts | awk '{print $2}' | cat - <(echo "<s>"; echo "</s>" ) > $dir/wordlist
-
-# hold out to compute ppl
-heldout_sent=10000 # Don't change this if you want result to be comparable with kaldi_lm results
-
-mkdir -p $dir
-cat $cleantext | awk '{for(n=2;n<=NF;n++){ printf $n; if(n<NF) printf " "; else print ""; }}' | \
-  head -$heldout_sent > $dir/heldout
-cat $cleantext | awk '{for(n=2;n<=NF;n++){ printf $n; if(n<NF) printf " "; else print ""; }}' | \
-  tail -n +$heldout_sent > $dir/train
-
-ngram-count -text $dir/train -order 3 -limit-vocab -vocab $dir/wordlist -unk \
-  -map-unk "<UNK>" -kndiscount -interpolate -lm $dir/lm.arpa
-ngram -lm $dir/lm.arpa -ppl $dir/heldout
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/aishell/local/run_build_tlg.sh b/speechx/examples/ds2_ol/aishell/local/run_build_tlg.sh
deleted file mode 100755
index 07f47c7ea..000000000
--- a/speechx/examples/ds2_ol/aishell/local/run_build_tlg.sh
+++ /dev/null
@@ -1,145 +0,0 @@
-#!/bin/bash
-set -eo pipefail
-
-. path.sh
-
-# attention, please replace the vocab is only for this script. 
-# different acustic model has different vocab
-ckpt_dir=data/fbank_model
-unit=$ckpt_dir/data/lang_char/vocab.txt       # vocab file, line: char/spm_pice
-model_dir=$ckpt_dir/exp/deepspeech2_online/checkpoints/
-
-stage=-1
-stop_stage=100
-corpus=aishell
-lexicon=data/lexicon.txt  # line: word ph0 ... phn, aishell/resource_aishell/lexicon.txt
-text=data/text            # line: utt text, aishell/data_aishell/transcript/aishell_transcript_v0.8.txt
-
-. utils/parse_options.sh
-
-data=$PWD/data
-mkdir -p $data
-
-if [ $stage -le -1 ] && [ $stop_stage -ge -1 ]; then
-    if [ ! -f $data/speech.ngram.zh.tar.gz ];then
-        # download ngram
-        pushd $data
-        wget -c http://paddlespeech.bj.bcebos.com/speechx/examples/ngram/zh/speech.ngram.zh.tar.gz
-        tar xvzf speech.ngram.zh.tar.gz
-        popd
-    fi
-
-    if [ ! -f $ckpt_dir/data/mean_std.json ]; then
-        # download model
-        mkdir -p $ckpt_dir
-        pushd $ckpt_dir
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr0/WIP1_asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz
-        tar xzfv WIP1_asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz
-        popd
-    fi
-fi
-
-if [ ! -f $unit ]; then
-    echo "$0: No such file $unit"
-    exit 1;
-fi
-
-if ! which ngram-count; then
-    # need srilm install
-    pushd $MAIN_ROOT/tools
-    make srilm.done
-    popd
-fi
-
-mkdir -p data/local/dict
-if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
-    # Prepare dict
-    # line: char/spm_pices
-    cp $unit data/local/dict/units.txt
-
-    if [ ! -f $lexicon ];then
-       utils/text_to_lexicon.py --has_key true --text $text --lexicon $lexicon
-        echo "Generate $lexicon from $text"
-    fi
-
-    # filter by vocab
-    # line: word ph0 ... phn -> line: word char0 ... charn
-    utils/fst/prepare_dict.py \
-        --unit_file $unit \
-        --in_lexicon ${lexicon} \
-        --out_lexicon data/local/dict/lexicon.txt
-fi
-
-lm=data/local/lm
-mkdir -p $lm
-
-if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
-    # Train ngram lm
-    cp $text $lm/text
-    local/aishell_train_lms.sh
-    echo "build LM done."
-fi
-
-# build TLG
-if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
-  # build T & L
-  utils/fst/compile_lexicon_token_fst.sh \
-      data/local/dict data/local/tmp data/local/lang
- 
-  # build G & TLG
-  utils/fst/make_tlg.sh data/local/lm data/local/lang data/lang_test || exit 1;
-
-fi
-
-aishell_wav_scp=aishell_test.scp
-nj=40
-cmvn=$data/cmvn_fbank.ark
-wfst=$data/lang_test
-
-if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
-    if [ ! -d $data/test ]; then
-        # download test dataset
-        pushd $data
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_test.zip
-        unzip  aishell_test.zip
-        popd
-
-        realpath $data/test/*/*.wav > $data/wavlist
-        awk -F '/' '{ print $(NF) }' $data/wavlist | awk -F '.' '{ print $1 }' > $data/utt_id
-        paste $data/utt_id $data/wavlist > $data/$aishell_wav_scp
-    fi
-
-    ./local/split_data.sh $data $data/$aishell_wav_scp $aishell_wav_scp $nj
-    
-    # convert cmvn format
-    cmvn-json2kaldi --json_file=$ckpt_dir/data/mean_std.json --cmvn_write_path=$cmvn
-fi
-
-wer=aishell_wer
-label_file=aishell_result
-export GLOG_logtostderr=1
-
-if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    #  recognize w/ TLG graph
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/check_tlg.log \
-    recognizer_main \
-        --wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
-        --cmvn_file=$cmvn \
-        --model_path=$model_dir/avg_5.jit.pdmodel \
-        --streaming_chunk=30 \
-        --use_fbank=true \
-        --param_path=$model_dir/avg_5.jit.pdiparams \
-        --word_symbol_table=$wfst/words.txt \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-        --model_cache_shapes="5-1-2048,5-1-2048" \
-        --graph_path=$wfst/TLG.fst --max_active=7500 \
-        --acoustic_scale=1.2 \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_check_tlg
-
-    cat $data/split${nj}/*/result_check_tlg > $exp/${label_file}_check_tlg
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_check_tlg > $exp/${wer}.check_tlg
-    echo "recognizer test have finished!!!"
-    echo "please checkout in ${exp}/${wer}.check_tlg"
-fi
-
-exit 0
diff --git a/speechx/examples/ds2_ol/aishell/local/split_data.sh b/speechx/examples/ds2_ol/aishell/local/split_data.sh
deleted file mode 100755
index 2af6fc5ab..000000000
--- a/speechx/examples/ds2_ol/aishell/local/split_data.sh
+++ /dev/null
@@ -1,30 +0,0 @@
-#!/usr/bin/env bash
-
-set -eo pipefail
-
-data=$1
-scp=$2
-split_name=$3
-numsplit=$4
-
-# save in $data/split{n}
-# $scp to split
-# 
-
-if [[ ! $numsplit -gt 0 ]]; then
-  echo "Invalid num-split argument";
-  exit 1;
-fi
-
-directories=$(for n in `seq $numsplit`; do echo $data/split${numsplit}/$n; done)
-scp_splits=$(for n in `seq $numsplit`; do echo $data/split${numsplit}/$n/${split_name}; done)
-
-# if this mkdir fails due to argument-list being too long, iterate.
-if ! mkdir -p $directories >&/dev/null; then
-  for n in `seq $numsplit`; do
-    mkdir -p $data/split${numsplit}/$n
-  done
-fi
-
-echo "utils/split_scp.pl $scp $scp_splits"
-utils/split_scp.pl $scp $scp_splits
diff --git a/speechx/examples/ds2_ol/aishell/path.sh b/speechx/examples/ds2_ol/aishell/path.sh
deleted file mode 100755
index 6e8039350..000000000
--- a/speechx/examples/ds2_ol/aishell/path.sh
+++ /dev/null
@@ -1,24 +0,0 @@
-# This contains the locations of binarys build required for running the examples.
-
-MAIN_ROOT=`realpath $PWD/../../../../`
-SPEECHX_ROOT=$PWD/../../../
-SPEECHX_BUILD=$SPEECHX_ROOT/build/speechx
-
-SPEECHX_TOOLS=$SPEECHX_ROOT/tools
-TOOLS_BIN=$SPEECHX_TOOLS/valgrind/install/bin
-
-[ -d $SPEECHX_BUILD ] || { echo "Error: 'build/speechx' directory not found. please ensure that the project build successfully"; }
-
-export LC_AL=C
-
-# openfst bin & kaldi bin
-KALDI_DIR=$SPEECHX_ROOT/build/speechx/kaldi/
-OPENFST_DIR=$SPEECHX_ROOT/fc_patch/openfst-build/src
-
-# srilm
-export LIBLBFGS=${MAIN_ROOT}/tools/liblbfgs-1.10
-export LD_LIBRARY_PATH=${LD_LIBRARY_PATH:-}:${LIBLBFGS}/lib/.libs
-export SRILM=${MAIN_ROOT}/tools/srilm
-
-SPEECHX_BIN=$SPEECHX_BUILD/decoder:$SPEECHX_BUILD/frontend/audio
-export PATH=$PATH:$SPEECHX_BIN:$TOOLS_BIN:${SRILM}/bin:${SRILM}/bin/i686-m64:$KALDI_DIR/lmbin:$KALDI_DIR/fstbin:$OPENFST_DIR/bin
diff --git a/speechx/examples/ds2_ol/aishell/run.sh b/speechx/examples/ds2_ol/aishell/run.sh
deleted file mode 100755
index 49438cb25..000000000
--- a/speechx/examples/ds2_ol/aishell/run.sh
+++ /dev/null
@@ -1,180 +0,0 @@
-#!/bin/bash
-set -x
-set -e
-
-. path.sh
-
-nj=40
-stage=0
-stop_stage=100
-
-. utils/parse_options.sh
-
-# 1. compile
-if [ ! -d ${SPEECHX_BUILD} ]; then
-    pushd ${SPEECHX_ROOT} 
-    bash build.sh
-    popd
-fi
-
-# input
-mkdir -p data
-data=$PWD/data
-
-ckpt_dir=$data/model
-model_dir=$ckpt_dir/exp/deepspeech2_online/checkpoints/
-vocb_dir=$ckpt_dir/data/lang_char/
-
-# output
-mkdir -p exp
-exp=$PWD/exp
-
-aishell_wav_scp=aishell_test.scp
-if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ];then
-    if [ ! -d $data/test ]; then
-        # donwload dataset
-        pushd $data
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_test.zip
-        unzip  aishell_test.zip
-        popd
-
-        realpath $data/test/*/*.wav > $data/wavlist
-        awk -F '/' '{ print $(NF) }' $data/wavlist | awk -F '.' '{ print $1 }' > $data/utt_id
-        paste $data/utt_id $data/wavlist > $data/$aishell_wav_scp
-    fi
-
-    if [ ! -f $ckpt_dir/data/mean_std.json ]; then
-        # download model
-        mkdir -p $ckpt_dir
-        pushd $ckpt_dir
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_online_aishell_ckpt_0.2.0.model.tar.gz
-        tar xzfv asr0_deepspeech2_online_aishell_ckpt_0.2.0.model.tar.gz 
-        popd
-    fi
-
-    lm=$data/zh_giga.no_cna_cmn.prune01244.klm
-    if [ ! -f $lm ]; then
-        # download kenlm bin
-        pushd $data
-        wget -c https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm
-        popd
-    fi
-fi
-
-# 3. make feature
-text=$data/test/text
-label_file=./aishell_result
-wer=./aishell_wer
-
-export GLOG_logtostderr=1
-
-
-cmvn=$data/cmvn.ark
-if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
-    # 3. convert cmvn format and compute linear feat
-    cmvn_json2kaldi_main --json_file=$ckpt_dir/data/mean_std.json --cmvn_write_path=$cmvn
-
-    ./local/split_data.sh $data $data/$aishell_wav_scp $aishell_wav_scp $nj
-
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/feat.log \
-    compute_linear_spectrogram_main \
-        --wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
-        --feature_wspecifier=ark,scp:$data/split${nj}/JOB/feat.ark,$data/split${nj}/JOB/feat.scp \
-        --cmvn_file=$cmvn \
-    echo "feature make have finished!!!"
-fi
-
-if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
-    #  decode w/o lm
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.wolm.log \
-    ctc_beam_search_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
-        --model_path=$model_dir/avg_1.jit.pdmodel \
-        --param_path=$model_dir/avg_1.jit.pdiparams \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-	    --nnet_decoder_chunk=8 \
-        --dict_file=$vocb_dir/vocab.txt \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result
-
-    cat $data/split${nj}/*/result > $exp/${label_file}
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file} > $exp/${wer}
-    echo "ctc-prefix-beam-search-decoder-ol without lm has finished!!!"
-    echo "please checkout in ${exp}/${wer}"
-    tail -n 7 $exp/${wer}
-fi
-
-if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
-    # decode w/ ngram lm with feature input
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.lm.log \
-    ctc_beam_search_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
-        --model_path=$model_dir/avg_1.jit.pdmodel \
-        --param_path=$model_dir/avg_1.jit.pdiparams \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-	    --nnet_decoder_chunk=8 \
-        --dict_file=$vocb_dir/vocab.txt \
-        --lm_path=$lm \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_lm
- 
-    cat $data/split${nj}/*/result_lm > $exp/${label_file}_lm
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_lm > $exp/${wer}.lm
-    echo "ctc-prefix-beam-search-decoder-ol with lm test has finished!!!"
-    echo "please checkout in ${exp}/${wer}.lm"
-    tail -n 7 $exp/${wer}.lm
-fi
-
-wfst=$data/wfst/
-if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    mkdir -p $wfst
-    if [ ! -f $wfst/aishell_graph.zip ]; then
-        # download TLG graph
-        pushd $wfst
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_graph.zip
-        unzip aishell_graph.zip
-        mv aishell_graph/* $wfst
-        popd
-    fi
-fi
-
-if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    #  decoder w/ TLG graph with feature input
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.wfst.log \
-    ctc_tlg_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/feat.scp \
-        --model_path=$model_dir/avg_1.jit.pdmodel \
-        --param_path=$model_dir/avg_1.jit.pdiparams \
-        --word_symbol_table=$wfst/words.txt \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-        --graph_path=$wfst/TLG.fst --max_active=7500 \
-	    --nnet_decoder_chunk=8 \
-        --acoustic_scale=1.2 \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_tlg
-
-    cat $data/split${nj}/*/result_tlg > $exp/${label_file}_tlg
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_tlg > $exp/${wer}.tlg
-    echo "wfst-decoder-ol have finished!!!"
-    echo "please checkout in ${exp}/${wer}.tlg"
-    tail -n 7 $exp/${wer}.tlg
-fi
-
-if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
-    #  recognize from wav file w/ TLG graph
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recognizer.log \
-    recognizer_main \
-        --wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
-        --cmvn_file=$cmvn \
-        --model_path=$model_dir/avg_1.jit.pdmodel \
-        --param_path=$model_dir/avg_1.jit.pdiparams \
-        --word_symbol_table=$wfst/words.txt \
-	    --nnet_decoder_chunk=8 \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-        --graph_path=$wfst/TLG.fst --max_active=7500 \
-        --acoustic_scale=1.2 \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_recognizer
-
-    cat $data/split${nj}/*/result_recognizer > $exp/${label_file}_recognizer
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_recognizer > $exp/${wer}.recognizer
-    echo "recognizer test have finished!!!"
-    echo "please checkout in ${exp}/${wer}.recognizer"
-    tail -n 7 $exp/${wer}.recognizer
-fi
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/aishell/run_fbank.sh b/speechx/examples/ds2_ol/aishell/run_fbank.sh
deleted file mode 100755
index b93d6944d..000000000
--- a/speechx/examples/ds2_ol/aishell/run_fbank.sh
+++ /dev/null
@@ -1,177 +0,0 @@
-#!/bin/bash
-set +x
-set -e
-
-. path.sh
-
-nj=40
-stage=0
-stop_stage=5
-
-. utils/parse_options.sh
-
-# 1. compile
-if [ ! -d ${SPEECHX_EXAMPLES} ]; then
-    pushd ${SPEECHX_ROOT} 
-    bash build.sh
-    popd
-fi
-
-# input
-mkdir -p data
-data=$PWD/data
-
-ckpt_dir=$data/fbank_model
-model_dir=$ckpt_dir/exp/deepspeech2_online/checkpoints/
-vocb_dir=$ckpt_dir/data/lang_char/
-
-# output
-mkdir -p exp
-exp=$PWD/exp
-
-lm=$data/zh_giga.no_cna_cmn.prune01244.klm
-aishell_wav_scp=aishell_test.scp
-if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ];then
-    if [ ! -d $data/test ]; then
-        pushd $data
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_test.zip
-        unzip  aishell_test.zip
-        popd
-
-        realpath $data/test/*/*.wav > $data/wavlist
-        awk -F '/' '{ print $(NF) }' $data/wavlist | awk -F '.' '{ print $1 }' > $data/utt_id
-        paste $data/utt_id $data/wavlist > $data/$aishell_wav_scp
-    fi
-
-    if [ ! -f $ckpt_dir/data/mean_std.json ]; then
-        mkdir -p $ckpt_dir
-        pushd $ckpt_dir
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/wenetspeech/asr0/WIP1_asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz
-        tar xzfv WIP1_asr0_deepspeech2_online_wenetspeech_ckpt_1.0.0a.model.tar.gz
-        popd
-    fi
-
-    if [ ! -f $lm ]; then
-        pushd $data
-        wget -c https://deepspeech.bj.bcebos.com/zh_lm/zh_giga.no_cna_cmn.prune01244.klm
-        popd
-    fi
-fi
-
-# 3. make feature
-text=$data/test/text
-label_file=./aishell_result_fbank
-wer=./aishell_wer_fbank
-
-export GLOG_logtostderr=1
-
-
-cmvn=$data/cmvn_fbank.ark
-if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ]; then
-    # 3. convert cmvn format and compute fbank feat
-    cmvn_json2kaldi_main --json_file=$ckpt_dir/data/mean_std.json --cmvn_write_path=$cmvn --binary=false
-
-    ./local/split_data.sh $data $data/$aishell_wav_scp $aishell_wav_scp $nj
-
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/feat.log \
-    compute_fbank_main \
-        --wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
-        --feature_wspecifier=ark,scp:$data/split${nj}/JOB/fbank_feat.ark,$data/split${nj}/JOB/fbank_feat.scp \
-        --cmvn_file=$cmvn \
-        --streaming_chunk=36
-fi
-
-if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ]; then
-    #  decode w/ lm by feature
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.fbank.wolm.log \
-    ctc_beam_search_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/fbank_feat.scp \
-        --model_path=$model_dir/avg_5.jit.pdmodel \
-        --param_path=$model_dir/avg_5.jit.pdiparams \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-    	--model_cache_shapes="5-1-2048,5-1-2048" \
-	    --nnet_decoder_chunk=8 \
-        --dict_file=$vocb_dir/vocab.txt \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_fbank
-
-    cat $data/split${nj}/*/result_fbank > $exp/${label_file}
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file} > $exp/${wer}
-    tail -n 7 $exp/${wer}
-fi
-
-if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then
-    #  decode with ngram lm by feature
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.fbank.lm.log \
-    ctc_beam_search_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/fbank_feat.scp \
-        --model_path=$model_dir/avg_5.jit.pdmodel \
-        --param_path=$model_dir/avg_5.jit.pdiparams \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-	    --model_cache_shapes="5-1-2048,5-1-2048" \
-	    --nnet_decoder_chunk=8 \
-        --dict_file=$vocb_dir/vocab.txt \
-        --lm_path=$lm \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/fbank_result_lm
- 
-    cat $data/split${nj}/*/fbank_result_lm > $exp/${label_file}_lm
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_lm > $exp/${wer}.lm
-    tail -n 7 $exp/${wer}.lm
-fi
-
-wfst=$data/wfst_fbank/
-if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    mkdir -p $wfst
-    if [ ! -f $wfst/aishell_graph2.zip ]; then
-        pushd $wfst
-        wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_graph2.zip
-        unzip aishell_graph2.zip
-        mv aishell_graph2/* $wfst
-        popd
-    fi
-fi
-
-if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then
-    #  decode w/ TLG graph by feature
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/recog.fbank.wfst.log \
-    ctc_tlg_decoder_main \
-        --feature_rspecifier=scp:$data/split${nj}/JOB/fbank_feat.scp \
-        --model_path=$model_dir/avg_5.jit.pdmodel \
-        --param_path=$model_dir/avg_5.jit.pdiparams \
-        --word_symbol_table=$wfst/words.txt \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-	    --model_cache_shapes="5-1-2048,5-1-2048" \
-	    --nnet_decoder_chunk=8 \
-        --graph_path=$wfst/TLG.fst --max_active=7500 \
-        --acoustic_scale=1.2 \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_tlg
-
-    cat $data/split${nj}/*/result_tlg > $exp/${label_file}_tlg
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_tlg > $exp/${wer}.tlg
-    echo "wfst-decoder-ol have finished!!!"
-    echo "please checkout in ${exp}/${wer}.tlg"
-    tail -n 7 $exp/${wer}.tlg
-fi
-
-if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then
-    # recgonize w/ TLG graph by wav
-    utils/run.pl JOB=1:$nj $data/split${nj}/JOB/fbank_recognizer.log \
-    recognizer_main \
-        --wav_rspecifier=scp:$data/split${nj}/JOB/${aishell_wav_scp} \
-        --cmvn_file=$cmvn \
-        --model_path=$model_dir/avg_5.jit.pdmodel \
-        --use_fbank=true \
-        --param_path=$model_dir/avg_5.jit.pdiparams \
-        --word_symbol_table=$wfst/words.txt \
-        --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-        --model_cache_shapes="5-1-2048,5-1-2048" \
-	    --nnet_decoder_chunk=8 \
-        --graph_path=$wfst/TLG.fst --max_active=7500 \
-        --acoustic_scale=1.2 \
-        --result_wspecifier=ark,t:$data/split${nj}/JOB/result_fbank_recognizer
-
-    cat $data/split${nj}/*/result_fbank_recognizer > $exp/${label_file}_recognizer
-    utils/compute-wer.py --char=1 --v=1 $text $exp/${label_file}_recognizer > $exp/${wer}.recognizer
-    echo "recognizer test have finished!!!"
-    echo "please checkout in ${exp}/${wer}.recognizer"
-    tail -n 7 $exp/${wer}.recognizer
-fi
diff --git a/speechx/examples/ds2_ol/aishell/utils b/speechx/examples/ds2_ol/aishell/utils
deleted file mode 120000
index c2519a9dd..000000000
--- a/speechx/examples/ds2_ol/aishell/utils
+++ /dev/null
@@ -1 +0,0 @@
-../../../../utils/
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/onnx/.gitignore b/speechx/examples/ds2_ol/onnx/.gitignore
deleted file mode 100644
index f862f73e2..000000000
--- a/speechx/examples/ds2_ol/onnx/.gitignore
+++ /dev/null
@@ -1,3 +0,0 @@
-data
-log
-exp
diff --git a/speechx/examples/ds2_ol/onnx/README.md b/speechx/examples/ds2_ol/onnx/README.md
deleted file mode 100644
index b98b74b6f..000000000
--- a/speechx/examples/ds2_ol/onnx/README.md
+++ /dev/null
@@ -1,57 +0,0 @@
-# Convert DeepSpeech2 model to ONNX format
-
-> We recommend using U2/U2++ model instead of DS2, please see [here](../../u2pp_ol/wenetspeech/).
-
-This example demonstrate converting ds2 model to ONNX fromat.
-
-Please make sure [Paddle2ONNX](https://github.com/PaddlePaddle/Paddle2ONNX) and [onnx-simplifier](https://github.com/zh794390558/onnx-simplifier/tree/dyn_time_shape) version is correct.
-
-The example test with these packages installed:
-```
-paddle2onnx              0.9.8    # develop 62c5424e22cd93968dc831216fc9e0f0fce3d819
-paddleaudio              0.2.1
-paddlefsl                1.1.0
-paddlenlp                2.2.6
-paddlepaddle-gpu         2.2.2
-paddlespeech             0.0.0       # develop
-paddlespeech-ctcdecoders 0.2.0
-paddlespeech-feat        0.1.0
-onnx                     1.11.0
-onnx-simplifier          0.0.0       # https://github.com/zh794390558/onnx-simplifier/tree/dyn_time_shape
-onnxoptimizer            0.2.7
-onnxruntime              1.11.0
-```
-
-
-## Using
-
-```
-bash run.sh --stage 0 --stop_stage 5
-```
-
-1. convert deepspeech2 model to ONNX, using Paddle2ONNX.
-2. check paddleinference and onnxruntime output equal.
-3. optimize onnx model
-4. check paddleinference and optimized onnxruntime output equal.
-5. quantize onnx model
-6. check paddleinference and optimized onnxruntime output equal.
-
-For more details please see `run.sh`.
-
-## Outputs
-The optimized onnx model is `exp/model.opt.onnx`, quanted model is `exp/model.optset11.quant.onnx`.
-
-
-## [Results](https://github.com/PaddlePaddle/PaddleSpeech/wiki/ASR-Benchmark#streaming-asr)
-
-机器硬件：`CPU：Intel(R) Xeon(R) Gold 6271C CPU @ 2.60GHz`    
-测试脚本：`Streaming Server`      
-
-Acoustic Model | Model Size | enigne | dedoding_method | ctc_weight | decoding_chunk_size | num_decoding_left_chunk | RTF |
-|:-------------:| :-----: | :-----: | :------------:| :-----: | :-----: | :-----: |:-----:|
-| deepspeech2online_wenetspeech | 659MB | infernece | ctc_prefix_beam_search | - | 1 | - | 1.9108175171428279(utts=80) |
-| deepspeech2online_wenetspeech | 659MB | onnx | ctc_prefix_beam_search | - | 1 | - | 0.5617182449999291 (utts=80) |
-| deepspeech2online_wenetspeech | 166MB | onnx quant | ctc_prefix_beam_search | - | 1 | - | 0.44507715475808385 (utts=80) |
-
-> quant 和机器有关，不是所有机器都支持。ONNX quant测试机器指令集支持:
-> Flags:   fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc arch_perfmon rep_good nopl xtopology eagerfpu pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single ssbd ibrs ibpb fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 arat umip pku ospke avx512_vnni spec_ctrl
diff --git a/speechx/examples/ds2_ol/onnx/local/infer_check.py b/speechx/examples/ds2_ol/onnx/local/infer_check.py
deleted file mode 100755
index f821baa12..000000000
--- a/speechx/examples/ds2_ol/onnx/local/infer_check.py
+++ /dev/null
@@ -1,100 +0,0 @@
-#!/usr/bin/env python3
-# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import argparse
-import os
-import pickle
-
-import numpy as np
-import onnxruntime
-import paddle
-
-
-def parse_args():
-    parser = argparse.ArgumentParser(description=__doc__)
-    parser.add_argument(
-        '--input_file',
-        type=str,
-        default="static_ds2online_inputs.pickle",
-        help="aishell ds2 input data file. For wenetspeech, we only feed for infer model",
-    )
-    parser.add_argument(
-        '--model_type',
-        type=str,
-        default="aishell",
-        help="aishell(1024) or wenetspeech(2048)", )
-    parser.add_argument(
-        '--model_dir', type=str, default=".", help="paddle model dir.")
-    parser.add_argument(
-        '--model_prefix',
-        type=str,
-        default="avg_1.jit",
-        help="paddle model prefix.")
-    parser.add_argument(
-        '--onnx_model',
-        type=str,
-        default='./model.old.onnx',
-        help="onnx model.")
-
-    return parser.parse_args()
-
-
-if __name__ == '__main__':
-    FLAGS = parse_args()
-
-    # input and output
-    with open(FLAGS.input_file, 'rb') as f:
-        iodict = pickle.load(f)
-        print(iodict.keys())
-
-    audio_chunk = iodict['audio_chunk']
-    audio_chunk_lens = iodict['audio_chunk_lens']
-    chunk_state_h_box = iodict['chunk_state_h_box']
-    chunk_state_c_box = iodict['chunk_state_c_bos']
-    print("raw state shape: ", chunk_state_c_box.shape)
-
-    if FLAGS.model_type == 'wenetspeech':
-        chunk_state_h_box = np.repeat(chunk_state_h_box, 2, axis=-1)
-        chunk_state_c_box = np.repeat(chunk_state_c_box, 2, axis=-1)
-    print("state shape: ", chunk_state_c_box.shape)
-
-    # paddle
-    model = paddle.jit.load(os.path.join(FLAGS.model_dir, FLAGS.model_prefix))
-    res_chunk, res_lens, chunk_state_h, chunk_state_c = model(
-        paddle.to_tensor(audio_chunk),
-        paddle.to_tensor(audio_chunk_lens),
-        paddle.to_tensor(chunk_state_h_box),
-        paddle.to_tensor(chunk_state_c_box), )
-
-    # onnxruntime
-    options = onnxruntime.SessionOptions()
-    options.enable_profiling = True
-    sess = onnxruntime.InferenceSession(FLAGS.onnx_model, sess_options=options)
-    ort_res_chunk, ort_res_lens, ort_chunk_state_h, ort_chunk_state_c = sess.run(
-        ['softmax_0.tmp_0', 'tmp_5', 'concat_0.tmp_0', 'concat_1.tmp_0'], {
-            "audio_chunk": audio_chunk,
-            "audio_chunk_lens": audio_chunk_lens,
-            "chunk_state_h_box": chunk_state_h_box,
-            "chunk_state_c_box": chunk_state_c_box
-        })
-
-    print(sess.end_profiling())
-
-    # assert paddle equal ort
-    print(np.allclose(ort_res_chunk, res_chunk, atol=1e-6))
-    print(np.allclose(ort_res_lens, res_lens, atol=1e-6))
-
-    if FLAGS.model_type == 'aishell':
-        print(np.allclose(ort_chunk_state_h, chunk_state_h, atol=1e-6))
-        print(np.allclose(ort_chunk_state_c, chunk_state_c, atol=1e-6))
diff --git a/speechx/examples/ds2_ol/onnx/local/netron.sh b/speechx/examples/ds2_ol/onnx/local/netron.sh
deleted file mode 100755
index 6dd9a39c9..000000000
--- a/speechx/examples/ds2_ol/onnx/local/netron.sh
+++ /dev/null
@@ -1,14 +0,0 @@
-#!/bin/bash
-
-# show model 
-
-if [ $# != 1 ];then
-    echo "usage: $0 model_path"
-    exit 1
-fi
-
-
-file=$1
-
-pip install netron
-netron -p 8082 --host $(hostname -i) $file
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_clone.sh b/speechx/examples/ds2_ol/onnx/local/onnx_clone.sh
deleted file mode 100755
index bce22dbc8..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_clone.sh
+++ /dev/null
@@ -1,7 +0,0 @@
-
-#!/bin/bash
-
-# clone onnx repos
-git clone https://github.com/onnx/onnx.git
-git clone https://github.com/microsoft/onnxruntime.git
-git clone https://github.com/PaddlePaddle/Paddle2ONNX.git
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_convert_opset.py b/speechx/examples/ds2_ol/onnx/local/onnx_convert_opset.py
deleted file mode 100755
index 00b5cf775..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_convert_opset.py
+++ /dev/null
@@ -1,37 +0,0 @@
-#!/usr/bin/env python3
-import argparse
-
-import onnx
-from onnx import version_converter
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(prog=__doc__)
-    parser.add_argument(
-        "--model-file", type=str, required=True, help='path/to/the/model.onnx.')
-    parser.add_argument(
-        "--save-model",
-        type=str,
-        required=True,
-        help='path/to/saved/model.onnx.')
-    # Models must be opset10 or higher to be quantized.
-    parser.add_argument(
-        "--target-opset", type=int, default=11, help='path/to/the/model.onnx.')
-
-    args = parser.parse_args()
-
-    print(f"to opset: {args.target_opset}")
-
-    # Preprocessing: load the model to be converted.
-    model_path = args.model_file
-    original_model = onnx.load(model_path)
-
-    # print('The model before conversion:\n{}'.format(original_model))
-
-    # A full list of supported adapters can be found here:
-    # https://github.com/onnx/onnx/blob/main/onnx/version_converter.py#L21
-    # Apply the version conversion on the original model
-    converted_model = version_converter.convert_version(original_model,
-                                                        args.target_opset)
-
-    # print('The model after conversion:\n{}'.format(converted_model))
-    onnx.save(converted_model, args.save_model)
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_infer_shape.py b/speechx/examples/ds2_ol/onnx/local/onnx_infer_shape.py
deleted file mode 100755
index c53e9ec92..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_infer_shape.py
+++ /dev/null
@@ -1,2514 +0,0 @@
-# Copyright (c) Microsoft Corporation. All rights reserved.
-# Licensed under the MIT License.
-# flake8: noqa
-import argparse
-import logging
-
-import numpy as np
-import onnx
-import sympy
-from onnx import helper
-from onnx import numpy_helper
-from onnx import shape_inference
-from packaging import version
-assert version.parse(onnx.__version__) >= version.parse("1.8.0")
-
-logger = logging.getLogger(__name__)
-
-
-def get_attribute(node, attr_name, default_value=None):
-    found = [attr for attr in node.attribute if attr.name == attr_name]
-    if found:
-        return helper.get_attribute_value(found[0])
-    return default_value
-
-
-def get_dim_from_proto(dim):
-    return getattr(dim, dim.WhichOneof('value')) if type(
-        dim.WhichOneof('value')) == str else None
-
-
-def is_sequence(type_proto):
-    cls_type = type_proto.WhichOneof('value')
-    assert cls_type in ['tensor_type', 'sequence_type']
-    return cls_type == 'sequence_type'
-
-
-def get_shape_from_type_proto(type_proto):
-    assert not is_sequence(type_proto)
-    if type_proto.tensor_type.HasField('shape'):
-        return [get_dim_from_proto(d) for d in type_proto.tensor_type.shape.dim]
-    else:
-        return None  # note no shape is different from shape without dim (scalar)
-
-
-def get_shape_from_value_info(vi):
-    cls_type = vi.type.WhichOneof('value')
-    if cls_type is None:
-        return None
-    if is_sequence(vi.type):
-        if 'tensor_type' == vi.type.sequence_type.elem_type.WhichOneof('value'):
-            return get_shape_from_type_proto(vi.type.sequence_type.elem_type)
-        else:
-            return None
-    else:
-        return get_shape_from_type_proto(vi.type)
-
-
-def make_named_value_info(name):
-    vi = onnx.ValueInfoProto()
-    vi.name = name
-    return vi
-
-
-def get_shape_from_sympy_shape(sympy_shape):
-    return [
-        None if i is None else (int(i) if is_literal(i) else str(i))
-        for i in sympy_shape
-    ]
-
-
-def is_literal(dim):
-    return type(dim) in [int, np.int64, np.int32, sympy.Integer] or (hasattr(
-        dim, 'is_number') and dim.is_number)
-
-
-def handle_negative_axis(axis, rank):
-    assert axis < rank and axis >= -rank
-    return axis if axis >= 0 else rank + axis
-
-
-def get_opset(mp, domain=None):
-    domain = domain or ['', 'onnx', 'ai.onnx']
-    if type(domain) != list:
-        domain = [domain]
-    for opset in mp.opset_import:
-        if opset.domain in domain:
-            return opset.version
-
-    return None
-
-
-def as_scalar(x):
-    if type(x) == list:
-        assert len(x) == 1
-        return x[0]
-    elif type(x) == np.ndarray:
-        return x.item()
-    else:
-        return x
-
-
-def as_list(x, keep_none):
-    if type(x) == list:
-        return x
-    elif type(x) == np.ndarray:
-        return list(x)
-    elif keep_none and x is None:
-        return None
-    else:
-        return [x]
-
-
-def sympy_reduce_product(x):
-    if type(x) == list:
-        value = sympy.Integer(1)
-        for v in x:
-            value = value * v
-    else:
-        value = x
-    return value
-
-
-class SymbolicShapeInference:
-    def __init__(self,
-                 int_max,
-                 auto_merge,
-                 guess_output_rank,
-                 verbose,
-                 prefix=''):
-        self.dispatcher_ = {
-            'Add':
-            self._infer_symbolic_compute_ops,
-            'ArrayFeatureExtractor':
-            self._infer_ArrayFeatureExtractor,
-            'AveragePool':
-            self._infer_Pool,
-            'BatchNormalization':
-            self._infer_BatchNormalization,
-            'Cast':
-            self._infer_Cast,
-            'CategoryMapper':
-            self._infer_CategoryMapper,
-            'Compress':
-            self._infer_Compress,
-            'Concat':
-            self._infer_Concat,
-            'ConcatFromSequence':
-            self._infer_ConcatFromSequence,
-            'Constant':
-            self._infer_Constant,
-            'ConstantOfShape':
-            self._infer_ConstantOfShape,
-            'Conv':
-            self._infer_Conv,
-            'CumSum':
-            self._pass_on_shape_and_type,
-            'Div':
-            self._infer_symbolic_compute_ops,
-            'Einsum':
-            self._infer_Einsum,
-            'Expand':
-            self._infer_Expand,
-            'Equal':
-            self._infer_symbolic_compute_ops,
-            'Floor':
-            self._infer_symbolic_compute_ops,
-            'Gather':
-            self._infer_Gather,
-            'GatherElements':
-            self._infer_GatherElements,
-            'GatherND':
-            self._infer_GatherND,
-            'Gelu':
-            self._pass_on_shape_and_type,
-            'If':
-            self._infer_If,
-            'Loop':
-            self._infer_Loop,
-            'MatMul':
-            self._infer_MatMul,
-            'MatMulInteger16':
-            self._infer_MatMulInteger,
-            'MaxPool':
-            self._infer_Pool,
-            'Max':
-            self._infer_symbolic_compute_ops,
-            'Min':
-            self._infer_symbolic_compute_ops,
-            'Mul':
-            self._infer_symbolic_compute_ops,
-            'NonMaxSuppression':
-            self._infer_NonMaxSuppression,
-            'NonZero':
-            self._infer_NonZero,
-            'OneHot':
-            self._infer_OneHot,
-            'Pad':
-            self._infer_Pad,
-            'Range':
-            self._infer_Range,
-            'Reciprocal':
-            self._pass_on_shape_and_type,
-            'ReduceSum':
-            self._infer_ReduceSum,
-            'ReduceProd':
-            self._infer_ReduceProd,
-            'Reshape':
-            self._infer_Reshape,
-            'Resize':
-            self._infer_Resize,
-            'Round':
-            self._pass_on_shape_and_type,
-            'Scan':
-            self._infer_Scan,
-            'ScatterElements':
-            self._infer_ScatterElements,
-            'SequenceAt':
-            self._infer_SequenceAt,
-            'SequenceInsert':
-            self._infer_SequenceInsert,
-            'Shape':
-            self._infer_Shape,
-            'Size':
-            self._infer_Size,
-            'Slice':
-            self._infer_Slice,
-            'SoftmaxCrossEntropyLoss':
-            self._infer_SoftmaxCrossEntropyLoss,
-            'SoftmaxCrossEntropyLossInternal':
-            self._infer_SoftmaxCrossEntropyLoss,
-            'NegativeLogLikelihoodLossInternal':
-            self._infer_SoftmaxCrossEntropyLoss,
-            'Split':
-            self._infer_Split,
-            'SplitToSequence':
-            self._infer_SplitToSequence,
-            'Squeeze':
-            self._infer_Squeeze,
-            'Sub':
-            self._infer_symbolic_compute_ops,
-            'Tile':
-            self._infer_Tile,
-            'TopK':
-            self._infer_TopK,
-            'Transpose':
-            self._infer_Transpose,
-            'Unsqueeze':
-            self._infer_Unsqueeze,
-            'Where':
-            self._infer_symbolic_compute_ops,
-            'ZipMap':
-            self._infer_ZipMap,
-            'Neg':
-            self._infer_symbolic_compute_ops,
-            # contrib ops:
-            'Attention':
-            self._infer_Attention,
-            'BiasGelu':
-            self._infer_BiasGelu,
-            'EmbedLayerNormalization':
-            self._infer_EmbedLayerNormalization,
-            'FastGelu':
-            self._infer_FastGelu,
-            'Gelu':
-            self._infer_Gelu,
-            'LayerNormalization':
-            self._infer_LayerNormalization,
-            'LongformerAttention':
-            self._infer_LongformerAttention,
-            'PythonOp':
-            self._infer_PythonOp,
-            'SkipLayerNormalization':
-            self._infer_SkipLayerNormalization
-        }
-        self.aten_op_dispatcher_ = {
-            'aten::embedding': self._infer_Gather,
-            'aten::bitwise_or': self._infer_aten_bitwise_or,
-            'aten::diagonal': self._infer_aten_diagonal,
-            'aten::max_pool2d_with_indices': self._infer_aten_pool2d,
-            'aten::multinomial': self._infer_aten_multinomial,
-            'aten::unfold': self._infer_aten_unfold,
-            'aten::argmax': self._infer_aten_argmax,
-            'aten::avg_pool2d': self._infer_aten_pool2d,
-            'aten::_adaptive_avg_pool2d': self._infer_aten_pool2d,
-            'aten::binary_cross_entropy_with_logits': self._infer_aten_bce,
-            'aten::numpy_T': self._infer_Transpose,
-        }
-        self.run_ = True
-        self.suggested_merge_ = {}
-        self.symbolic_dims_ = {}
-        self.input_symbols_ = {}
-        self.auto_merge_ = auto_merge
-        self.guess_output_rank_ = guess_output_rank
-        self.verbose_ = verbose
-        self.int_max_ = int_max
-        self.subgraph_id_ = 0
-        self.prefix_ = prefix
-
-    def _add_suggested_merge(self, symbols, apply=False):
-        assert all([(type(s) == str and s in self.symbolic_dims_) or
-                    is_literal(s) for s in symbols])
-        symbols = set(symbols)
-        for k, v in self.suggested_merge_.items():
-            if k in symbols:
-                symbols.remove(k)
-                symbols.add(v)
-        map_to = None
-        # if there is literal, map to it first
-        for s in symbols:
-            if is_literal(s):
-                map_to = s
-                break
-        # when no literals, map to input symbolic dims, then existing symbolic dims
-        if map_to is None:
-            for s in symbols:
-                if s in self.input_symbols_:
-                    map_to = s
-                    break
-        if map_to is None:
-            for s in symbols:
-                if type(self.symbolic_dims_[s]) == sympy.Symbol:
-                    map_to = s
-                    break
-        # when nothing to map to, use the shorter one
-        if map_to is None:
-            if self.verbose_ > 0:
-                logger.warning(
-                    'Potential unsafe merge between symbolic expressions: ({})'.
-                    format(','.join(symbols)))
-            symbols_list = list(symbols)
-            lens = [len(s) for s in symbols_list]
-            map_to = symbols_list[lens.index(min(lens))]
-            symbols.remove(map_to)
-
-        for s in symbols:
-            if s == map_to:
-                continue
-            if is_literal(map_to) and is_literal(s):
-                assert int(map_to) == int(s)
-            self.suggested_merge_[s] = int(map_to) if is_literal(
-                map_to) else map_to
-            for k, v in self.suggested_merge_.items():
-                if v == s:
-                    self.suggested_merge_[k] = map_to
-        if apply and self.auto_merge_:
-            self._apply_suggested_merge()
-
-    def _apply_suggested_merge(self, graph_input_only=False):
-        if not self.suggested_merge_:
-            return
-        for i in list(self.out_mp_.graph.input) + (
-            [] if graph_input_only else list(self.out_mp_.graph.value_info)):
-            for d in i.type.tensor_type.shape.dim:
-                if d.dim_param in self.suggested_merge_:
-                    v = self.suggested_merge_[d.dim_param]
-                    if is_literal(v):
-                        d.dim_value = int(v)
-                    else:
-                        d.dim_param = v
-
-    def _preprocess(self, in_mp):
-        self.out_mp_ = onnx.ModelProto()
-        self.out_mp_.CopyFrom(in_mp)
-        self.graph_inputs_ = dict(
-            [(i.name, i) for i in list(self.out_mp_.graph.input)])
-        self.initializers_ = dict(
-            [(i.name, i) for i in self.out_mp_.graph.initializer])
-        self.known_vi_ = dict(
-            [(i.name, i) for i in list(self.out_mp_.graph.input)])
-        self.known_vi_.update(
-            dict([(i.name, helper.make_tensor_value_info(i.name, i.data_type,
-                                                         list(i.dims)))
-                  for i in self.out_mp_.graph.initializer]))
-
-    def _merge_symbols(self, dims):
-        if not all([type(d) == str for d in dims]):
-            if self.auto_merge_:
-                unique_dims = list(set(dims))
-                is_int = [is_literal(d) for d in unique_dims]
-                assert sum(
-                    is_int
-                ) <= 1  # if there are more than 1 unique ints, something is wrong
-                if sum(is_int) == 1:
-                    int_dim = is_int.index(1)
-                    if self.verbose_ > 0:
-                        logger.debug('dim {} has been merged with value {}'.
-                                     format(unique_dims[:int_dim] + unique_dims[
-                                         int_dim + 1:], unique_dims[int_dim]))
-                    self._check_merged_dims(unique_dims, allow_broadcast=False)
-                    return unique_dims[int_dim]
-                else:
-                    if self.verbose_ > 0:
-                        logger.debug('dim {} has been mergd with dim {}'.format(
-                            unique_dims[1:], unique_dims[0]))
-                    return dims[0]
-            else:
-                return None
-        if all([d == dims[0] for d in dims]):
-            return dims[0]
-        merged = [
-            self.suggested_merge_[d] if d in self.suggested_merge_ else d
-            for d in dims
-        ]
-        if all([d == merged[0] for d in merged]):
-            assert merged[0] in self.symbolic_dims_
-            return merged[0]
-        else:
-            return None
-
-    # broadcast from right to left, and merge symbolic dims if needed
-    def _broadcast_shapes(self, shape1, shape2):
-        new_shape = []
-        rank1 = len(shape1)
-        rank2 = len(shape2)
-        new_rank = max(rank1, rank2)
-        for i in range(new_rank):
-            dim1 = shape1[rank1 - 1 - i] if i < rank1 else 1
-            dim2 = shape2[rank2 - 1 - i] if i < rank2 else 1
-            if dim1 == 1 or dim1 == dim2:
-                new_dim = dim2
-            elif dim2 == 1:
-                new_dim = dim1
-            else:
-                new_dim = self._merge_symbols([dim1, dim2])
-                if not new_dim:
-                    # warning about unsupported broadcast when not auto merge
-                    # note that auto merge has the risk of incorrectly merge symbols while one of them being 1
-                    # for example, 'a' = 1, 'b' = 5 at runtime is valid broadcasting, but with auto merge 'a' == 'b'
-                    if self.auto_merge_:
-                        self._add_suggested_merge([dim1, dim2], apply=True)
-                    else:
-                        logger.warning('unsupported broadcast between ' + str(
-                            dim1) + ' ' + str(dim2))
-            new_shape = [new_dim] + new_shape
-        return new_shape
-
-    def _get_shape(self, node, idx):
-        name = node.input[idx]
-        if name in self.known_vi_:
-            vi = self.known_vi_[name]
-            return get_shape_from_value_info(vi)
-        else:
-            assert name in self.initializers_
-            return list(self.initializers_[name].dims)
-
-    def _get_shape_rank(self, node, idx):
-        return len(self._get_shape(node, idx))
-
-    def _get_sympy_shape(self, node, idx):
-        sympy_shape = []
-        for d in self._get_shape(node, idx):
-            if type(d) == str:
-                sympy_shape.append(self.symbolic_dims_[d] if d in
-                                   self.symbolic_dims_ else sympy.Symbol(
-                                       d, integer=True, nonnegative=True))
-            else:
-                assert None != d
-                sympy_shape.append(d)
-        return sympy_shape
-
-    def _get_value(self, node, idx):
-        name = node.input[idx]
-        assert name in self.sympy_data_ or name in self.initializers_
-        return self.sympy_data_[
-            name] if name in self.sympy_data_ else numpy_helper.to_array(
-                self.initializers_[name])
-
-    def _try_get_value(self, node, idx):
-        if idx >= len(node.input):
-            return None
-        name = node.input[idx]
-        if name in self.sympy_data_ or name in self.initializers_:
-            return self._get_value(node, idx)
-        return None
-
-    def _update_computed_dims(self, new_sympy_shape):
-        for i, new_dim in enumerate(new_sympy_shape):
-            if not is_literal(new_dim) and not type(new_dim) == str:
-                str_dim = str(new_dim)
-                if str_dim in self.suggested_merge_:
-                    if is_literal(self.suggested_merge_[str_dim]):
-                        continue  # no need to create dim for literals
-                    new_sympy_shape[i] = self.symbolic_dims_[
-                        self.suggested_merge_[str_dim]]
-                else:
-                    # add new_dim if it's a computational expression
-                    if not str(new_dim) in self.symbolic_dims_:
-                        self.symbolic_dims_[str(new_dim)] = new_dim
-
-    def _onnx_infer_single_node(self, node):
-        # skip onnx shape inference for some ops, as they are handled in _infer_*
-        skip_infer = node.op_type in [
-            'If', 'Loop', 'Scan', 'SplitToSequence', 'ZipMap', 'Attention',
-            'BiasGelu', 'EmbedLayerNormalization', 'FastGelu', 'Gelu',
-            'LayerNormalization', 'LongformerAttention',
-            'SkipLayerNormalization', 'PythonOp'
-        ]
-
-        if not skip_infer:
-            # Only pass initializers that satisfy the following condition:
-            # (1) Operator need value of some input for shape inference.
-            #     For example, Unsqueeze in opset 13 uses the axes input to calculate shape of output.
-            # (2) opset version >= 9. In older version, initializer is required in graph input by onnx spec.
-            # (3) The initializer is not in graph input. The means the node input is "constant" in inference.
-            initializers = []
-            if (get_opset(self.out_mp_) >= 9) and node.op_type in ['Unsqueeze']:
-                initializers = [
-                    self.initializers_[name] for name in node.input
-                    if (name in self.initializers_ and name not in
-                        self.graph_inputs_)
-                ]
-
-            # run single node inference with self.known_vi_ shapes
-            tmp_graph = helper.make_graph(
-                [node], 'tmp', [self.known_vi_[i] for i in node.input if i],
-                [make_named_value_info(i) for i in node.output], initializers)
-
-            self.tmp_mp_.graph.CopyFrom(tmp_graph)
-
-            self.tmp_mp_ = shape_inference.infer_shapes(self.tmp_mp_)
-
-        for i_o in range(len(node.output)):
-            o = node.output[i_o]
-            vi = self.out_mp_.graph.value_info.add()
-            if not skip_infer:
-                vi.CopyFrom(self.tmp_mp_.graph.output[i_o])
-            else:
-                vi.name = o
-            self.known_vi_[o] = vi
-
-    def _onnx_infer_subgraph(self,
-                             node,
-                             subgraph,
-                             use_node_input=True,
-                             inc_subgraph_id=True):
-        if self.verbose_ > 2:
-            logger.debug(
-                'Inferencing subgraph of node {} with output({}...): {}'.format(
-                    node.name, node.output[0], node.op_type))
-        # node inputs are not passed directly to the subgraph
-        # it's up to the node dispatcher to prepare subgraph input
-        # for example, with Scan/Loop, subgraph input shape would be trimmed from node input shape
-        # besides, inputs in subgraph could shadow implicit inputs
-        subgraph_inputs = set(
-            [i.name for i in list(subgraph.initializer) + list(subgraph.input)])
-        subgraph_implicit_input = set([
-            name for name in self.known_vi_.keys()
-            if not name in subgraph_inputs
-        ])
-        tmp_graph = helper.make_graph(
-            list(subgraph.node), 'tmp',
-            list(subgraph.input) +
-            [self.known_vi_[i] for i in subgraph_implicit_input],
-            [make_named_value_info(i.name) for i in subgraph.output])
-        tmp_graph.initializer.extend([
-            i for i in self.out_mp_.graph.initializer
-            if i.name in subgraph_implicit_input
-        ])
-        tmp_graph.initializer.extend(subgraph.initializer)
-        self.tmp_mp_.graph.CopyFrom(tmp_graph)
-
-        symbolic_shape_inference = SymbolicShapeInference(
-            self.int_max_,
-            self.auto_merge_,
-            self.guess_output_rank_,
-            self.verbose_,
-            prefix=self.prefix_ + '_' + str(self.subgraph_id_))
-        if inc_subgraph_id:
-            self.subgraph_id_ += 1
-
-        all_shapes_inferred = False
-        symbolic_shape_inference._preprocess(self.tmp_mp_)
-        symbolic_shape_inference.suggested_merge_ = self.suggested_merge_.copy()
-        while symbolic_shape_inference.run_:
-            all_shapes_inferred = symbolic_shape_inference._infer_impl(
-                self.sympy_data_.copy())
-        symbolic_shape_inference._update_output_from_vi()
-        if use_node_input:
-            # if subgraph uses node input, it needs to update to merged dims
-            subgraph.ClearField('input')
-            subgraph.input.extend(
-                symbolic_shape_inference.out_mp_.graph.input[:len(node.input)])
-        subgraph.ClearField('output')
-        subgraph.output.extend(symbolic_shape_inference.out_mp_.graph.output)
-        subgraph.ClearField('value_info')
-        subgraph.value_info.extend(
-            symbolic_shape_inference.out_mp_.graph.value_info)
-        subgraph.ClearField('node')
-        subgraph.node.extend(symbolic_shape_inference.out_mp_.graph.node)
-        # for new symbolic dims from subgraph output, add to main graph symbolic dims
-        subgraph_shapes = [
-            get_shape_from_value_info(o)
-            for o in symbolic_shape_inference.out_mp_.graph.output
-        ]
-        subgraph_new_symbolic_dims = set([
-            d for s in subgraph_shapes
-            if s for d in s if type(d) == str and not d in self.symbolic_dims_
-        ])
-        new_dims = {}
-        for d in subgraph_new_symbolic_dims:
-            assert d in symbolic_shape_inference.symbolic_dims_
-            new_dims[d] = symbolic_shape_inference.symbolic_dims_[d]
-        self.symbolic_dims_.update(new_dims)
-        return symbolic_shape_inference
-
-    def _get_int_values(self, node, broadcast=False):
-        values = [self._try_get_value(node, i) for i in range(len(node.input))]
-        if all([v is not None for v in values]):
-            # some shape compute is in floating point, cast to int for sympy
-            for i, v in enumerate(values):
-                if type(v) != np.ndarray:
-                    continue
-                if len(v.shape) > 1:
-                    new_v = None  # ignore value for rank > 1
-                elif len(v.shape) == 0:
-                    new_v = int(v.item())
-                else:
-                    assert len(v.shape) == 1
-                    new_v = [int(vv) for vv in v]
-                values[i] = new_v
-        values_len = [len(v) if type(v) == list else 0 for v in values]
-        max_len = max(values_len)
-        if max_len >= 1 and broadcast:
-            # broadcast
-            for i, v in enumerate(values):
-                if v is None:
-                    continue  # don't broadcast if value is unknown
-                if type(v) == list:
-                    if len(v) < max_len:
-                        values[i] = v * max_len
-                    else:
-                        assert len(v) == max_len
-                else:
-                    values[i] = [v] * max_len
-        return values
-
-    def _compute_on_sympy_data(self, node, op_func):
-        assert len(node.output) == 1
-        values = self._get_int_values(node, broadcast=True)
-        if all([v is not None for v in values]):
-            is_list = [type(v) == list for v in values]
-            as_list = any(is_list)
-            if as_list:
-                self.sympy_data_[node.output[
-                    0]] = [op_func(vs) for vs in zip(*values)]
-            else:
-                self.sympy_data_[node.output[0]] = op_func(values)
-
-    def _pass_on_sympy_data(self, node):
-        assert len(
-            node.
-            input) == 1 or node.op_type in ['Reshape', 'Unsqueeze', 'Squeeze']
-        self._compute_on_sympy_data(node, lambda x: x[0])
-
-    def _pass_on_shape_and_type(self, node):
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type,
-                                          self._get_shape(node, 0)))
-
-    def _new_symbolic_dim(self, prefix, dim):
-        new_dim = '{}_d{}'.format(prefix, dim)
-        if new_dim in self.suggested_merge_:
-            v = self.suggested_merge_[new_dim]
-            new_symbolic_dim = sympy.Integer(int(v)) if is_literal(v) else v
-        else:
-            new_symbolic_dim = sympy.Symbol(
-                new_dim, integer=True, nonnegative=True)
-            self.symbolic_dims_[new_dim] = new_symbolic_dim
-        return new_symbolic_dim
-
-    def _new_symbolic_dim_from_output(self, node, out_idx=0, dim=0):
-        return self._new_symbolic_dim('{}{}_{}_o{}_'.format(
-            node.op_type, self.prefix_,
-            list(self.out_mp_.graph.node).index(node), out_idx), dim)
-
-    def _new_symbolic_shape(self, rank, node, out_idx=0):
-        return [
-            self._new_symbolic_dim_from_output(node, out_idx, i)
-            for i in range(rank)
-        ]
-
-    def _compute_conv_pool_shape(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        if len(node.input) > 1:
-            W_shape = self._get_sympy_shape(node, 1)
-            rank = len(W_shape) - 2  # number of spatial axes
-            kernel_shape = W_shape[-rank:]
-            sympy_shape[1] = W_shape[0]
-        else:
-            W_shape = None
-            kernel_shape = get_attribute(node, 'kernel_shape')
-            rank = len(kernel_shape)
-
-        assert len(sympy_shape) == rank + 2
-
-        # only need to symbolic shape inference if input has symbolic dims in spatial axes
-        is_symbolic_dims = [not is_literal(i) for i in sympy_shape[-rank:]]
-
-        if not any(is_symbolic_dims):
-            shape = get_shape_from_value_info(self.known_vi_[node.output[0]])
-            if len(shape) > 0:
-                assert len(sympy_shape) == len(shape)
-                sympy_shape[-rank:] = [sympy.Integer(d) for d in shape[-rank:]]
-                return sympy_shape
-
-        dilations = get_attribute(node, 'dilations', [1] * rank)
-        strides = get_attribute(node, 'strides', [1] * rank)
-        effective_kernel_shape = [(k - 1) * d + 1
-                                  for k, d in zip(kernel_shape, dilations)]
-        pads = get_attribute(node, 'pads')
-        if pads is None:
-            pads = [0] * (2 * rank)
-            auto_pad = get_attribute(node, 'auto_pad',
-                                     b'NOTSET').decode('utf-8')
-            if auto_pad != 'VALID' and auto_pad != 'NOTSET':
-                try:
-                    residual = [
-                        sympy.Mod(d, s)
-                        for d, s in zip(sympy_shape[-rank:], strides)
-                    ]
-                    total_pads = [
-                        max(0, (k - s) if r == 0 else (k - r))
-                        for k, s, r in zip(effective_kernel_shape, strides,
-                                           residual)
-                    ]
-                except TypeError:  # sympy may throw TypeError: cannot determine truth value of Relational
-                    total_pads = [
-                        max(0, (k - s))
-                        for k, s in zip(effective_kernel_shape, strides)
-                    ]  # assuming no residual if sympy throws error
-            elif auto_pad == 'VALID':
-                total_pads = []
-            else:
-                total_pads = [0] * rank
-        else:
-            assert len(pads) == 2 * rank
-            total_pads = [p1 + p2 for p1, p2 in zip(pads[:rank], pads[rank:])]
-
-        ceil_mode = get_attribute(node, 'ceil_mode', 0)
-        for i in range(rank):
-            effective_input_size = sympy_shape[-rank + i]
-            if len(total_pads) > 0:
-                effective_input_size = effective_input_size + total_pads[i]
-            if ceil_mode:
-                strided_kernel_positions = sympy.ceiling(
-                    (effective_input_size - effective_kernel_shape[i]) /
-                    strides[i])
-            else:
-                strided_kernel_positions = (
-                    effective_input_size - effective_kernel_shape[i]
-                ) // strides[i]
-            sympy_shape[-rank + i] = strided_kernel_positions + 1
-        return sympy_shape
-
-    def _check_merged_dims(self, dims, allow_broadcast=True):
-        if allow_broadcast:
-            dims = [d for d in dims if not (is_literal(d) and int(d) <= 1)]
-        if not all([d == dims[0] for d in dims]):
-            self._add_suggested_merge(dims, apply=True)
-
-    def _compute_matmul_shape(self, node, output_dtype=None):
-        lhs_shape = self._get_shape(node, 0)
-        rhs_shape = self._get_shape(node, 1)
-        lhs_rank = len(lhs_shape)
-        rhs_rank = len(rhs_shape)
-        lhs_reduce_dim = 0
-        rhs_reduce_dim = 0
-        assert lhs_rank > 0 and rhs_rank > 0
-        if lhs_rank == 1 and rhs_rank == 1:
-            new_shape = []
-        elif lhs_rank == 1:
-            rhs_reduce_dim = -2
-            new_shape = rhs_shape[:rhs_reduce_dim] + [rhs_shape[-1]]
-        elif rhs_rank == 1:
-            lhs_reduce_dim = -1
-            new_shape = lhs_shape[:lhs_reduce_dim]
-        else:
-            lhs_reduce_dim = -1
-            rhs_reduce_dim = -2
-            new_shape = self._broadcast_shapes(
-                lhs_shape[:-2],
-                rhs_shape[:-2]) + [lhs_shape[-2]] + [rhs_shape[-1]]
-        # merge reduce dim
-        self._check_merged_dims(
-            [lhs_shape[lhs_reduce_dim], rhs_shape[rhs_reduce_dim]],
-            allow_broadcast=False)
-        if output_dtype is None:
-            # infer output_dtype from input type when not specified
-            output_dtype = self.known_vi_[node.input[
-                0]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], output_dtype,
-                                          new_shape))
-
-    def _fuse_tensor_type(self, node, out_idx, dst_type, src_type):
-        '''
-        update dst_tensor_type to be compatible with src_tensor_type when dimension mismatches
-        '''
-        dst_tensor_type = dst_type.sequence_type.elem_type.tensor_type if is_sequence(
-            dst_type) else dst_type.tensor_type
-        src_tensor_type = src_type.sequence_type.elem_type.tensor_type if is_sequence(
-            src_type) else src_type.tensor_type
-        if dst_tensor_type.elem_type != src_tensor_type.elem_type:
-            node_id = node.name if node.name else node.op_type
-            raise ValueError(
-                f"For node {node_id}, dst_tensor_type.elem_type != src_tensor_type.elem_type: "
-                f"{onnx.onnx_pb.TensorProto.DataType.Name(dst_tensor_type.elem_type)} vs "
-                f"{onnx.onnx_pb.TensorProto.DataType.Name(src_tensor_type.elem_type)}"
-            )
-        if dst_tensor_type.HasField('shape'):
-            for di, ds in enumerate(
-                    zip(dst_tensor_type.shape.dim, src_tensor_type.shape.dim)):
-                if ds[0] != ds[1]:
-                    # create a new symbolic dimension for node/out_idx/mismatch dim id in dst_tensor_type for tensor_type
-                    # for sequence_type, clear the dimension
-                    new_dim = onnx.TensorShapeProto.Dimension()
-                    if not is_sequence(dst_type):
-                        new_dim.dim_param = str(
-                            self._new_symbolic_dim_from_output(node, out_idx,
-                                                               di))
-                    dst_tensor_type.shape.dim[di].CopyFrom(new_dim)
-        else:
-            dst_tensor_type.CopyFrom(src_tensor_type)
-
-    def _infer_ArrayFeatureExtractor(self, node):
-        data_shape = self._get_shape(node, 0)
-        indices_shape = self._get_shape(node, 1)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, data_shape[:-1] +
-                                          indices_shape))
-
-    def _infer_symbolic_compute_ops(self, node):
-        funcs = {
-            'Add':
-            lambda l: l[0] + l[1],
-            'Div':
-            lambda l: l[0] // l[1],  # integer div in sympy
-            'Equal':
-            lambda l: l[0] == l[1],
-            'Floor':
-            lambda l: sympy.floor(l[0]),
-            'Max':
-            lambda l: l[1] if is_literal(l[0]) and int(l[0]) < -self.int_max_ else (l[0] if is_literal(l[1]) and int(l[1]) < -self.int_max_ else sympy.Max(l[0], l[1])),
-            'Min':
-            lambda l: l[1] if is_literal(l[0]) and int(l[0]) > self.int_max_ else (l[0] if is_literal(l[1]) and int(l[1]) > self.int_max_ else sympy.Min(l[0], l[1])),
-            'Mul':
-            lambda l: l[0] * l[1],
-            'Sub':
-            lambda l: l[0] - l[1],
-            'Where':
-            lambda l: l[1] if l[0] else l[2],
-            'Neg':
-            lambda l: -l[0]
-        }
-        assert node.op_type in funcs
-        self._compute_on_sympy_data(node, funcs[node.op_type])
-
-    def _infer_Cast(self, node):
-        self._pass_on_sympy_data(node)
-
-    def _infer_CategoryMapper(self, node):
-        input_type = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-        if input_type == onnx.TensorProto.STRING:
-            output_type = onnx.TensorProto.INT64
-        else:
-            output_type = onnx.TensorProto.STRING
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], output_type,
-                                          self._get_shape(node, 0)))
-
-    def _infer_Compress(self, node):
-        input_shape = self._get_shape(node, 0)
-        # create a new symbolic dimension for Compress output
-        compress_len = str(self._new_symbolic_dim_from_output(node))
-        axis = get_attribute(node, 'axis')
-        if axis == None:
-            # when axis is not specified, input is flattened before compress so output is 1D
-            output_shape = [compress_len]
-        else:
-            output_shape = input_shape
-            output_shape[handle_negative_axis(axis, len(
-                input_shape))] = compress_len
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, output_shape))
-
-    def _infer_Concat(self, node):
-        if any([
-                i in self.sympy_data_ or i in self.initializers_
-                for i in node.input
-        ]):
-            values = self._get_int_values(node)
-            print("=======", values, node.name, get_attribute(node, 'axis'))
-            if all([v is not None for v in values]):
-                axis = get_attribute(node, 'axis')
-                if axis < 0:
-                    axis = axis + len(values[0])
-                assert 0 == axis
-                self.sympy_data_[node.output[0]] = []
-                for i in range(len(node.input)):
-                    value = values[i]
-                    if type(value) == list:
-                        self.sympy_data_[node.output[0]].extend(value)
-                    else:
-                        self.sympy_data_[node.output[0]].append(value)
-
-        sympy_shape = self._get_sympy_shape(node, 0)
-        axis = handle_negative_axis(
-            get_attribute(node, 'axis'), len(sympy_shape))
-        for i_idx in range(1, len(node.input)):
-            input_shape = self._get_sympy_shape(node, i_idx)
-            if input_shape:
-                sympy_shape[axis] = sympy_shape[axis] + input_shape[axis]
-        self._update_computed_dims(sympy_shape)
-        # merge symbolic dims for non-concat axes
-        for d in range(len(sympy_shape)):
-            if d == axis:
-                continue
-            dims = [
-                self._get_shape(node, i_idx)[d]
-                for i_idx in range(len(node.input))
-                if self._get_shape(node, i_idx)
-            ]
-            if all([d == dims[0] for d in dims]):
-                continue
-            merged = self._merge_symbols(dims)
-            if type(merged) == str:
-                sympy_shape[d] = self.symbolic_dims_[merged] if merged else None
-            else:
-                sympy_shape[d] = merged
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], self.known_vi_[node.input[0]].type.tensor_type.
-                elem_type, get_shape_from_sympy_shape(sympy_shape)))
-
-    def _infer_ConcatFromSequence(self, node):
-        seq_shape = self._get_shape(node, 0)
-        new_axis = 1 if get_attribute(node, 'new_axis') else 0
-        axis = handle_negative_axis(
-            get_attribute(node, 'axis'), len(seq_shape) + new_axis)
-        concat_dim = str(self._new_symbolic_dim_from_output(node, 0, axis))
-        new_shape = seq_shape
-        if new_axis:
-            new_shape = seq_shape[:axis] + [concat_dim] + seq_shape[axis:]
-        else:
-            new_shape[axis] = concat_dim
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], self.known_vi_[node.input[0]]
-                .type.sequence_type.elem_type.tensor_type.elem_type, new_shape))
-
-    def _infer_Constant(self, node):
-        t = get_attribute(node, 'value')
-        self.sympy_data_[node.output[0]] = numpy_helper.to_array(t)
-
-    def _infer_ConstantOfShape(self, node):
-        sympy_shape = self._get_int_values(node)[0]
-        vi = self.known_vi_[node.output[0]]
-        if sympy_shape is not None:
-            if type(sympy_shape) != list:
-                sympy_shape = [sympy_shape]
-            self._update_computed_dims(sympy_shape)
-            # update sympy data if output type is int, and shape is known
-            if vi.type.tensor_type.elem_type == onnx.TensorProto.INT64 and all(
-                [is_literal(x) for x in sympy_shape]):
-                self.sympy_data_[node.output[0]] = np.ones(
-                    [int(x) for x in sympy_shape],
-                    dtype=np.int64) * numpy_helper.to_array(
-                        get_attribute(node, 'value', 0))
-        else:
-            # create new dynamic shape
-            # note input0 is a 1D vector of shape, the new symbolic shape has the rank of the shape vector length
-            sympy_shape = self._new_symbolic_shape(
-                self._get_shape(node, 0)[0], node)
-
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], vi.type.tensor_type.elem_type,
-                get_shape_from_sympy_shape(sympy_shape)))
-
-    def _infer_Conv(self, node):
-        sympy_shape = self._compute_conv_pool_shape(node)
-        self._update_computed_dims(sympy_shape)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], vi.type.tensor_type.elem_type,
-                get_shape_from_sympy_shape(sympy_shape)))
-
-    def _infer_Einsum(self, node):
-        # ref:https://github.com/onnx/onnx/blob/623dfaa0151b2e4ce49779c3ec31cbd78c592b80/onnx/defs/math/defs.cc#L3275
-        equation = get_attribute(node, 'equation')
-        equation = equation.replace(b' ', b'')
-        mid_index = equation.find(b'->')
-        left_equation = equation[:mid_index] if mid_index != -1 else equation
-
-        num_operands = 0
-        num_ellipsis = 0
-        num_ellipsis_indices = 0
-
-        letter_to_dim = {}
-
-        terms = left_equation.split(b',')
-        for term in terms:
-            ellipsis_index = term.find(b'...')
-            shape = self._get_shape(node, num_operands)
-            rank = len(shape)
-            if ellipsis_index != -1:
-                if num_ellipsis == 0:
-                    num_ellipsis_indices = rank - len(term) + 3
-                num_ellipsis = num_ellipsis + 1
-            for i in range(1, rank + 1):
-                letter = term[-i]
-                if letter != 46:  # letter != b'.'
-                    dim = shape[-i]
-                    if letter not in letter_to_dim.keys():
-                        letter_to_dim[letter] = dim
-                    elif type(dim) != sympy.Symbol:
-                        letter_to_dim[letter] = dim
-            num_operands = num_operands + 1
-
-        new_sympy_shape = []
-        from collections import OrderedDict
-        num_letter_occurrences = OrderedDict()
-        if mid_index != -1:
-            right_equation = equation[mid_index + 2:]
-            right_ellipsis_index = right_equation.find(b'...')
-            if right_ellipsis_index != -1:
-                for i in range(num_ellipsis_indices):
-                    new_sympy_shape.append(shape[i])
-            for c in right_equation:
-                if c != 46:  # c != b'.'
-                    new_sympy_shape.append(letter_to_dim[c])
-        else:
-            for i in range(num_ellipsis_indices):
-                new_sympy_shape.append(shape[i])
-            for c in left_equation:
-                if c != 44 and c != 46:  # c != b',' and c != b'.':
-                    if c in num_letter_occurrences:
-                        num_letter_occurrences[c] = num_letter_occurrences[
-                            c] + 1
-                    else:
-                        num_letter_occurrences[c] = 1
-            for key, value in num_letter_occurrences.items():
-                if value == 1:
-                    new_sympy_shape.append(letter_to_dim[key])
-
-        output_dtype = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], output_dtype,
-                                          new_sympy_shape))
-
-    def _infer_Expand(self, node):
-        expand_to_shape = as_list(self._try_get_value(node, 1), keep_none=True)
-        if expand_to_shape is not None:
-            # new_shape's dim can come from shape value
-            self._update_computed_dims(expand_to_shape)
-            shape = self._get_shape(node, 0)
-            new_shape = self._broadcast_shapes(
-                shape, get_shape_from_sympy_shape(expand_to_shape))
-            vi = self.known_vi_[node.output[0]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                    node.input[0]].type.tensor_type.elem_type, new_shape))
-
-    def _infer_Gather(self, node):
-        data_shape = self._get_shape(node, 0)
-        axis = handle_negative_axis(
-            get_attribute(node, 'axis', 0), len(data_shape))
-        indices_shape = self._get_shape(node, 1)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, data_shape[:axis] +
-                                          indices_shape + data_shape[axis +
-                                                                     1:]))
-        # for 1D input, do some sympy compute
-        if node.input[0] in self.sympy_data_ and len(
-                data_shape) == 1 and 0 == get_attribute(node, 'axis', 0):
-            idx = self._try_get_value(node, 1)
-            if idx is not None:
-                data = self.sympy_data_[node.input[0]]
-                if type(data) == list:
-                    if type(idx) == np.ndarray and len(idx.shape) == 1:
-                        self.sympy_data_[node.output[
-                            0]] = [data[int(i)] for i in idx]
-                    else:
-                        self.sympy_data_[node.output[0]] = data[int(idx)]
-                else:
-                    assert idx == 0 or idx == -1
-                    self.sympy_data_[node.output[0]] = data
-
-    def _infer_GatherElements(self, node):
-        indices_shape = self._get_shape(node, 1)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, indices_shape))
-
-    def _infer_GatherND(self, node):
-        data_shape = self._get_shape(node, 0)
-        data_rank = len(data_shape)
-        indices_shape = self._get_shape(node, 1)
-        indices_rank = len(indices_shape)
-        last_index_dimension = indices_shape[-1]
-        assert is_literal(
-            last_index_dimension) and last_index_dimension <= data_rank
-        new_shape = indices_shape[:-1] + data_shape[last_index_dimension:]
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, new_shape))
-
-    def _infer_If(self, node):
-        # special case for constant condition, in case there are mismatching shape from the non-executed branch
-        subgraphs = [
-            get_attribute(node, 'then_branch'), get_attribute(node,
-                                                              'else_branch')
-        ]
-        cond = self._try_get_value(node, 0)
-        if cond is not None:
-            if as_scalar(cond) > 0:
-                subgraphs[1].CopyFrom(subgraphs[0])
-            else:
-                subgraphs[0].CopyFrom(subgraphs[1])
-
-        for i_sub, subgraph in enumerate(subgraphs):
-            subgraph_infer = self._onnx_infer_subgraph(
-                node, subgraph, use_node_input=False)
-            for i_out in range(len(node.output)):
-                vi = self.known_vi_[node.output[i_out]]
-                if i_sub == 0:
-                    vi.CopyFrom(subgraph.output[i_out])
-                    vi.name = node.output[i_out]
-                else:
-                    self._fuse_tensor_type(node, i_out, vi.type,
-                                           subgraph.output[i_out].type)
-
-                # pass on sympy data from subgraph, if cond is constant
-                if cond is not None and i_sub == (0 if as_scalar(cond) > 0 else
-                                                  1):
-                    if subgraph.output[
-                            i_out].name in subgraph_infer.sympy_data_:
-                        self.sympy_data_[vi.name] = subgraph_infer.sympy_data_[
-                            subgraph.output[i_out].name]
-
-    def _infer_Loop(self, node):
-        subgraph = get_attribute(node, 'body')
-        assert len(subgraph.input) == len(node.input)
-        num_loop_carried = len(
-            node.input) - 2  # minus the length and initial loop condition
-        # when sequence_type is used as loop carried input
-        # needs to run subgraph infer twice if the tensor shape in sequence contains None
-        for i, si in enumerate(subgraph.input):
-            si_name = si.name
-            si.CopyFrom(self.known_vi_[node.input[i]])
-            si.name = si_name
-
-        self._onnx_infer_subgraph(node, subgraph)
-
-        # check subgraph input/output for shape changes in loop carried variables
-        # for tensor_type, create new symbolic dim when changing, i.e., output = Concat(input, a)
-        # for sequence_type, propagate from output to input
-        need_second_infer = False
-        for i_out in range(1, num_loop_carried + 1):
-            so = subgraph.output[i_out]
-            so_shape = get_shape_from_value_info(so)
-            if is_sequence(so.type):
-                if so_shape and None in so_shape:
-                    # copy shape from output to input
-                    # note that loop input is [loop_len, cond, input_0, input_1, ...]
-                    # while loop output is [cond, output_0, output_1, ...]
-                    subgraph.input[i_out +
-                                   1].type.sequence_type.elem_type.CopyFrom(
-                                       so.type.sequence_type.elem_type)
-                    need_second_infer = True
-            else:
-                si = subgraph.input[i_out + 1]
-                si_shape = get_shape_from_value_info(si)
-                for di, dims in enumerate(zip(si_shape, so_shape)):
-                    if dims[0] != dims[1]:
-                        new_dim = onnx.TensorShapeProto.Dimension()
-                        new_dim.dim_param = str(
-                            self._new_symbolic_dim_from_output(node, i_out, di))
-                        si.type.tensor_type.shape.dim[di].CopyFrom(new_dim)
-                        so.type.tensor_type.shape.dim[di].CopyFrom(new_dim)
-                        need_second_infer = True
-
-        if need_second_infer:
-            if self.verbose_ > 2:
-                logger.debug(
-                    "Rerun Loop: {}({}...), because of sequence in loop carried variables".
-                    format(node.name, node.output[0]))
-            self._onnx_infer_subgraph(node, subgraph, inc_subgraph_id=False)
-
-        # create a new symbolic dimension for iteration dependent dimension
-        loop_iter_dim = str(self._new_symbolic_dim_from_output(node))
-        for i in range(len(node.output)):
-            vi = self.known_vi_[node.output[i]]
-            vi.CopyFrom(subgraph.output[
-                i +
-                1])  # first subgraph output is condition, not in node output
-            if i >= num_loop_carried:
-                assert not is_sequence(
-                    vi.type)  # TODO: handle loop accumulation in sequence_type
-                subgraph_vi_dim = subgraph.output[i +
-                                                  1].type.tensor_type.shape.dim
-                vi.type.tensor_type.shape.ClearField('dim')
-                vi_dim = vi.type.tensor_type.shape.dim
-                vi_dim.add().dim_param = loop_iter_dim
-                vi_dim.extend(list(subgraph_vi_dim))
-            vi.name = node.output[i]
-
-    def _infer_MatMul(self, node):
-        self._compute_matmul_shape(node)
-
-    def _infer_MatMulInteger(self, node):
-        self._compute_matmul_shape(node, onnx.TensorProto.INT32)
-
-    def _infer_NonMaxSuppression(self, node):
-        selected = str(self._new_symbolic_dim_from_output(node))
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[
-                0], onnx.TensorProto.INT64, [selected, 3]))
-
-    def _infer_NonZero(self, node):
-        input_rank = self._get_shape_rank(node, 0)
-        # create a new symbolic dimension for NonZero output
-        nz_len = str(self._new_symbolic_dim_from_output(node, 0, 1))
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[
-                0], vi.type.tensor_type.elem_type, [input_rank, nz_len]))
-
-    def _infer_OneHot(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        depth = self._try_get_value(node, 1)
-        axis = get_attribute(node, 'axis', -1)
-        axis = handle_negative_axis(axis, len(sympy_shape) + 1)
-        new_shape = get_shape_from_sympy_shape(sympy_shape[:axis] + [
-            self._new_symbolic_dim_from_output(node)
-            if not is_literal(depth) else depth
-        ] + sympy_shape[axis:])
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[2]].type.tensor_type.elem_type, new_shape))
-
-    def _infer_Pad(self, node):
-        if get_opset(self.out_mp_) <= 10:
-            pads = get_attribute(node, 'pads')
-        else:
-            pads = self._try_get_value(node, 1)
-
-        sympy_shape = self._get_sympy_shape(node, 0)
-        rank = len(sympy_shape)
-
-        if pads is not None:
-            assert len(pads) == 2 * rank
-            new_sympy_shape = [
-                d + pad_up + pad_down
-                for d, pad_up, pad_down in zip(sympy_shape, pads[:rank], pads[
-                    rank:])
-            ]
-            self._update_computed_dims(new_sympy_shape)
-        else:
-            # dynamic pads, create new symbolic dimensions
-            new_sympy_shape = self._new_symbolic_shape(rank, node)
-        output_tp = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[
-                0], output_tp, get_shape_from_sympy_shape(new_sympy_shape)))
-
-    def _infer_Pool(self, node):
-        sympy_shape = self._compute_conv_pool_shape(node)
-        self._update_computed_dims(sympy_shape)
-        for o in node.output:
-            if not o:
-                continue
-            vi = self.known_vi_[o]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(o, vi.type.tensor_type.elem_type,
-                                              get_shape_from_sympy_shape(
-                                                  sympy_shape)))
-
-    def _infer_aten_bitwise_or(self, node):
-        shape0 = self._get_shape(node, 0)
-        shape1 = self._get_shape(node, 1)
-        new_shape = self._broadcast_shapes(shape0, shape1)
-        t0 = self.known_vi_[node.input[0]]
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[
-                0], t0.type.tensor_type.elem_type, new_shape))
-
-    def _infer_aten_diagonal(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        rank = len(sympy_shape)
-        offset = self._try_get_value(node, 1)
-        dim1 = self._try_get_value(node, 2)
-        dim2 = self._try_get_value(node, 3)
-
-        assert offset is not None and dim1 is not None and dim2 is not None
-        dim1 = handle_negative_axis(dim1, rank)
-        dim2 = handle_negative_axis(dim2, rank)
-
-        new_shape = []
-        for dim, val in enumerate(sympy_shape):
-            if dim not in [dim1, dim2]:
-                new_shape.append(val)
-
-        shape1 = sympy_shape[dim1]
-        shape2 = sympy_shape[dim2]
-        if offset >= 0:
-            diag_shape = sympy.Max(0, sympy.Min(shape1, shape2 - offset))
-        else:
-            diag_shape = sympy.Max(0, sympy.Min(shape1 + offset, shape2))
-        new_shape.append(diag_shape)
-
-        if node.output[0]:
-            vi = self.known_vi_[node.output[0]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                    node.input[0]].type.tensor_type.elem_type,
-                                              get_shape_from_sympy_shape(
-                                                  new_shape)))
-
-    def _infer_aten_multinomial(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        rank = len(sympy_shape)
-        assert rank in [1, 2]
-        num_samples = self._try_get_value(node, 1)
-        di = rank - 1
-        last_dim = num_samples if num_samples else str(
-            self._new_symbolic_dim_from_output(node, 0, di))
-        output_shape = sympy_shape[:-1] + [last_dim]
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], onnx.TensorProto.INT64,
-                get_shape_from_sympy_shape(output_shape)))
-
-    def _infer_aten_pool2d(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        assert len(sympy_shape) == 4
-        sympy_shape[-2:] = [
-            self._new_symbolic_dim_from_output(node, 0, i) for i in [2, 3]
-        ]
-        self._update_computed_dims(sympy_shape)
-        for i, o in enumerate(node.output):
-            if not o:
-                continue
-            vi = self.known_vi_[o]
-            elem_type = onnx.TensorProto.INT64 if i == 1 else self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type
-            vi.CopyFrom(
-                helper.make_tensor_value_info(
-                    o, elem_type, get_shape_from_sympy_shape(sympy_shape)))
-
-    def _infer_aten_unfold(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        dimension = self._try_get_value(node, 1)
-        size = self._try_get_value(node, 2)
-        step = self._try_get_value(node, 3)
-        if dimension is not None and size is not None and step is not None:
-            assert dimension < len(sympy_shape)
-            sympy_shape[dimension] = (sympy_shape[dimension] - size) // step + 1
-            sympy_shape.append(size)
-        else:
-            rank = len(sympy_shape)
-            sympy_shape = self._new_symbolic_shape(rank + 1, node)
-        self._update_computed_dims(sympy_shape)
-        if node.output[0]:
-            vi = self.known_vi_[node.output[0]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                    node.input[0]].type.tensor_type.elem_type,
-                                              get_shape_from_sympy_shape(
-                                                  sympy_shape)))
-
-    def _infer_aten_argmax(self, node):
-        new_shape = None
-        if node.input[1] == '':
-            # The argmax of the flattened input is returned.
-            new_shape = []
-        else:
-            dim = self._try_get_value(node, 1)
-            keepdim = self._try_get_value(node, 2)
-            if keepdim is not None:
-                sympy_shape = self._get_sympy_shape(node, 0)
-                if dim is not None:
-                    dim = handle_negative_axis(dim, len(sympy_shape))
-                    if keepdim:
-                        sympy_shape[dim] = 1
-                    else:
-                        del sympy_shape[dim]
-                else:
-                    rank = len(sympy_shape)
-                    sympy_shape = self._new_symbolic_shape(rank if keepdim else
-                                                           rank - 1, node)
-                self._update_computed_dims(sympy_shape)
-                new_shape = get_shape_from_sympy_shape(sympy_shape)
-        if node.output[0] and new_shape is not None:
-            vi = self.known_vi_[node.output[0]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[
-                    0], onnx.TensorProto.INT64, new_shape))
-
-    def _infer_aten_bce(self, node):
-        reduction = self._try_get_value(node, 4)
-        if reduction is None:
-            reduction = 1
-        elem_type = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[0]]
-        if reduction == 0:
-            vi.type.tensor_type.elem_type = elem_type
-            vi.type.tensor_type.shape.CopyFrom(onnx.TensorShapeProto())
-        else:
-            vi.CopyFrom(
-                helper.make_tensor_value_info(vi.name, elem_type,
-                                              self._get_shape(node, 0)))
-
-    def _infer_BatchNormalization(self, node):
-        self._propagate_shape_and_type(node)
-
-        # this works for opsets < 14 and 14 since we check i < len(node.output) in the loop
-        for i in [1, 2, 3, 4]:
-            if i < len(node.output) and node.output[i] != "":
-                # all of these parameters have the same shape as the 1st input
-                self._propagate_shape_and_type(
-                    node, input_index=1, output_index=i)
-
-    def _infer_Range(self, node):
-        vi = self.known_vi_[node.output[0]]
-        input_data = self._get_int_values(node)
-        if all([i is not None for i in input_data]):
-            start = as_scalar(input_data[0])
-            limit = as_scalar(input_data[1])
-            delta = as_scalar(input_data[2])
-            new_sympy_shape = [
-                sympy.Max(sympy.ceiling((limit - start) / delta), 0)
-            ]
-        else:
-            new_sympy_shape = [self._new_symbolic_dim_from_output(node)]
-        self._update_computed_dims(new_sympy_shape)
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], self.known_vi_[node.input[0]].type.tensor_type.
-                elem_type, get_shape_from_sympy_shape(new_sympy_shape)))
-
-    def _infer_ReduceSum(self, node):
-        keep_dims = get_attribute(node, 'keepdims', 1)
-        if get_opset(self.out_mp_) >= 13 and len(node.input) > 1:
-            # ReduceSum changes axes to input[1] in opset 13
-            axes = self._try_get_value(node, 1)
-            vi = self.known_vi_[node.output[0]]
-            if axes is None:
-                assert keep_dims  # can only handle keep_dims==True when axes is unknown, by generating new ranks
-                vi.CopyFrom(
-                    helper.make_tensor_value_info(
-                        node.output[0], self.known_vi_[node.input[
-                            0]].type.tensor_type.elem_type,
-                        get_shape_from_sympy_shape(
-                            self._new_symbolic_shape(
-                                self._get_shape_rank(node, 0), node))))
-            else:
-                shape = self._get_shape(node, 0)
-                output_shape = []
-                axes = [handle_negative_axis(a, len(shape)) for a in axes]
-                for i, d in enumerate(shape):
-                    if i in axes:
-                        if keep_dims:
-                            output_shape.append(1)
-                    else:
-                        output_shape.append(d)
-                vi.CopyFrom(
-                    helper.make_tensor_value_info(node.output[
-                        0], self.known_vi_[node.input[
-                            0]].type.tensor_type.elem_type, output_shape))
-
-    def _infer_ReduceProd(self, node):
-        axes = get_attribute(node, 'axes')
-        keep_dims = get_attribute(node, 'keepdims', 1)
-        if keep_dims == 0 and axes == [0]:
-            data = self._get_int_values(node)[0]
-            if data is not None:
-                self.sympy_data_[node.output[0]] = sympy_reduce_product(data)
-
-    def _infer_Reshape(self, node):
-        shape_value = self._try_get_value(node, 1)
-        vi = self.known_vi_[node.output[0]]
-        if shape_value is None:
-            shape_shape = self._get_shape(node, 1)
-            assert len(shape_shape) == 1
-            shape_rank = shape_shape[0]
-            assert is_literal(shape_rank)
-            vi.CopyFrom(
-                helper.make_tensor_value_info(
-                    node.output[0], vi.type.tensor_type.elem_type,
-                    get_shape_from_sympy_shape(
-                        self._new_symbolic_shape(shape_rank, node))))
-        else:
-            input_sympy_shape = self._get_sympy_shape(node, 0)
-            total = int(1)
-            for d in input_sympy_shape:
-                total = total * d
-            new_sympy_shape = []
-            deferred_dim_idx = -1
-            non_deferred_size = int(1)
-            for i, d in enumerate(shape_value):
-                if type(d) == sympy.Symbol:
-                    new_sympy_shape.append(d)
-                elif d == 0:
-                    new_sympy_shape.append(input_sympy_shape[i])
-                    non_deferred_size = non_deferred_size * input_sympy_shape[i]
-                else:
-                    new_sympy_shape.append(d)
-                if d == -1:
-                    deferred_dim_idx = i
-                elif d != 0:
-                    non_deferred_size = non_deferred_size * d
-
-            assert new_sympy_shape.count(-1) < 2
-            if -1 in new_sympy_shape:
-                new_dim = total // non_deferred_size
-                new_sympy_shape[deferred_dim_idx] = new_dim
-
-            self._update_computed_dims(new_sympy_shape)
-            vi.CopyFrom(
-                helper.make_tensor_value_info(
-                    node.output[0], vi.type.tensor_type.elem_type,
-                    get_shape_from_sympy_shape(new_sympy_shape)))
-
-        self._pass_on_sympy_data(node)
-
-    def _infer_Resize(self, node):
-        vi = self.known_vi_[node.output[0]]
-        input_sympy_shape = self._get_sympy_shape(node, 0)
-        if get_opset(self.out_mp_) <= 10:
-            scales = self._try_get_value(node, 1)
-            if scales is not None:
-                new_sympy_shape = [
-                    sympy.simplify(sympy.floor(d * s))
-                    for d, s in zip(input_sympy_shape, scales)
-                ]
-                self._update_computed_dims(new_sympy_shape)
-                vi.CopyFrom(
-                    helper.make_tensor_value_info(
-                        node.output[0], self.known_vi_[node.input[
-                            0]].type.tensor_type.elem_type,
-                        get_shape_from_sympy_shape(new_sympy_shape)))
-        else:
-            roi = self._try_get_value(node, 1)
-            scales = self._try_get_value(node, 2)
-            sizes = self._try_get_value(node, 3)
-            if sizes is not None:
-                new_sympy_shape = [
-                    sympy.simplify(sympy.floor(s)) for s in sizes
-                ]
-                self._update_computed_dims(new_sympy_shape)
-            elif scales is not None:
-                rank = len(scales)
-                if get_attribute(node, 'coordinate_transformation_mode'
-                                 ) == 'tf_crop_and_resize':
-                    assert len(roi) == 2 * rank
-                    roi_start = list(roi)[:rank]
-                    roi_end = list(roi)[rank:]
-                else:
-                    roi_start = [0] * rank
-                    roi_end = [1] * rank
-                scales = list(scales)
-                new_sympy_shape = [
-                    sympy.simplify(sympy.floor(d * (end - start) * scale))
-                    for d, start, end, scale in zip(input_sympy_shape,
-                                                    roi_start, roi_end, scales)
-                ]
-                self._update_computed_dims(new_sympy_shape)
-            else:
-                new_sympy_shape = self._new_symbolic_shape(
-                    self._get_shape_rank(node, 0), node)
-
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                    node.input[0]].type.tensor_type.elem_type,
-                                              get_shape_from_sympy_shape(
-                                                  new_sympy_shape)))
-
-    def _infer_Scan(self, node):
-        subgraph = get_attribute(node, 'body')
-        num_scan_inputs = get_attribute(node, 'num_scan_inputs')
-        scan_input_axes = get_attribute(node, 'scan_input_axes',
-                                        [0] * num_scan_inputs)
-        num_scan_states = len(node.input) - num_scan_inputs
-        scan_input_axes = [
-            handle_negative_axis(
-                ax, self._get_shape_rank(node, i + num_scan_states))
-            for i, ax in enumerate(scan_input_axes)
-        ]
-        # We may have cases where the subgraph has optionial inputs that appear in both subgraph's input and initializer,
-        # but not in the node's input. In such cases, the input model might be invalid, but let's skip those optional inputs.
-        assert len(subgraph.input) >= len(node.input)
-        subgraph_inputs = subgraph.input[:len(node.input)]
-        for i, si in enumerate(subgraph_inputs):
-            subgraph_name = si.name
-            si.CopyFrom(self.known_vi_[node.input[i]])
-            if i >= num_scan_states:
-                scan_input_dim = si.type.tensor_type.shape.dim
-                scan_input_dim.remove(
-                    scan_input_dim[scan_input_axes[i - num_scan_states]])
-            si.name = subgraph_name
-        self._onnx_infer_subgraph(node, subgraph)
-        num_scan_outputs = len(node.output) - num_scan_states
-        scan_output_axes = get_attribute(node, 'scan_output_axes',
-                                         [0] * num_scan_outputs)
-        scan_input_dim = get_shape_from_type_proto(
-            self.known_vi_[node.input[-1]].type)[scan_input_axes[-1]]
-        for i, o in enumerate(node.output):
-            vi = self.known_vi_[o]
-            if i >= num_scan_states:
-                shape = get_shape_from_type_proto(subgraph.output[i].type)
-                new_dim = handle_negative_axis(
-                    scan_output_axes[i - num_scan_states], len(shape) + 1)
-                shape = shape[:new_dim] + [scan_input_dim] + shape[new_dim:]
-                vi.CopyFrom(
-                    helper.make_tensor_value_info(o, subgraph.output[
-                        i].type.tensor_type.elem_type, shape))
-            else:
-                vi.CopyFrom(subgraph.output[i])
-            vi.name = o
-
-    def _infer_ScatterElements(self, node):
-        data_shape = self._get_shape(node, 0)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, data_shape))
-
-    def _infer_SequenceAt(self, node):
-        # need to create new symbolic dimension if sequence shape has None:
-        seq_shape = self._get_shape(node, 0)
-        vi = self.known_vi_[node.output[0]]
-        if seq_shape is not None:
-            for di, d in enumerate(seq_shape):
-                if d is not None:
-                    continue
-                new_dim = onnx.TensorShapeProto.Dimension()
-                new_dim.dim_param = str(
-                    self._new_symbolic_dim_from_output(node, 0, di))
-                vi.type.tensor_type.shape.dim[di].CopyFrom(new_dim)
-
-    def _infer_SequenceInsert(self, node):
-        # workaround bug in onnx's shape inference
-        vi_seq = self.known_vi_[node.input[0]]
-        vi_tensor = self.known_vi_[node.input[1]]
-        vi_out_seq = self.known_vi_[node.output[0]]
-        vi_out_seq.CopyFrom(vi_seq)
-        vi_out_seq.name = node.output[0]
-        self._fuse_tensor_type(node, 0, vi_out_seq.type, vi_tensor.type)
-
-    def _infer_Shape(self, node):
-        self.sympy_data_[node.output[0]] = self._get_sympy_shape(node, 0)
-
-    def _infer_Size(self, node):
-        sympy_shape = self._get_sympy_shape(node, 0)
-        self.sympy_data_[node.output[0]] = sympy_reduce_product(sympy_shape)
-        self.known_vi_[node.output[0]].CopyFrom(
-            helper.make_tensor_value_info(node.output[0],
-                                          onnx.TensorProto.INT64, []))
-
-    def _infer_Slice(self, node):
-        def less_equal(x, y):
-            try:
-                return bool(x <= y)
-            except TypeError:
-                pass
-            try:
-                return bool(y >= x)
-            except TypeError:
-                pass
-            try:
-                return bool(-x >= -y)
-            except TypeError:
-                pass
-            try:
-                return bool(-y <= -x)
-            except TypeError:
-                # the last attempt; this may raise TypeError
-                return bool(y - x >= 0)
-
-        def handle_negative_index(index, bound):
-            """ normalizes a negative index to be in [0, bound) """
-            try:
-                if not less_equal(0, index):
-                    if is_literal(index) and index <= -self.int_max_:
-                        # this case is handled separately
-                        return index
-                    return bound + index
-            except TypeError:
-                logger.warning("Cannot determine if {} < 0".format(index))
-            return index
-
-        if get_opset(self.out_mp_) <= 9:
-            axes = get_attribute(node, 'axes')
-            starts = get_attribute(node, 'starts')
-            ends = get_attribute(node, 'ends')
-            if not axes:
-                axes = list(range(len(starts)))
-            steps = [1] * len(axes)
-        else:
-            starts = as_list(self._try_get_value(node, 1), keep_none=True)
-            ends = as_list(self._try_get_value(node, 2), keep_none=True)
-            axes = self._try_get_value(node, 3)
-            steps = self._try_get_value(node, 4)
-            if axes is None and not (starts is None and ends is None):
-                axes = list(
-                    range(0, len(starts if starts is not None else ends)))
-            if steps is None and not (starts is None and ends is None):
-                steps = [1] * len(starts if starts is not None else ends)
-            axes = as_list(axes, keep_none=True)
-            steps = as_list(steps, keep_none=True)
-
-        new_sympy_shape = self._get_sympy_shape(node, 0)
-        if starts is None or ends is None:
-            if axes is None:
-                for i in range(len(new_sympy_shape)):
-                    new_sympy_shape[i] = self._new_symbolic_dim_from_output(
-                        node, 0, i)
-            else:
-                new_sympy_shape = get_shape_from_sympy_shape(new_sympy_shape)
-                for i in axes:
-                    new_sympy_shape[i] = self._new_symbolic_dim_from_output(
-                        node, 0, i)
-        else:
-            for i, s, e, t in zip(axes, starts, ends, steps):
-                e = handle_negative_index(e, new_sympy_shape[i])
-                if is_literal(e):
-                    if e >= self.int_max_:
-                        e = new_sympy_shape[i]
-                    elif e <= -self.int_max_:
-                        e = 0 if s > 0 else -1
-                    elif is_literal(new_sympy_shape[i]):
-                        if e < 0:
-                            e = max(0, e + new_sympy_shape[i])
-                        e = min(e, new_sympy_shape[i])
-                    else:
-                        if e > 0:
-                            e = sympy.Min(
-                                e, new_sympy_shape[i]
-                            ) if e > 1 else e  #special case for slicing first to make computation easier
-                else:
-                    if is_literal(new_sympy_shape[i]):
-                        e = sympy.Min(e, new_sympy_shape[i])
-                    else:
-                        try:
-                            if not less_equal(e, new_sympy_shape[i]):
-                                e = new_sympy_shape[i]
-                        except Exception:
-                            logger.warning(
-                                'Unable to determine if {} <= {}, treat as equal'.
-                                format(e, new_sympy_shape[i]))
-                            e = new_sympy_shape[i]
-
-                s = handle_negative_index(s, new_sympy_shape[i])
-                if is_literal(new_sympy_shape[i]) and is_literal(s):
-                    s = max(0, min(s, new_sympy_shape[i]))
-
-                new_sympy_shape[i] = sympy.simplify(
-                    (e - s + t + (-1 if t > 0 else 1)) // t)
-
-            self._update_computed_dims(new_sympy_shape)
-
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], vi.type.tensor_type.elem_type,
-                get_shape_from_sympy_shape(new_sympy_shape)))
-
-        # handle sympy_data if needed, for slice in shape computation
-        if (node.input[0] in self.sympy_data_ and [0] == axes and
-                len(starts) == 1 and len(ends) == 1 and len(steps) == 1):
-            input_sympy_data = self.sympy_data_[node.input[0]]
-            if type(input_sympy_data) == list or (
-                    type(input_sympy_data) == np.array and
-                    len(input_sympy_data.shape) == 1):
-                self.sympy_data_[node.output[0]] = input_sympy_data[starts[
-                    0]:ends[0]:steps[0]]
-
-    def _infer_SoftmaxCrossEntropyLoss(self, node):
-        vi = self.known_vi_[node.output[0]]
-        elem_type = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-        vi.type.tensor_type.elem_type = elem_type
-        vi.type.tensor_type.shape.CopyFrom(onnx.TensorShapeProto())
-
-        if len(node.output) > 1:
-            data_shape = self._get_shape(node, 0)
-            vi = self.known_vi_[node.output[1]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(vi.name, elem_type, data_shape))
-
-    def _infer_Split_Common(self, node, make_value_info_func):
-        input_sympy_shape = self._get_sympy_shape(node, 0)
-        axis = handle_negative_axis(
-            get_attribute(node, 'axis', 0), len(input_sympy_shape))
-        split = get_attribute(node, 'split')
-        if not split:
-            num_outputs = len(node.output)
-            split = [input_sympy_shape[axis] /
-                     sympy.Integer(num_outputs)] * num_outputs
-            self._update_computed_dims(split)
-        else:
-            split = [sympy.Integer(s) for s in split]
-
-        for i_o in range(len(split)):
-            vi = self.known_vi_[node.output[i_o]]
-            vi.CopyFrom(
-                make_value_info_func(node.output[i_o], self.known_vi_[
-                    node.input[0]].type.tensor_type.elem_type,
-                                     get_shape_from_sympy_shape(
-                                         input_sympy_shape[:axis] + [
-                                             split[i_o]
-                                         ] + input_sympy_shape[axis + 1:])))
-            self.known_vi_[vi.name] = vi
-
-    def _infer_Split(self, node):
-        self._infer_Split_Common(node, helper.make_tensor_value_info)
-
-    def _infer_SplitToSequence(self, node):
-        self._infer_Split_Common(node, helper.make_sequence_value_info)
-
-    def _infer_Squeeze(self, node):
-        input_shape = self._get_shape(node, 0)
-        op_set = get_opset(self.out_mp_)
-
-        # Depending on op-version 'axes' are provided as attribute or via 2nd input
-        if op_set < 13:
-            axes = get_attribute(node, 'axes')
-            assert self._try_get_value(node, 1) is None
-        else:
-            axes = self._try_get_value(node, 1)
-            assert get_attribute(node, 'axes') is None
-
-        if axes is None:
-            # No axes have been provided (neither via attribute nor via input).
-            # In this case the 'Shape' op should remove all axis with dimension 1.
-            # For symbolic dimensions we guess they are !=1.
-            output_shape = [s for s in input_shape if s != 1]
-            if self.verbose_ > 0:
-                symbolic_dimensions = [s for s in input_shape if type(s) != int]
-                if len(symbolic_dimensions) > 0:
-                    logger.debug(
-                        f"Symbolic dimensions in input shape of op: '{node.op_type}' node: '{node.name}'. "
-                        +
-                        f"Assuming the following dimensions are never equal to 1: {symbolic_dimensions}"
-                    )
-        else:
-            axes = [handle_negative_axis(a, len(input_shape)) for a in axes]
-            output_shape = []
-            for i in range(len(input_shape)):
-                if i not in axes:
-                    output_shape.append(input_shape[i])
-                else:
-                    assert input_shape[i] == 1 or type(input_shape[i]) != int
-                    if self.verbose_ > 0 and type(input_shape[i]) != int:
-                        logger.debug(
-                            f"Symbolic dimensions in input shape of op: '{node.op_type}' node: '{node.name}'. "
-                            +
-                            f"Assuming the dimension '{input_shape[i]}' at index {i} of the input to be equal to 1."
-                        )
-
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, output_shape))
-        self._pass_on_sympy_data(node)
-
-    def _infer_Tile(self, node):
-        repeats_value = self._try_get_value(node, 1)
-        new_sympy_shape = []
-        if repeats_value is not None:
-            input_sympy_shape = self._get_sympy_shape(node, 0)
-            for i, d in enumerate(input_sympy_shape):
-                new_dim = d * repeats_value[i]
-                new_sympy_shape.append(new_dim)
-            self._update_computed_dims(new_sympy_shape)
-        else:
-            new_sympy_shape = self._new_symbolic_shape(
-                self._get_shape_rank(node, 0), node)
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(
-                node.output[0], vi.type.tensor_type.elem_type,
-                get_shape_from_sympy_shape(new_sympy_shape)))
-
-    def _infer_TopK(self, node):
-        rank = self._get_shape_rank(node, 0)
-        axis = handle_negative_axis(get_attribute(node, 'axis', -1), rank)
-        new_shape = self._get_shape(node, 0)
-
-        if get_opset(self.out_mp_) <= 9:
-            k = get_attribute(node, 'k')
-        else:
-            k = self._get_int_values(node)[1]
-
-        if k == None:
-            k = self._new_symbolic_dim_from_output(node)
-        else:
-            k = as_scalar(k)
-
-        if type(k) in [int, str]:
-            new_shape[axis] = k
-        else:
-            new_sympy_shape = self._get_sympy_shape(node, 0)
-            new_sympy_shape[axis] = k
-            self._update_computed_dims(
-                new_sympy_shape
-            )  # note that TopK dim could be computed in sympy_data, so need to update computed_dims when it enters shape
-            new_shape = get_shape_from_sympy_shape(new_sympy_shape)
-
-        for i_o in range(len(node.output)):
-            vi = self.known_vi_[node.output[i_o]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[
-                    i_o], vi.type.tensor_type.elem_type, new_shape))
-
-    def _infer_Transpose(self, node):
-        if node.input[0] in self.sympy_data_:
-            data_shape = self._get_shape(node, 0)
-            perm = get_attribute(node, 'perm',
-                                 reversed(list(range(len(data_shape)))))
-            input_data = self.sympy_data_[node.input[0]]
-            self.sympy_data_[node.output[0]] = np.transpose(
-                np.array(input_data).reshape(*data_shape),
-                axes=tuple(perm)).flatten().tolist()
-
-    def _infer_Unsqueeze(self, node):
-        input_shape = self._get_shape(node, 0)
-        op_set = get_opset(self.out_mp_)
-
-        # Depending on op-version 'axes' are provided as attribute or via 2nd input
-        if op_set < 13:
-            axes = get_attribute(node, 'axes')
-            assert self._try_get_value(node, 1) is None
-        else:
-            axes = self._try_get_value(node, 1)
-            assert get_attribute(node, 'axes') is None
-
-        output_rank = len(input_shape) + len(axes)
-        axes = [handle_negative_axis(a, output_rank) for a in axes]
-
-        input_axis = 0
-        output_shape = []
-        for i in range(output_rank):
-            if i in axes:
-                output_shape.append(1)
-            else:
-                output_shape.append(input_shape[input_axis])
-                input_axis += 1
-
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], self.known_vi_[
-                node.input[0]].type.tensor_type.elem_type, output_shape))
-
-        self._pass_on_sympy_data(node)
-
-    def _infer_ZipMap(self, node):
-        map_key_type = None
-        if get_attribute(node, 'classlabels_int64s') is not None:
-            map_key_type = onnx.TensorProto.INT64
-        elif get_attribute(node, 'classlabels_strings') is not None:
-            map_key_type = onnx.TensorProto.STRING
-
-        assert map_key_type is not None
-        new_vi = onnx.ValueInfoProto()
-        new_vi.name = node.output[0]
-        new_vi.type.sequence_type.elem_type.map_type.value_type.tensor_type.elem_type = onnx.TensorProto.FLOAT
-        new_vi.type.sequence_type.elem_type.map_type.key_type = map_key_type
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(new_vi)
-
-    def _infer_Attention(self, node):
-        shape = self._get_shape(node, 0)
-        shape_bias = self._get_shape(node, 2)
-        assert len(shape) == 3 and len(shape_bias) == 1
-        qkv_hidden_sizes_attr = get_attribute(node, 'qkv_hidden_sizes')
-        if qkv_hidden_sizes_attr is not None:
-            assert len(qkv_hidden_sizes_attr) == 3
-            shape[2] = int(qkv_hidden_sizes_attr[2])
-        else:
-            shape[2] = int(shape_bias[0] / 3)
-        output_dtype = self.known_vi_[node.input[0]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], output_dtype, shape))
-
-        if len(node.output) > 1:
-            # input shape: (batch_size, sequence_length, hidden_size)
-            # past shape: (2, batch_size, num_heads, past_sequence_length, head_size)
-            # mask shape: (batch_size, total_sequence_length) or (batch_size, sequence_length, total_sequence_length) or (batch_size, 1, max_seq_len, max_seq_len)
-            # present shape: (2, batch_size, num_heads, total_sequence_length, head_size), where total_sequence_length=sequence_length+past_sequence_length
-            input_shape = self._get_shape(node, 0)
-            past_shape = self._get_shape(node, 4)
-            mask_shape = self._get_shape(node, 3)
-            if len(past_shape) == 5:
-                if len(mask_shape) in [2, 3]:
-                    past_shape[3] = mask_shape[-1]
-                elif isinstance(input_shape[1], int) and isinstance(
-                        past_shape[3], int):
-                    past_shape[3] = input_shape[1] + past_shape[3]
-                else:
-                    past_shape[3] = f"{past_shape[3]}+{input_shape[1]}"
-                vi = self.known_vi_[node.output[1]]
-                vi.CopyFrom(
-                    helper.make_tensor_value_info(vi.name, output_dtype,
-                                                  past_shape))
-
-    def _infer_BiasGelu(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_FastGelu(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_Gelu(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_LayerNormalization(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_LongformerAttention(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_EmbedLayerNormalization(self, node):
-        input_ids_shape = self._get_shape(node, 0)
-        word_embedding_shape = self._get_shape(node, 2)
-        assert len(input_ids_shape) == 2 and len(word_embedding_shape) == 2
-        output_shape = input_ids_shape + [word_embedding_shape[1]]
-
-        word_embedding_dtype = self.known_vi_[node.input[
-            2]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0], word_embedding_dtype,
-                                          output_shape))
-
-        mask_index_shape = [input_ids_shape[0]]
-        vi = self.known_vi_[node.output[1]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[
-                1], onnx.TensorProto.INT32, mask_index_shape))
-
-        if len(node.output) > 2:
-            # Optional output of add before layer nomalization is done
-            # shape is same as the output
-            vi = self.known_vi_[node.output[2]]
-            vi.CopyFrom(
-                helper.make_tensor_value_info(node.output[
-                    2], word_embedding_dtype, output_shape))
-
-    def _infer_SkipLayerNormalization(self, node):
-        self._propagate_shape_and_type(node)
-
-    def _infer_PythonOp(self, node):
-        output_tensor_types = get_attribute(node, 'output_tensor_types')
-        assert output_tensor_types
-        output_tensor_ranks = get_attribute(node, 'output_tensor_ranks')
-        assert output_tensor_ranks
-
-        # set the context output seperately.
-        # The first output is autograd's context.
-        vi = self.known_vi_[node.output[0]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[0],
-                                          onnx.TensorProto.INT64, []))
-
-        # Outputs after autograd's context are tensors.
-        # We assume their ranks are fixed for different model inputs.
-        for i in range(len(node.output) - 1):
-            # Process the i-th tensor outputs.
-            vi = self.known_vi_[node.output[i + 1]]
-            sympy_shape = self._new_symbolic_shape(output_tensor_ranks[i], node)
-            shape = get_shape_from_sympy_shape(sympy_shape)
-            value_info = helper.make_tensor_value_info(
-                node.output[i + 1], output_tensor_types[i], shape)
-            vi.CopyFrom(value_info)
-
-    def _propagate_shape_and_type(self, node, input_index=0, output_index=0):
-        shape = self._get_shape(node, input_index)
-        output_dtype = self.known_vi_[node.input[
-            input_index]].type.tensor_type.elem_type
-        vi = self.known_vi_[node.output[output_index]]
-        vi.CopyFrom(
-            helper.make_tensor_value_info(node.output[output_index],
-                                          output_dtype, shape))
-
-    def _is_none_dim(self, dim_value):
-        if type(dim_value) != str:
-            return False
-        if "unk__" not in dim_value:
-            return False
-        if dim_value in self.symbolic_dims_.keys():
-            return False
-        return True
-
-    def _is_shape_contains_none_dim(self, out_shape):
-        for out in out_shape:
-            if self._is_none_dim(out):
-                return out
-        return None
-
-    def _infer_impl(self, start_sympy_data=None):
-        self.sympy_data_ = start_sympy_data or {}
-        self.out_mp_.graph.ClearField('value_info')
-        self._apply_suggested_merge(graph_input_only=True)
-        self.input_symbols_ = set()
-        for i in self.out_mp_.graph.input:
-            input_shape = get_shape_from_value_info(i)
-            if input_shape is None:
-                continue
-
-            if is_sequence(i.type):
-                input_dims = i.type.sequence_type.elem_type.tensor_type.shape.dim
-            else:
-                input_dims = i.type.tensor_type.shape.dim
-
-            for i_dim, dim in enumerate(input_shape):
-                if dim is None:
-                    # some models use None for symbolic dim in input, replace it with a string
-                    input_dims[i_dim].dim_param = str(
-                        self._new_symbolic_dim(i.name, i_dim))
-
-            self.input_symbols_.update(
-                [d for d in input_shape if type(d) == str])
-
-        for s in self.input_symbols_:
-            if s in self.suggested_merge_:
-                s_merge = self.suggested_merge_[s]
-                assert s_merge in self.symbolic_dims_
-                self.symbolic_dims_[s] = self.symbolic_dims_[s_merge]
-            else:
-                # Since inputs are not produced by other ops, we can assume positivity
-                self.symbolic_dims_[s] = sympy.Symbol(
-                    s, integer=True, positive=True)
-        # create a temporary ModelProto for single node inference
-        # note that we remove initializer to have faster inference
-        # for tensor ops like Reshape/Tile/Expand that read initializer, we need to do sympy computation based inference anyways
-        self.tmp_mp_ = onnx.ModelProto()
-        self.tmp_mp_.CopyFrom(self.out_mp_)
-        self.tmp_mp_.graph.ClearField('initializer')
-
-        # compute prerequesite for node for topological sort
-        # node with subgraphs may have dependency on implicit inputs, which will affect topological sort
-        prereq_for_node = {
-        }  # map from node to all its inputs, including implicit ones in subgraph
-
-        def get_prereq(node):
-            names = set(i for i in node.input if i)
-            subgraphs = []
-            if 'If' == node.op_type:
-                subgraphs = [
-                    get_attribute(node, 'then_branch'),
-                    get_attribute(node, 'else_branch')
-                ]
-            elif node.op_type in ['Loop', 'Scan']:
-                subgraphs = [get_attribute(node, 'body')]
-            for g in subgraphs:
-                g_outputs_and_initializers = {i.name for i in g.initializer}
-                g_prereq = set()
-                for n in g.node:
-                    g_outputs_and_initializers.update(n.output)
-                for n in g.node:
-                    g_prereq.update([
-                        i for i in get_prereq(n)
-                        if i not in g_outputs_and_initializers
-                    ])
-                names.update(g_prereq)
-                # remove subgraph inputs from g_prereq since those are local-only
-                for i in g.input:
-                    if i.name in names:
-                        names.remove(i.name)
-            return names
-
-        for n in self.tmp_mp_.graph.node:
-            prereq_for_node[n.output[0]] = get_prereq(n)
-
-        # topological sort nodes, note there might be dead nodes so we check if all graph outputs are reached to terminate
-        sorted_nodes = []
-        sorted_known_vi = set([
-            i.name
-            for i in list(self.out_mp_.graph.input) + list(
-                self.out_mp_.graph.initializer)
-        ])
-        if any([o.name in sorted_known_vi for o in self.out_mp_.graph.output]):
-            # Loop/Scan will have some graph output in graph inputs, so don't do topological sort
-            sorted_nodes = self.out_mp_.graph.node
-        else:
-            while not all(
-                [o.name in sorted_known_vi for o in self.out_mp_.graph.output]):
-                old_sorted_nodes_len = len(sorted_nodes)
-                for node in self.out_mp_.graph.node:
-                    if (node.output[0] not in sorted_known_vi) and all([
-                            i in sorted_known_vi
-                            for i in prereq_for_node[node.output[0]] if i
-                    ]):
-                        sorted_known_vi.update(node.output)
-                        sorted_nodes.append(node)
-                if old_sorted_nodes_len == len(sorted_nodes) and not all([
-                        o.name in sorted_known_vi
-                        for o in self.out_mp_.graph.output
-                ]):
-                    raise Exception('Invalid model with cyclic graph')
-
-        for node in sorted_nodes:
-            assert all([i in self.known_vi_ for i in node.input if i])
-            self._onnx_infer_single_node(node)
-            known_aten_op = False
-            if node.op_type in self.dispatcher_:
-                self.dispatcher_[node.op_type](node)
-            elif node.op_type in ['ConvTranspose']:
-                # onnx shape inference ops like ConvTranspose may have empty shape for symbolic input
-                # before adding symbolic compute for them
-                # mark the output type as UNDEFINED to allow guessing of rank
-                vi = self.known_vi_[node.output[0]]
-                if len(vi.type.tensor_type.shape.dim) == 0:
-                    vi.type.tensor_type.elem_type = onnx.TensorProto.UNDEFINED
-            elif node.op_type == 'ATen' and node.domain == 'org.pytorch.aten':
-                for attr in node.attribute:
-                    # TODO: Is overload_name needed?
-                    if attr.name == 'operator':
-                        aten_op_name = attr.s.decode('utf-8') if isinstance(
-                            attr.s, bytes) else attr.s
-                        if aten_op_name in self.aten_op_dispatcher_:
-                            known_aten_op = True
-                            self.aten_op_dispatcher_[aten_op_name](node)
-                        break
-
-            if self.verbose_ > 2:
-                logger.debug(node.op_type + ': ' + node.name)
-                for i, name in enumerate(node.input):
-                    logger.debug('  Input {}: {} {}'.format(
-                        i, name, 'initializer'
-                        if name in self.initializers_ else ''))
-
-            # onnx automatically merge dims with value, i.e. Mul(['aaa', 'bbb'], [1000, 1]) -> [1000, 'bbb']
-            # symbolic shape inference needs to apply merge of 'aaa' -> 1000 in this case
-            if node.op_type in [
-                    'Add', 'Sub', 'Mul', 'Div', 'MatMul', 'MatMulInteger',
-                    'MatMulInteger16', 'Where', 'Sum'
-            ]:
-                vi = self.known_vi_[node.output[0]]
-                out_rank = len(get_shape_from_type_proto(vi.type))
-                in_shapes = [
-                    self._get_shape(node, i) for i in range(len(node.input))
-                ]
-                for d in range(out_rank - (2 if node.op_type in [
-                        'MatMul', 'MatMulInteger', 'MatMulInteger16'
-                ] else 0)):
-                    in_dims = [
-                        s[len(s) - out_rank + d] for s in in_shapes
-                        if len(s) + d >= out_rank
-                    ]
-                    if len(in_dims) > 1:
-                        self._check_merged_dims(in_dims, allow_broadcast=True)
-
-            for i_o in range(len(node.output)):
-                vi = self.known_vi_[node.output[i_o]]
-                out_type = vi.type
-                out_type_kind = out_type.WhichOneof('value')
-
-                # do not process shape for non-tensors
-                if out_type_kind not in [
-                        'tensor_type', 'sparse_tensor_type', None
-                ]:
-                    if self.verbose_ > 2:
-                        if out_type_kind == 'sequence_type':
-                            seq_cls_type = out_type.sequence_type.elem_type.WhichOneof(
-                                'value')
-                            if 'tensor_type' == seq_cls_type:
-                                logger.debug('  {}: sequence of {} {}'.format(
-                                    node.output[i_o],
-                                    str(get_shape_from_value_info(vi)),
-                                    onnx.TensorProto.DataType.Name(
-                                        vi.type.sequence_type.elem_type.
-                                        tensor_type.elem_type)))
-                            else:
-                                logger.debug('  {}: sequence of {}'.format(
-                                    node.output[i_o], seq_cls_type))
-                        else:
-                            logger.debug('  {}: {}'.format(node.output[i_o],
-                                                           out_type_kind))
-                    continue
-
-                out_shape = get_shape_from_value_info(vi)
-                out_type_undefined = out_type.tensor_type.elem_type == onnx.TensorProto.UNDEFINED
-                if self.verbose_ > 2:
-                    logger.debug('  {}: {} {}'.format(
-                        node.output[i_o],
-                        str(out_shape),
-                        onnx.TensorProto.DataType.Name(
-                            vi.type.tensor_type.elem_type)))
-                    if node.output[i_o] in self.sympy_data_:
-                        logger.debug('  Sympy Data: ' + str(self.sympy_data_[
-                            node.output[i_o]]))
-
-                # onnx >= 1.11.0, use unk__#index instead of None when the shape dim is uncertain
-                if (out_shape is not None and
-                    (None in out_shape or
-                     self._is_shape_contains_none_dim(out_shape))
-                    ) or out_type_undefined:
-                    if self.auto_merge_:
-                        if node.op_type in [
-                                'Add', 'Sub', 'Mul', 'Div', 'MatMul',
-                                'MatMulInteger', 'MatMulInteger16', 'Concat',
-                                'Where', 'Sum', 'Equal', 'Less', 'Greater',
-                                'LessOrEqual', 'GreaterOrEqual'
-                        ]:
-                            shapes = [
-                                self._get_shape(node, i)
-                                for i in range(len(node.input))
-                            ]
-                            if node.op_type in [
-                                    'MatMul', 'MatMulInteger', 'MatMulInteger16'
-                            ]:
-                                if None in out_shape or self._is_shape_contains_none_dim(
-                                        out_shape):
-                                    if None in out_shape:
-                                        idx = out_shape.index(None)
-                                    else:
-                                        idx = out_shape.index(
-                                            self._is_shape_contains_none_dim(
-                                                out_shape))
-                                    dim_idx = [
-                                        len(s) - len(out_shape) + idx
-                                        for s in shapes
-                                    ]
-                                    # only support auto merge for MatMul for dim < rank-2 when rank > 2
-                                    assert len(
-                                        shapes[0]) > 2 and dim_idx[0] < len(
-                                            shapes[0]) - 2
-                                    assert len(
-                                        shapes[1]) > 2 and dim_idx[1] < len(
-                                            shapes[1]) - 2
-                        elif node.op_type == 'Expand':
-                            # auto merge for cases like Expand([min(batch, 1), min(seq, 512)], [batch, seq])
-                            shapes = [
-                                self._get_shape(node, 0), self._get_value(node,
-                                                                          1)
-                            ]
-                        else:
-                            shapes = []
-
-                        if shapes:
-                            for idx in range(len(out_shape)):
-                                if out_shape[
-                                        idx] is not None and not self._is_none_dim(
-                                            out_shape[idx]):
-                                    continue
-                                # note that the broadcasting rule aligns from right to left
-                                # if a tensor has a lower rank (dim_idx[idx] < 0), it would automatically broadcast and need no merge
-                                dim_idx = [
-                                    len(s) - len(out_shape) + idx
-                                    for s in shapes
-                                ]
-                                if len(dim_idx) > 0:
-                                    self._add_suggested_merge([
-                                        s[i] if is_literal(s[i]) else str(s[i])
-                                        for s, i in zip(shapes, dim_idx)
-                                        if i >= 0
-                                    ])
-                            self.run_ = True
-                        else:
-                            self.run_ = False
-                    else:
-                        self.run_ = False
-
-                    # create new dynamic dims for ops not handled by symbolic shape inference
-                    if self.run_ == False and not node.op_type in self.dispatcher_ and not known_aten_op:
-                        is_unknown_op = out_type_undefined and (
-                            out_shape is None or len(out_shape) == 0)
-                        if is_unknown_op:
-                            # unknown op to ONNX, maybe from higher opset or other domain
-                            # only guess the output rank from input 0 when using guess_output_rank option
-                            out_rank = self._get_shape_rank(
-                                node, 0) if self.guess_output_rank_ else -1
-                        else:
-                            # valid ONNX op, but not handled by symbolic shape inference, just assign dynamic shape
-                            out_rank = len(out_shape)
-
-                        if out_rank >= 0:
-                            new_shape = self._new_symbolic_shape(out_rank, node,
-                                                                 i_o)
-                            if out_type_undefined:
-                                # guess output data type from input vi if not defined
-                                out_dtype = self.known_vi_[node.input[
-                                    0]].type.tensor_type.elem_type
-                            else:
-                                # otherwise, use original data type
-                                out_dtype = vi.type.tensor_type.elem_type
-                            vi.CopyFrom(
-                                helper.make_tensor_value_info(
-                                    vi.name, out_dtype,
-                                    get_shape_from_sympy_shape(new_shape)))
-
-                            if self.verbose_ > 0:
-                                if is_unknown_op:
-                                    logger.debug(
-                                        "Possible unknown op: {} node: {}, guessing {} shape".
-                                        format(node.op_type, node.name,
-                                               vi.name))
-                                if self.verbose_ > 2:
-                                    logger.debug('  {}: {} {}'.format(
-                                        node.output[i_o],
-                                        str(new_shape),
-                                        vi.type.tensor_type.elem_type))
-
-                            self.run_ = True
-                            continue  # continue the inference after guess, no need to stop as no merge is needed
-
-                    if self.verbose_ > 0 or not self.auto_merge_ or out_type_undefined:
-                        logger.debug(
-                            'Stopping at incomplete shape inference at ' +
-                            node.op_type + ': ' + node.name)
-                        logger.debug('node inputs:')
-                        for i in node.input:
-                            logger.debug(self.known_vi_[i])
-                        logger.debug('node outputs:')
-                        for o in node.output:
-                            logger.debug(self.known_vi_[o])
-                        if self.auto_merge_ and not out_type_undefined:
-                            logger.debug('Merging: ' + str(
-                                self.suggested_merge_))
-                    return False
-
-        self.run_ = False
-        return True
-
-    def _update_output_from_vi(self):
-        for output in self.out_mp_.graph.output:
-            if output.name in self.known_vi_:
-                output.CopyFrom(self.known_vi_[output.name])
-
-    @staticmethod
-    def infer_shapes(in_mp,
-                     int_max=2**31 - 1,
-                     auto_merge=False,
-                     guess_output_rank=False,
-                     verbose=0):
-        onnx_opset = get_opset(in_mp)
-        if (not onnx_opset) or onnx_opset < 7:
-            logger.warning('Only support models of onnx opset 7 and above.')
-            return None
-        symbolic_shape_inference = SymbolicShapeInference(
-            int_max, auto_merge, guess_output_rank, verbose)
-        all_shapes_inferred = False
-        symbolic_shape_inference._preprocess(in_mp)
-        while symbolic_shape_inference.run_:
-            all_shapes_inferred = symbolic_shape_inference._infer_impl()
-        symbolic_shape_inference._update_output_from_vi()
-        if not all_shapes_inferred:
-            raise Exception("Incomplete symbolic shape inference")
-        return symbolic_shape_inference.out_mp_
-
-
-def parse_arguments():
-    parser = argparse.ArgumentParser()
-    parser.add_argument('--input', required=True, help='The input model file')
-    parser.add_argument('--output', help='The output model file')
-    parser.add_argument(
-        '--auto_merge',
-        help='Automatically merge symbolic dims when confliction happens',
-        action='store_true',
-        default=False)
-    parser.add_argument(
-        '--int_max',
-        help='maximum value for integer to be treated as boundless for ops like slice',
-        type=int,
-        default=2**31 - 1)
-    parser.add_argument(
-        '--guess_output_rank',
-        help='guess output rank to be the same as input 0 for unknown ops',
-        action='store_true',
-        default=False)
-    parser.add_argument(
-        '--verbose',
-        help='Prints detailed logs of inference, 0: turn off, 1: warnings, 3: detailed',
-        type=int,
-        default=0)
-    return parser.parse_args()
-
-
-if __name__ == '__main__':
-    args = parse_arguments()
-    logger.info('input model: ' + args.input)
-    if args.output:
-        logger.info('output model ' + args.output)
-    logger.info('Doing symbolic shape inference...')
-    out_mp = SymbolicShapeInference.infer_shapes(
-        onnx.load(args.input), args.int_max, args.auto_merge,
-        args.guess_output_rank, args.verbose)
-    if args.output and out_mp:
-        onnx.save(out_mp, args.output)
-        logger.info('Done!')
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_opt.sh b/speechx/examples/ds2_ol/onnx/local/onnx_opt.sh
deleted file mode 100755
index ce2f24e58..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_opt.sh
+++ /dev/null
@@ -1,20 +0,0 @@
-#!/bin/bash
-
-set -e
-
-if [ $# != 3 ];then
-    # ./local/onnx_opt.sh model.old.onnx model.opt.onnx  "audio_chunk:1,-1,161  audio_chunk_lens:1 chunk_state_c_box:5,1,1024 chunk_state_h_box:5,1,1024"                                                 
-    echo "usage: $0 onnx.model.in onnx.model.out input_shape "
-    exit 1
-fi
-
-# onnx optimizer
-pip install onnx-simplifier
-
-in=$1
-out=$2
-input_shape=$3
-
-check_n=3
-
-onnxsim $in $out $check_n --dynamic-input-shape  --input-shape $input_shape
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_prune_model.py b/speechx/examples/ds2_ol/onnx/local/onnx_prune_model.py
deleted file mode 100755
index 5b85eef3e..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_prune_model.py
+++ /dev/null
@@ -1,128 +0,0 @@
-#!/usr/bin/env python3 -W ignore::DeprecationWarning
-# prune model by output names
-import argparse
-import copy
-import sys
-
-import onnx
-
-
-def parse_arguments():
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        '--model',
-        required=True,
-        help='Path of directory saved the input model.')
-    parser.add_argument(
-        '--output_names',
-        required=True,
-        nargs='+',
-        help='The outputs of pruned model.')
-    parser.add_argument(
-        '--save_file', required=True, help='Path to save the new onnx model.')
-    return parser.parse_args()
-
-
-if __name__ == '__main__':
-    args = parse_arguments()
-
-    if len(set(args.output_names)) < len(args.output_names):
-        print(
-            "[ERROR] There's dumplicate name in --output_names, which is not allowed."
-        )
-        sys.exit(-1)
-
-    model = onnx.load(args.model)
-
-    # collect all node outputs and graph output
-    output_tensor_names = set()
-    for node in model.graph.node:
-        for out in node.output:
-            # may contain model output
-            output_tensor_names.add(out)
-
-    # for out in model.graph.output:
-    #     output_tensor_names.add(out.name)
-
-    for output_name in args.output_names:
-        if output_name not in output_tensor_names:
-            print(
-                "[ERROR] Cannot find output tensor name '{}' in onnx model graph.".
-                format(output_name))
-            sys.exit(-1)
-
-    output_node_indices = set()  # has output names
-    output_to_node = dict()  # all node outputs
-    for i, node in enumerate(model.graph.node):
-        for out in node.output:
-            output_to_node[out] = i
-            if out in args.output_names:
-                output_node_indices.add(i)
-
-    # from outputs find all the ancestors
-    reserved_node_indices = copy.deepcopy(
-        output_node_indices)  # nodes need to keep
-    reserved_inputs = set()  # model input to keep
-    new_output_node_indices = copy.deepcopy(output_node_indices)
-
-    while True and len(new_output_node_indices) > 0:
-        output_node_indices = copy.deepcopy(new_output_node_indices)
-
-        new_output_node_indices = set()
-
-        for out_node_idx in output_node_indices:
-            # backtrace to parenet
-            for ipt in model.graph.node[out_node_idx].input:
-                if ipt in output_to_node:
-                    reserved_node_indices.add(output_to_node[ipt])
-                    new_output_node_indices.add(output_to_node[ipt])
-                else:
-                    reserved_inputs.add(ipt)
-
-    num_inputs = len(model.graph.input)
-    num_outputs = len(model.graph.output)
-    num_nodes = len(model.graph.node)
-    print(
-        f"old graph has {num_inputs} inputs, {num_outputs} outpus, {num_nodes} nodes"
-    )
-    print(f"{len(reserved_node_indices)} node to keep.")
-
-    # del node not to keep
-    for idx in range(num_nodes - 1, -1, -1):
-        if idx not in reserved_node_indices:
-            del model.graph.node[idx]
-
-    # del graph input not to keep
-    for idx in range(num_inputs - 1, -1, -1):
-        if model.graph.input[idx].name not in reserved_inputs:
-            del model.graph.input[idx]
-
-    # del old graph outputs
-    for i in range(num_outputs):
-        del model.graph.output[0]
-
-    # new graph output as user input
-    for out in args.output_names:
-        model.graph.output.extend([onnx.ValueInfoProto(name=out)])
-
-    # infer shape
-    try:
-        from onnx_infer_shape import SymbolicShapeInference
-        model = SymbolicShapeInference.infer_shapes(
-            model,
-            int_max=2**31 - 1,
-            auto_merge=True,
-            guess_output_rank=False,
-            verbose=1)
-    except Exception as e:
-        print(f"skip infer shape step: {e}")
-
-    # check onnx model
-    onnx.checker.check_model(model)
-    # save onnx model
-    onnx.save(model, args.save_file)
-    print("[Finished] The new model saved in {}.".format(args.save_file))
-    print("[DEBUG INFO] The inputs of new model: {}".format(
-        [x.name for x in model.graph.input]))
-    print("[DEBUG INFO] The outputs of new model: {}".format(
-        [x.name for x in model.graph.output]))
diff --git a/speechx/examples/ds2_ol/onnx/local/onnx_rename_model.py b/speechx/examples/ds2_ol/onnx/local/onnx_rename_model.py
deleted file mode 100755
index fc00a82ec..000000000
--- a/speechx/examples/ds2_ol/onnx/local/onnx_rename_model.py
+++ /dev/null
@@ -1,111 +0,0 @@
-#!/usr/bin/env python3 -W ignore::DeprecationWarning
-# rename node to new names
-import argparse
-import sys
-
-import onnx
-
-
-def parse_arguments():
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        '--model',
-        required=True,
-        help='Path of directory saved the input model.')
-    parser.add_argument(
-        '--origin_names',
-        required=True,
-        nargs='+',
-        help='The original name you want to modify.')
-    parser.add_argument(
-        '--new_names',
-        required=True,
-        nargs='+',
-        help='The new name you want change to, the number of new_names should be same with the number of origin_names'
-    )
-    parser.add_argument(
-        '--save_file', required=True, help='Path to save the new onnx model.')
-    return parser.parse_args()
-
-
-if __name__ == '__main__':
-    args = parse_arguments()
-
-    if len(set(args.origin_names)) < len(args.origin_names):
-        print(
-            "[ERROR] There's dumplicate name in --origin_names, which is not allowed."
-        )
-        sys.exit(-1)
-
-    if len(set(args.new_names)) < len(args.new_names):
-        print(
-            "[ERROR] There's dumplicate name in --new_names, which is not allowed."
-        )
-        sys.exit(-1)
-
-    if len(args.new_names) != len(args.origin_names):
-        print(
-            "[ERROR] Number of --new_names must be same with the number of --origin_names."
-        )
-        sys.exit(-1)
-
-    model = onnx.load(args.model)
-
-    # collect input and all node output
-    output_tensor_names = set()
-    for ipt in model.graph.input:
-        output_tensor_names.add(ipt.name)
-
-    for node in model.graph.node:
-        for out in node.output:
-            output_tensor_names.add(out)
-
-    for origin_name in args.origin_names:
-        if origin_name not in output_tensor_names:
-            print(
-                f"[ERROR] Cannot find tensor name '{origin_name}' in onnx model graph."
-            )
-            sys.exit(-1)
-
-    for new_name in args.new_names:
-        if new_name in output_tensor_names:
-            print(
-                "[ERROR] The defined new_name '{}' is already exist in the onnx model, which is not allowed."
-            )
-            sys.exit(-1)
-
-    # rename graph input
-    for i, ipt in enumerate(model.graph.input):
-        if ipt.name in args.origin_names:
-            idx = args.origin_names.index(ipt.name)
-            model.graph.input[i].name = args.new_names[idx]
-
-    # rename node input and output
-    for i, node in enumerate(model.graph.node):
-        for j, ipt in enumerate(node.input):
-            if ipt in args.origin_names:
-                idx = args.origin_names.index(ipt)
-                model.graph.node[i].input[j] = args.new_names[idx]
-
-        for j, out in enumerate(node.output):
-            if out in args.origin_names:
-                idx = args.origin_names.index(out)
-                model.graph.node[i].output[j] = args.new_names[idx]
-
-    # rename graph output
-    for i, out in enumerate(model.graph.output):
-        if out.name in args.origin_names:
-            idx = args.origin_names.index(out.name)
-            model.graph.output[i].name = args.new_names[idx]
-
-    # check onnx model
-    onnx.checker.check_model(model)
-
-    # save model
-    onnx.save(model, args.save_file)
-
-    print("[Finished] The new model saved in {}.".format(args.save_file))
-    print("[DEBUG INFO] The inputs of new model: {}".format(
-        [x.name for x in model.graph.input]))
-    print("[DEBUG INFO] The outputs of new model: {}".format(
-        [x.name for x in model.graph.output]))
diff --git a/speechx/examples/ds2_ol/onnx/local/ort_dyanmic_quant.py b/speechx/examples/ds2_ol/onnx/local/ort_dyanmic_quant.py
deleted file mode 100755
index 2c5692369..000000000
--- a/speechx/examples/ds2_ol/onnx/local/ort_dyanmic_quant.py
+++ /dev/null
@@ -1,48 +0,0 @@
-#!/usr/bin/env python3
-import argparse
-
-from onnxruntime.quantization import quantize_dynamic
-from onnxruntime.quantization import QuantType
-
-
-def quantize_onnx_model(onnx_model_path,
-                        quantized_model_path,
-                        nodes_to_exclude=[]):
-    print("Starting quantization...")
-
-    quantize_dynamic(
-        onnx_model_path,
-        quantized_model_path,
-        weight_type=QuantType.QInt8,
-        nodes_to_exclude=nodes_to_exclude)
-
-    print(f"Quantized model saved to: {quantized_model_path}")
-
-
-def main():
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "--model-in",
-        type=str,
-        required=True,
-        help="ONNX model", )
-    parser.add_argument(
-        "--model-out",
-        type=str,
-        required=True,
-        default='model.quant.onnx',
-        help="ONNX model", )
-    parser.add_argument(
-        "--nodes-to-exclude",
-        type=str,
-        required=True,
-        help="nodes to exclude. e.g. conv,linear.", )
-
-    args = parser.parse_args()
-
-    nodes_to_exclude = args.nodes_to_exclude.split(',')
-    quantize_onnx_model(args.model_in, args.model_out, nodes_to_exclude)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/speechx/examples/ds2_ol/onnx/local/ort_opt.py b/speechx/examples/ds2_ol/onnx/local/ort_opt.py
deleted file mode 100755
index 8e995bcf0..000000000
--- a/speechx/examples/ds2_ol/onnx/local/ort_opt.py
+++ /dev/null
@@ -1,45 +0,0 @@
-#!/usr/bin/env python3
-import argparse
-
-import onnxruntime as ort
-
-# onnxruntime optimizer.
-# https://onnxruntime.ai/docs/performance/graph-optimizations.html
-# https://onnxruntime.ai/docs/api/python/api_summary.html#api
-
-
-def parse_arguments():
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        '--model_in', required=True, type=str, help='Path to onnx model.')
-    parser.add_argument(
-        '--opt_level',
-        required=True,
-        type=int,
-        default=0,
-        choices=[0, 1, 2],
-        help='Path to onnx model.')
-    parser.add_argument(
-        '--model_out', required=True, help='path to save the optimized model.')
-    parser.add_argument('--debug', default=False, help='output debug info.')
-    return parser.parse_args()
-
-
-if __name__ == '__main__':
-    args = parse_arguments()
-
-    sess_options = ort.SessionOptions()
-
-    # Set graph optimization level
-    print(f"opt level: {args.opt_level}")
-    if args.opt_level == 0:
-        sess_options.graph_optimization_level = ort.GraphOptimizationLevel.ORT_ENABLE_BASIC
-    elif args.opt_level == 1:
-        sess_options.graph_optimization_level = ort.GraphOptimizationLevel.ORT_ENABLE_EXTENDED
-    else:
-        sess_options.graph_optimization_level = ort.GraphOptimizationLevel.ORT_ENABLE_ALL
-
-    # To enable model serialization after graph optimization set this
-    sess_options.optimized_model_filepath = args.model_out
-
-    session = ort.InferenceSession(args.model_in, sess_options)
diff --git a/speechx/examples/ds2_ol/onnx/local/tonnx.sh b/speechx/examples/ds2_ol/onnx/local/tonnx.sh
deleted file mode 100755
index 104872303..000000000
--- a/speechx/examples/ds2_ol/onnx/local/tonnx.sh
+++ /dev/null
@@ -1,26 +0,0 @@
-#!/bin/bash
-
-if [ $# != 4 ];then
-    # local/tonnx.sh data/exp/deepspeech2_online/checkpoints avg_1.jit.pdmodel avg_1.jit.pdiparams exp/model.onnx   
-    echo "usage: $0 model_dir model_name param_name onnx_output_name"
-    exit 1
-fi
-
-dir=$1
-model=$2
-param=$3
-output=$4
-
-pip install paddle2onnx
-pip install onnx
-
-# https://github.com/PaddlePaddle/Paddle2ONNX#%E5%91%BD%E4%BB%A4%E8%A1%8C%E8%BD%AC%E6%8D%A2
- # opset10 support quantize
-paddle2onnx --model_dir $dir \
-            --model_filename $model \
-            --params_filename $param \
-            --save_file $output \
-            --enable_dev_version True \
-            --opset_version 11 \
-            --enable_onnx_checker True
-            
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/onnx/path.sh b/speechx/examples/ds2_ol/onnx/path.sh
deleted file mode 100755
index 97d487379..000000000
--- a/speechx/examples/ds2_ol/onnx/path.sh
+++ /dev/null
@@ -1,14 +0,0 @@
-# This contains the locations of binarys build required for running the examples.
-
-MAIN_ROOT=`realpath $PWD/../../../../`
-SPEECHX_ROOT=$PWD/../../../
-SPEECHX_BUILD=$SPEECHX_ROOT/build/speechx
-
-SPEECHX_TOOLS=$SPEECHX_ROOT/tools
-TOOLS_BIN=$SPEECHX_TOOLS/valgrind/install/bin
-
-[ -d $SPEECHX_BUILD ] || { echo "Error: 'build/speechx' directory not found. please ensure that the project build successfully"; }
-
-export LC_AL=C
-
-export PATH=$PATH:$TOOLS_BIN
diff --git a/speechx/examples/ds2_ol/onnx/run.sh b/speechx/examples/ds2_ol/onnx/run.sh
deleted file mode 100755
index 3dc5e9100..000000000
--- a/speechx/examples/ds2_ol/onnx/run.sh
+++ /dev/null
@@ -1,91 +0,0 @@
-#!/bin/bash
-
-set -e
-
-. path.sh
-
-stage=0
-stop_stage=50
-tarfile=asr0_deepspeech2_online_wenetspeech_ckpt_1.0.2.model.tar.gz
-#tarfile=asr0_deepspeech2_online_aishell_fbank161_ckpt_1.0.1.model.tar.gz
-model_prefix=avg_10.jit
-#model_prefix=avg_1.jit
-model=${model_prefix}.pdmodel
-param=${model_prefix}.pdiparams
-
-. utils/parse_options.sh
-
-data=data
-exp=exp
-
-mkdir -p $data $exp
-
-dir=$data/exp/deepspeech2_online/checkpoints
-
-# wenetspeech or aishell
-model_type=$(echo $tarfile | cut -d '_' -f 4)
-
-if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ];then
-    test -f $data/$tarfile || wget -P $data -c https://paddlespeech.bj.bcebos.com/s2t/$model_type/asr0/$tarfile
-
-    # wenetspeech ds2 model
-    pushd $data
-    tar zxvf $tarfile 
-    popd
-
-    # ds2 model demo inputs
-    pushd $exp
-    wget -c http://paddlespeech.bj.bcebos.com/speechx/examples/ds2_ol/onnx/static_ds2online_inputs.pickle
-    popd
-fi
-
-input_file=$exp/static_ds2online_inputs.pickle
-test -e $input_file
-
-if [ ${stage} -le 1 ] && [ ${stop_stage} -ge 1 ];then
-    # to onnx
-   ./local/tonnx.sh $dir $model $param $exp/model.onnx
-
-   ./local/infer_check.py --input_file $input_file --model_type $model_type --model_dir $dir --model_prefix $model_prefix --onnx_model $exp/model.onnx
-fi
-
-
-if [ ${stage} -le 2 ] && [ ${stop_stage} -ge 2 ] ;then
-    # ort graph optmize
-    ./local/ort_opt.py --model_in $exp/model.onnx --opt_level 0 --model_out $exp/model.ort.opt.onnx
-
-    ./local/infer_check.py --input_file $input_file --model_type $model_type  --model_dir $dir --model_prefix $model_prefix --onnx_model $exp/model.ort.opt.onnx
-fi
-
-
-if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ];then
-    # convert opset_num to 11
-    ./local/onnx_convert_opset.py --target-opset 11  --model-file $exp/model.ort.opt.onnx --save-model $exp/model.optset11.onnx 
-
-    # quant model
-    nodes_to_exclude='p2o.Conv.0,p2o.Conv.2'
-    ./local/ort_dyanmic_quant.py --model-in $exp/model.optset11.onnx --model-out $exp/model.optset11.quant.onnx --nodes-to-exclude "${nodes_to_exclude}"
-
-    ./local/infer_check.py --input_file $input_file --model_type $model_type  --model_dir $dir --model_prefix $model_prefix --onnx_model $exp/model.optset11.quant.onnx
-fi
-
-
-# aishell rnn hidden is 1024
-# wenetspeech rnn hiddn is 2048
-if [ $model_type == 'aishell' ];then
-    input_shape="audio_chunk:1,-1,161  audio_chunk_lens:1 chunk_state_c_box:5,1,1024 chunk_state_h_box:5,1,1024"  
-elif [ $model_type == 'wenetspeech' ];then
-    input_shape="audio_chunk:1,-1,161  audio_chunk_lens:1 chunk_state_c_box:5,1,2048 chunk_state_h_box:5,1,2048"  
-else
-    echo "not support: $model_type"
-    exit -1
-fi
-
-
-if [ ${stage} -le 51 ] && [ ${stop_stage} -ge 51 ] ;then
-    # wenetspeech ds2 model execed 2GB limit, will error.
-    # simplifying onnx model
-    ./local/onnx_opt.sh $exp/model.onnx $exp/model.opt.onnx  "$input_shape"
-
-    ./local/infer_check.py --input_file $input_file --model_type $model_type  --model_dir $dir --model_prefix $model_prefix --onnx_model $exp/model.opt.onnx
-fi
diff --git a/speechx/examples/ds2_ol/onnx/utils b/speechx/examples/ds2_ol/onnx/utils
deleted file mode 120000
index c2519a9dd..000000000
--- a/speechx/examples/ds2_ol/onnx/utils
+++ /dev/null
@@ -1 +0,0 @@
-../../../../utils/
\ No newline at end of file
diff --git a/speechx/examples/ds2_ol/websocket/.gitignore b/speechx/examples/ds2_ol/websocket/.gitignore
deleted file mode 100644
index bbd86a25b..000000000
--- a/speechx/examples/ds2_ol/websocket/.gitignore
+++ /dev/null
@@ -1,2 +0,0 @@
-data
-exp
diff --git a/speechx/examples/ds2_ol/websocket/README.md b/speechx/examples/ds2_ol/websocket/README.md
deleted file mode 100644
index 3fa84135f..000000000
--- a/speechx/examples/ds2_ol/websocket/README.md
+++ /dev/null
@@ -1,78 +0,0 @@
-#  Streaming DeepSpeech2 Server with WebSocket
-
-This example is about using `websocket` as streaming deepspeech2 server. For deepspeech2 model training please see [here](../../../../examples/aishell/asr0/).
-
-The websocket protocal is same to [PaddleSpeech Server](../../../../demos/streaming_asr_server/), 
-for detail of implementation please see [here](../../../speechx/protocol/websocket/).
-
-
-## Source path.sh
-
-```bash
-. path.sh
-```
-
-SpeechX bins is under `echo $SPEECHX_BUILD`, more info please see `path.sh`.
-
-
-## Start WebSocket Server
-
-```bash
-bash websoket_server.sh
-```
-
-The output is like below:
-
-```text
-I1130 02:19:32.029882 12856 cmvn_json2kaldi_main.cc:39] cmvn josn path: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/model/data/mean_std.json
-I1130 02:19:32.032230 12856 cmvn_json2kaldi_main.cc:73] nframe: 907497
-I1130 02:19:32.032564 12856 cmvn_json2kaldi_main.cc:85] cmvn stats have write into: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/cmvn.ark
-I1130 02:19:32.032579 12856 cmvn_json2kaldi_main.cc:86] Binary: 1
-I1130 02:19:32.798342 12937 feature_pipeline.h:53] cmvn file: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/cmvn.ark
-I1130 02:19:32.798542 12937 feature_pipeline.h:58] dither: 0
-I1130 02:19:32.798583 12937 feature_pipeline.h:60] frame shift ms: 10
-I1130 02:19:32.798588 12937 feature_pipeline.h:62] feature type: linear
-I1130 02:19:32.798596 12937 feature_pipeline.h:80] frame length ms: 20
-I1130 02:19:32.798601 12937 feature_pipeline.h:88] subsampling rate: 4
-I1130 02:19:32.798606 12937 feature_pipeline.h:90] nnet receptive filed length: 7
-I1130 02:19:32.798611 12937 feature_pipeline.h:92] nnet chunk size: 1
-I1130 02:19:32.798615 12937 feature_pipeline.h:94] frontend fill zeros: 0
-I1130 02:19:32.798630 12937 nnet_itf.h:52] subsampling rate: 4
-I1130 02:19:32.798635 12937 nnet_itf.h:54] model path: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/model/exp/deepspeech2_online/checkpoints//avg_1.jit.pdmodel
-I1130 02:19:32.798640 12937 nnet_itf.h:57] param path: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/model/exp/deepspeech2_online/checkpoints//avg_1.jit.pdiparams
-I1130 02:19:32.798643 12937 nnet_itf.h:59] DS2 param: 
-I1130 02:19:32.798647 12937 nnet_itf.h:61]   cache names: chunk_state_h_box,chunk_state_c_box
-I1130 02:19:32.798652 12937 nnet_itf.h:63]   cache shape: 5-1-1024,5-1-1024
-I1130 02:19:32.798656 12937 nnet_itf.h:65]   input names: audio_chunk,audio_chunk_lens,chunk_state_h_box,chunk_state_c_box
-I1130 02:19:32.798660 12937 nnet_itf.h:67]   output names: softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0
-I1130 02:19:32.798664 12937 ctc_tlg_decoder.h:41] fst path: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/wfst//TLG.fst
-I1130 02:19:32.798669 12937 ctc_tlg_decoder.h:42] fst symbole table: /workspace/zhanghui/PaddleSpeech/speechx/examples/ds2_ol/websocket/data/wfst//words.txt
-I1130 02:19:32.798673 12937 ctc_tlg_decoder.h:47] LatticeFasterDecoder max active: 7500
-I1130 02:19:32.798677 12937 ctc_tlg_decoder.h:49] LatticeFasterDecoder beam: 15
-I1130 02:19:32.798681 12937 ctc_tlg_decoder.h:50] LatticeFasterDecoder lattice_beam: 7.5
-I1130 02:19:32.798708 12937 websocket_server_main.cc:37] Listening at port 8082
-```
-
-## Start WebSocket Client
-
-```bash
-bash websocket_client.sh
-```
-
-This script using AISHELL-1 test data to call websocket server.
-
-The input is specific by `--wav_rspecifier=scp:$data/$aishell_wav_scp`.
-
-The `scp` file which look like this:
-```text
-# head data/split1/1/aishell_test.scp 
-BAC009S0764W0121        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0121.wav
-BAC009S0764W0122        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0122.wav
-...
-BAC009S0764W0125        /workspace/PaddleSpeech/speechx/examples/u2pp_ol/wenetspeech/data/test/S0764/BAC009S0764W0125.wav
-```
-
-If you want to recognize one wav, you can make `scp` file like this:
-```text
-key  path/to/wav/file
-```
diff --git a/speechx/examples/ds2_ol/websocket/path.sh b/speechx/examples/ds2_ol/websocket/path.sh
deleted file mode 100755
index 6dd6bddbf..000000000
--- a/speechx/examples/ds2_ol/websocket/path.sh
+++ /dev/null
@@ -1,14 +0,0 @@
-# This contains the locations of binarys build required for running the examples.
-
-SPEECHX_ROOT=$PWD/../../../
-SPEECHX_BUILD=$SPEECHX_ROOT/build/speechx
-
-SPEECHX_TOOLS=$SPEECHX_ROOT/tools
-TOOLS_BIN=$SPEECHX_TOOLS/valgrind/install/bin
-
-[ -d $SPEECHX_BUILD ] || { echo "Error: 'build/speechx' directory not found. please ensure that the project build successfully"; }
-
-export LC_AL=C
-
-SPEECHX_BIN=$SPEECHX_BUILD/protocol/websocket:$SPEECHX_BUILD/frontend/audio
-export PATH=$PATH:$SPEECHX_BIN:$TOOLS_BIN
diff --git a/speechx/examples/ds2_ol/websocket/websocket_client.sh b/speechx/examples/ds2_ol/websocket/websocket_client.sh
deleted file mode 100755
index a508adfbc..000000000
--- a/speechx/examples/ds2_ol/websocket/websocket_client.sh
+++ /dev/null
@@ -1,35 +0,0 @@
-#!/bin/bash
-set +x
-set -e
-
-. path.sh
-
-# 1. compile
-if [ ! -d ${SPEECHX_EXAMPLES} ]; then
-    pushd ${SPEECHX_ROOT} 
-    bash build.sh
-    popd
-fi
-
-# input
-mkdir -p data
-data=$PWD/data
-
-# output
-aishell_wav_scp=aishell_test.scp
-if [ ! -d $data/test ]; then
-    pushd $data
-    wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_test.zip
-    unzip  aishell_test.zip
-    popd
-
-    realpath $data/test/*/*.wav > $data/wavlist
-    awk -F '/' '{ print $(NF) }' $data/wavlist | awk -F '.' '{ print $1 }' > $data/utt_id
-    paste $data/utt_id $data/wavlist > $data/$aishell_wav_scp
-fi
-
-export GLOG_logtostderr=1
-
-# websocket client
-websocket_client_main \
-    --wav_rspecifier=scp:$data/$aishell_wav_scp --streaming_chunk=0.5
diff --git a/speechx/examples/ds2_ol/websocket/websocket_server.sh b/speechx/examples/ds2_ol/websocket/websocket_server.sh
deleted file mode 100755
index 18d29857c..000000000
--- a/speechx/examples/ds2_ol/websocket/websocket_server.sh
+++ /dev/null
@@ -1,55 +0,0 @@
-#!/bin/bash
-set +x
-set -e
-
-. path.sh
-
-# 1. compile
-if [ ! -d ${SPEECHX_EXAMPLES} ]; then
-    pushd ${SPEECHX_ROOT} 
-    bash build.sh
-    popd
-fi
-
-# input
-mkdir -p data
-data=$PWD/data
-ckpt_dir=$data/model
-model_dir=$ckpt_dir/exp/deepspeech2_online/checkpoints/
-vocb_dir=$ckpt_dir/data/lang_char/
-
-
-if [ ! -f $ckpt_dir/data/mean_std.json ]; then
-    mkdir -p $ckpt_dir
-    pushd $ckpt_dir
-    wget -c https://paddlespeech.bj.bcebos.com/s2t/aishell/asr0/asr0_deepspeech2_online_aishell_ckpt_0.2.0.model.tar.gz
-    tar xzfv asr0_deepspeech2_online_aishell_ckpt_0.2.0.model.tar.gz 
-    popd
-fi
-
-export GLOG_logtostderr=1
-
-# 3. gen cmvn 
-cmvn=$data/cmvn.ark
-cmvn_json2kaldi_main --json_file=$ckpt_dir/data/mean_std.json --cmvn_write_path=$cmvn
-
-
-wfst=$data/wfst/
-mkdir -p $wfst
-if [ ! -f $wfst/aishell_graph.zip ]; then
-    pushd $wfst
-    wget -c https://paddlespeech.bj.bcebos.com/s2t/paddle_asr_online/aishell_graph.zip
-    unzip aishell_graph.zip
-    mv aishell_graph/* $wfst
-    popd
-fi
-
-# 5. test websocket server 
-websocket_server_main \
-    --cmvn_file=$cmvn \
-    --model_path=$model_dir/avg_1.jit.pdmodel \
-    --param_path=$model_dir/avg_1.jit.pdiparams \
-    --word_symbol_table=$wfst/words.txt \
-    --model_output_names=softmax_0.tmp_0,tmp_5,concat_0.tmp_0,concat_1.tmp_0 \
-    --graph_path=$wfst/TLG.fst --max_active=7500 \
-    --acoustic_scale=1.2 
diff --git a/speechx/speechx/codelab/CMakeLists.txt b/speechx/speechx/codelab/CMakeLists.txt
index 950432637..c8445fb82 100644
--- a/speechx/speechx/codelab/CMakeLists.txt
+++ b/speechx/speechx/codelab/CMakeLists.txt
@@ -1,4 +1,3 @@
 cmake_minimum_required(VERSION 3.14 FATAL_ERROR)
 
 add_subdirectory(glog)
-add_subdirectory(nnet)
diff --git a/speechx/speechx/codelab/nnet/CMakeLists.txt b/speechx/speechx/codelab/nnet/CMakeLists.txt
deleted file mode 100644
index dcad8a9c6..000000000
--- a/speechx/speechx/codelab/nnet/CMakeLists.txt
+++ /dev/null
@@ -1,6 +0,0 @@
-cmake_minimum_required(VERSION 3.14 FATAL_ERROR)
-
-set(bin_name ds2_model_test_main)
-add_executable(${bin_name} ${CMAKE_CURRENT_SOURCE_DIR}/${bin_name}.cc)
-target_include_directories(${bin_name} PRIVATE ${SPEECHX_ROOT} ${SPEECHX_ROOT}/kaldi)
-target_link_libraries(${bin_name} PUBLIC nnet gflags glog ${DEPS})
diff --git a/speechx/speechx/codelab/nnet/ds2_model_test_main.cc b/speechx/speechx/codelab/nnet/ds2_model_test_main.cc
deleted file mode 100644
index ab7b2cb58..000000000
--- a/speechx/speechx/codelab/nnet/ds2_model_test_main.cc
+++ /dev/null
@@ -1,207 +0,0 @@
-// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//     http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-// deepspeech2 online model info
-
-#include <algorithm>
-#include <fstream>
-#include <functional>
-#include <iostream>
-#include <iterator>
-#include <numeric>
-#include <thread>
-
-#include "base/flags.h"
-#include "base/log.h"
-#include "paddle_inference_api.h"
-
-using std::cout;
-using std::endl;
-
-
-DEFINE_string(model_path, "", "xxx.pdmodel");
-DEFINE_string(param_path, "", "xxx.pdiparams");
-DEFINE_int32(chunk_size, 35, "feature chunk size, unit:frame");
-DEFINE_int32(feat_dim, 161, "feature dim");
-
-
-void produce_data(std::vector<std::vector<float>>* data);
-void model_forward_test();
-
-void produce_data(std::vector<std::vector<float>>* data) {
-    int chunk_size = FLAGS_chunk_size;  // chunk_size in frame
-    int col_size = FLAGS_feat_dim;      // feat dim
-    cout << "chunk size: " << chunk_size << endl;
-    cout << "feat dim: " << col_size << endl;
-
-    data->reserve(chunk_size);
-    data->back().reserve(col_size);
-    for (int row = 0; row < chunk_size; ++row) {
-        data->push_back(std::vector<float>());
-        for (int col_idx = 0; col_idx < col_size; ++col_idx) {
-            data->back().push_back(0.201);
-        }
-    }
-}
-
-void model_forward_test() {
-    std::cout << "1. read the data" << std::endl;
-    std::vector<std::vector<float>> feats;
-    produce_data(&feats);
-
-    std::cout << "2. load the model" << std::endl;
-    ;
-    std::string model_graph = FLAGS_model_path;
-    std::string model_params = FLAGS_param_path;
-    CHECK_NE(model_graph, "");
-    CHECK_NE(model_params, "");
-    cout << "model path: " << model_graph << endl;
-    cout << "model param path : " << model_params << endl;
-
-    paddle_infer::Config config;
-    config.SetModel(model_graph, model_params);
-    config.SwitchIrOptim(false);
-    cout << "SwitchIrOptim: " << false << endl;
-    config.DisableFCPadding();
-    cout << "DisableFCPadding: " << endl;
-    auto predictor = paddle_infer::CreatePredictor(config);
-
-    std::cout << "3. feat shape, row=" << feats.size()
-              << ",col=" << feats[0].size() << std::endl;
-    std::vector<float> pp_input_mat;
-    for (const auto& item : feats) {
-        pp_input_mat.insert(pp_input_mat.end(), item.begin(), item.end());
-    }
-
-    std::cout << "4. fead the data to model" << std::endl;
-    int row = feats.size();
-    int col = feats[0].size();
-    std::vector<std::string> input_names = predictor->GetInputNames();
-    std::vector<std::string> output_names = predictor->GetOutputNames();
-    for (auto name : input_names) {
-        cout << "model input names: " << name << endl;
-    }
-    for (auto name : output_names) {
-        cout << "model output names: " << name << endl;
-    }
-
-    // input
-    std::unique_ptr<paddle_infer::Tensor> input_tensor =
-        predictor->GetInputHandle(input_names[0]);
-    std::vector<int> INPUT_SHAPE = {1, row, col};
-    input_tensor->Reshape(INPUT_SHAPE);
-    input_tensor->CopyFromCpu(pp_input_mat.data());
-
-    // input length
-    std::unique_ptr<paddle_infer::Tensor> input_len =
-        predictor->GetInputHandle(input_names[1]);
-    std::vector<int> input_len_size = {1};
-    input_len->Reshape(input_len_size);
-    std::vector<int64_t> audio_len;
-    audio_len.push_back(row);
-    input_len->CopyFromCpu(audio_len.data());
-
-    // state_h
-    std::unique_ptr<paddle_infer::Tensor> chunk_state_h_box =
-        predictor->GetInputHandle(input_names[2]);
-    std::vector<int> chunk_state_h_box_shape = {5, 1, 1024};
-    chunk_state_h_box->Reshape(chunk_state_h_box_shape);
-    int chunk_state_h_box_size =
-        std::accumulate(chunk_state_h_box_shape.begin(),
-                        chunk_state_h_box_shape.end(),
-                        1,
-                        std::multiplies<int>());
-    std::vector<float> chunk_state_h_box_data(chunk_state_h_box_size, 0.0f);
-    chunk_state_h_box->CopyFromCpu(chunk_state_h_box_data.data());
-
-    // state_c
-    std::unique_ptr<paddle_infer::Tensor> chunk_state_c_box =
-        predictor->GetInputHandle(input_names[3]);
-    std::vector<int> chunk_state_c_box_shape = {5, 1, 1024};
-    chunk_state_c_box->Reshape(chunk_state_c_box_shape);
-    int chunk_state_c_box_size =
-        std::accumulate(chunk_state_c_box_shape.begin(),
-                        chunk_state_c_box_shape.end(),
-                        1,
-                        std::multiplies<int>());
-    std::vector<float> chunk_state_c_box_data(chunk_state_c_box_size, 0.0f);
-    chunk_state_c_box->CopyFromCpu(chunk_state_c_box_data.data());
-
-    // run
-    bool success = predictor->Run();
-
-    // state_h out
-    std::unique_ptr<paddle_infer::Tensor> h_out =
-        predictor->GetOutputHandle(output_names[2]);
-    std::vector<int> h_out_shape = h_out->shape();
-    int h_out_size = std::accumulate(
-        h_out_shape.begin(), h_out_shape.end(), 1, std::multiplies<int>());
-    std::vector<float> h_out_data(h_out_size);
-    h_out->CopyToCpu(h_out_data.data());
-
-    // stage_c out
-    std::unique_ptr<paddle_infer::Tensor> c_out =
-        predictor->GetOutputHandle(output_names[3]);
-    std::vector<int> c_out_shape = c_out->shape();
-    int c_out_size = std::accumulate(
-        c_out_shape.begin(), c_out_shape.end(), 1, std::multiplies<int>());
-    std::vector<float> c_out_data(c_out_size);
-    c_out->CopyToCpu(c_out_data.data());
-
-    // output tensor
-    std::unique_ptr<paddle_infer::Tensor> output_tensor =
-        predictor->GetOutputHandle(output_names[0]);
-    std::vector<int> output_shape = output_tensor->shape();
-    std::vector<float> output_probs;
-    int output_size = std::accumulate(
-        output_shape.begin(), output_shape.end(), 1, std::multiplies<int>());
-    output_probs.resize(output_size);
-    output_tensor->CopyToCpu(output_probs.data());
-    row = output_shape[1];
-    col = output_shape[2];
-
-    // probs
-    std::vector<std::vector<float>> probs;
-    probs.reserve(row);
-    for (int i = 0; i < row; i++) {
-        probs.push_back(std::vector<float>());
-        probs.back().reserve(col);
-
-        for (int j = 0; j < col; j++) {
-            probs.back().push_back(output_probs[i * col + j]);
-        }
-    }
-
-    std::vector<std::vector<float>> log_feat = probs;
-    std::cout << "probs, row: " << log_feat.size()
-              << " col: " << log_feat[0].size() << std::endl;
-    for (size_t row_idx = 0; row_idx < log_feat.size(); ++row_idx) {
-        for (size_t col_idx = 0; col_idx < log_feat[row_idx].size();
-             ++col_idx) {
-            std::cout << log_feat[row_idx][col_idx] << " ";
-        }
-        std::cout << std::endl;
-    }
-}
-
-int main(int argc, char* argv[]) {
-    gflags::SetUsageMessage("Usage:");
-    gflags::ParseCommandLineFlags(&argc, &argv, false);
-    google::InitGoogleLogging(argv[0]);
-    google::InstallFailureSignalHandler();
-    FLAGS_logtostderr = 1;
-
-    model_forward_test();
-    return 0;
-}