From af76e60bc418c66204db2ac81741e20feab9092f Mon Sep 17 00:00:00 2001 From: zxcd <228587199@qq.com> Date: Thu, 2 Feb 2023 12:56:02 +0000 Subject: [PATCH] add wav2vec2_zh recipe. --- examples/aishell/asr3/cmd.sh | 89 ++ examples/aishell/asr3/conf/conformer.yaml | 91 ++ examples/aishell/asr3/conf/preprocess.yaml | 3 + .../aishell/asr3/conf/train_with_wav2vec.yaml | 103 +++ .../asr3/conf/tuning/chunk_decode.yaml | 11 + examples/aishell/asr3/conf/tuning/decode.yaml | 4 + examples/aishell/asr3/conf/wav2vec2ASR.yaml | 165 ++++ examples/aishell/asr3/local/data.sh | 95 ++ examples/aishell/asr3/local/test.sh | 84 ++ examples/aishell/asr3/local/test_wav.sh | 58 ++ examples/aishell/asr3/local/train.sh | 59 ++ examples/aishell/asr3/path.sh | 15 + examples/aishell/asr3/run.sh | 48 + examples/aishell/asr3/utils | 1 + paddlespeech/s2t/exps/wav2vec2/model.py | 417 +++++++-- paddlespeech/s2t/models/wav2vec2/__init__.py | 2 +- paddlespeech/s2t/models/wav2vec2/io/batch.py | 107 +++ .../s2t/models/wav2vec2/io/data_pipeline.py | 511 +++++++++++ .../s2t/models/wav2vec2/io/data_utils.py | 177 ++++ paddlespeech/s2t/models/wav2vec2/io/dataio.py | 845 ++++++++++++++++++ .../s2t/models/wav2vec2/io/dataloader.py | 172 ++++ .../s2t/models/wav2vec2/io/dataset.py | 371 ++++++++ .../s2t/models/wav2vec2/io/depgraph.py | 237 +++++ .../s2t/models/wav2vec2/io/make_dataloader.py | 118 +++ .../s2t/models/wav2vec2/io/sampler.py | 505 +++++++++++ .../s2t/models/wav2vec2/io/sb_pipeline.py | 156 ++++ .../wav2vec2/processing/signal_processing.py | 20 +- .../processing/speech_augmentation.py | 46 +- .../s2t/models/wav2vec2/wav2vec2_ASR.py | 58 +- 29 files changed, 4456 insertions(+), 112 deletions(-) create mode 100755 examples/aishell/asr3/cmd.sh create mode 100755 examples/aishell/asr3/conf/conformer.yaml create mode 100755 examples/aishell/asr3/conf/preprocess.yaml create mode 100755 examples/aishell/asr3/conf/train_with_wav2vec.yaml create mode 100755 examples/aishell/asr3/conf/tuning/chunk_decode.yaml create mode 100755 examples/aishell/asr3/conf/tuning/decode.yaml create mode 100755 examples/aishell/asr3/conf/wav2vec2ASR.yaml create mode 100755 examples/aishell/asr3/local/data.sh create mode 100755 examples/aishell/asr3/local/test.sh create mode 100755 examples/aishell/asr3/local/test_wav.sh create mode 100755 examples/aishell/asr3/local/train.sh create mode 100755 examples/aishell/asr3/path.sh create mode 100755 examples/aishell/asr3/run.sh create mode 120000 examples/aishell/asr3/utils mode change 100644 => 100755 paddlespeech/s2t/exps/wav2vec2/model.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/batch.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/data_pipeline.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/data_utils.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/dataio.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/dataloader.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/dataset.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/depgraph.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/make_dataloader.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/sampler.py create mode 100755 paddlespeech/s2t/models/wav2vec2/io/sb_pipeline.py mode change 100644 => 100755 paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py diff --git a/examples/aishell/asr3/cmd.sh b/examples/aishell/asr3/cmd.sh new file mode 100755 index 000000000..7b70ef5e0 --- /dev/null +++ b/examples/aishell/asr3/cmd.sh @@ -0,0 +1,89 @@ +# ====== About run.pl, queue.pl, slurm.pl, and ssh.pl ====== +# Usage: .pl [options] JOB=1: +# e.g. +# run.pl --mem 4G JOB=1:10 echo.JOB.log echo JOB +# +# Options: +# --time