From d103cb8f9ec9be6004f2ef1693bb2ebc85ec24a0 Mon Sep 17 00:00:00 2001 From: zxcd <228587199@qq.com> Date: Wed, 15 Mar 2023 14:29:17 +0800 Subject: [PATCH] [ASR]cherrypick change optimizer and fix import error, test=asr (#3049) * optional tokenizer and fix some doc * cherry pick with pr:3040 --- examples/aishell/asr3/RESULT.md | 1 + examples/aishell/asr3/conf/train_with_wav2vec.yaml | 2 +- examples/aishell/asr3/local/aishell_prepare.py | 2 +- examples/aishell/asr3/local/data.sh | 2 +- 4 files changed, 4 insertions(+), 3 deletions(-) diff --git a/examples/aishell/asr3/RESULT.md b/examples/aishell/asr3/RESULT.md index 1291ef15..da76fc74 100644 --- a/examples/aishell/asr3/RESULT.md +++ b/examples/aishell/asr3/RESULT.md @@ -4,6 +4,7 @@ * paddle version: develop (commit id: daea892c67e85da91906864de40ce9f6f1b893ae) * paddlespeech version: develop (commit id: c14b4238b256693281e59605abff7c9435b3e2b2) +* paddlenlp version: 2.5.2 ## Device * python: 3.7 diff --git a/examples/aishell/asr3/conf/train_with_wav2vec.yaml b/examples/aishell/asr3/conf/train_with_wav2vec.yaml index 77b3762e..273175d2 100755 --- a/examples/aishell/asr3/conf/train_with_wav2vec.yaml +++ b/examples/aishell/asr3/conf/train_with_wav2vec.yaml @@ -83,7 +83,7 @@ dnn_neurons: 1024 freeze_wav2vec: False dropout: 0.15 -tokenizer: !apply:transformers.BertTokenizer.from_pretrained +tokenizer: !apply:paddlenlp.transformers.AutoTokenizer.from_pretrained pretrained_model_name_or_path: bert-base-chinese # bert-base-chinese tokens length output_neurons: 21128 diff --git a/examples/aishell/asr3/local/aishell_prepare.py b/examples/aishell/asr3/local/aishell_prepare.py index a2573579..2a7ba5c6 100644 --- a/examples/aishell/asr3/local/aishell_prepare.py +++ b/examples/aishell/asr3/local/aishell_prepare.py @@ -21,7 +21,7 @@ import glob import logging import os -from paddlespeech.s2t.models.wav2vec2.io.dataio import read_audio +from paddlespeech.s2t.io.speechbrain.dataio import read_audio logger = logging.getLogger(__name__) diff --git a/examples/aishell/asr3/local/data.sh b/examples/aishell/asr3/local/data.sh index 1a468f54..bd26c1e7 100755 --- a/examples/aishell/asr3/local/data.sh +++ b/examples/aishell/asr3/local/data.sh @@ -1,7 +1,7 @@ #!/bin/bash stage=-1 -stop_stage=-1 +stop_stage=3 dict_dir=data/lang_char . ${MAIN_ROOT}/utils/parse_options.sh || exit -1;