From e520077652fb43ba91518aea048d46885a4320d9 Mon Sep 17 00:00:00 2001 From: Hui Zhang Date: Thu, 18 Mar 2021 07:08:39 +0000 Subject: [PATCH] when loss div batchsize, change lr, more epoch, loss can reduce more and cer lower than before --- examples/aishell/README.md | 8 ++++---- examples/aishell/conf/deepspeech2.yaml | 4 ++-- examples/aishell/local/train.sh | 2 +- 3 files changed, 7 insertions(+), 7 deletions(-) diff --git a/examples/aishell/README.md b/examples/aishell/README.md index 6d67d19a9..5c3db546a 100644 --- a/examples/aishell/README.md +++ b/examples/aishell/README.md @@ -1,7 +1,7 @@ # Aishell-1 ## CTC -| Model | Config | Test set | CER | -| --- | --- | --- | --- | -| DeepSpeech2 | conf/deepspeech2.yaml | test | 0.078977 | -| DeepSpeech2 | release 1.8.5 | test | 0.080447 | +| Model | Config | Test Set | CER | Valid Loss | +| --- | --- | --- | --- | --- | +| DeepSpeech2 | conf/deepspeech2.yaml | test | 0.078786 | 7.036566 | +| DeepSpeech2 | release 1.8.5 | test | 0.080447 | - | diff --git a/examples/aishell/conf/deepspeech2.yaml b/examples/aishell/conf/deepspeech2.yaml index 821c183e5..9a840186b 100644 --- a/examples/aishell/conf/deepspeech2.yaml +++ b/examples/aishell/conf/deepspeech2.yaml @@ -29,8 +29,8 @@ model: use_gru: True share_rnn_weights: False training: - n_epoch: 30 - lr: 5e-4 + n_epoch: 50 + lr: 2e-3 lr_decay: 0.83 weight_decay: 1e-06 global_grad_clip: 5.0 diff --git a/examples/aishell/local/train.sh b/examples/aishell/local/train.sh index c286566a8..245ed2172 100644 --- a/examples/aishell/local/train.sh +++ b/examples/aishell/local/train.sh @@ -2,7 +2,7 @@ # train model # if you wish to resume from an exists model, uncomment --init_from_pretrained_model -export FLAGS_sync_nccl_allreduce=0 +#export FLAGS_sync_nccl_allreduce=0 ngpu=$(echo ${CUDA_VISIBLE_DEVICES} | python -c 'import sys; a = sys.stdin.read(); print(len(a.split(",")));') echo "using $ngpu gpus..."