fix tester

5 years ago · e80c741131
parent 4292e50622
commit e80c741131
5 changed files with 57 additions and 55 deletions
--- a/examples/aishell/local/infer.sh
+++ b/examples/aishell/local/infer.sh
@ -9,31 +9,12 @@ if [ $? -ne 0 ]; then
 fi
 cd - > /dev/null
 # infer
 CUDA_VISIBLE_DEVICES=0 \
 python3 -u ${MAIN_ROOT}/infer.py \
--num_samples=10 \
+--device 'gpu' \
--beam_size=300 \
+--nproc 1 \
--num_proc_bsearch=8 \
+--config conf/deepspeech2.yaml \
--num_conv_layers=2 \
+--checkpoint_path ckpt/checkpoints/step-3283
--num_rnn_layers=3 \
+
 --rnn_layer_size=1024 \
 --alpha=2.6 \
 --beta=5.0 \
 --cutoff_prob=0.99 \
 --cutoff_top_n=40 \
 --use_gru=True \
 --use_gpu=True \
 --share_rnn_weights=False \
 --infer_manifest="data/manifest.test" \
 --mean_std_path="data/mean_std.npz" \
 --vocab_path="data/vocab.txt" \
 --model_path="checkpoints/step_final" \
 --lang_model_path="${MAIN_ROOT}/models/lm/zh_giga.no_cna_cmn.prune01244.klm" \
 --decoding_method="ctc_beam_search" \
 --error_rate_type="cer" \
 --specgram_type="linear"
 if [ $? -ne 0 ]; then
    echo "Failed in inference!"
--- a/examples/aishell/local/train.sh
+++ b/examples/aishell/local/train.sh
@ -4,39 +4,11 @@
 # if you wish to resume from an exists model, uncomment --init_from_pretrained_model
 export FLAGS_sync_nccl_allreduce=0
 #CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
 #python3 -u ${MAIN_ROOT}/train.py \
 #--batch_size=64 \
 #--num_epoch=50 \
 #--num_conv_layers=2 \
 #--num_rnn_layers=3 \
 #--rnn_layer_size=1024 \
 #--num_iter_print=100 \
 #--save_epoch=1 \
 #--num_samples=120000 \
 #--learning_rate=5e-4 \
 #--max_duration=27.0 \
 #--min_duration=0.0 \
 #--test_off=False \
 #--use_sortagrad=True \
 #--use_gru=True \
 #--use_gpu=True \
 #--is_local=True \
 #--share_rnn_weights=False \
 #--train_manifest="data/manifest.train" \
 #--dev_manifest="data/manifest.dev" \
 #--mean_std_path="data/mean_std.npz" \
 #--vocab_path="data/vocab.txt" \
 #--output_model_dir="./checkpoints" \
 #--augment_conf_path="${MAIN_ROOT}/conf/augmentation.config" \
 #--specgram_type="linear" \
 #--shuffle_method="batch_shuffle_clipped" \
 python3 -u ${MAIN_ROOT}/train.py \
 --device 'gpu' \
 --nproc 4 \
 --config conf/deepspeech2.yaml \
--output ckpt
+--output ckpt-${1}
 if [ $? -ne 0 ]; then
--- a/model_utils/model.py
+++ b/model_utils/model.py
@ -21,6 +21,7 @@ import logging
 import numpy as np
 from collections import defaultdict
 from functools import partial
 from pathlib import Path
 import paddle
 from paddle import distributed as dist
@ -449,6 +450,30 @@ class DeepSpeech2Tester(DeepSpeech2Trainer):
            error_rate_type, num_ins, num_ins, errors_sum / len_refs)
        self.logger.info(msg)
    def setup_output_dir(self):
        """Create a directory used for output.
        """
        # output dir
        if self.args.output:
            output_dir = Path(self.args.output).expanduser() / "infer"
            output_dir.mkdir(parents=True, exist_ok=True)
        else:
            output_dir = Path(self.args.checkpoint_path).expanduser().parent / "infer"
            output_dir.mkdir(parents=True, exist_ok=True)
        self.output_dir = output_dir
    # def setup_checkpointer(self):
    #     """Create a directory used to save checkpoints into.
    #     It is "checkpoints" inside the output directory.
    #     """
    #     # checkpoint dir
    #     checkpoint_dir = self.output_dir / "checkpoints"
    #     checkpoint_dir.mkdir(exist_ok=True)
    #     self.checkpoint_dir = checkpoint_dir
    def setup(self):
        """Setup the experiment.
        """
@ -458,7 +483,6 @@ class DeepSpeech2Tester(DeepSpeech2Trainer):
        self.setup_output_dir()
        self.setup_logger()
        self.setup_checkpointer()
        self.setup_dataloader()
        self.setup_model()
@ -482,7 +506,7 @@ class DeepSpeech2Tester(DeepSpeech2Trainer):
            num_rnn_layers=config.model.num_rnn_layers,
            rnn_size=config.model.rnn_layer_size,
            share_rnn_weights=config.model.share_rnn_weights)
-
+        
        if self.parallel:
            model = paddle.DataParallel(model)
--- a/model_utils/network.py
+++ b/model_utils/network.py
@ -688,6 +688,24 @@ class DeepSpeech2(nn.Layer):
            probs, vocab_list, decoding_method, lang_model_path, beam_alpha,
            beam_beta, beam_size, cutoff_prob, cutoff_top_n, num_processes)
    def from_pretrained(self, checkpoint_path):
        """Build a model from a pretrained model.
        Parameters
        ----------
        model: nn.Layer
            Asr Model.
        checkpoint_path: Path or str
            The path of pretrained model checkpoint, without extension name.
        Returns
        -------
        Model
            The model build from pretrined result.
        """
        checkpoint.load_parameters(self, checkpoint_path=checkpoint_path)
        return model
 def ctc_loss(logits,
             labels,
--- a/training/trainer.py
+++ b/training/trainer.py
@ -91,6 +91,9 @@ class Trainer():
        self.args = args
        self.optimizer = None
        self.visualizer = None
        self.output_dir = None
        self.checkpoint_dir = None
        self.logger = None
    def setup(self):
        """Setup the experiment.
@ -258,6 +261,10 @@ class Trainer():
        stream_handler.setFormatter(formatter)
        logger.addHandler(stream_handler)
        if not hasattr(self, 'output_dir'):
            self.logger = logger
            return
        log_file = self.output_dir / 'worker_{}.log'.format(dist.get_rank())
        # file_handler = logging.FileHandler(str(log_file))
        # file_handler.setFormatter(formatter)