diff --git a/examples/timit/s1/README.md b/examples/timit/s1/README.md index d516040d..11aa19f1 100644 --- a/examples/timit/s1/README.md +++ b/examples/timit/s1/README.md @@ -2,8 +2,8 @@ ### Transformer | Model | Params | Config | Decode method | Loss | PER | -| --- | --- | --- | --- | --- | -| transformer | 5.17M | conf/transformer.yaml | attention | 49.25688171386719 | 0.510742 | -| transformer | 5.17M | conf/transformer.yaml | ctc_greedy_search | 49.25688171386719 | 0.382398 | -| transformer | 5.17M | conf/transformer.yaml | ctc_prefix_beam_search | 49.25688171386719 | 0.367429 | -| transformer | 5.17M | conf/transformer.yaml | attention_rescore | 49.25688171386719 | 0.357173 | +| --- | --- | --- | --- | --- | --- | +| transformer | 5.17M | conf/transformer.yaml | attention | 46.41119385 | 0.469993 | +| transformer | 5.17M | conf/transformer.yaml | ctc_greedy_search | 46.41119385 | 0.297713 | +| transformer | 5.17M | conf/transformer.yaml | ctc_prefix_beam_search | 46.41119385 | 0.293555 | +| transformer | 5.17M | conf/transformer.yaml | attention_rescore | 46.41119385 | 0.281081 | diff --git a/examples/timit/s1/conf/transformer.yaml b/examples/timit/s1/conf/transformer.yaml index a55dcc43..e138fbbe 100644 --- a/examples/timit/s1/conf/transformer.yaml +++ b/examples/timit/s1/conf/transformer.yaml @@ -67,14 +67,14 @@ model: model_conf: ctc_weight: 0.5 ctc_dropoutrate: 0.0 - ctc_grad_norm_type: batch + ctc_grad_norm_type: instance lsm_weight: 0.1 # label smoothing option length_normalized_loss: false training: n_epoch: 200 - accum_grad: 2 + accum_grad: 1 global_grad_clip: 5.0 optim: adam optim_conf: @@ -82,7 +82,7 @@ training: weight_decay: 1e-06 scheduler: warmuplr # pytorch v1.1.0+ required scheduler_conf: - warmup_steps: 2000 + warmup_steps: 1200 lr_decay: 1.0 log_interval: 10 checkpoint: