diff --git a/examples/aishell/s1/local/download_lm_ch.sh b/examples/aishell/s1/local/download_lm_ch.sh deleted file mode 120000 index 6541d91c..00000000 --- a/examples/aishell/s1/local/download_lm_ch.sh +++ /dev/null @@ -1 +0,0 @@ -../../s0/local/download_lm_ch.sh \ No newline at end of file diff --git a/examples/dataset/librispeech/librispeech.py b/examples/dataset/librispeech/librispeech.py index f549a95f..d34c3223 100644 --- a/examples/dataset/librispeech/librispeech.py +++ b/examples/dataset/librispeech/librispeech.py @@ -114,7 +114,7 @@ def create_manifest(data_dir, manifest_path): for line in json_lines: out_file.write(line + '\n') - subset = os.path.splitext(manifest_path)[1] + subset = manifest_path with open(subset + '.meta', 'w') as f: print(f"{subset}:", file=f) print(f"{total_num} utts", file=f) diff --git a/examples/librispeech/s0/conf/augmentation.json b/examples/librispeech/s0/conf/augmentation.json index 5635d9c8..1987ad42 100644 --- a/examples/librispeech/s0/conf/augmentation.json +++ b/examples/librispeech/s0/conf/augmentation.json @@ -15,5 +15,20 @@ "max_shift_ms": 5 }, "prob": 1.0 + }, + { + "type": "specaug", + "params": { + "F": 10, + "T": 50, + "n_freq_masks": 2, + "n_time_masks": 2, + "p": 1.0, + "W": 80, + "adaptive_number_ratio": 0, + "adaptive_size_ratio": 0, + "max_n_time_masks": 20 + }, + "prob": 1.0 } ] diff --git a/examples/librispeech/s1/README.md b/examples/librispeech/s1/README.md index 5b4130bb..17afa1c0 100644 --- a/examples/librispeech/s1/README.md +++ b/examples/librispeech/s1/README.md @@ -15,10 +15,10 @@ | Model | Params | Config | Augmentation| Test set | Decode method | Chunk Size & Left Chunks | Loss | WER | | --- | --- | --- | --- | --- | --- | --- | --- | --- | -| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | attention | 16, -1 | 7.01250648 | | -| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | ctc_greedy_search | 16, -1 | 7.01250648 | | +| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | attention | 16, -1 | 7.01250648 | 0.069548 | +| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | ctc_greedy_search | 16, -1 | 7.01250648 | 0.094753 | | conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | ctc_prefix_beam_search | 16, -1 | 7.01250648 | | -| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | attention_rescoring | 16, -1 | 7.01250648 | | +| conformer | 47.63 M | conf/chunk_conformer.yaml | spec_aug + shift | test-clean | attention_rescoring | 16, -1 | 7.01250648 | | diff --git a/examples/librispeech/s1/conf/chunk_confermer.yaml b/examples/librispeech/s1/conf/chunk_conformer.yaml similarity index 99% rename from examples/librispeech/s1/conf/chunk_confermer.yaml rename to examples/librispeech/s1/conf/chunk_conformer.yaml index d78ce740..7a4ddf5d 100644 --- a/examples/librispeech/s1/conf/chunk_confermer.yaml +++ b/examples/librispeech/s1/conf/chunk_conformer.yaml @@ -81,7 +81,7 @@ model: training: - n_epoch: 120 + n_epoch: 240 accum_grad: 8 global_grad_clip: 5.0 optim: adam diff --git a/examples/tiny/s1/local/download_lm_en.sh b/examples/tiny/s1/local/download_lm_en.sh deleted file mode 120000 index 831f3c31..00000000 --- a/examples/tiny/s1/local/download_lm_en.sh +++ /dev/null @@ -1 +0,0 @@ -../../s0/local/download_lm_en.sh \ No newline at end of file diff --git a/tools/Makefile b/tools/Makefile index 94e5ea2f..08cb9955 100644 --- a/tools/Makefile +++ b/tools/Makefile @@ -18,7 +18,7 @@ kenlm.done: apt install -y build-essential cmake libboost-system-dev libboost-thread-dev libboost-program-options-dev libboost-test-dev libeigen3-dev zlib1g-dev libbz2-dev liblzma-dev apt-get install -y gcc-5 g++-5 && update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-5 50 && update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-5 50 test -d kenlm || wget -O - https://kheafield.com/code/kenlm.tar.gz | tar xz - mkdir -p kenlm/build && cd kenlm/build && cmake .. && make -j4 && make install + rm -rf kenlm/build && mkdir -p kenlm/build && cd kenlm/build && cmake .. && make -j4 && make install source venv/bin/activate; cd kenlm && python setup.py install touch kenlm.done