format

4 years ago · 5d4f3fbd7b
parent 65346b83ee
commit 5d4f3fbd7b
20 changed files with 43 additions and 41 deletions
--- a/deepspeech/init.py
+++ b/deepspeech/init.py
@ -421,7 +421,6 @@ logger.warn(
 )
 F.ctc_loss = ctc_loss

-
 ########### hcak paddle.nn #############
 if not hasattr(paddle.nn, 'Module'):
    logger.warn("register user Module to paddle.nn, remove this when fixed!")
--- a/deepspeech/frontend/normalizer.py
+++ b/deepspeech/frontend/normalizer.py
@ -179,7 +179,8 @@ class FeatureNormalizer(object):
                wav_number += batch_size

                if wav_number % 1000 == 0:
-                    logger.info(f'process {wav_number} wavs,{all_number} frames.')
+                    logger.info(
+                        f'process {wav_number} wavs,{all_number} frames.')

        self.cmvn_info = {
            'mean_stat': list(all_mean_stat.tolist()),
--- a/deepspeech/modules/mask.py
+++ b/deepspeech/modules/mask.py
@ -23,6 +23,7 @@ __all__ = [
    "mask_finished_preds"
 ]

+
 def make_pad_mask(lengths: paddle.Tensor) -> paddle.Tensor:
    """Make mask tensor containing indices of padded part.
    See description of make_non_pad_mask.
--- a/doc/src/alignment.md
+++ b/doc/src/alignment.md
@ -18,4 +18,3 @@

 * [ctc alignment](https://mp.weixin.qq.com/s/4aGehNN7PpIvCh03qTT5oA)
 * [时间戳和N-Best](https://mp.weixin.qq.com/s?__biz=MzU2NjUwMTgxOQ==&mid=2247483956&idx=1&sn=80ce595238d84155d50f08c0d52267d3&chksm=fcaacae0cbdd43f62b1da60c8e8671a9e0bb2aeee94f58751839b03a1c45b9a3889b96705080&scene=21#wechat_redirect)
-
--- a/doc/src/benchmark.md
+++ b/doc/src/benchmark.md
@ -14,4 +14,3 @@ We compare the training time with 1, 2, 4, 8 Tesla V100 GPUs (with a subset of L
 | 8         | 6.95 X |

 `utils/profile.sh` provides such a demo profiling tool, you can change it as need.
-
--- a/doc/src/decoding.md
+++ b/doc/src/decoding.md
@ -3,4 +3,3 @@
 ## Reference

 * [时间戳和N-Best](https://mp.weixin.qq.com/s?__biz=MzU2NjUwMTgxOQ==&mid=2247483956&idx=1&sn=80ce595238d84155d50f08c0d52267d3&chksm=fcaacae0cbdd43f62b1da60c8e8671a9e0bb2aeee94f58751839b03a1c45b9a3889b96705080&scene=21#wechat_redirect)
-
--- a/doc/src/praat_textgrid.md
+++ b/doc/src/praat_textgrid.md
@ -256,4 +256,3 @@ pip3 install textgrid

 * https://zh.wikipedia.org/wiki/Praat%E8%AF%AD%E9%9F%B3%E5%AD%A6%E8%BD%AF%E4%BB%B6
 * https://blog.csdn.net/duxin_csdn/article/details/88966295
-
--- a/doc/src/tools.md
+++ b/doc/src/tools.md
@ -1,4 +1,3 @@
 # Useful Tools

 * [正则可视化和常用正则表达式](https://wangwl.net/static/projects/visualRegex/#)
-
--- a/doc/src/vad.md
+++ b/doc/src/vad.md
@ -29,4 +29,3 @@
 * [Endpoint 检测](https://mp.weixin.qq.com/s?__biz=MzU2NjUwMTgxOQ==&mid=2247484024&idx=1&sn=12da2ee76347de4a18856274ba6ba61f&chksm=fcaacaaccbdd43ba6b3e996bbf1e2ac6d5f1b449dfd80fcaccfbbe0a240fa1668b931dbf4bd5&scene=21#wechat_redirect)
 * Kaldi: *https://github.com/kaldi-asr/kaldi/blob/6260b27d146e466c7e1e5c60858e8da9fd9c78ae/src/online2/online-endpoint.h#L132-L150*
 * End-to-End Automatic Speech Recognition Integrated with CTC-Based Voice Activity Detection: *https://arxiv.org/pdf/2002.00551.pdf*
-
--- a/examples/aishell/s1/conf/conformer.yaml
+++ b/examples/aishell/s1/conf/conformer.yaml
@ -24,7 +24,7 @@ data:
  n_fft: None
  stride_ms: 10.0
  window_ms: 25.0
-  use_dB_normalization: False 
+  use_dB_normalization: True 
  target_dB: -20
  random_seed: 0
  keep_transcription_text: False
@ -76,7 +76,7 @@ model:
 training:
  n_epoch: 240 
  accum_grad: 2
-  global_grad_clip: 5.0
+  global_grad_clip: 3.0
  optim: adam
  optim_conf:
    lr: 0.002
--- a/examples/cc-cedict/local/parser.py
+++ b/examples/cc-cedict/local/parser.py
@ -1,18 +1,24 @@
+# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 # https://github.com/rubber-duck-dragon/rubber-duck-dragon.github.io/blob/master/cc-cedict_parser/parser.py
-
 #A parser for the CC-Cedict. Convert the Chinese-English dictionary into a list of python dictionaries with "traditional","simplified", "pinyin", and "english" keys.
-
 #Make sure that the cedict_ts.u8 file is in the same folder as this file, and that the name matches the file name on line 13.
-
 #Before starting, open the CEDICT text file and delete the copyright information at the top. Otherwise the program will try to parse it and you will get an error message.
-
 #Characters that are commonly used as surnames have two entries in CC-CEDICT. This program will remove the surname entry if there is another entry for the character. If you want to include the surnames, simply delete lines 59 and 60.
-
 #This code was written by Franki Allegra in February 2020.
-
-
-import sys
 import json
+import sys

 # usage: bin ccedict dump.json

@ -50,9 +56,10 @@ with open(sys.argv[1], 'rt') as file:
        list_of_dicts.append(parsed)

    def remove_surnames():
-        for x in range(len(list_of_dicts)-1, -1, -1):
+        for x in range(len(list_of_dicts) - 1, -1, -1):
            if "surname " in list_of_dicts[x]['english']:
-                if list_of_dicts[x]['traditional'] == list_of_dicts[x+1]['traditional']:
+                if list_of_dicts[x]['traditional'] == list_of_dicts[x + 1][
+                        'traditional']:
                    list_of_dicts.pop(x)

    def main():
@ -66,7 +73,6 @@ with open(sys.argv[1], 'rt') as file:
        print("Removing Surnames . . .")
        remove_surnames()

-
        print("Saving to database (this may take a few minutes) . . .")
        with open(sys.argv[2], 'wt') as fout:
            for one_dict in list_of_dicts:
@ -74,5 +80,6 @@ with open(sys.argv[1], 'rt') as file:
                fout.write(json_str + "\n")
        print('Done!')

+
 list_of_dicts = []
 parsed_dict = main()
--- a/requirements.txt
+++ b/requirements.txt
@ -1,5 +1,6 @@
 coverage
 pre-commit
+pybind11
 resampy==0.2.2
 scipy==1.2.1
 sentencepiece
@ -7,7 +8,6 @@ snakeviz
 SoundFile==0.9.0.post1
 sox
 tensorboardX
+textgrid
 typeguard
 yacs
-pybind11
-textgrid