fix compliance test bug, and format

pull/1597/head
Hui Zhang 3 years ago
parent fc1bee35c4
commit 4051e7b762

2
.gitignore vendored

@ -35,3 +35,5 @@ tools/miniconda.sh
tools/CRF++-0.58/ tools/CRF++-0.58/
speechx/fc_patch/ speechx/fc_patch/
third_party/ctc_decoders/paddlespeech_ctcdecoders.py

@ -1,12 +1,11 @@
soundfile==0.10.3.post1 diskcache==5.2.1
fastapi
librosa==0.8.0 librosa==0.8.0
numpy numpy
pydanticpymilvus==2.0.1
pymysql pymysql
fastapi
uvicorn
diskcache==5.2.1
pymilvus==2.0.1
python-multipart python-multipart
typing soundfile==0.10.3.post1
starlette starlette
pydantic typing
uvicorn

@ -11,7 +11,6 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
import os import os
############### Milvus Configuration ############### ############### Milvus Configuration ###############

@ -11,7 +11,6 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
import codecs
import datetime import datetime
import logging import logging
import os import os
@ -124,7 +123,7 @@ class MultiprocessHandler(logging.FileHandler):
logging.FileHandler.emit(self, record) logging.FileHandler.emit(self, record)
except (KeyboardInterrupt, SystemExit): except (KeyboardInterrupt, SystemExit):
raise raise
except: except Exception as e:
self.handleError(record) self.handleError(record)

@ -26,8 +26,7 @@ def get_audios(path):
""" """
supported_formats = [".wav", ".mp3", ".ogg", ".flac", ".m4a"] supported_formats = [".wav", ".mp3", ".ogg", ".flac", ".m4a"]
return [ return [
item item for sublist in [[os.path.join(dir, file) for file in files]
for sublist in [[os.path.join(dir, file) for file in files]
for dir, _, files in list(os.walk(path))] for dir, _, files in list(os.walk(path))]
for item in sublist if os.path.splitext(item)[1] in supported_formats for item in sublist if os.path.splitext(item)[1] in supported_formats
] ]

@ -18,7 +18,6 @@ Download: http://groups.inf.ed.ac.uk/ami/download/
Prepares metadata files (JSON) from manual annotations "segments/" using RTTM format (Oracle VAD). Prepares metadata files (JSON) from manual annotations "segments/" using RTTM format (Oracle VAD).
""" """
import argparse import argparse
import glob import glob
import json import json

@ -0,0 +1,2 @@
.eggs
*.wav

@ -5,18 +5,14 @@
# This file does only contain a selection of the most common options. For a # This file does only contain a selection of the most common options. For a
# full list see the documentation: # full list see the documentation:
# http://www.sphinx-doc.org/en/master/config # http://www.sphinx-doc.org/en/master/config
# -- Path setup -------------------------------------------------------------- # -- Path setup --------------------------------------------------------------
# If extensions (or modules to document with autodoc) are in another directory, # If extensions (or modules to document with autodoc) are in another directory,
# add these directories to sys.path here. If the directory is relative to the # add these directories to sys.path here. If the directory is relative to the
# documentation root, use os.path.abspath to make it absolute, like shown here. # documentation root, use os.path.abspath to make it absolute, like shown here.
import os import os
import sys import sys
sys.path.insert(0, os.path.abspath('../..')) sys.path.insert(0, os.path.abspath('../..'))
# -- Project information ----------------------------------------------------- # -- Project information -----------------------------------------------------
project = 'PaddleAudio' project = 'PaddleAudio'
@ -28,7 +24,6 @@ version = ''
# The full version, including alpha/beta/rc tags # The full version, including alpha/beta/rc tags
release = '0.2.0' release = '0.2.0'
# -- General configuration --------------------------------------------------- # -- General configuration ---------------------------------------------------
# If your documentation needs a minimal Sphinx version, state it here. # If your documentation needs a minimal Sphinx version, state it here.
@ -75,7 +70,6 @@ exclude_patterns = []
# The name of the Pygments (syntax highlighting) style to use. # The name of the Pygments (syntax highlighting) style to use.
pygments_style = None pygments_style = None
# -- Options for HTML output ------------------------------------------------- # -- Options for HTML output -------------------------------------------------
# The theme to use for HTML and HTML Help pages. See the documentation for # The theme to use for HTML and HTML Help pages. See the documentation for
@ -112,13 +106,11 @@ html_css_files = [
# #
# html_sidebars = {} # html_sidebars = {}
# -- Options for HTMLHelp output --------------------------------------------- # -- Options for HTMLHelp output ---------------------------------------------
# Output file base name for HTML help builder. # Output file base name for HTML help builder.
htmlhelp_basename = 'PaddleAudiodoc' htmlhelp_basename = 'PaddleAudiodoc'
# -- Options for LaTeX output ------------------------------------------------ # -- Options for LaTeX output ------------------------------------------------
latex_elements = { latex_elements = {
@ -143,20 +135,16 @@ latex_elements = {
# (source start file, target name, title, # (source start file, target name, title,
# author, documentclass [howto, manual, or own class]). # author, documentclass [howto, manual, or own class]).
latex_documents = [ latex_documents = [
(master_doc, 'PaddleAudio.tex', 'PaddleAudio Documentation', (master_doc, 'PaddleAudio.tex', 'PaddleAudio Documentation', 'PaddlePaddle',
'PaddlePaddle', 'manual'), 'manual'),
] ]
# -- Options for manual page output ------------------------------------------ # -- Options for manual page output ------------------------------------------
# One entry per manual page. List of tuples # One entry per manual page. List of tuples
# (source start file, name, description, authors, manual section). # (source start file, name, description, authors, manual section).
man_pages = [ man_pages = [(master_doc, 'paddleaudio', 'PaddleAudio Documentation', [author],
(master_doc, 'paddleaudio', 'PaddleAudio Documentation', 1)]
[author], 1)
]
# -- Options for Texinfo output ---------------------------------------------- # -- Options for Texinfo output ----------------------------------------------
@ -164,12 +152,10 @@ man_pages = [
# (source start file, target name, title, author, # (source start file, target name, title, author,
# dir menu entry, description, category) # dir menu entry, description, category)
texinfo_documents = [ texinfo_documents = [
(master_doc, 'PaddleAudio', 'PaddleAudio Documentation', (master_doc, 'PaddleAudio', 'PaddleAudio Documentation', author,
author, 'PaddleAudio', 'One line description of project.', 'PaddleAudio', 'One line description of project.', 'Miscellaneous'),
'Miscellaneous'),
] ]
# -- Options for Epub output ------------------------------------------------- # -- Options for Epub output -------------------------------------------------
# Bibliographic Dublin Core info. # Bibliographic Dublin Core info.
@ -187,7 +173,6 @@ epub_title = project
# A list of files that should not be packed into the epub file. # A list of files that should not be packed into the epub file.
epub_exclude_files = ['search.html'] epub_exclude_files = ['search.html']
# -- Extension configuration ------------------------------------------------- # -- Extension configuration -------------------------------------------------
# -- Options for intersphinx extension --------------------------------------- # -- Options for intersphinx extension ---------------------------------------

@ -11,3 +11,5 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
from . import kaldi
from . import librosa

@ -22,7 +22,9 @@ __all__ = [
] ]
def mcd_distance(xs: np.ndarray, ys: np.ndarray, cost_fn: Callable=mt.logSpecDbDist) -> float: def mcd_distance(xs: np.ndarray,
ys: np.ndarray,
cost_fn: Callable=mt.logSpecDbDist) -> float:
"""Mel cepstral distortion (MCD), dtw distance. """Mel cepstral distortion (MCD), dtw distance.
Dynamic Time Warping. Dynamic Time Warping.

@ -64,7 +64,7 @@ def replace_time(match) -> str:
result = f"{num2str(hour)}" result = f"{num2str(hour)}"
if minute.lstrip('0'): if minute.lstrip('0'):
if int(minute) == 30: if int(minute) == 30:
result += f"" result += ""
else: else:
result += f"{_time_num2str(minute)}" result += f"{_time_num2str(minute)}"
if second and second.lstrip('0'): if second and second.lstrip('0'):
@ -75,7 +75,7 @@ def replace_time(match) -> str:
result += f"{num2str(hour_2)}" result += f"{num2str(hour_2)}"
if minute_2.lstrip('0'): if minute_2.lstrip('0'):
if int(minute) == 30: if int(minute) == 30:
result += f"" result += ""
else: else:
result += f"{_time_num2str(minute_2)}" result += f"{_time_num2str(minute_2)}"
if second_2 and second_2.lstrip('0'): if second_2 and second_2.lstrip('0'):

@ -16,22 +16,20 @@ This script contains basic functions used for speaker diarization.
This script has an optional dependency on open source sklearn library. This script has an optional dependency on open source sklearn library.
A few sklearn functions are modified in this script as per requirement. A few sklearn functions are modified in this script as per requirement.
""" """
import argparse import argparse
import warnings import warnings
import scipy
import numpy as np
from distutils.util import strtobool from distutils.util import strtobool
import numpy as np
import scipy
import sklearn
from scipy import sparse from scipy import sparse
from scipy.sparse.linalg import eigsh
from scipy.sparse.csgraph import connected_components from scipy.sparse.csgraph import connected_components
from scipy.sparse.csgraph import laplacian as csgraph_laplacian from scipy.sparse.csgraph import laplacian as csgraph_laplacian
from scipy.sparse.linalg import eigsh
import sklearn
from sklearn.neighbors import kneighbors_graph
from sklearn.cluster import SpectralClustering from sklearn.cluster import SpectralClustering
from sklearn.cluster._kmeans import k_means from sklearn.cluster._kmeans import k_means
from sklearn.neighbors import kneighbors_graph
def _graph_connected_component(graph, node_id): def _graph_connected_component(graph, node_id):

Loading…
Cancel
Save