From dc56c11de06b6e8100fe39c5bc0b914257d8c3f7 Mon Sep 17 00:00:00 2001 From: Hui Zhang Date: Tue, 2 Feb 2021 08:26:02 +0000 Subject: [PATCH 1/3] remove useless comma --- data_utils/data.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/data_utils/data.py b/data_utils/data.py index 3628e067..4a5224ef 100644 --- a/data_utils/data.py +++ b/data_utils/data.py @@ -276,8 +276,8 @@ class DataGenerator(object): def reader(): for instance in manifest: inst = self.process_utterance(instance["audio_filepath"], - instance["text"]), - yield inst[0] + instance["text"]) + yield inst return reader From 457323e26b473152396ffbbe51a0b7f4b567812a Mon Sep 17 00:00:00 2001 From: Hui Zhang Date: Tue, 2 Feb 2021 08:26:39 +0000 Subject: [PATCH 2/3] using china data source --- data/aishell/aishell.py | 1 + data/librispeech/librispeech.py | 1 + 2 files changed, 2 insertions(+) diff --git a/data/aishell/aishell.py b/data/aishell/aishell.py index d3340fc6..e81d2085 100644 --- a/data/aishell/aishell.py +++ b/data/aishell/aishell.py @@ -19,6 +19,7 @@ from data_utils.utility import download, unpack DATA_HOME = os.path.expanduser('~/.cache/paddle/dataset/speech') URL_ROOT = 'http://www.openslr.org/resources/33' +URL_ROOT = 'https://openslr.magicdatatech.com/resources/33' DATA_URL = URL_ROOT + '/data_aishell.tgz' MD5_DATA = '2f494334227864a8a8fec932999db9d8' diff --git a/data/librispeech/librispeech.py b/data/librispeech/librispeech.py index 07cc0933..770b7110 100644 --- a/data/librispeech/librispeech.py +++ b/data/librispeech/librispeech.py @@ -20,6 +20,7 @@ import io from data_utils.utility import download, unpack URL_ROOT = "http://www.openslr.org/resources/12" +URL_ROOT = "https://openslr.magicdatatech.com/resources/12" URL_TEST_CLEAN = URL_ROOT + "/test-clean.tar.gz" URL_TEST_OTHER = URL_ROOT + "/test-other.tar.gz" URL_DEV_CLEAN = URL_ROOT + "/dev-clean.tar.gz" From 71f37a8a9078d7599a56981031ad1b5fc0211ffc Mon Sep 17 00:00:00 2001 From: Hui Zhang Date: Tue, 2 Feb 2021 10:04:55 +0000 Subject: [PATCH 3/3] add loss package --- data/voxforge/voxforge.py | 1 + data_utils/speech.py | 1 + 2 files changed, 2 insertions(+) diff --git a/data/voxforge/voxforge.py b/data/voxforge/voxforge.py index b86b0f00..b7cc38bd 100644 --- a/data/voxforge/voxforge.py +++ b/data/voxforge/voxforge.py @@ -11,6 +11,7 @@ from __future__ import print_function import os import codecs +import datetime import soundfile import json import argparse diff --git a/data_utils/speech.py b/data_utils/speech.py index 0cea8873..e64109dc 100644 --- a/data_utils/speech.py +++ b/data_utils/speech.py @@ -3,6 +3,7 @@ from __future__ import absolute_import from __future__ import division from __future__ import print_function +import numpy as np from data_utils.audio import AudioSegment