parent
14efbf5b15
commit
60d73bb7bd
@ -0,0 +1,60 @@
|
||||
import argparse
|
||||
import os
|
||||
|
||||
import numpy as np
|
||||
import paddle
|
||||
from paddle.io import BatchSampler
|
||||
from paddle.io import DataLoader
|
||||
from paddle.io import DistributedBatchSampler
|
||||
|
||||
from paddleaudio.datasets.voxceleb import VoxCeleb1
|
||||
from paddleaudio.features.core import melspectrogram
|
||||
from paddlespeech.s2t.utils.log import Log
|
||||
from paddlespeech.vector.io.augment import build_augment_pipeline
|
||||
from paddlespeech.vector.io.augment import waveform_augment
|
||||
from paddlespeech.vector.io.batch import feature_normalize
|
||||
from paddlespeech.vector.io.batch import waveform_collate_fn
|
||||
from paddlespeech.vector.models.ecapa_tdnn import EcapaTdnn
|
||||
from paddlespeech.vector.modules.loss import AdditiveAngularMargin
|
||||
from paddlespeech.vector.modules.loss import LogSoftmaxWrapper
|
||||
from paddlespeech.vector.modules.lr import CyclicLRScheduler
|
||||
from paddlespeech.vector.modules.sid_model import SpeakerIdetification
|
||||
from paddlespeech.vector.training.seeding import seed_everything
|
||||
from paddlespeech.vector.utils.time import Timer
|
||||
|
||||
logger = Log(__name__).getlog()
|
||||
|
||||
def main(args):
|
||||
# stage0: set the cpu device, all data prepare process will be done in cpu mode
|
||||
paddle.set_device("cpu")
|
||||
# set the random seed, it is a must for multiprocess training
|
||||
seed_everything(args.seed)
|
||||
|
||||
# stage 1: generate the voxceleb csv file
|
||||
# Note: this may occurs c++ execption, but the program will execute fine
|
||||
# so we can ignore the execption
|
||||
train_dataset = VoxCeleb1('train', target_dir=args.data_dir)
|
||||
dev_dataset = VoxCeleb1('dev', target_dir=args.data_dir)
|
||||
|
||||
# stage 2: generate the augment noise csv file
|
||||
if args.augment:
|
||||
augment_pipeline = build_augment_pipeline(target_dir=args.data_dir)
|
||||
|
||||
if __name__ == "__main__":
|
||||
# yapf: disable
|
||||
parser = argparse.ArgumentParser(__doc__)
|
||||
parser.add_argument("--seed",
|
||||
default=0,
|
||||
type=int,
|
||||
help="random seed for paddle, numpy and python random package")
|
||||
parser.add_argument("--data-dir",
|
||||
default="./data/",
|
||||
type=str,
|
||||
help="data directory")
|
||||
parser.add_argument("--augment",
|
||||
action="store_true",
|
||||
default=False,
|
||||
help="Apply audio augments.")
|
||||
args = parser.parse_args()
|
||||
# yapf: enable
|
||||
main(args)
|
Loading…
Reference in new issue