|
|
|
@ -215,8 +215,14 @@ class U2Trainer(Trainer):
|
|
|
|
|
config.data.manifest = config.data.train_manifest
|
|
|
|
|
train_dataset = ManifestDataset.from_config(config)
|
|
|
|
|
|
|
|
|
|
config.data.manifest = config.data.dev_manifest
|
|
|
|
|
config.data.augmentation_config = ""
|
|
|
|
|
config.data.min_input_len = 0.0 # second
|
|
|
|
|
config.data.max_input_len: 100.0 # second
|
|
|
|
|
config.data.min_output_len: 0.0 # tokens
|
|
|
|
|
config.data.max_output_len: 400.0 # tokens
|
|
|
|
|
config.data.min_output_input_ratio: 0.00
|
|
|
|
|
config.data.max_output_input_ratio: 100.0
|
|
|
|
|
config.data.manifest = config.data.dev_manifest
|
|
|
|
|
dev_dataset = ManifestDataset.from_config(config)
|
|
|
|
|
|
|
|
|
|
collate_fn = SpeechCollator(keep_transcription_text=False)
|
|
|
|
@ -253,6 +259,12 @@ class U2Trainer(Trainer):
|
|
|
|
|
# test dataset, return raw text
|
|
|
|
|
config.data.keep_transcription_text = True
|
|
|
|
|
config.data.augmentation_config = ""
|
|
|
|
|
config.data.min_input_len = 0.0 # second
|
|
|
|
|
config.data.max_input_len: 100.0 # second
|
|
|
|
|
config.data.min_output_len: 0.0 # tokens
|
|
|
|
|
config.data.max_output_len: 400.0 # tokens
|
|
|
|
|
config.data.min_output_input_ratio: 0.00
|
|
|
|
|
config.data.max_output_input_ratio: 100.0
|
|
|
|
|
config.data.manifest = config.data.test_manifest
|
|
|
|
|
test_dataset = ManifestDataset.from_config(config)
|
|
|
|
|
# return text ord id
|
|
|
|
|