|
|
|
@ -264,12 +264,12 @@ class U2Trainer(Trainer):
|
|
|
|
|
config.data.manifest = config.data.test_manifest
|
|
|
|
|
# filter test examples, will cause less examples, but no mismatch with training
|
|
|
|
|
# and can use large batch size , save training time, so filter test egs now.
|
|
|
|
|
# config.data.min_input_len = 0.0 # second
|
|
|
|
|
# config.data.max_input_len = float('inf') # second
|
|
|
|
|
# config.data.min_output_len = 0.0 # tokens
|
|
|
|
|
# config.data.max_output_len = float('inf') # tokens
|
|
|
|
|
# config.data.min_output_input_ratio = 0.00
|
|
|
|
|
# config.data.max_output_input_ratio = float('inf')
|
|
|
|
|
config.data.min_input_len = 0.0 # second
|
|
|
|
|
config.data.max_input_len = float('inf') # second
|
|
|
|
|
config.data.min_output_len = 0.0 # tokens
|
|
|
|
|
config.data.max_output_len = float('inf') # tokens
|
|
|
|
|
config.data.min_output_input_ratio = 0.00
|
|
|
|
|
config.data.max_output_input_ratio = float('inf')
|
|
|
|
|
|
|
|
|
|
test_dataset = ManifestDataset.from_config(config)
|
|
|
|
|
# return text ord id
|
|
|
|
|