Merge pull request #691 from PaddlePaddle/bugfix

fix audio shape bug for audio len
pull/692/head
Hui Zhang 4 years ago committed by GitHub
commit d1c280cce8
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -154,8 +154,8 @@ class SpeechCollator():
random_seed (int, optional): for random generator. Defaults to 0.
keep_transcription_text (bool, optional): True, when not in training mode, will not do tokenizer; Defaults to False.
if ``keep_transcription_text`` is False, text is token ids else is raw string.
Do augmentations
Do augmentations
Padding audio features with zeros to make them have the same shape (or
a user-defined shape) within one batch.
"""
@ -271,7 +271,7 @@ class SpeechCollator():
utts.append(utt)
# audio
audios.append(audio) # [T, D]
audio_lens.append(audio.shape[1])
audio_lens.append(audio.shape[0])
# text
# for training, text is token ids
# else text is string, convert to unicode ord

Loading…
Cancel
Save