From f7fc54badef36151e77509e24ddfc8356e3659e8 Mon Sep 17 00:00:00 2001 From: Luzhenhui Date: Thu, 24 Aug 2023 18:20:41 +0800 Subject: [PATCH] bugfix: audio_len should be 1D, no 0D, which will raise list index out of range error in the following decode process --- paddlespeech/cli/asr/infer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/paddlespeech/cli/asr/infer.py b/paddlespeech/cli/asr/infer.py index 231a00f4d..4001f957f 100644 --- a/paddlespeech/cli/asr/infer.py +++ b/paddlespeech/cli/asr/infer.py @@ -274,7 +274,7 @@ class ASRExecutor(BaseExecutor): # fbank audio = preprocessing(audio, **preprocess_args) - audio_len = paddle.to_tensor(audio.shape[0]).unsqueeze(axis=0) + audio_len = paddle.to_tensor([audio.shape[0]]).unsqueeze(axis=0) audio = paddle.to_tensor(audio, dtype='float32').unsqueeze(axis=0) self._inputs["audio"] = audio