From 6316514329764151e1a409f0a31631c51924920c Mon Sep 17 00:00:00 2001 From: megemini Date: Wed, 30 Oct 2024 17:41:17 +0800 Subject: [PATCH 1/3] [Fix] type promotion (#3817) --- paddlespeech/audio/utils/tensor_utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/paddlespeech/audio/utils/tensor_utils.py b/paddlespeech/audio/utils/tensor_utils.py index 93883c94d..43dcac0ac 100644 --- a/paddlespeech/audio/utils/tensor_utils.py +++ b/paddlespeech/audio/utils/tensor_utils.py @@ -248,7 +248,7 @@ def st_reverse_pad_list(ys_pad: paddle.Tensor, # >>> tensor([[ 2, 1, 0], # >>> [ 2, 1, 0], # >>> [ 0, -1, -2]]) - index = index * seq_mask + index = index * seq_mask.astype(index.dtype) # >>> index # >>> tensor([[2, 1, 0], From e41a8794c4d505ff7b8e8be99cfafa184c4b6599 Mon Sep 17 00:00:00 2001 From: 131 <11222509+Netrvin@users.noreply.github.com> Date: Mon, 4 Nov 2024 14:56:07 +0800 Subject: [PATCH 2/3] fix pydantic dependency (#3715) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * fix pydantic dependency pydantic>=2.0时,str不能为None * remove extra space --- setup.py | 1 + 1 file changed, 1 insertion(+) diff --git a/setup.py b/setup.py index 48c684855..927f7edb6 100644 --- a/setup.py +++ b/setup.py @@ -59,6 +59,7 @@ base = [ "paddlespeech_feat", "praatio>=5.0.0, <=5.1.1", "prettytable", + "pydantic>=1.10.14, <2.0", "pypinyin<=0.44.0", "pypinyin-dict", "python-dateutil", From d5b0020e9a492abb96286590316044d5a8b9417f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=BC=A0=E6=98=A5=E4=B9=94?= <83450930+Liyulingyue@users.noreply.github.com> Date: Mon, 4 Nov 2024 17:48:23 +0800 Subject: [PATCH 3/3] =?UTF-8?q?Fix=20missing=20=E2=80=99=20(#3869)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- demos/speech_ssl/README_cn.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/demos/speech_ssl/README_cn.md b/demos/speech_ssl/README_cn.md index a18c778a7..5b209419a 100644 --- a/demos/speech_ssl/README_cn.md +++ b/demos/speech_ssl/README_cn.md @@ -56,7 +56,7 @@ wget -c https://paddlespeech.bj.bcebos.com/PaddleAudio/en.wav # 识别文本 text = ssl_executor( - model='wav2vec2, + model='wav2vec2', task='asr', lang='en', sample_rate=16000,