diff --git a/paddlespeech/cli/whisper/infer.py b/paddlespeech/cli/whisper/infer.py index a739487fd..7056e7f94 100644 --- a/paddlespeech/cli/whisper/infer.py +++ b/paddlespeech/cli/whisper/infer.py @@ -140,7 +140,7 @@ class WhisperExecutor(BaseExecutor): model_type: str='whisper', lang: str='', task: str='transcribe', - size: str='large', + size: str='turbo', language: str='None', sample_rate: int=16000, cfg_path: Optional[os.PathLike]=None, diff --git a/paddlespeech/resource/pretrained_models.py b/paddlespeech/resource/pretrained_models.py index 50ad5f311..c5285a875 100644 --- a/paddlespeech/resource/pretrained_models.py +++ b/paddlespeech/resource/pretrained_models.py @@ -939,9 +939,9 @@ whisper_dynamic_pretrained_models = { 'params': 'whisper-turbo-model.pdparams', 'resource_data': - 'https://paddlespeech.cdn.bcebos.com/whisper/whisper_model_20221108/assets.tar', + 'https://paddlespeech.bj.bcebos.com/whisper/whisper_model_20250825/assets.tar', 'resource_data_md5': - '37a0a8abdb3641a51194f79567a93b61', + 'dd61d092d362f1fdbae6ede08282e177', }, }, } diff --git a/paddlespeech/s2t/models/whisper/whisper.py b/paddlespeech/s2t/models/whisper/whisper.py index dc38eca4d..9914d0dd8 100644 --- a/paddlespeech/s2t/models/whisper/whisper.py +++ b/paddlespeech/s2t/models/whisper/whisper.py @@ -1557,7 +1557,7 @@ def hann_window(n_fft: int=N_FFT): """ return paddle.to_tensor( [0.5 - 0.5 * np.cos(2 * np.pi * n / n_fft) for n in range(n_fft)], - dtype=paddle.float32) + dtype="float32") @lru_cache(maxsize=None)