From 7d825c42b1fb0399f681818cbb29c723dea1071f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=BC=A0=E6=98=A5=E4=B9=94?= <83450930+Liyulingyue@users.noreply.github.com> Date: Wed, 6 Nov 2024 08:23:42 +0800 Subject: [PATCH] Apply suggestions from code review --- paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py b/paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py index b19d967e2..65a5f8e59 100755 --- a/paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py +++ b/paddlespeech/s2t/models/wav2vec2/wav2vec2_ASR.py @@ -84,15 +84,18 @@ class Wav2vec2ASR(nn.Layer): def extract_features(self, wav): if self.normalize_wav: wav = F.layer_norm(wav, wav.shape[-1]) + # Extract wav2vec output out = self.wav2vec2(wav)[0] # We normalize the output if required if self.output_norm: out = F.layer_norm(out, out.shape[-1]) + if self.training and hasattr(self.config, 'spec_augment'): feats = self.spec_augment(out) else: feats = out + return feats @paddle.no_grad()