fix ctc cuda memcopy error

5 years ago · 8c4f60be09
parent 4dc75c40c9
commit 8c4f60be09
3 changed files with 7 additions and 6 deletions
--- a/examples/tiny/local/run_train.sh
+++ b/examples/tiny/local/run_train.sh
@ -17,6 +17,7 @@ export FLAGS_sync_nccl_allreduce=0
 #CUDA_VISIBLE_DEVICES=0,1,2,3 \
 CUDA_VISIBLE_DEVICES=1,2,3 \
 python3 -u ${MAIN_ROOT}/train.py \
+--device 'gpu' \
 --nproc 1 \
 --config conf/deepspeech2.yaml \
 --output ckpt
--- a/model_utils/model.py
+++ b/model_utils/model.py
@ -149,8 +149,8 @@ class DeepSpeech2Trainer(Trainer):
        self.logger.info("Setup model/optimizer/criterion!")

    def compute_losses(self, inputs, outputs):
-        _, texts, logits_len, texts_len = inputs
-        logits = outputs
+        _, texts, _, texts_len = inputs
+        logits, logits_len = outputs
        loss = self.criterion(logits, texts, logits_len, texts_len)
        return loss

--- a/model_utils/network.py
+++ b/model_utils/network.py
@ -517,11 +517,11 @@ class DeepSpeech2(nn.Layer):
        #ctcdecoder need probs, not log_probs
        probs = F.softmax(logits)

-        return logits, probs
+        return logits, probs, audio_len

    @paddle.no_grad()
    def infer(self, audio, audio_len):
-        _, probs = self.predict(audio, audio_len)
+        _, probs, audio_len = self.predict(audio, audio_len)
        return probs

    def forward(self, audio, text, audio_len, text_len):
@ -531,8 +531,8 @@ class DeepSpeech2(nn.Layer):
        audio_len: shape [B]
        text_len: shape [B]
        """
-        logits, _ = self.predict(audio, audio_len)
-        return logits
+        logits, _, audio_len = self.predict(audio, audio_len)
+        return logits, audio_len


 class DeepSpeech2Loss(nn.Layer):