diff --git a/paddlespeech/t2s/models/diffsinger/diffsinger_updater.py b/paddlespeech/t2s/models/diffsinger/diffsinger_updater.py index 5321d1061..9d2924ef3 100644 --- a/paddlespeech/t2s/models/diffsinger/diffsinger_updater.py +++ b/paddlespeech/t2s/models/diffsinger/diffsinger_updater.py @@ -210,7 +210,7 @@ class DiffSingerEvaluator(StandardEvaluator): spk_id = None # Here show diffsinger eval - mel, mel_masks = self.model( + mel, mel_ref, mel_masks = self.model( text=batch["text"], note=batch["note"], note_dur=batch["note_dur"], @@ -226,9 +226,10 @@ class DiffSingerEvaluator(StandardEvaluator): train_fs2=False, ) mel = mel.transpose((0, 2, 1)) + mel_ref = mel_ref.transpose((0, 2, 1)) mel_masks = mel_masks.transpose((0, 2, 1)) l1_loss_ds = self.criterion_ds( - ref_mels=batch["speech"], + ref_mels=mel_ref, out_mels=mel, mel_masks=mel_masks, ) loss_ds = l1_loss_ds