|
|
@ -940,8 +940,6 @@ class StyleFastSpeech2Inference(FastSpeech2Inference):
|
|
|
|
Tensor
|
|
|
|
Tensor
|
|
|
|
Output sequence of features (L, odim).
|
|
|
|
Output sequence of features (L, odim).
|
|
|
|
"""
|
|
|
|
"""
|
|
|
|
if spk_id:
|
|
|
|
|
|
|
|
spk_id = paddle.to_tensor(spk_id)
|
|
|
|
|
|
|
|
normalized_mel, d_outs, p_outs, e_outs = self.acoustic_model.inference(
|
|
|
|
normalized_mel, d_outs, p_outs, e_outs = self.acoustic_model.inference(
|
|
|
|
text,
|
|
|
|
text,
|
|
|
|
durations=None,
|
|
|
|
durations=None,
|
|
|
|