@ -146,7 +146,7 @@ class DeepSpeech2Trainer(Trainer):
learning_rate=config.training.lr,
gamma=config.training.lr_decay,
verbose=True)
optimizer = paddle.optimizer.SGD( #Adam
optimizer = paddle.optimizer.Adam(
learning_rate=lr_scheduler,
parameters=model.parameters(),
weight_decay=paddle.regularizer.L2Decay(
@ -30,6 +30,4 @@ class Conv2dSubsampling4Online(Conv2dSubsampling4):
#b, c, t, f = paddle.shape(x) #not work under jit
x = x.transpose([0, 2, 1, 3]).reshape([0, 0, -1])
x_len = ((x_len - 1) // 2 - 1) // 2
x_len = paddle.where(x_len >= 0, x_len,
paddle.zeros_like(x_len.shape, "int64"))
return x, x_len