From 414de3747c9ac9a7422dc45f0c945d135245de6f Mon Sep 17 00:00:00 2001 From: WongLaw Date: Thu, 20 Apr 2023 11:18:06 +0000 Subject: [PATCH 1/4] VITS learning rate revised, test=tts --- examples/csmsc/vits/conf/default.yaml | 2 +- paddlespeech/t2s/models/vits/vits_updater.py | 6 ++++-- 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/examples/csmsc/vits/conf/default.yaml b/examples/csmsc/vits/conf/default.yaml index a2aef998..e0572535 100644 --- a/examples/csmsc/vits/conf/default.yaml +++ b/examples/csmsc/vits/conf/default.yaml @@ -179,7 +179,7 @@ generator_first: False # whether to start updating generator first # OTHER TRAINING SETTING # ########################################################## num_snapshots: 10 # max number of snapshots to keep while training -train_max_steps: 350000 # Number of training steps. == total_iters / ngpus, total_iters = 1000000 +max_epoch: 1000 # Number of training epochs. save_interval_steps: 1000 # Interval steps to save checkpoint. eval_interval_steps: 250 # Interval steps to evaluate the network. seed: 777 # random seed number diff --git a/paddlespeech/t2s/models/vits/vits_updater.py b/paddlespeech/t2s/models/vits/vits_updater.py index 9f8be680..7926bb6a 100644 --- a/paddlespeech/t2s/models/vits/vits_updater.py +++ b/paddlespeech/t2s/models/vits/vits_updater.py @@ -166,7 +166,8 @@ class VITSUpdater(StandardUpdater): gen_loss.backward() self.optimizer_g.step() - self.scheduler_g.step() + if self.state.iteration % self.updates_per_epoch == 0: + self.scheduler_g.step() # reset cache if self.model.reuse_cache_gen or not self.model.training: @@ -202,7 +203,8 @@ class VITSUpdater(StandardUpdater): dis_loss.backward() self.optimizer_d.step() - self.scheduler_d.step() + if self.state.iteration % self.updates_per_epoch == 0: + self.scheduler_d.step() # reset cache if self.model.reuse_cache_dis or not self.model.training: From 47e31f46cb229676c81273596958ba8672a80fa7 Mon Sep 17 00:00:00 2001 From: WongLaw Date: Thu, 20 Apr 2023 11:34:20 +0000 Subject: [PATCH 2/4] VITS learning rate revised, test=tts --- paddlespeech/t2s/exps/vits/train.py | 2 +- paddlespeech/t2s/models/vits/vits_updater.py | 2 ++ 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/paddlespeech/t2s/exps/vits/train.py b/paddlespeech/t2s/exps/vits/train.py index 0e74bf63..8e166beb 100644 --- a/paddlespeech/t2s/exps/vits/train.py +++ b/paddlespeech/t2s/exps/vits/train.py @@ -231,7 +231,7 @@ def train_sp(args, config): trainer = Trainer( updater, - stop_trigger=(config.train_max_steps, "iteration"), + stop_trigger=(config.max_epoch, 'epoch'), out=output_dir) if dist.get_rank() == 0: diff --git a/paddlespeech/t2s/models/vits/vits_updater.py b/paddlespeech/t2s/models/vits/vits_updater.py index 7926bb6a..e61e617c 100644 --- a/paddlespeech/t2s/models/vits/vits_updater.py +++ b/paddlespeech/t2s/models/vits/vits_updater.py @@ -166,6 +166,7 @@ class VITSUpdater(StandardUpdater): gen_loss.backward() self.optimizer_g.step() + # learning rate updates on each epoch. if self.state.iteration % self.updates_per_epoch == 0: self.scheduler_g.step() @@ -203,6 +204,7 @@ class VITSUpdater(StandardUpdater): dis_loss.backward() self.optimizer_d.step() + # learning rate updates on each epoch. if self.state.iteration % self.updates_per_epoch == 0: self.scheduler_d.step() From fdeb9b88a79f5a2e297666f5eb0b9a3aec63ba76 Mon Sep 17 00:00:00 2001 From: WongLaw Date: Mon, 24 Apr 2023 03:01:10 +0000 Subject: [PATCH 3/4] VITS learning rate revised, test=tts --- examples/csmsc/vits/conf/default.yaml | 2 +- paddlespeech/t2s/exps/vits/train.py | 6 ++---- 2 files changed, 3 insertions(+), 5 deletions(-) diff --git a/examples/csmsc/vits/conf/default.yaml b/examples/csmsc/vits/conf/default.yaml index e0572535..a897569a 100644 --- a/examples/csmsc/vits/conf/default.yaml +++ b/examples/csmsc/vits/conf/default.yaml @@ -180,6 +180,6 @@ generator_first: False # whether to start updating generator first ########################################################## num_snapshots: 10 # max number of snapshots to keep while training max_epoch: 1000 # Number of training epochs. -save_interval_steps: 1000 # Interval steps to save checkpoint. +save_interval_epochs: 1 # Interval epochs to save checkpoint. eval_interval_steps: 250 # Interval steps to evaluate the network. seed: 777 # random seed number diff --git a/paddlespeech/t2s/exps/vits/train.py b/paddlespeech/t2s/exps/vits/train.py index 8e166beb..fefa6a01 100644 --- a/paddlespeech/t2s/exps/vits/train.py +++ b/paddlespeech/t2s/exps/vits/train.py @@ -230,9 +230,7 @@ def train_sp(args, config): output_dir=output_dir) trainer = Trainer( - updater, - stop_trigger=(config.max_epoch, 'epoch'), - out=output_dir) + updater, stop_trigger=(config.max_epoch, 'epoch'), out=output_dir) if dist.get_rank() == 0: trainer.extend( @@ -240,7 +238,7 @@ def train_sp(args, config): trainer.extend(VisualDL(output_dir), trigger=(1, 'iteration')) trainer.extend( Snapshot(max_size=config.num_snapshots), - trigger=(config.save_interval_steps, 'iteration')) + trigger=(config.save_interval_epochs, 'epoch')) print("Trainer Done!") trainer.run() From 305375c310680e59980bcc3302ebdfca7a292642 Mon Sep 17 00:00:00 2001 From: WongLaw Date: Mon, 24 Apr 2023 03:15:02 +0000 Subject: [PATCH 4/4] VITS learning rate revised, test=tts --- examples/csmsc/vits/conf/default.yaml | 2 +- paddlespeech/t2s/exps/vits/train.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/csmsc/vits/conf/default.yaml b/examples/csmsc/vits/conf/default.yaml index a897569a..7e9e9c1d 100644 --- a/examples/csmsc/vits/conf/default.yaml +++ b/examples/csmsc/vits/conf/default.yaml @@ -181,5 +181,5 @@ generator_first: False # whether to start updating generator first num_snapshots: 10 # max number of snapshots to keep while training max_epoch: 1000 # Number of training epochs. save_interval_epochs: 1 # Interval epochs to save checkpoint. -eval_interval_steps: 250 # Interval steps to evaluate the network. +eval_interval_epochs: 1 # Interval steps to evaluate the network. seed: 777 # random seed number diff --git a/paddlespeech/t2s/exps/vits/train.py b/paddlespeech/t2s/exps/vits/train.py index fefa6a01..cdfd3003 100644 --- a/paddlespeech/t2s/exps/vits/train.py +++ b/paddlespeech/t2s/exps/vits/train.py @@ -234,7 +234,7 @@ def train_sp(args, config): if dist.get_rank() == 0: trainer.extend( - evaluator, trigger=(config.eval_interval_steps, 'iteration')) + evaluator, trigger=(config.eval_interval_epochs, 'epoch')) trainer.extend(VisualDL(output_dir), trigger=(1, 'iteration')) trainer.extend( Snapshot(max_size=config.num_snapshots),