Tighten PR scope to single-GPU training path fixes

2026-07-23 02:45:48 +08:00 · 2026-04-18 15:02:38 +08:00 · 2026-04-18 15:02:38 +08:00 · 43506a8a69
commit 43506a8a69
parent e8c53643e7
1 changed files with 16 additions and 22 deletions
--- a/GPT_SoVITS/s2_train_v3_lora.py
+++ b/GPT_SoVITS/s2_train_v3_lora.py
@ -342,28 +342,22 @@ def train_and_evaluate(rank, epoch, hps, nets, optims, schedulers, scaler, loade

        global_step += 1
    if epoch % hps.train.save_every_epoch == 0 and rank == 0:
-        try:
-            if hps.train.if_save_latest == 0:
-                utils.save_checkpoint(
-                    net_g,
-                    optim_g,
-                    hps.train.learning_rate,
-                    epoch,
-                    os.path.join(save_root, "G_{}.pth".format(global_step)),
-                )
-            else:
-                utils.save_checkpoint(
-                    net_g,
-                    optim_g,
-                    hps.train.learning_rate,
-                    epoch,
-                    os.path.join(save_root, "G_{}.pth".format(233333333333)),
-                )
-        except Exception as e:
-            if logger is not None:
-                logger.warning(f"skip large checkpoint save due to error: {e}")
-            else:
-                print(f"skip large checkpoint save due to error: {e}")
+        if hps.train.if_save_latest == 0:
+            utils.save_checkpoint(
+                net_g,
+                optim_g,
+                hps.train.learning_rate,
+                epoch,
+                os.path.join(save_root, "G_{}.pth".format(global_step)),
+            )
+        else:
+            utils.save_checkpoint(
+                net_g,
+                optim_g,
+                hps.train.learning_rate,
+                epoch,
+                os.path.join(save_root, "G_{}.pth".format(233333333333)),
+            )
        if rank == 0 and hps.train.if_save_every_weights == True:
            if hasattr(net_g, "module"):
                ckpt = net_g.module.state_dict()