From 2a8d041806df41fa3719505d1b3379bbbd369574 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期六, 08 六月 2024 21:35:21 +0800
Subject: [PATCH] fix bug

---
 funasr/bin/train.py |    5 ++++-
 1 files changed, 4 insertions(+), 1 deletions(-)

diff --git a/funasr/bin/train.py b/funasr/bin/train.py
index d20915c..c3556d1 100644
--- a/funasr/bin/train.py
+++ b/funasr/bin/train.py
@@ -198,7 +198,7 @@
         writer = None
 
     dataloader_tr, dataloader_val = None, None
-    for epoch in range(trainer.start_epoch, trainer.max_epoch + 1):
+    for epoch in range(trainer.start_epoch, trainer.max_epoch):
         time1 = time.perf_counter()
 
         for data_split_i in range(trainer.start_data_split_i, dataloader.data_split_num):
@@ -223,6 +223,7 @@
 
             torch.cuda.empty_cache()
 
+        trainer.start_data_split_i = 0
         trainer.validate_epoch(
             model=model, dataloader_val=dataloader_val, epoch=epoch + 1, writer=writer
         )
@@ -240,6 +241,8 @@
             f"estimated to finish {trainer.max_epoch} "
             f"epoch: {(trainer.max_epoch - epoch) * time_escaped:.3f} hours\n"
         )
+        trainer.train_acc_avg = 0.0
+        trainer.train_loss_avg = 0.0
 
     if trainer.rank == 0:
         average_checkpoints(trainer.output_dir, trainer.avg_nbest_model)

--
Gitblit v1.9.1