From 4152cf4615e234b9892703a8e088cdd51937fc13 Mon Sep 17 00:00:00 2001
From: haoneng.lhn <haoneng.lhn@alibaba-inc.com>
Date: 星期四, 07 十二月 2023 14:49:34 +0800
Subject: [PATCH] fix loss normalization for ddp training

---
 funasr/models/e2e_asr.py |    3 +++
 1 files changed, 3 insertions(+), 0 deletions(-)

diff --git a/funasr/models/e2e_asr.py b/funasr/models/e2e_asr.py
index 79c5387..162bfba 100644
--- a/funasr/models/e2e_asr.py
+++ b/funasr/models/e2e_asr.py
@@ -122,6 +122,7 @@
             self.ctc = ctc
 
         self.extract_feats_in_collect_stats = extract_feats_in_collect_stats
+        self.length_normalized_loss = length_normalized_loss
 
     def forward(
             self,
@@ -220,6 +221,8 @@
         stats["loss"] = torch.clone(loss.detach())
 
         # force_gatherable: to-device and to-tensor if scalar for DataParallel
+        if self.length_normalized_loss:
+            batch_size = (text_lengths + 1).sum().type_as(batch_size)
         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
         return loss, stats, weight
 

--
Gitblit v1.9.1