Merge pull request #1161 from alibaba-damo-academy/dev_lhn

fix loss normalization for ddp training
2025-09-15 14:48:36 +08:00 · 2023-12-08 16:43:48 +08:00 · 2023-12-08 16:43:48 +08:00 · 202ab8a2c9
commit 202ab8a2c9
parent aab1fcd6b6 ace42e5043
1 changed files with 1 additions and 1 deletions
--- a/funasr/models/e2e_uni_asr.py
+++ b/funasr/models/e2e_uni_asr.py
@ -442,7 +442,7 @@ class UniASR(FunASRModel):
        stats["loss"] = torch.clone(loss.detach())
        # force_gatherable: to-device and to-tensor if scalar for DataParallel
        if self.length_normalized_loss:
-            batch_size = (text_lengths + 1).sum().type_as(batch_size)
+            batch_size = int((text_lengths + 1).sum())
        loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
        return loss, stats, weight