Merge pull request #1161 from alibaba-damo-academy/dev_lhn

fix loss normalization for ddp training
This commit is contained in:
hnluo 2023-12-08 16:43:48 +08:00 committed by GitHub
commit 202ab8a2c9
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -442,7 +442,7 @@ class UniASR(FunASRModel):
stats["loss"] = torch.clone(loss.detach())
# force_gatherable: to-device and to-tensor if scalar for DataParallel
if self.length_normalized_loss:
batch_size = (text_lengths + 1).sum().type_as(batch_size)
batch_size = int((text_lengths + 1).sum())
loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
return loss, stats, weight