diff --git a/funasr/bin/train_ds.py b/funasr/bin/train_ds.py index 415904ed3..69c2712fe 100644 --- a/funasr/bin/train_ds.py +++ b/funasr/bin/train_ds.py @@ -81,7 +81,13 @@ def main(**kwargs): deepspeed.init_distributed(dist_backend=kwargs.get("backend", "nccl")) elif use_ddp or use_fsdp: logging.info(f"use_ddp: {use_ddp}, use_fsdp: {use_fsdp}") - dist.init_process_group(backend=kwargs.get("backend", "nccl"), init_method="env://") + dist.init_process_group( + backend=kwargs.get("backend", "nccl"), + init_method="env://", + find_unused_parameters=kwargs.get("train_conf", {}).get( + "find_unused_parameters", False + ), + ) torch.cuda.set_device(local_rank) # rank = dist.get_rank() diff --git a/funasr/version.txt b/funasr/version.txt index db1527897..a5e428299 100644 --- a/funasr/version.txt +++ b/funasr/version.txt @@ -1 +1 @@ -1.1.8 \ No newline at end of file +1.1.9 \ No newline at end of file