From 310006dd60bf464c0fbeb2b81771eef53539f1c6 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=B8=B8=E9=9B=81?= Date: Sat, 8 Jun 2024 17:19:32 +0800 Subject: [PATCH] fix bug --- funasr/datasets/openai_datasets/datasets.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/funasr/datasets/openai_datasets/datasets.py b/funasr/datasets/openai_datasets/datasets.py index 0d12a1c4f..3bc6aa011 100644 --- a/funasr/datasets/openai_datasets/datasets.py +++ b/funasr/datasets/openai_datasets/datasets.py @@ -162,7 +162,7 @@ class OpenAIDataset(torch.utils.data.Dataset): if badcase_flag: continue input_ids = torch.tensor(input_ids, dtype=torch.int64) # [: self.max_token_length] - attention_mask = torch.tensor([len(input_ids)], dtype=torch.int32) + attention_mask = torch.tensor([1] * len(input_ids), dtype=torch.int32) labels = torch.tensor(labels, dtype=torch.int64) # [: self.max_token_length] fbank = speech[0, :, :]