diff --git a/funasr/models/e2e_asr_paraformer.py b/funasr/models/e2e_asr_paraformer.py index ef8c0ca2e..cc6f54ba0 100644 --- a/funasr/models/e2e_asr_paraformer.py +++ b/funasr/models/e2e_asr_paraformer.py @@ -906,9 +906,9 @@ class ParaformerBert(Paraformer): self.step_cur += 1 # for data-parallel text = text[:, : text_lengths.max()] - speech = speech[:, :speech_lengths.max(), :] + speech = speech[:, :speech_lengths.max()] if embed is not None: - embed = embed[:, :embed_lengths.max(), :] + embed = embed[:, :embed_lengths.max()] # 1. Encoder encoder_out, encoder_out_lens = self.encode(speech, speech_lengths)