Merge pull request #14 from alibaba-damo-academy/dev

wav
2025-09-15 14:48:36 +08:00 · 2022-12-12 21:32:36 +08:00 · 2022-12-12 21:32:36 +08:00 · 22f0bd8265
commit 22f0bd8265
parent 7817db2e20 aa340bc2c8
1 changed files with 3 additions and 3 deletions
--- a/funasr/bin/asr_inference_paraformer.py
+++ b/funasr/bin/asr_inference_paraformer.py
@ -197,9 +197,9 @@ class Speech2Text:

        # data: (Nsamples,) -> (1, Nsamples)
        # lengths: (1,)
-        if len(speech.size()) < 3:
-            speech = speech.unsqueeze(0).to(getattr(torch, self.dtype))
-            speech_lengths = speech.new_full([1], dtype=torch.long, fill_value=speech.size(1))
+        # if len(speech.size()) < 3:
+        #     speech = speech.unsqueeze(0).to(getattr(torch, self.dtype))
+        #     speech_lengths = speech.new_full([1], dtype=torch.long, fill_value=speech.size(1))
        lfr_factor = max(1, (speech.size()[-1]//80)-1)
        
        batch = {"speech": speech, "speech_lengths": speech_lengths}