add extract token run_mode

2025-09-15 14:48:36 +08:00 · 2024-09-24 17:15:30 +08:00 · 2024-09-24 17:15:30 +08:00 · ce5b79d234
commit ce5b79d234
parent 1fb762d9be
1 changed files with 2 additions and 2 deletions
--- a/funasr/models/sense_voice/model_small.py
+++ b/funasr/models/sense_voice/model_small.py
@ -2034,11 +2034,11 @@ class SenseVoiceL(nn.Module):
            lfr_n = frontend.lfr_n if hasattr(frontend, "lfr_n") else 1
            meta_data["batch_data_time"] = speech_lengths.sum().item() * frame_shift * lfr_n / 1000

-        speech = speech.to(device=kwargs["device"])[0, :, :]
+        speech = speech.to(device=kwargs["device"])
        speech_lengths = speech_lengths.to(device=kwargs["device"])

        (outs, ret_dict), out_lens = self.model.encoder(
-            speech.permute(0, 2, 1), speech_lengths,
+            speech, speech_lengths,
            only_extract_tokens=True
        )
        tokens = ret_dict["indices"]