mirror of
https://github.com/FunAudioLLM/SenseVoice.git
synced 2025-09-15 15:08:35 +08:00
add postprocess for sensevoice
This commit is contained in:
parent
771252c097
commit
831cd02798
@ -118,6 +118,7 @@ print(res)
|
||||
|
||||
```python
|
||||
from funasr import AutoModel
|
||||
from funasr.utils.postprocess_utils import rich_transcription_postprocess
|
||||
|
||||
model_dir = "iic/SenseVoiceSmall"
|
||||
input_file = (
|
||||
@ -137,7 +138,9 @@ res = model.generate(
|
||||
batch_size_s=0,
|
||||
)
|
||||
|
||||
print(res)
|
||||
text = rich_transcription_postprocess(res[0]["text"])
|
||||
|
||||
print(text)
|
||||
```
|
||||
|
||||
The funasr version has integrated the VAD (Voice Activity Detection) model and supports audio input of any duration, with `batch_size_s` in seconds.
|
||||
|
||||
@ -118,6 +118,7 @@ print(res)
|
||||
|
||||
```python
|
||||
from funasr import AutoModel
|
||||
from funasr.utils.postprocess_utils import rich_transcription_postprocess
|
||||
|
||||
model_dir = "iic/SenseVoiceSmall"
|
||||
input_file = (
|
||||
@ -137,7 +138,9 @@ res = model.generate(
|
||||
batch_size_s=0,
|
||||
)
|
||||
|
||||
print(res)
|
||||
text = rich_transcription_postprocess(res[0]["text"])
|
||||
|
||||
print(text)
|
||||
```
|
||||
|
||||
funasr版本已经集成了vad模型,支持任意时长音频输入,`batch_size_s`单位为秒。
|
||||
|
||||
@ -4,6 +4,7 @@
|
||||
# MIT License (https://opensource.org/licenses/MIT)
|
||||
|
||||
from funasr import AutoModel
|
||||
from funasr.utils.postprocess_utils import rich_transcription_postprocess
|
||||
|
||||
model_dir = "iic/SenseVoiceSmall"
|
||||
input_file = (
|
||||
@ -22,4 +23,6 @@ res = model.generate(
|
||||
use_itn=False,
|
||||
)
|
||||
|
||||
print(res)
|
||||
text = rich_transcription_postprocess(res[0]["text"])
|
||||
|
||||
print(text)
|
||||
|
||||
Loading…
Reference in New Issue
Block a user