Merge branch 'dev_gzf_funasr2' of github.com:alibaba-damo-academy/FunASR into dev_gzf_funasr2

add
2025-09-15 14:48:36 +08:00 · 2023-12-27 23:05:49 +08:00 · 2023-12-27 23:05:49 +08:00 · fddb28f026
commit fddb28f026
parent ccb9488954 840657e54e
9 changed files with 45 additions and 18 deletions
--- a/examples/industrial_data_pretraining/contextual_paraformer/demo.py
+++ b/examples/industrial_data_pretraining/contextual_paraformer/demo.py
@ -0,0 +1,12 @@
+#!/usr/bin/env python3
+# -*- encoding: utf-8 -*-
+# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
+#  MIT License  (https://opensource.org/licenses/MIT)
+
+from funasr import AutoModel
+
+model = AutoModel(model="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404")
+
+res = model(input="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404/example/asr_example.wav",
+            hotword='达魔院 魔搭')
+print(res)
--- a/examples/industrial_data_pretraining/neat_contextual_paraformer/infer.sh
+++ b/examples/industrial_data_pretraining/neat_contextual_paraformer/infer.sh
@ -1,6 +1,6 @@

 # download model
-local_path_root=./modelscope_models
+local_path_root=../modelscope_models
 mkdir -p ${local_path_root}
 local_path=${local_path_root}/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404
 git clone https://www.modelscope.cn/damo/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404.git ${local_path}
--- a/examples/industrial_data_pretraining/neat_contextual_paraformer/demo.py
+++ b/examples/industrial_data_pretraining/neat_contextual_paraformer/demo.py
@ -1,12 +0,0 @@
-#!/usr/bin/env python3
-# -*- encoding: utf-8 -*-
-# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
-#  MIT License  (https://opensource.org/licenses/MIT)
-
-from funasr import AutoModel
-
-model = AutoModel(model="/Users/zhifu/Downloads/modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404")
-
-res = model(input="/Users/zhifu/Downloads/modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404/example/asr_example.wav",
-            hotword='达魔院 魔搭')
-print(res)
--- a/examples/industrial_data_pretraining/seaco_paraformer/demo.py
+++ b/examples/industrial_data_pretraining/seaco_paraformer/demo.py
@ -0,0 +1,12 @@
+#!/usr/bin/env python3
+# -*- encoding: utf-8 -*-
+# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
+#  MIT License  (https://opensource.org/licenses/MIT)
+
+from funasr import AutoModel
+
+model = AutoModel(model="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404")
+
+res = model(input="../modelscope_models/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404/example/asr_example.wav",
+            hotword='达魔院 魔搭')
+print(res)
--- a/examples/industrial_data_pretraining/seaco_paraformer/infer.sh
+++ b/examples/industrial_data_pretraining/seaco_paraformer/infer.sh
@ -0,0 +1,15 @@
+
+# download model
+local_path_root=../modelscope_models
+mkdir -p ${local_path_root}
+local_path=${local_path_root}/speech_paraformer-large-contextual_asr_nat-zh-cn-16k-common-vocab8404
+git clone https://www.modelscope.cn/damo/speech_seaco_paraformer_large_asr_nat-zh-cn-16k-common-vocab8404-pytorch.git ${local_path}
+
+
+python funasr/bin/inference.py \
+model="${local_path}" \
+input="${local_path}/example/asr_example.wav" \
+output_dir="./outputs/debug" \
+device="cpu" \
+"hotword='达魔院 魔搭'"
+
--- a/funasr/models/neat_contextual_paraformer/init.py
+++ b/funasr/models/neat_contextual_paraformer/init.py
--- a/funasr/models/neat_contextual_paraformer/decoder.py
+++ b/funasr/models/neat_contextual_paraformer/decoder.py
--- a/funasr/models/neat_contextual_paraformer/model.py
+++ b/funasr/models/neat_contextual_paraformer/model.py
@ -55,12 +55,12 @@ from funasr.models.paraformer.model import Paraformer

 from funasr.register import tables

-@tables.register("model_classes", "NeatContextualParaformer")
-class NeatContextualParaformer(Paraformer):
+@tables.register("model_classes", "ContextualParaformer")
+class ContextualParaformer(Paraformer):
 	"""
 	Author: Speech Lab of DAMO Academy, Alibaba Group
-	Paraformer: Fast and Accurate Parallel Transformer for Non-autoregressive End-to-End Speech Recognition
-	https://arxiv.org/abs/2206.08317
+	FunASR: A Fundamental End-to-End Speech Recognition Toolkit
+	https://arxiv.org/abs/2305.11013
 	"""
 	
 	def __init__(
--- a/funasr/models/neat_contextual_paraformer/template.yaml
+++ b/funasr/models/neat_contextual_paraformer/template.yaml
@ -6,7 +6,7 @@
 # tables.print()

 # network architecture
-model: NeatContextualParaformer
+model: ContextualParaformer
 model_conf:
    ctc_weight: 0.0
    lsm_weight: 0.1