From 43af70b129ab49c9f34268bba49857ed1a2bd3f8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=BF=97=E6=B5=A9?= Date: Tue, 24 Sep 2024 20:09:30 +0800 Subject: [PATCH] add support mixture of kaldi_ark or sound --- funasr/utils/load_utils.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/funasr/utils/load_utils.py b/funasr/utils/load_utils.py index 5ccd2161d..868f00229 100644 --- a/funasr/utils/load_utils.py +++ b/funasr/utils/load_utils.py @@ -114,6 +114,9 @@ def load_audio_text_image_video( elif isinstance(data_or_path_or_list, np.ndarray): # audio sample point data_or_path_or_list = torch.from_numpy(data_or_path_or_list).squeeze() # [n_samples,] elif isinstance(data_or_path_or_list, str) and data_type in ["kaldi_ark", "kaldi_ark_or_sound"]: + if len(data_or_path_or_list.split()) == 2: + data_or_path_or_list, audio_fs = data_or_path_or_list.split() + audio_fs = int(audio_fs) data_mat = kaldiio.load_mat(data_or_path_or_list) if isinstance(data_mat, tuple): audio_fs, mat = data_mat