From b1857837dd5873a8308eb770c50f4fc4c8eab752 Mon Sep 17 00:00:00 2001 From: "shixian.shi" Date: Wed, 17 Jan 2024 16:47:41 +0800 Subject: [PATCH] update --- funasr/auto/auto_model.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/funasr/auto/auto_model.py b/funasr/auto/auto_model.py index 0bc5e0eaf..740614c74 100644 --- a/funasr/auto/auto_model.py +++ b/funasr/auto/auto_model.py @@ -309,6 +309,7 @@ class AutoModel: time_speech_total_per_sample = speech_lengths/16000 time_speech_total_all_samples += time_speech_total_per_sample + all_segments = [] for j, _ in enumerate(range(0, n)): batch_size_ms_cum += (sorted_data[j][0][1] - sorted_data[j][0][0]) if j < n - 1 and ( @@ -320,7 +321,7 @@ class AutoModel: speech_j, speech_lengths_j = slice_padding_audio_samples(speech, speech_lengths, sorted_data[beg_idx:end_idx]) results = self.inference(speech_j, input_len=None, model=model, kwargs=kwargs, **cfg) if self.spk_model is not None: - all_segments = [] + # compose vad segments: [[start_time_sec, end_time_sec, speech], [...]] for _b in range(len(speech_j)): vad_segments = [[sorted_data[beg_idx:end_idx][_b][0][0]/1000.0, \