mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
update
This commit is contained in:
parent
dcc310e1a8
commit
b1857837dd
@ -309,6 +309,7 @@ class AutoModel:
|
|||||||
time_speech_total_per_sample = speech_lengths/16000
|
time_speech_total_per_sample = speech_lengths/16000
|
||||||
time_speech_total_all_samples += time_speech_total_per_sample
|
time_speech_total_all_samples += time_speech_total_per_sample
|
||||||
|
|
||||||
|
all_segments = []
|
||||||
for j, _ in enumerate(range(0, n)):
|
for j, _ in enumerate(range(0, n)):
|
||||||
batch_size_ms_cum += (sorted_data[j][0][1] - sorted_data[j][0][0])
|
batch_size_ms_cum += (sorted_data[j][0][1] - sorted_data[j][0][0])
|
||||||
if j < n - 1 and (
|
if j < n - 1 and (
|
||||||
@ -320,7 +321,7 @@ class AutoModel:
|
|||||||
speech_j, speech_lengths_j = slice_padding_audio_samples(speech, speech_lengths, sorted_data[beg_idx:end_idx])
|
speech_j, speech_lengths_j = slice_padding_audio_samples(speech, speech_lengths, sorted_data[beg_idx:end_idx])
|
||||||
results = self.inference(speech_j, input_len=None, model=model, kwargs=kwargs, **cfg)
|
results = self.inference(speech_j, input_len=None, model=model, kwargs=kwargs, **cfg)
|
||||||
if self.spk_model is not None:
|
if self.spk_model is not None:
|
||||||
all_segments = []
|
|
||||||
# compose vad segments: [[start_time_sec, end_time_sec, speech], [...]]
|
# compose vad segments: [[start_time_sec, end_time_sec, speech], [...]]
|
||||||
for _b in range(len(speech_j)):
|
for _b in range(len(speech_j)):
|
||||||
vad_segments = [[sorted_data[beg_idx:end_idx][_b][0][0]/1000.0, \
|
vad_segments = [[sorted_data[beg_idx:end_idx][_b][0][0]/1000.0, \
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user