From 31b4a9837a5836b809de276c1bc781dfa5b3189f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=BF=97=E6=B5=A9?= Date: Thu, 23 Feb 2023 23:03:40 +0800 Subject: [PATCH] sond pipeline --- .../sd/scripts/real_meeting_process/dump_real_meeting_chunks.py | 1 + egs/mars/sd/scripts/simu_chunk_with_labels.py | 2 ++ 2 files changed, 3 insertions(+) diff --git a/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py b/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py index c6ff1f547..a2bcd390a 100644 --- a/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py +++ b/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py @@ -26,6 +26,7 @@ def calc_rand_ivc(spk, spk2utt, utt2ivc, utt2frames, total_len=3000): short_spk_list.append(spk) ivc_list = [kaldiio.load_mat(utt2ivc[utt]) for utt in utt_list] + ivc_list = [x/np.linalg.norm(x, axis=-1) for x in ivc_list] ivc = np.concatenate(ivc_list, axis=0) ivc = np.mean(ivc, axis=0, keepdims=False) return ivc diff --git a/egs/mars/sd/scripts/simu_chunk_with_labels.py b/egs/mars/sd/scripts/simu_chunk_with_labels.py index 3f9fe1e9e..226784bff 100644 --- a/egs/mars/sd/scripts/simu_chunk_with_labels.py +++ b/egs/mars/sd/scripts/simu_chunk_with_labels.py @@ -103,6 +103,8 @@ def calculate_embedding(spk, spk2utts, utt2xvec, embedding_dim, average_emb_num) xvec_list = [kaldiio.load_mat(utt2xvec[utt]) for utt in utt_list] else: xvec_list = [kaldiio.load_mat(utt2xvec[utt]) for utt in random.sample(utt_list, average_emb_num)] + # TODO: rerun the simulation + xvec_list = [x / np.linalg.norm(x, axis=-1) for x in xvec_list] xvec = np.mean(np.concatenate(xvec_list, axis=0), axis=0) return xvec