diff --git a/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py b/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py index c6ff1f547..a2bcd390a 100644 --- a/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py +++ b/egs/mars/sd/scripts/real_meeting_process/dump_real_meeting_chunks.py @@ -26,6 +26,7 @@ def calc_rand_ivc(spk, spk2utt, utt2ivc, utt2frames, total_len=3000): short_spk_list.append(spk) ivc_list = [kaldiio.load_mat(utt2ivc[utt]) for utt in utt_list] + ivc_list = [x/np.linalg.norm(x, axis=-1) for x in ivc_list] ivc = np.concatenate(ivc_list, axis=0) ivc = np.mean(ivc, axis=0, keepdims=False) return ivc diff --git a/egs/mars/sd/scripts/simu_chunk_with_labels.py b/egs/mars/sd/scripts/simu_chunk_with_labels.py index 3f9fe1e9e..226784bff 100644 --- a/egs/mars/sd/scripts/simu_chunk_with_labels.py +++ b/egs/mars/sd/scripts/simu_chunk_with_labels.py @@ -103,6 +103,8 @@ def calculate_embedding(spk, spk2utts, utt2xvec, embedding_dim, average_emb_num) xvec_list = [kaldiio.load_mat(utt2xvec[utt]) for utt in utt_list] else: xvec_list = [kaldiio.load_mat(utt2xvec[utt]) for utt in random.sample(utt_list, average_emb_num)] + # TODO: rerun the simulation + xvec_list = [x / np.linalg.norm(x, axis=-1) for x in xvec_list] xvec = np.mean(np.concatenate(xvec_list, axis=0), axis=0) return xvec