Merge pull request #403 from alibaba-damo-academy/dev_lhn

update data filtering recipe
This commit is contained in:
zhifu gao 2023-04-23 15:06:15 +08:00 committed by GitHub
commit b58f412eac
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -299,7 +299,7 @@ def filter_wav_text(data_dir, dataset):
wav_dict = {}
for line in wav_lines:
parts = line.strip().split()
if len(parts) < 2:
if len(parts) != 2:
continue
sample_name, wav_path = parts
wav_dict[sample_name] = wav_path