Update wav_utils.py

Because there are no uppercase letters in the dictionary, when there are uppercase letters in the annotated text, the finetune result will be "unk", so uniformly converted to lowercase when read the annotated text.
This commit is contained in:
zhuzizyf 2023-03-03 10:33:51 +08:00 committed by GitHub
parent 5d4b0c3994
commit 1a39b6f981
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -309,7 +309,7 @@ def filter_wav_text(data_dir, dataset):
if len(parts) < 2:
continue
sample_name = parts[0]
text_dict[sample_name] = " ".join(parts[1:])
text_dict[sample_name] = " ".join(parts[1:]).lower()
filter_count = 0
with open(wav_file, "w") as f_wav, open(text_file, "w") as f_text:
for sample_name, wav_path in wav_dict.items():