mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
Update wav_utils.py
Because there are no uppercase letters in the dictionary, when there are uppercase letters in the annotated text, the finetune result will be "unk", so uniformly converted to lowercase when read the annotated text.
This commit is contained in:
parent
5d4b0c3994
commit
1a39b6f981
@ -309,7 +309,7 @@ def filter_wav_text(data_dir, dataset):
|
||||
if len(parts) < 2:
|
||||
continue
|
||||
sample_name = parts[0]
|
||||
text_dict[sample_name] = " ".join(parts[1:])
|
||||
text_dict[sample_name] = " ".join(parts[1:]).lower()
|
||||
filter_count = 0
|
||||
with open(wav_file, "w") as f_wav, open(text_file, "w") as f_text:
|
||||
for sample_name, wav_path in wav_dict.items():
|
||||
|
||||
Loading…
Reference in New Issue
Block a user