mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
update
This commit is contained in:
parent
41481008e2
commit
bbea0265f1
@ -59,7 +59,7 @@ def tokenize(data,
|
||||
pre_index = None
|
||||
for hw in hw_config['pre_hwlist']:
|
||||
hw = " ".join(seg_tokenize(hw, seg_dict))
|
||||
_find = " ".join(text.find(hw))
|
||||
_find = " ".join(text).find(hw)
|
||||
if _find != -1:
|
||||
_find = text[:_find].count(" ") # bpe sometimes
|
||||
pre_index = [_find, _find + max(hw.count(" "), 1)]
|
||||
|
||||
Loading…
Reference in New Issue
Block a user