This commit is contained in:
shixian.shi 2023-06-27 19:13:02 +08:00
parent 35ea75e9e5
commit 79ec916cab

View File

@ -58,7 +58,7 @@ def tokenize(data,
# enable preset hotword detect in sampling
pre_index = None
for hw in hw_config['pre_hwlist']:
hw = " ".join(seg_tokenize(hw))
hw = " ".join(seg_tokenize(hw, seg_dict))
_find = text.find(hw)
if _find != -1:
_find = text[:_find].count(" ") # bpe sometimes