From ac00b7deee093773ee2f42f2694746dfbbd8163f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=98=89=E6=B8=8A?= Date: Thu, 15 Jun 2023 16:53:26 +0800 Subject: [PATCH] update repo --- funasr/build_utils/build_diar_model.py | 14 +++++++++----- 1 file changed, 9 insertions(+), 5 deletions(-) diff --git a/funasr/build_utils/build_diar_model.py b/funasr/build_utils/build_diar_model.py index 640640484..d21df8546 100644 --- a/funasr/build_utils/build_diar_model.py +++ b/funasr/build_utils/build_diar_model.py @@ -178,14 +178,18 @@ class_choices_list = [ def build_diar_model(args): # token_list - if args.token_list is not None: - with open(args.token_list) as f: + if isinstance(args.token_list, str): + with open(args.token_list, encoding="utf-8") as f: token_list = [line.rstrip() for line in f] + + # Overwriting token_list to keep it as "portable". args.token_list = list(token_list) - vocab_size = len(token_list) - logging.info(f"Vocabulary size: {vocab_size}") + elif isinstance(args.token_list, (tuple, list)): + token_list = list(args.token_list) else: - vocab_size = None + raise RuntimeError("token_list must be str or list") + vocab_size = len(token_list) + logging.info(f"Vocabulary size: {vocab_size}") # frontend if args.input_size is None: