mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
25 lines
1.1 KiB
Python
25 lines
1.1 KiB
Python
import os
|
|
import argparse
|
|
|
|
if __name__ == '__main__':
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument("--root_path", type=str)
|
|
parser.add_argument("--out_path", type=str)
|
|
parser.add_argument("--split_num", type=int, default=64)
|
|
args = parser.parse_args()
|
|
root_path = args.root_path
|
|
out_path = args.out_path
|
|
split_num = args.split_num
|
|
|
|
with open(os.path.join(out_path, "feats.scp"), "w") as out_f:
|
|
for i in range(split_num):
|
|
idx = str(i + 1)
|
|
feature_file = os.path.join(root_path, "feature.scp.{}".format(idx))
|
|
label_file = os.path.join(root_path, "label.scp.{}".format(idx))
|
|
with open(feature_file) as ff, open(label_file) as fl:
|
|
ff_lines = ff.readlines()
|
|
fl_lines = fl.readlines()
|
|
for ff_line, fl_line in zip(ff_lines, fl_lines):
|
|
sample_name, f_path = ff_line.strip().split()
|
|
_, l_path = fl_line.strip().split()
|
|
out_f.write("{} {} {}\n".format(sample_name, f_path, l_path)) |