FunASR/funasr/datasets/small_datasets/build_loader.py
speech_asr 9f90bad3f5 update
2023-04-17 17:11:05 +08:00

17 lines
692 B
Python

import torch
from funasr.datasets.small_datasets.dataset import ESPnetDataset
from funasr.datasets.small_datasets.build_preprocess import build_preprocess
def build_dataloader(args):
if args.frontend_conf is not None:
dest_sample_rate = args.frontend_conf["fs"] if (args.frontend_conf is not None and "fs" in args.frontend_conf) else 16000
preprocess_fn = build_preprocess()
dataset = ESPnetDataset(
iter_options.data_path_and_name_and_type,
float_dtype=args.train_dtype,
preprocess=preprocess_fn,
max_cache_size=iter_options.max_cache_size,
max_cache_fd=iter_options.max_cache_fd,
dest_sample_rate=dest_sample_rate,
)