diff --git a/egs/wenetspeech/conformer/local/data.sh b/egs/wenetspeech/conformer/local/data.sh index dcfba5f58..d5c548f40 100755 --- a/egs/wenetspeech/conformer/local/data.sh +++ b/egs/wenetspeech/conformer/local/data.sh @@ -17,20 +17,11 @@ stage=1 stop_stage=100 set=L data_dir="data" +WENETSPEECH= log "$0 $*" . utils/parse_options.sh -. ./path.sh || exit 1; -. ./cmd.sh || exit 1; -. ./db.sh || exit 1; - -if [ ! -e "${WENETSPEECH}" ]; then - log "Fill the value of 'WENETSPEECH' of db.sh" - log "or download the data set follwing the instruction in https://wenet-e2e.github.io/WenetSpeech/" - exit 1 -fi - if [ ! -d "${WENETSPEECH}/audio" ] && [ ! -f "${WENETSPEECH}/WenetSpeech.json" ]; then echo "Valid WENETSPEECH data not found in ${WENETSPEECH}." echo "Please follow the instruction in https://wenet-e2e.github.io/WenetSpeech/" diff --git a/egs/wenetspeech/conformer/run.sh b/egs/wenetspeech/conformer/run.sh index 0945e668d..bf0dc1f9a 100644 --- a/egs/wenetspeech/conformer/run.sh +++ b/egs/wenetspeech/conformer/run.sh @@ -72,7 +72,7 @@ fi if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then echo "stage 0: Data preparation" # Data preparation - local/data.sh "--set ${set}" + local/data.sh --set ${set} --nj 64 --data_dir $feats_dir --WENETSPEECH $raw_data # mkdir $feats_dir/data # mv $feats_dir/$train_set $feats_dir/data/$train_set # for x in $test_sets; do