mirror of
https://github.com/modelscope/FunASR
synced 2025-09-15 14:48:36 +08:00
55 lines
1.3 KiB
Bash
Executable File
55 lines
1.3 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
|
|
. ./path.sh || exit 1;
|
|
# Begin configuration section.
|
|
nj=32
|
|
cmd=./utils/run.pl
|
|
|
|
# feature configuration
|
|
feats_dim=80
|
|
sample_frequency=16000
|
|
speed_perturb="1.0"
|
|
window_type="hamming"
|
|
max_lengths=1500
|
|
|
|
echo "$0 $@"
|
|
|
|
. utils/parse_options.sh || exit 1;
|
|
|
|
data=$1
|
|
logdir=$2
|
|
fbankdir=$3
|
|
|
|
[ ! -f $data/wav.scp ] && echo "$0: no such file $data/wav.scp" && exit 1;
|
|
[ ! -f $data/text ] && echo "$0: no such file $data/text" && exit 1;
|
|
|
|
python utils/split_data.py $data $data $nj
|
|
|
|
ark_dir=${fbankdir}/ark; mkdir -p ${ark_dir}
|
|
text_dir=${fbankdir}/txt; mkdir -p ${text_dir}
|
|
mkdir -p ${logdir}
|
|
|
|
$cmd JOB=1:$nj $logdir/make_fbank.JOB.log \
|
|
python utils/compute_fbank.py -w $data/split${nj}/JOB/wav.scp -t $data/split${nj}/JOB/text \
|
|
-d $feats_dim -s $sample_frequency -m ${max_lengths} -p ${speed_perturb} -a JOB -o ${fbankdir} \
|
|
--window-type ${window_type} \
|
|
|| exit 1;
|
|
|
|
for n in $(seq $nj); do
|
|
cat ${ark_dir}/feats.$n.scp || exit 1
|
|
done > $fbankdir/feats.scp || exit 1
|
|
|
|
for n in $(seq $nj); do
|
|
cat ${text_dir}/text.$n.txt || exit 1
|
|
done > $fbankdir/text || exit 1
|
|
|
|
for n in $(seq $nj); do
|
|
cat ${ark_dir}/len.$n || exit 1
|
|
done > $fbankdir/speech_shape || exit 1
|
|
|
|
for n in $(seq $nj); do
|
|
cat ${text_dir}/len.$n || exit 1
|
|
done > $fbankdir/text_shape || exit 1
|
|
|
|
echo "$0: Succeeded compute FBANK features"
|