compute_fbank.sh 1.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
  1. #!/usr/bin/env bash
  2. . ./path.sh || exit 1;
  3. # Begin configuration section.
  4. nj=32
  5. cmd=./utils/run.pl
  6. # feature configuration
  7. feats_dim=80
  8. sample_frequency=16000
  9. speed_perturb="1.0"
  10. window_type="hamming"
  11. max_lengths=1500
  12. echo "$0 $@"
  13. . utils/parse_options.sh || exit 1;
  14. data=$1
  15. logdir=$2
  16. fbankdir=$3
  17. [ ! -f $data/wav.scp ] && echo "$0: no such file $data/wav.scp" && exit 1;
  18. [ ! -f $data/text ] && echo "$0: no such file $data/text" && exit 1;
  19. python utils/split_data.py $data $data $nj
  20. ark_dir=${fbankdir}/ark; mkdir -p ${ark_dir}
  21. text_dir=${fbankdir}/txt; mkdir -p ${text_dir}
  22. mkdir -p ${logdir}
  23. $cmd JOB=1:$nj $logdir/make_fbank.JOB.log \
  24. python utils/compute_fbank.py -w $data/split${nj}/JOB/wav.scp -t $data/split${nj}/JOB/text \
  25. -d $feats_dim -s $sample_frequency -m ${max_lengths} -p ${speed_perturb} -a JOB -o ${fbankdir} \
  26. --window-type ${window_type} \
  27. || exit 1;
  28. for n in $(seq $nj); do
  29. cat ${ark_dir}/feats.$n.scp || exit 1
  30. done > $fbankdir/feats.scp || exit 1
  31. for n in $(seq $nj); do
  32. cat ${text_dir}/text.$n.txt || exit 1
  33. done > $fbankdir/text || exit 1
  34. for n in $(seq $nj); do
  35. cat ${ark_dir}/len.$n || exit 1
  36. done > $fbankdir/speech_shape || exit 1
  37. for n in $(seq $nj); do
  38. cat ${text_dir}/len.$n || exit 1
  39. done > $fbankdir/text_shape || exit 1
  40. echo "$0: Succeeded compute FBANK features"