Blame view
egs/sprakbanken/s5/local/nnet2/run_5b_gpu.sh
3.09 KB
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 |
#!/bin/bash stage=0 train_stage=-100 temp_dir= # This trains only unadapted (just cepstral mean normalized) features, # and uses various combinations of VTLN warping factor and time-warping # factor to artificially expand the amount of data. . ./cmd.sh . utils/parse_options.sh # to parse the --stage option, if given if [ $# != 0 ]; then echo "Usage: $0 [--stage <stage> --train-stage <train-stage>]" echo "Options: " echo " --stage <stage> # controls partial re-runs" echo " --train-stage <train-stage> # use with --stage 2 to control partial rerun of training" echo " --temp-dir <temp-dir> # e.g. --temp-dir /export/my-machine/dpovey/wsj-temp-5b" echo " # (puts temporary data including MFCC and egs at this location)" exit 1; fi set -e if [ $stage -le 0 ]; then # Create the training data. if [ ! -z "$temp_dir" ]; then mkdir -p $temp_dir/mfcc_5b_gpu featdir=$temp_dir/mfcc_5b_gpu else featdir=`pwd`/mfcc/nnet5b_gpu; mkdir -p $featdir fi fbank_conf=conf/fbank_40.conf echo "--num-mel-bins=40" > $fbank_conf steps/nnet2/get_perturbed_feats.sh --cmd "$train_cmd" \ $fbank_conf $featdir exp/perturbed_fbanks_si284 data/train_si284 data/train_si284_perturbed_fbank & steps/nnet2/get_perturbed_feats.sh --cmd "$train_cmd" --feature-type mfcc \ conf/mfcc.conf $featdir exp/perturbed_mfcc_si284 data/train_si284 data/train_si284_perturbed_mfcc & wait fi if [ $stage -le 1 ]; then steps/align_fmllr.sh --nj 30 --cmd "$train_cmd" \ data/train_si284_perturbed_mfcc data/lang exp/tri4b exp/tri4b_ali_si284_perturbed_mfcc fi if [ $stage -le 2 ]; then if [ ! -z "$temp_dir" ] && [ ! -e exp/nnet5b_gpu/egs ]; then mkdir -p exp/nnet5b_gpu mkdir -p $temp_dir/nnet5b_gpu/egs ln -s $temp_dir/nnet5b_gpu/egs exp/nnet5b_gpu/ fi steps/nnet2/train_block.sh --stage "$train_stage" \ --num-threads 1 --max-change 40.0 --minibatch-size 512 --num-jobs-nnet 8 \ --parallel-opts "--gpu 1" \ --initial-learning-rate 0.0075 --final-learning-rate 0.00075 \ --num-epochs 10 --num-epochs-extra 5 \ --cmd "$decode_cmd" \ --hidden-layer-dim 1536 \ --num-block-layers 3 --num-normal-layers 3 \ data/train_si284_perturbed_fbank data/lang exp/tri4b_ali_si284_perturbed_mfcc exp/nnet5b_gpu || exit 1 fi if [ $stage -le 3 ]; then # create testing fbank data. featdir=`pwd`/mfcc fbank_conf=conf/fbank_40.conf for x in test_eval92 test_eval93 test_dev93; do mkdir -p data/${x}_fbank cp data/$x/* data/${x}_fbank || true steps/make_fbank.sh --fbank-config "$fbank_conf" --nj 8 \ --cmd "$train_cmd" data/${x}_fbank exp/make_fbank/$x $featdir || exit 1; steps/compute_cmvn_stats.sh data/${x}_fbank exp/make_fbank/$x $featdir || exit 1; done fi if [ $stage -le 4 ]; then steps/nnet2/decode.sh --cmd "$decode_cmd" --nj 10 \ exp/tri4b/graph_bd_tgpr data/test_dev93_fbank exp/nnet5b_gpu/decode_bd_tgpr_dev93 steps/nnet2/decode.sh --cmd "$decode_cmd" --nj 8 \ exp/tri4b/graph_bd_tgpr data/test_eval92_fbank exp/nnet5b_gpu/decode_bd_tgpr_eval92 fi exit 0; |