run_bnf.sh
3.51 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
#!/bin/bash
# Note: In order to run BNF, run run_bnf.sh
. ./path.sh
. ./cmd.sh
set -e
set -o pipefail
set -u
. utils/parse_options.sh
bnf_train_stage=-100
align_dir=exp/tri4b_ali_si284
train_data_dir=data/train_si284
exp_dir=exp_bnf
bnf_exp_dir=$exp_dir/tri6_bnf
if [ ! -f $bnf_exp_dir/.done ]; then
mkdir -p $exp_dir
mkdir -p $bnf_exp_dir
echo ---------------------------------------------------------------------
echo "Starting training the bottleneck network"
echo ---------------------------------------------------------------------
steps/nnet2/train_tanh_bottleneck.sh \
--stage $bnf_train_stage --num-jobs-nnet 4 \
--num-threads 1 --mix-up 5000 --max-change 40 \
--minibatch-size 512 \
--initial-learning-rate 0.005 \
--final-learning-rate 0.0005 \
--num-hidden-layers 5 \
--bottleneck-dim 42 --hidden-layer-dim 1024 --cmd "$train_cmd" \
$train_data_dir data/lang $align_dir $bnf_exp_dir || exit 1
touch $bnf_exp_dir/.done
fi
[ ! -d param_bnf ] && mkdir -p param_bnf
if [ ! -f data_bnf/train_bnf/.done ]; then
mkdir -p data_bnf
# put the archives in param_bnf/.
steps/nnet2/dump_bottleneck_features.sh --cmd "$train_cmd" \
--transform-dir $align_dir $train_data_dir data_bnf/train_bnf $bnf_exp_dir param_bnf $exp_dir/dump_bnf
touch data_bnf/train_bnf/.done
fi
[ ! -d data/test_eval92 ] && echo "No such directory data/test_eval92" && exit 1;
[ ! -d data/test_dev93 ] && echo "No such directory data/test_dev93" && exit 1;
[ ! -d exp/tri4b/decode_bd_tgpr_eval92 ] && echo "No such directory exp/tri4b/decode_bd_tgpr_eval92" && exit 1;
[ ! -d exp/tri4b/decode_bd_tgpr_dev93 ] && echo "No such directory exp/tri4b/decode_bd_tgpr_dev93" && exit 1;
# put the archives in param_bnf/.
steps/nnet2/dump_bottleneck_features.sh --nj 8 \
--transform-dir exp/tri4b/decode_bd_tgpr_eval92 data/test_eval92 data_bnf/eval92_bnf $bnf_exp_dir param_bnf $exp_dir/dump_bnf
steps/nnet2/dump_bottleneck_features.sh --nj 10 \
--transform-dir exp/tri4b/decode_bd_tgpr_dev93 data/test_dev93 data_bnf/dev93_bnf $bnf_exp_dir param_bnf $exp_dir/dump_bnf
if [ ! data_bnf/train/.done -nt data_bnf/train_bnf/.done ]; then
steps/nnet/make_fmllr_feats.sh --cmd "$train_cmd --max-jobs-run 10" \
--transform-dir $align_dir data_bnf/train_sat $train_data_dir \
exp/tri4b $exp_dir/make_fmllr_feats/log param_bnf/
steps/append_feats.sh --cmd "$train_cmd" --nj 4 \
data_bnf/train_bnf data_bnf/train_sat data_bnf/train \
$exp_dir/append_feats/log param_bnf/
steps/compute_cmvn_stats.sh --fake data_bnf/train $exp_dir/make_fmllr_feats param_bnf
rm -r data_bnf/train_sat
touch data_bnf/train/.done
fi
## preparing Bottleneck features for eval92 and dev93
steps/nnet/make_fmllr_feats.sh \
--nj 8 --transform-dir exp/tri4b/decode_bd_tgpr_eval92 data_bnf/eval92_sat data/test_eval92 \
$align_dir $exp_dir/make_fmllr_feats/log param_bnf/
steps/nnet/make_fmllr_feats.sh \
--nj 10 --transform-dir exp/tri4b/decode_bd_tgpr_dev93 data_bnf/dev93_sat data/test_dev93 \
$align_dir $exp_dir/make_fmllr_feats/log param_bnf/
steps/append_feats.sh --nj 4 \
data_bnf/eval92_bnf data_bnf/eval92_sat data_bnf/eval92 \
$exp_dir/append_feats/log param_bnf/
steps/append_feats.sh --nj 4 \
data_bnf/dev93_bnf data_bnf/dev93_sat data_bnf/dev93 \
$exp_dir/append_feats/log param_bnf/
steps/compute_cmvn_stats.sh --fake data_bnf/eval92 $exp_dir/make_fmllr_feats param_bnf
steps/compute_cmvn_stats.sh --fake data_bnf/dev93 $exp_dir/make_fmllr_feats param_bnf
rm -r data_bnf/eval92_sat
rm -r data_bnf/dev93_sat
exit 0;