Blame view
egs/vystadial_en/s5/env_voip_en.sh
1.21 KB
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 |
#!/bin/bash # EVERY_N utterance is used for training # EVERY_N=3 -> we use one third of training data export EVERY_N=1 export TEST_SETS="dev test" # Directories set up export DATA_ROOT=`pwd`/data # expects subdirectories train + $TEST_SETS export WORK=`pwd`/lang_prep export EXP=`pwd`/exp export TGT_MODELS=trained_models # Specify paths to arpa models. Paths may not contain spaces. # Specify build0 or build1 or build2, .. for building (zero|uni|bi)-gram LM. # Note: The LM file name should not contain underscore "_"! # Otherwise the results will be reported without the LM with underscore." export LMs="build0 build2" # Use path to prebuilt dictionary or 'build' command in order to build dictionary # export DICTIONARY="../../resources/lm/caminfo/dict" export DICTIONARY="build" # Borders for estimating LM model weight. # LMW is tuned on development set and applied on test set. export min_lmw=9 export max_lmw=20 # Number of states for phonem training export pdf=1200 # Maximum number of Gaussians used for training export gauss=19200 export train_mmi_boost=0.05 export mmi_beam=16.0 export mmi_lat_beam=10.0 # --fake -> NO CMVN; empty -> CMVN (pykaldi decoders can not handle CMVN -> fake) export fake="--fake" |