Blame view
egs/heroico/s5/local/prepare_dict.sh
836 Bytes
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 |
#!/bin/bash -u # Copyright 2017 John Morgan # Apache 2.0. set -o errexit [ -f ./path.sh ] && . ./path.sh if [ ! -d data/local/dict ]; then mkdir -p data/local/dict fi export LC_ALL=C cut -f2- ./santiago.txt | \ tr -s '[:space:]' '[ *]' | \ grep -v SPN | sort -u >data/local/dict/nonsilence_phones.txt # sed "1d" deletes the last line. expand -t 1 ./santiago.txt | sort -u | sed "1d" >data/local/dict/lexicon.txt echo "<UNK> SPN" >> data/local/dict/lexicon.txt # silence phones, one per line. { echo SIL; echo SPN; } >data/local/dict/silence_phones.txt echo SIL >data/local/dict/optional_silence.txt ( tr ' ' ' ' <data/local/dict/silence_phones.txt; echo; tr ' ' ' ' <data/local/dict/nonsilence_phones.txt; echo; ) >data/local/dict/extra_questions.txt echo "Finished dictionary preparation." |