Blame view
egs/swahili/s5/local/prepare_data.sh
1.05 KB
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 |
#!/bin/bash if [[ $1 && $2 ]]; then local=`pwd`/local mkdir -p data data/local data/$1 data/$2 echo "Preparing train and test data" echo "make wav.scp for $1 $2" rm -rf data/mfcc data/log cd asr_swahili/data pushd $1 cp wav.scp ../../../data/$1/wav.scp popd pushd $2/wav5 ls */*.wav | sed 's/^/asr_swahili\/data\/test\/wav5\//g' > tutu1 cat tutu1 | sed "s/\//#/g" | awk 'BEGIN{FS="#"} {print $6}' | sed "s/\.wav//g" > tutu2 paste tutu2 tutu1 > ../../../../data/$2/wav.scp rm tutu1 tutu2 popd echo "copy spk2utt, utt2spk, text for $1 $2" for x in $1 $2; do cp $x/spk2utt ../../data/$x/. cp $x/utt2spk ../../data/$x/. cp $x/text ../../data/$x/. done pushd ../../data/local if [ ! -f "swahili.arpa" ]; then cd ../../asr_swahili/LM unzip swahili.arpa.zip -d ../../data/local/ fi popd echo "Preparing data OK." cd ../.. else echo "ERROR: Preparing train and test data failed !" echo "You must have forgotten to precise train test directories" echo "Usage: ./prepare_data.sh train test" fi |