Blame view
egs/voxforge/s5/getdata.sh
932 Bytes
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
#!/bin/bash # Copyright 2012 Vassil Panayotov # Apache 2.0 # Downloads and extracts the data from VoxForge website # defines the "DATA_ROOT" variable - the location to store data source ./path.sh DATA_SRC="http://www.repository.voxforge1.org/downloads/SpeechCorpus/Trunk/Audio/Main/16kHz_16bit" DATA_TGZ=${DATA_ROOT}/tgz DATA_EXTRACT=${DATA_ROOT}/extracted source utils/parse_options.sh mkdir -p ${DATA_TGZ} 2>/dev/null # Check if the executables needed for this script are present in the system command -v wget >/dev/null 2>&1 ||\ { echo "\"wget\" is needed but not found"'!'; exit 1; } echo "--- Starting VoxForge data download (may take some time) ..." wget -P ${DATA_TGZ} -l 1 -N -nd -c -e robots=off -A tgz -r -np ${DATA_SRC} || \ { echo "WGET error"'!' ; exit 1 ; } mkdir -p ${DATA_EXTRACT} echo "--- Starting VoxForge archives extraction ..." for a in ${DATA_TGZ}/*.tgz; do tar -C ${DATA_EXTRACT} -xf $a done |