download_data.sh
852 Bytes
#!/bin/bash
# Copyright 2014 Nickolay V. Shmyrev
# 2014 Brno University of Technology (Author: Karel Vesely)
# Apache 2.0
mkdir -p db
pushd db
# TED-LIUM database:
if [[ $(hostname -f) == *.clsp.jhu.edu ]] ; then
ln -s /export/corpora5/TEDLIUM_release1
else
if [ ! -f TEDLIUM_release1.tar.gz ]; then
wget http://www.openslr.org/resources/7/TEDLIUM_release1.tar.gz || exit 1
tar xf TEDLIUM_release1.tar.gz
fi
fi
# Language models (Cantab Research):
if [ ! -d cantab-TEDLIUM ]; then
echo "Downloading \"http://www.openslr.org/resources/27/cantab-TEDLIUM.tar.bz2\". "
wget --no-verbose --output-document=- http://www.openslr.org/resources/27/cantab-TEDLIUM.tar.bz2 | bzcat | tar --extract --file=- || exit 1
gzip cantab-TEDLIUM/cantab-TEDLIUM-pruned.lm3
gzip cantab-TEDLIUM/cantab-TEDLIUM-unpruned.lm4
fi
popd