Blame view

egs/tunisian_msa/s5/local/subs_download.sh 506 Bytes
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
  #!/bin/bash
  
  # Copyright 2018 John Morgan
  # Apache 2.0.
  
  # Begin configuration 
  subs_src=$1
  tmpdir=data/local/tmp
  download_dir=$(pwd)
  datadir=$(pwd)
  # End configuration
  
  # download the subs corpus
  if [ ! -f $download_dir/subs.txt.gz ]; then
      wget -O $download_dir/subs.txt.gz $subs_src
  else
    echo "$0: The corpus $subs_src was already downloaded."
  fi
  
  if [ ! -f $datadir/subs.txt ]; then
    (
      cd $datadir
      zcat < ./subs.txt.gz > subs.txt
    )
    else
      echo "$0: subs file already extracted."
  fi