Blame view

egs/yesno/s5/local/prepare_data.sh 1.04 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
  #!/bin/bash
  
  mkdir -p data/local
  local=`pwd`/local
  scripts=`pwd`/scripts
  
  export PATH=$PATH:`pwd`/../../../tools/irstlm/bin
  
  echo "Preparing train and test data"
  
  train_base_name=train_yesno
  test_base_name=test_yesno
  waves_dir=$1
  
  ls -1 $waves_dir > data/local/waves_all.list
  
  cd data/local
  
  ../../local/create_yesno_waves_test_train.pl waves_all.list waves.test waves.train
  
  ../../local/create_yesno_wav_scp.pl ${waves_dir} waves.test > ${test_base_name}_wav.scp
  
  ../../local/create_yesno_wav_scp.pl ${waves_dir} waves.train > ${train_base_name}_wav.scp
  
  ../../local/create_yesno_txt.pl waves.test > ${test_base_name}.txt
  
  ../../local/create_yesno_txt.pl waves.train > ${train_base_name}.txt
  
  cp ../../input/task.arpabo lm_tg.arpa
  
  cd ../..
  
  # This stage was copied from WSJ example
  for x in train_yesno test_yesno; do 
    mkdir -p data/$x
    cp data/local/${x}_wav.scp data/$x/wav.scp
    cp data/local/$x.txt data/$x/text
    cat data/$x/text | awk '{printf("%s global
  ", $1);}' > data/$x/utt2spk
    utils/utt2spk_to_spk2utt.pl <data/$x/utt2spk >data/$x/spk2utt
  done