run_corpus.sh 883 Bytes
#!/bin/bash
export RUBYLIB=$RUBYLIB:bin/

echo "***** Create K-Fold *****"
for file in task1 task2 task3
do
  echo "[x] $file"
  ruby bin/decoupe.rb db/${file}-train.csv data/task1 4
done

echo "***** CREATE TRAIN CORPUS *****"
for kfold in `seq 0 1 3`
do
  for file in task1 task2 task3
  do
    echo "[x] $file"
    ruby bin/tokenize_file.rb data/${file}_train_${kfold}.txt > data/${file}_train_${kfold}.tokenize
  done
done


echo "***** CREATE DEV CORPUS *****"
for kfold in `seq 0 1 3`
do
  for file in task1 task2 task3
  do
    echo "[x] $file"
    ruby bin/tokenize_file.rb data/${file}_dev_${kfold}.txt > data/${file}_dev_${kfold}.tokenize
  done
done


echo "***** CREATE TEST CORPUS *****"
for file in task1 task2 task3
do
  echo "[x] $file"
  ruby bin/tokenize_file_gold.rb db/${file}-testGold.csv > data/${file}_test.tokenize
done