Blame view

run-measures.sh 2.93 KB
42b4edb5a   Mathias Quillot   This file aims to...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
  # Pour le moment, le run ne fait qu'executer
  # quelques petites commandes que l'on souhaite
  # tester.
  
  OUTDIR="exp/kmeans_teacher_1/pvector-1"
  DATADIR="data"
  NEW_LSTDIR="${OUTDIR}/lst"
  
  kmin=2
  kmax=100
  
  if [ ! -d "$OUTDIR" ];
  then
      mkdir -p $OUTDIR
  fi
  
  if [ ! -d "$NEW_LSTDIR" ];
  then
      mkdir -p $NEW_LSTDIR
  fi
  
  for kfold in {1..4}
  do
      pvector_file="${DATADIR}/pvectors_1rst/pvectors_teacher_${kfold}.txt"
      lst_dir="${DATADIR}/pvectors_1rst/lst"
      output_kfold="${OUTDIR}/${kfold}"
      
      #python3 "bin/replace_label.py" \
      #    "${DATADIR}/masseffect.lst" \
      #    "${DATADIR}/character_information.csv" \
      #    --field "type" --lst "data/pvectors_1rst/lst/train_${kfold}.lst" \
      #    --outfile "${NEW_LSTDIR}/train_${kfold}_type.lst"
  
      #python3 "bin/replace_label.py" \
      #    "${DATADIR}/masseffect.lst" \
      #    "${DATADIR}/character_information.csv" \
      #    --field "type" --lst "data/pvectors_1rst/lst/val_${kfold}.lst" \
      #    --outfile "${NEW_LSTDIR}/val_${kfold}_type.lst"
     
      cat "${NEW_LSTDIR}/train_${kfold}_type.lst" "${NEW_LSTDIR}/val_${kfold}_type.lst" > "${NEW_LSTDIR}/metas_${kfold}_type.lst"
  
   
      echo "Clustering - ${kfold}"
  
      for k in $(seq ${kmin} 1 ${kmax})
      do
          echo "Kmeans Measuring and ploting - ${k}"
  	
  	    # This script compute measures from clustering   
          #python3 bin/measure_clustering.py "${output_kfold}/${k}/clustered_${k}.txt" "${pvector_file}" "${lst_dir}/train_${kfold}.lst" "${lst_dir}/val_${kfold}.lst" --outfile "${output_kfold}/${k}/measures.json"
          
          python3 bin/measure_clustering.py "${output_kfold}/${k}/clustered_${k}.txt" \
              "${NEW_LSTDIR}/metas_${kfold}_type.lst" "${lst_dir}/train_${kfold}.lst" \
              "${lst_dir}/val_${kfold}.lst" \
              --outfile "${output_kfold}/${k}/measures_type.json"
          
          # This script plot the count matrix of the train set
          python3 bin/plot-count-matrix.py ${output_kfold}/${k}/clustered_${k}.txt \
          ${NEW_LSTDIR}/metas_${kfold}_type.lst ${lst_dir}/train_${kfold}.lst \
          --outfile ${output_kfold}/${k}/train_count_matrix_type.pdf
          
          # This script plot the count matrix of the validation set
          python3 bin/plot-count-matrix.py ${output_kfold}/${k}/clustered_${k}.txt \
          ${NEW_LSTDIR}/metas_${kfold}_type.lst ${lst_dir}/val_${kfold}.lst \
          --outfile ${output_kfold}/${k}/val_count_matrix_type.pdf
          
          # This script plot the count matrix of the train set
          #python3 bin/plot-count-matrix.py ${output_kfold}/${k}/clustered_${k}.txt \
          #${pvector_file} ${lst_dir}/train_${kfold}.lst \
          #--outfile ${output_kfold}/${k}/train_count_matrix.pdf
          
          # This script plot the count matrix of the validation set
          #python3 bin/plot-count-matrix.py ${output_kfold}/${k}/clustered_${k}.txt \
          #${pvector_file} ${lst_dir}/val_${kfold}.lst \
          #--outfile ${output_kfold}/${k}/val_count_matrix.pdf
      done
  done