Blame view

egs/chime4/s5_1ch/local/chime4_calc_wers.sh 2.74 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
  #!/bin/bash
  
  #  Copyright  2015  Mitsubishi Electric Research Laboratories (Author: Shinji Watanabe)
  #  Apache 2.0.
  
  set -e
  
  # Config:
  eval_flag=true # make it true when the evaluation data are released
  
  . utils/parse_options.sh || exit 1;
  
  if [ $# -ne 3 ]; then
    printf "
  USAGE: %s <training experiment directory> <enhancement method> <graph_dir>
  
  " `basename $0`
    printf "%s exp/tri3b_tr05_sr_noisy noisy exp/tri4a_dnn_tr05_sr_noisy/graph_tgpr_5k
  
  " `basename $0`
    exit 1;
  fi
  
  echo "$0 $@"  # Print the command line for logging
  
  . ./path.sh
  
  dir=$1
  enhan=$2
  graph_dir=$3
  
  echo "compute dt05 WER for each location"
  echo ""
  mkdir -p $dir/log
  for a in `find $dir/decode_tgpr_5k_dt05_real_$enhan/ | grep "\/wer_" | awk -F'[/]' '{print $NF}' | sort`; do
    echo -n "$a "
    if [ -e $dir/decode_tgpr_5k_dt05_simu_$enhan ]; then
      cat $dir/decode_tgpr_5k_dt05_{real,simu}_$enhan/$a | grep WER | awk '{err+=$4} {wrd+=$6} END{printf("%.2f
  ",err/wrd*100)}'
    else
      cat $dir/decode_tgpr_5k_dt05_real_$enhan/$a | grep WER | awk '{err+=$4} {wrd+=$6} END{printf("%.2f
  ",err/wrd*100)}'
    fi
  done | sort -n -k 2 | head -n 1 > $dir/log/best_wer_$enhan
  
  lmw=`cut -f 1 -d" " $dir/log/best_wer_$enhan | cut -f 2 -d"_"`
  echo "-------------------"
  printf "best overall dt05 WER %s" `cut -f 2 -d" " $dir/log/best_wer_$enhan`
  echo -n "%"
  printf " (language model weight = %s)
  " $lmw
  echo "-------------------"
  if $eval_flag; then
    tasks="dt05 et05"
  else
    tasks="dt05"
  fi
  for e_d in $tasks; do
    for task in simu real; do
      rdir=$dir/decode_tgpr_5k_${e_d}_${task}_$enhan
      if [ -e $rdir ]; then
        for a in _BUS _CAF _PED _STR; do
          grep $a $rdir/scoring/test_filt.txt \
            > $rdir/scoring/test_filt_$a.txt
          cat $rdir/scoring/$lmw.tra \
            | utils/int2sym.pl -f 2- $graph_dir/words.txt \
            | sed s:\<UNK\>::g \
            | compute-wer --text --mode=present ark:$rdir/scoring/test_filt_$a.txt ark,p:- \
            1> $rdir/${a}_wer_$lmw 2> /dev/null
        done
        echo -n "${e_d}_${task} WER: `grep WER $rdir/wer_$lmw | cut -f 2 -d" "`% (Average), "
        echo -n "`grep WER $rdir/_BUS_wer_$lmw | cut -f 2 -d" "`% (BUS), "
        echo -n "`grep WER $rdir/_CAF_wer_$lmw | cut -f 2 -d" "`% (CAFE), "
        echo -n "`grep WER $rdir/_PED_wer_$lmw | cut -f 2 -d" "`% (PEDESTRIAN), "
        echo -n "`grep WER $rdir/_STR_wer_$lmw | cut -f 2 -d" "`% (STREET)"
        echo ""
        echo "-------------------"
      fi
    done
  done
  echo ""
  
  for e_d in $tasks; do
    echo "-----------------------------"
    echo "1-best transcription for $e_d"
    echo "-----------------------------"
    for task in simu real; do
      rdir=$dir/decode_tgpr_5k_${e_d}_${task}_$enhan
      cat $rdir/scoring/$lmw.tra \
        | utils/int2sym.pl -f 2- $graph_dir/words.txt \
        | sed s:\<UNK\>::g
    done
  done