score_sclite.sh
1.46 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#!/bin/bash
# Copyright 2010-2011 Microsoft Corporation
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
# WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
# MERCHANTABLITY OR NON-INFRINGEMENT.
# See the Apache 2 License for the specific language governing permissions and
# limitations under the License.
# Does the sclite version of scoring in decode directories.
if [ $# != 2 ]; then
echo "Usage: scripts/score_sclite.sh <decode-dir> <ref>"
exit 1;
fi
sclite=../../../tools/sctk/bin/sclite
if [ ! -f $sclite ]; then
echo "The sclite program is not there. Follow the INSTALL instructions in ../../../tools";
exit 1;
fi
dir=$1
ref=$2
if [ ! -f "$ref" ]; then
echo "Reference file $ref is not there"
exit 1
fi
scoredir=$dir/scoring
mkdir $scoredir
cat $dir/*.tra | \
scripts/int2sym.pl --ignore-first-field data/words.txt | \
sed 's:<s>::' | sed 's:</s>::' | sed 's:<UNK>::g' | \
scripts/transcript2hyp.pl > $scoredir/hyp
cat $ref | scripts/transcript2hyp.pl | sed 's:<NOISE>::g' | \
sed 's:<SPOKEN_NOISE>::g' > $scoredir/ref
$sclite -r $scoredir/ref trn -h $scoredir/hyp trn -i wsj -o all -o dtl