add-self-loops.cc
4.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
// bin/add-self-loops.cc
// Copyright 2009-2011 Microsoft Corporation
// 2015 Johns Hopkins University (author: Daniel Povey)
// See ../../COPYING for clarification regarding multiple authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
// MERCHANTABLITY OR NON-INFRINGEMENT.
// See the Apache 2 License for the specific language governing permissions and
// limitations under the License.
#include "hmm/transition-model.h"
#include "hmm/hmm-utils.h"
#include "tree/context-dep.h"
#include "util/common-utils.h"
#include "fst/fstlib.h"
#include "fstext/table-matcher.h"
#include "fstext/fstext-utils.h"
#include "fstext/context-fst.h"
/** @brief Add self-loops and transition probabilities to transducer, expanding to transition-ids.
*/
int main(int argc, char *argv[]) {
try {
using namespace kaldi;
typedef kaldi::int32 int32;
using fst::SymbolTable;
using fst::VectorFst;
using fst::StdArc;
const char *usage =
"Add self-loops and transition probabilities to transducer. Input transducer\n"
"has transition-ids on the input side, but only the forward transitions, not the\n"
"self-loops. Output transducer has transition-ids on the input side, but with\n"
"self-loops added. The --reorder option controls whether the loop is added before\n"
"the forward transition (if false), or afterward (if true). The default (true)\n"
"is recommended as the decoding will in that case be faster.\n"
"Usage: add-self-loops [options] transition-gmm/acoustic-model [fst-in] [fst-out]\n"
"e.g.: \n"
" add-self-loops --self-loop-scale=0.1 1.mdl HCLGa.fst HCLG.fst\n"
"or: add-self-loops --self-loop-scale=0.1 1.mdl <HCLGa.fst >HCLG.fst\n";
BaseFloat self_loop_scale = 1.0;
bool reorder = true;
std::string disambig_in_filename;
ParseOptions po(usage);
po.Register("self-loop-scale", &self_loop_scale,
"Scale for self-loop probabilities relative to LM.");
po.Register("disambig-syms", &disambig_in_filename,
"List of disambiguation symbols on input of fst-in [input file]");
po.Register("reorder", &reorder,
"If true, reorder symbols for more decoding efficiency");
po.Read(argc, argv);
if (po.NumArgs() < 1 || po.NumArgs() > 3) {
po.PrintUsage();
exit(1);
}
std::string model_in_filename = po.GetArg(1);
std::string fst_in_filename = po.GetOptArg(2);
if (fst_in_filename == "-") fst_in_filename = "";
std::string fst_out_filename = po.GetOptArg(3);
if (fst_out_filename == "-") fst_out_filename = "";
#if _MSC_VER
if (fst_in_filename == "")
_setmode(_fileno(stdin), _O_BINARY);
if (fst_out_filename == "")
_setmode(_fileno(stdout), _O_BINARY);
#endif
std::vector<int32> disambig_syms_in;
if (disambig_in_filename != "") {
if (disambig_in_filename == "-") disambig_in_filename = "";
if (!ReadIntegerVectorSimple(disambig_in_filename, &disambig_syms_in))
KALDI_ERR << "add-self-loops: could not read disambig symbols from "
<<(disambig_in_filename == "" ?
"standard input" : disambig_in_filename);
}
TransitionModel trans_model;
ReadKaldiObject(model_in_filename, &trans_model);
fst::VectorFst<fst::StdArc> *fst =
fst::VectorFst<fst::StdArc>::Read(fst_in_filename);
if (!fst)
KALDI_ERR << "add-self-loops: error reading input FST.";
bool check_no_self_loops = true;
// The work gets done here.
AddSelfLoops(trans_model,
disambig_syms_in,
self_loop_scale,
reorder, check_no_self_loops, fst);
if (! fst->Write(fst_out_filename) )
KALDI_ERR << "add-self-loops: error writing FST to "
<< (fst_out_filename == "" ?
"standard output" : fst_out_filename);
delete fst;
return 0;
} catch(const std::exception &e) {
std::cerr << e.what();
return -1;
}
}