Blame view

tools/openfst-1.6.7/src/extensions/pdt/pdtexpand.cc 1.88 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
  // See www.openfst.org for extensive documentation on this weighted
  // finite-state transducer library.
  //
  // Expands a (bounded-stack) PDT as an FST.
  
  #include <cstring>
  
  #include <memory>
  #include <string>
  #include <vector>
  
  #include <fst/flags.h>
  #include <fst/log.h>
  
  #include <fst/extensions/pdt/pdtscript.h>
  #include <fst/util.h>
  
  DEFINE_string(pdt_parentheses, "", "PDT parenthesis label pairs");
  DEFINE_bool(connect, true, "Trim output?");
  DEFINE_bool(keep_parentheses, false, "Keep PDT parentheses in result?");
  DEFINE_string(weight, "", "Weight threshold");
  
  int main(int argc, char **argv) {
    namespace s = fst::script;
    using fst::script::FstClass;
    using fst::script::VectorFstClass;
    using fst::script::WeightClass;
    using fst::ReadLabelPairs;
  
    string usage = "Expand a (bounded-stack) PDT as an FST.
  
    Usage: ";
    usage += argv[0];
    usage += " in.pdt [out.fst]
  ";
  
    std::set_new_handler(FailedNewHandler);
    SET_FLAGS(usage.c_str(), &argc, &argv, true);
    if (argc > 3) {
      ShowUsage();
      return 1;
    }
  
    const string in_name =
        (argc > 1 && (strcmp(argv[1], "-") != 0)) ? argv[1] : "";
    const string out_name = argc > 2 ? argv[2] : "";
  
    std::unique_ptr<FstClass> ifst(FstClass::Read(in_name));
    if (!ifst) return 1;
  
    if (FLAGS_pdt_parentheses.empty()) {
      LOG(ERROR) << argv[0] << ": No PDT parenthesis label pairs provided";
      return 1;
    }
  
    std::vector<s::LabelPair> parens;
    if (!ReadLabelPairs(FLAGS_pdt_parentheses, &parens, false)) return 1;
  
    const auto weight_threshold =
        FLAGS_weight.empty() ? WeightClass::Zero(ifst->WeightType())
                             : WeightClass(ifst->WeightType(), FLAGS_weight);
  
    VectorFstClass ofst(ifst->ArcType());
    s::PdtExpand(*ifst, parens, &ofst,
                 s::PdtExpandOptions(FLAGS_connect, FLAGS_keep_parentheses,
                                     weight_threshold));
  
    ofst.Write(out_name);
  
    return 0;
  }