Blame view

tools/openfst-1.6.7/src/extensions/mpdt/mpdtcompose.cc 2.55 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
  // See www.openfst.org for extensive documentation on this weighted
  // finite-state transducer library.
  //
  // Composes an MPDT and an FST.
  
  #include <cstring>
  
  #include <memory>
  #include <string>
  #include <vector>
  
  #include <fst/flags.h>
  #include <fst/log.h>
  
  #include <fst/extensions/mpdt/mpdtscript.h>
  #include <fst/extensions/mpdt/read_write_utils.h>
  #include <fst/extensions/pdt/getters.h>
  #include <fst/util.h>
  
  DEFINE_string(mpdt_parentheses, "",
                "MPDT parenthesis label pairs with assignments");
  DEFINE_bool(left_mpdt, true, "Is the first argument the MPDT?");
  DEFINE_bool(connect, true, "Trim output?");
  DEFINE_string(compose_filter, "paren",
                "Composition filter, one of: \"expand\", \"expand_paren\", "
                "\"paren\"");
  
  int main(int argc, char **argv) {
    namespace s = fst::script;
    using fst::MPdtComposeOptions;
    using fst::PdtComposeFilter;
    using fst::ReadLabelTriples;
    using fst::script::FstClass;
    using fst::script::VectorFstClass;
  
    string usage = "Compose an MPDT and an FST.
  
    Usage: ";
    usage += argv[0];
    usage += " in.pdt in.fst [out.mpdt]
  ";
    usage += " in.fst in.pdt [out.mpdt]
  ";
  
    std::set_new_handler(FailedNewHandler);
    SET_FLAGS(usage.c_str(), &argc, &argv, true);
    if (argc < 3 || argc > 4) {
      ShowUsage();
      return 1;
    }
  
    const string in1_name = strcmp(argv[1], "-") == 0 ? "" : argv[1];
    const string in2_name = strcmp(argv[2], "-") == 0 ? "" : argv[2];
    const string out_name = argc > 3 ? argv[3] : "";
  
    if (in1_name.empty() && in2_name.empty()) {
      LOG(ERROR) << argv[0] << ": Can't take both inputs from standard input.";
      return 1;
    }
  
    std::unique_ptr<FstClass> ifst1(FstClass::Read(in1_name));
    if (!ifst1) return 1;
    std::unique_ptr<FstClass> ifst2(FstClass::Read(in2_name));
    if (!ifst2) return 1;
  
    if (FLAGS_mpdt_parentheses.empty()) {
      LOG(ERROR) << argv[0] << ": No MPDT parenthesis label pairs provided";
      return 1;
    }
  
    std::vector<s::LabelPair> parens;
    std::vector<int64> assignments;
    if (!ReadLabelTriples(FLAGS_mpdt_parentheses, &parens, &assignments, false))
      return 1;
  
    VectorFstClass ofst(ifst1->ArcType());
  
    PdtComposeFilter compose_filter;
    if (!s::GetPdtComposeFilter(FLAGS_compose_filter, &compose_filter)) {
      LOG(ERROR) << argv[0] << ": Unknown or unsupported compose filter type: "
                 << FLAGS_compose_filter;
      return 1;
    }
  
    const MPdtComposeOptions opts(FLAGS_connect, compose_filter);
  
    s::MPdtCompose(*ifst1, *ifst2, parens, assignments, &ofst, opts,
                   FLAGS_left_mpdt);
  
    ofst.Write(out_name);
  
    return 0;
  }