Blame view

tools/openfst-1.6.7/include/fst/add-on.h 7.27 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
  // See www.openfst.org for extensive documentation on this weighted
  // finite-state transducer library.
  //
  // FST implementation class to attach an arbitrary object with a read/write
  // method to an FST and its file representation. The FST is given a new type
  // name.
  
  #ifndef FST_ADD_ON_H_
  #define FST_ADD_ON_H_
  
  #include <stddef.h>
  #include <memory>
  #include <string>
  #include <utility>
  
  #include <fst/log.h>
  
  #include <fst/fst.h>
  
  
  namespace fst {
  
  // Identifies stream data as an add-on FST.
  static constexpr int32 kAddOnMagicNumber = 446681434;
  
  // Nothing to save.
  class NullAddOn {
   public:
    NullAddOn() {}
  
    static NullAddOn *Read(std::istream &strm, const FstReadOptions &opts) {
      return new NullAddOn();
    }
  
    bool Write(std::ostream &ostrm, const FstWriteOptions &opts) const {
      return true;
    }
  };
  
  // Create a new add-on from a pair of add-ons.
  template <class A1, class A2>
  class AddOnPair {
   public:
    // Argument reference count incremented.
    AddOnPair(std::shared_ptr<A1> a1, std::shared_ptr<A2> a2)
        : a1_(std::move(a1)), a2_(std::move(a2)) {}
  
    const A1 *First() const { return a1_.get(); }
  
    const A2 *Second() const { return a2_.get(); }
  
    std::shared_ptr<A1> SharedFirst() const { return a1_; }
  
    std::shared_ptr<A2> SharedSecond() const { return a2_; }
  
    static AddOnPair<A1, A2> *Read(std::istream &istrm,
                                   const FstReadOptions &opts) {
      A1 *a1 = nullptr;
      bool have_addon1 = false;
      ReadType(istrm, &have_addon1);
      if (have_addon1) a1 = A1::Read(istrm, opts);
  
      A2 *a2 = nullptr;
      bool have_addon2 = false;
      ReadType(istrm, &have_addon2);
      if (have_addon2) a2 = A2::Read(istrm, opts);
  
      return new AddOnPair<A1, A2>(std::shared_ptr<A1>(a1),
                                   std::shared_ptr<A2>(a2));
    }
  
    bool Write(std::ostream &ostrm, const FstWriteOptions &opts) const {
      bool have_addon1 = a1_ != nullptr;
      WriteType(ostrm, have_addon1);
      if (have_addon1) a1_->Write(ostrm, opts);
      bool have_addon2 = a2_ != nullptr;
      WriteType(ostrm, have_addon2);
      if (have_addon2) a2_->Write(ostrm, opts);
      return true;
    }
  
   private:
    std::shared_ptr<A1> a1_;
    std::shared_ptr<A2> a2_;
  };
  
  namespace internal {
  
  // Adds an object of type T to an FST. T must support:
  //
  //     T* Read(std::istream &);
  //     bool Write(std::ostream &);
  //
  // The resulting type is a new FST implementation.
  template <class FST, class T>
  class AddOnImpl : public FstImpl<typename FST::Arc> {
   public:
    using Arc = typename FST::Arc;
    using Label = typename Arc::Label;
    using StateId = typename Arc::StateId;
    using Weight = typename Arc::Weight;
  
    using FstImpl<Arc>::SetType;
    using FstImpl<Arc>::SetInputSymbols;
    using FstImpl<Arc>::SetOutputSymbols;
    using FstImpl<Arc>::SetProperties;
    using FstImpl<Arc>::WriteHeader;
  
    // We make a thread-safe copy of the FST by default since an FST
    // implementation is expected to not share mutable data between objects.
    AddOnImpl(const FST &fst, const string &type,
              std::shared_ptr<T> t = std::shared_ptr<T>())
        : fst_(fst, true), t_(std::move(t)) {
      SetType(type);
      SetProperties(fst_.Properties(kFstProperties, false));
      SetInputSymbols(fst_.InputSymbols());
      SetOutputSymbols(fst_.OutputSymbols());
    }
  
    // Conversion from const Fst<Arc> & to F always copies the underlying
    // implementation.
    AddOnImpl(const Fst<Arc> &fst, const string &type,
              std::shared_ptr<T> t = std::shared_ptr<T>())
        : fst_(fst), t_(std::move(t)) {
      SetType(type);
      SetProperties(fst_.Properties(kFstProperties, false));
      SetInputSymbols(fst_.InputSymbols());
      SetOutputSymbols(fst_.OutputSymbols());
    }
  
    // We make a thread-safe copy of the FST by default since an FST
    // implementation is expected to not share mutable data between objects.
    AddOnImpl(const AddOnImpl<FST, T> &impl)
        : fst_(impl.fst_, true), t_(impl.t_) {
      SetType(impl.Type());
      SetProperties(fst_.Properties(kCopyProperties, false));
      SetInputSymbols(fst_.InputSymbols());
      SetOutputSymbols(fst_.OutputSymbols());
    }
  
    StateId Start() const { return fst_.Start(); }
  
    Weight Final(StateId s) const { return fst_.Final(s); }
  
    size_t NumArcs(StateId s) const { return fst_.NumArcs(s); }
  
    size_t NumInputEpsilons(StateId s) const { return fst_.NumInputEpsilons(s); }
  
    size_t NumOutputEpsilons(StateId s) const {
      return fst_.NumOutputEpsilons(s);
    }
  
    size_t NumStates() const { return fst_.NumStates(); }
  
    static AddOnImpl<FST, T> *Read(std::istream &strm,
                                   const FstReadOptions &opts) {
      FstReadOptions nopts(opts);
      FstHeader hdr;
      if (!nopts.header) {
        hdr.Read(strm, nopts.source);
        nopts.header = &hdr;
      }
      std::unique_ptr<AddOnImpl<FST, T>> impl(
          new AddOnImpl<FST, T>(nopts.header->FstType()));
      if (!impl->ReadHeader(strm, nopts, kMinFileVersion, &hdr)) return nullptr;
      impl.reset();
      int32 magic_number = 0;
      ReadType(strm, &magic_number);  // Ensures this is an add-on FST.
      if (magic_number != kAddOnMagicNumber) {
        LOG(ERROR) << "AddOnImpl::Read: Bad add-on header: " << nopts.source;
        return nullptr;
      }
      FstReadOptions fopts(opts);
      fopts.header = nullptr;  // Contained header was written out.
      std::unique_ptr<FST> fst(FST::Read(strm, fopts));
      if (!fst) return nullptr;
      std::shared_ptr<T> t;
      bool have_addon = false;
      ReadType(strm, &have_addon);
      if (have_addon) {  // Reads add-on object if present.
        t = std::shared_ptr<T>(T::Read(strm, fopts));
        if (!t) return nullptr;
      }
      return new AddOnImpl<FST, T>(*fst, nopts.header->FstType(), t);
    }
  
    bool Write(std::ostream &strm, const FstWriteOptions &opts) const {
      FstHeader hdr;
      FstWriteOptions nopts(opts);
      nopts.write_isymbols = false;  // Allows contained FST to hold any symbols.
      nopts.write_osymbols = false;
      WriteHeader(strm, nopts, kFileVersion, &hdr);
      WriteType(strm, kAddOnMagicNumber);  // Ensures this is an add-on FST.
      FstWriteOptions fopts(opts);
      fopts.write_header = true;  // Forces writing contained header.
      if (!fst_.Write(strm, fopts)) return false;
      bool have_addon = !!t_;
      WriteType(strm, have_addon);
      // Writes add-on object if present.
      if (have_addon) t_->Write(strm, opts);
      return true;
    }
  
    void InitStateIterator(StateIteratorData<Arc> *data) const {
      fst_.InitStateIterator(data);
    }
  
    void InitArcIterator(StateId s, ArcIteratorData<Arc> *data) const {
      fst_.InitArcIterator(s, data);
    }
  
    FST &GetFst() { return fst_; }
  
    const FST &GetFst() const { return fst_; }
  
    const T *GetAddOn() const { return t_.get(); }
  
    std::shared_ptr<T> GetSharedAddOn() const { return t_; }
  
    void SetAddOn(std::shared_ptr<T> t) { t_ = t; }
  
   private:
    explicit AddOnImpl(const string &type) : t_() {
      SetType(type);
      SetProperties(kExpanded);
    }
  
    // Current file format version.
    static constexpr int kFileVersion = 1;
    // Minimum file format version supported.
    static constexpr int kMinFileVersion = 1;
  
    FST fst_;
    std::shared_ptr<T> t_;
  
    AddOnImpl &operator=(const AddOnImpl &) = delete;
  };
  
  template <class FST, class T>
  constexpr int AddOnImpl<FST, T>::kFileVersion;
  
  template <class FST, class T>
  constexpr int AddOnImpl<FST, T>::kMinFileVersion;
  
  }  // namespace internal
  }  // namespace fst
  
  #endif  // FST_ADD_ON_H_