Blame view
src/lm/kaldi-rnnlm.h
3.13 KB
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 |
// lm/kaldi-rnnlm.h // Copyright 2015 Guoguo Chen // See ../../COPYING for clarification regarding multiple authors // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE, // MERCHANTABLITY OR NON-INFRINGEMENT. // See the Apache 2 License for the specific language governing permissions and // limitations under the License. #ifndef KALDI_LM_KALDI_RNNLM_H_ #define KALDI_LM_KALDI_RNNLM_H_ #include <string> #include <vector> #include "base/kaldi-common.h" #include "fstext/deterministic-fst.h" #include "lm/mikolov-rnnlm-lib.h" #include "util/common-utils.h" namespace kaldi { struct KaldiRnnlmWrapperOpts { std::string unk_symbol; std::string eos_symbol; KaldiRnnlmWrapperOpts() : unk_symbol("<RNN_UNK>"), eos_symbol("</s>") {} void Register(OptionsItf *opts) { opts->Register("unk-symbol", &unk_symbol, "Symbol for out-of-vocabulary " "words in rnnlm."); opts->Register("eos-symbol", &eos_symbol, "End of setence symbol in " "rnnlm."); } }; class KaldiRnnlmWrapper { public: KaldiRnnlmWrapper(const KaldiRnnlmWrapperOpts &opts, const std::string &unk_prob_rspecifier, const std::string &word_symbol_table_rxfilename, const std::string &rnnlm_rxfilename); int32 GetHiddenLayerSize() const { return rnnlm_.getHiddenLayerSize(); } int32 GetEos() const { return eos_; } BaseFloat GetLogProb(int32 word, const std::vector<int32> &wseq, const std::vector<float> &context_in, std::vector<float> *context_out); private: rnnlm::CRnnLM rnnlm_; std::vector<std::string> label_to_word_; int32 eos_; KALDI_DISALLOW_COPY_AND_ASSIGN(KaldiRnnlmWrapper); }; class RnnlmDeterministicFst : public fst::DeterministicOnDemandFst<fst::StdArc> { public: typedef fst::StdArc::Weight Weight; typedef fst::StdArc::StateId StateId; typedef fst::StdArc::Label Label; // Does not take ownership. RnnlmDeterministicFst(int32 max_ngram_order, KaldiRnnlmWrapper *rnnlm); // We cannot use "const" because the pure virtual function in the interface is // not const. virtual StateId Start() { return start_state_; } // We cannot use "const" because the pure virtual function in the interface is // not const. virtual Weight Final(StateId s); virtual bool GetArc(StateId s, Label ilabel, fst::StdArc* oarc); private: typedef unordered_map<std::vector<Label>, StateId, VectorHasher<Label> > MapType; StateId start_state_; MapType wseq_to_state_; std::vector<std::vector<Label> > state_to_wseq_; KaldiRnnlmWrapper *rnnlm_; int32 max_ngram_order_; std::vector<std::vector<float> > state_to_context_; }; } // namespace kaldi #endif // KALDI_LM_KALDI_RNNLM_H_ |