Merge branch 'master' of github.com:redpony/cdec

author: armatthews <armatthe@cmu.edu> 2014-10-13 14:59:23 -0400
committer: armatthews <armatthe@cmu.edu> 2014-10-13 14:59:23 -0400
commit: b26cda84e05d4523eee069234a975a0153bf8608 (patch)
tree: 61c9da4f8dd6070f27c8e81812a76fc0a8cf2d8d /klm/lm/wrappers/nplm.hh
parent: cd7bc67f475fdfd07fba003ac4cca40e83944740 (diff)
parent: b1ed81ef3216b212295afa76c5d20a56fb647204 (diff)
1 files changed, 83 insertions, 0 deletions
diff --git a/klm/lm/wrappers/nplm.hh b/klm/lm/wrappers/nplm.hh
new file mode 100644
index 00000000..b7dd4a21
--- /dev/null
+++ b/klm/lm/wrappers/nplm.hh
@@ -0,0 +1,83 @@
+#ifndef LM_WRAPPERS_NPLM_H
+#define LM_WRAPPERS_NPLM_H
+
+#include "lm/facade.hh"
+#include "lm/max_order.hh"
+#include "util/string_piece.hh"
+
+#include <boost/thread/tss.hpp>
+#include <boost/scoped_ptr.hpp>
+
+/* Wrapper to NPLM "by Ashish Vaswani, with contributions from David Chiang
+ * and Victoria Fossum."  
+ * http://nlg.isi.edu/software/nplm/
+ */
+
+namespace nplm {
+class vocabulary;
+class neuralLM;
+} // namespace nplm
+
+namespace lm {
+namespace np {
+
+class Vocabulary : public base::Vocabulary {
+  public:
+    Vocabulary(const nplm::vocabulary &vocab);
+
+    ~Vocabulary();
+
+    WordIndex Index(const std::string &str) const;
+
+    // TODO: lobby them to support StringPiece
+    WordIndex Index(const StringPiece &str) const {
+      return Index(std::string(str.data(), str.size()));
+    }
+
+    lm::WordIndex NullWord() const { return null_word_; }
+
+  private:
+    const nplm::vocabulary &vocab_;
+
+    const lm::WordIndex null_word_;
+};
+
+// Sorry for imposing my limitations on your code.
+#define NPLM_MAX_ORDER 7
+
+struct State {
+  WordIndex words[NPLM_MAX_ORDER - 1];
+};
+
+class Model : public lm::base::ModelFacade<Model, State, Vocabulary> {
+  private:
+    typedef lm::base::ModelFacade<Model, State, Vocabulary> P;
+
+  public:
+    // Does this look like an NPLM?
+    static bool Recognize(const std::string &file);
+
+    explicit Model(const std::string &file, std::size_t cache_size = 1 << 20);
+
+    ~Model();
+
+    FullScoreReturn FullScore(const State &from, const WordIndex new_word, State &out_state) const;
+
+    FullScoreReturn FullScoreForgotState(const WordIndex *context_rbegin, const WordIndex *context_rend, const WordIndex new_word, State &out_state) const;
+
+  private:
+    boost::scoped_ptr<nplm::neuralLM> base_instance_;
+
+    mutable boost::thread_specific_ptr<nplm::neuralLM> backend_;
+
+    Vocabulary vocab_;
+
+    lm::WordIndex null_word_;
+
+    const std::size_t cache_size_;
+};
+
+} // namespace np
+} // namespace lm
+
+#endif // LM_WRAPPERS_NPLM_H
author	armatthews <armatthe@cmu.edu>	2014-10-13 14:59:23 -0400
committer	armatthews <armatthe@cmu.edu>	2014-10-13 14:59:23 -0400
commit	b26cda84e05d4523eee069234a975a0153bf8608 (patch)
tree	61c9da4f8dd6070f27c8e81812a76fc0a8cf2d8d /klm/lm/wrappers/nplm.hh
parent	cd7bc67f475fdfd07fba003ac4cca40e83944740 (diff)
parent	b1ed81ef3216b212295afa76c5d20a56fb647204 (diff)