Merge branch 'const_reorder_2' into softsyn_2

author: Wu, Ke <wuke@cs.umd.edu> 2014-12-17 16:15:13 -0500
committer: Wu, Ke <wuke@cs.umd.edu> 2014-12-17 16:15:13 -0500
commit: 17dbb7d5ab1544899b1b9e867d2246a0a93e3aa8 (patch)
tree: 7fa2a51763a1b67fb325e86b0e3f764dd119cd70 /klm/lm/wrappers/nplm.hh
parent: 1983c75c35b7f5dc3f356a2f9a9345d632b87650 (diff)
parent: 1613f1fc44ca67820afd7e7b21eb54b316c8ce55 (diff)
1 files changed, 83 insertions, 0 deletions
diff --git a/klm/lm/wrappers/nplm.hh b/klm/lm/wrappers/nplm.hh
new file mode 100644
index 00000000..b7dd4a21
--- /dev/null
+++ b/klm/lm/wrappers/nplm.hh
@@ -0,0 +1,83 @@
+#ifndef LM_WRAPPERS_NPLM_H
+#define LM_WRAPPERS_NPLM_H
+
+#include "lm/facade.hh"
+#include "lm/max_order.hh"
+#include "util/string_piece.hh"
+
+#include <boost/thread/tss.hpp>
+#include <boost/scoped_ptr.hpp>
+
+/* Wrapper to NPLM "by Ashish Vaswani, with contributions from David Chiang
+ * and Victoria Fossum."  
+ * http://nlg.isi.edu/software/nplm/
+ */
+
+namespace nplm {
+class vocabulary;
+class neuralLM;
+} // namespace nplm
+
+namespace lm {
+namespace np {
+
+class Vocabulary : public base::Vocabulary {
+  public:
+    Vocabulary(const nplm::vocabulary &vocab);
+
+    ~Vocabulary();
+
+    WordIndex Index(const std::string &str) const;
+
+    // TODO: lobby them to support StringPiece
+    WordIndex Index(const StringPiece &str) const {
+      return Index(std::string(str.data(), str.size()));
+    }
+
+    lm::WordIndex NullWord() const { return null_word_; }
+
+  private:
+    const nplm::vocabulary &vocab_;
+
+    const lm::WordIndex null_word_;
+};
+
+// Sorry for imposing my limitations on your code.
+#define NPLM_MAX_ORDER 7
+
+struct State {
+  WordIndex words[NPLM_MAX_ORDER - 1];
+};
+
+class Model : public lm::base::ModelFacade<Model, State, Vocabulary> {
+  private:
+    typedef lm::base::ModelFacade<Model, State, Vocabulary> P;
+
+  public:
+    // Does this look like an NPLM?
+    static bool Recognize(const std::string &file);
+
+    explicit Model(const std::string &file, std::size_t cache_size = 1 << 20);
+
+    ~Model();
+
+    FullScoreReturn FullScore(const State &from, const WordIndex new_word, State &out_state) const;
+
+    FullScoreReturn FullScoreForgotState(const WordIndex *context_rbegin, const WordIndex *context_rend, const WordIndex new_word, State &out_state) const;
+
+  private:
+    boost::scoped_ptr<nplm::neuralLM> base_instance_;
+
+    mutable boost::thread_specific_ptr<nplm::neuralLM> backend_;
+
+    Vocabulary vocab_;
+
+    lm::WordIndex null_word_;
+
+    const std::size_t cache_size_;
+};
+
+} // namespace np
+} // namespace lm
+
+#endif // LM_WRAPPERS_NPLM_H
author	Wu, Ke <wuke@cs.umd.edu>	2014-12-17 16:15:13 -0500
committer	Wu, Ke <wuke@cs.umd.edu>	2014-12-17 16:15:13 -0500
commit	17dbb7d5ab1544899b1b9e867d2246a0a93e3aa8 (patch)
tree	7fa2a51763a1b67fb325e86b0e3f764dd119cd70 /klm/lm/wrappers/nplm.hh
parent	1983c75c35b7f5dc3f356a2f9a9345d632b87650 (diff)
parent	1613f1fc44ca67820afd7e7b21eb54b316c8ce55 (diff)