summaryrefslogtreecommitdiff
path: root/src/csplit.h
diff options
context:
space:
mode:
authorChris Dyer <redpony@gmail.com>2009-12-07 01:50:49 -0500
committerChris Dyer <redpony@gmail.com>2009-12-07 01:50:49 -0500
commitec7edcc7e398bdb040d810094b8416ad9f279d98 (patch)
treebdaea01e4317d04946de432d8b3a187881e63e96 /src/csplit.h
parentd6c82eaee9489a4d187a266a7d76a3e09cde119f (diff)
minor changes to the way the phonotactic prob is calculated
Diffstat (limited to 'src/csplit.h')
-rw-r--r--src/csplit.h7
1 files changed, 7 insertions, 0 deletions
diff --git a/src/csplit.h b/src/csplit.h
index 5911af77..54e5329d 100644
--- a/src/csplit.h
+++ b/src/csplit.h
@@ -4,6 +4,13 @@
#include "translator.h"
#include "lattice.h"
+// this "translator" takes single words (with NO SPACES) and segments
+// them using the approach described in:
+//
+// C. Dyer. (2009) Using a maximum entropy model to build segmentation
+// lattices for MT. In Proceedings of NAACL HLT 2009.
+// note, an extra word space marker # is inserted at the left edge of
+// the forest!
struct CompoundSplitImpl;
struct CompoundSplit : public Translator {
CompoundSplit(const boost::program_options::variables_map& conf);