diff options
author | Chris Dyer <redpony@gmail.com> | 2009-12-07 01:50:49 -0500 |
---|---|---|
committer | Chris Dyer <redpony@gmail.com> | 2009-12-07 01:50:49 -0500 |
commit | ec7edcc7e398bdb040d810094b8416ad9f279d98 (patch) | |
tree | bdaea01e4317d04946de432d8b3a187881e63e96 /src/csplit.h | |
parent | d6c82eaee9489a4d187a266a7d76a3e09cde119f (diff) |
minor changes to the way the phonotactic prob is calculated
Diffstat (limited to 'src/csplit.h')
-rw-r--r-- | src/csplit.h | 7 |
1 files changed, 7 insertions, 0 deletions
diff --git a/src/csplit.h b/src/csplit.h index 5911af77..54e5329d 100644 --- a/src/csplit.h +++ b/src/csplit.h @@ -4,6 +4,13 @@ #include "translator.h" #include "lattice.h" +// this "translator" takes single words (with NO SPACES) and segments +// them using the approach described in: +// +// C. Dyer. (2009) Using a maximum entropy model to build segmentation +// lattices for MT. In Proceedings of NAACL HLT 2009. +// note, an extra word space marker # is inserted at the left edge of +// the forest! struct CompoundSplitImpl; struct CompoundSplit : public Translator { CompoundSplit(const boost::program_options::variables_map& conf); |