diff options
| author | Michael Denkowski <mdenkows@cs.cmu.edu> | 2014-02-24 23:25:27 -0800 | 
|---|---|---|
| committer | Michael Denkowski <mdenkows@cs.cmu.edu> | 2014-02-24 23:25:27 -0800 | 
| commit | 73bc12bb80316362c3ba0c5a745bfc9591f88c55 (patch) | |
| tree | 96b69ce6b035c79a54e3fb456cb3c3cce751c161 /python/cdec | |
| parent | 9cf584746a55fd724de6af39f2fbe7bff1b79643 (diff) | |
refactoring
Diffstat (limited to 'python/cdec')
| -rw-r--r-- | python/cdec/sa/features.py | 12 | 
1 files changed, 3 insertions, 9 deletions
| diff --git a/python/cdec/sa/features.py b/python/cdec/sa/features.py index fe3fb2bd..f5cbdb8d 100644 --- a/python/cdec/sa/features.py +++ b/python/cdec/sa/features.py @@ -142,17 +142,11 @@ def IsSupportedOnline(ctx): # Occurs in online data?          return False  def CountExceptLM(vocab): -    def CountExceptLM(ctx): # In bitext (inc online data) but NOT mono text +    def CountExceptLM(ctx): # Word count in bitext (inc online data) but NOT mono text          return sum(1 for e in ctx.ephrase.words if e not in vocab)      return CountExceptLM  def CountExceptLex(ttable): -    def CountExceptLex(ctx): -        count = 0.0 -        for e in ctx.ephrase.words: -            if not ttable.contains_e_word(e): -                count += 1 -        return count +    def CountExceptLex(ctx): # Word count in online data but NOT original bitext +        return sum(1 for e in ctx.ephrase.words if not ttable.contains_e_word(e))      return CountExceptLex - - | 
