summaryrefslogtreecommitdiff
path: root/python/cdec
diff options
context:
space:
mode:
authorMichael Denkowski <mdenkows@cs.cmu.edu>2014-02-24 23:25:27 -0800
committerMichael Denkowski <mdenkows@cs.cmu.edu>2014-02-24 23:25:27 -0800
commit3cb43f4e3980457cbb7b749cee51a5bb777e18f8 (patch)
tree839a04a281d0673b718e837960f3333b42923446 /python/cdec
parent6b0afcb161141cdb64e249adfb3708682febc089 (diff)
refactoring
Diffstat (limited to 'python/cdec')
-rw-r--r--python/cdec/sa/features.py12
1 files changed, 3 insertions, 9 deletions
diff --git a/python/cdec/sa/features.py b/python/cdec/sa/features.py
index fe3fb2bd..f5cbdb8d 100644
--- a/python/cdec/sa/features.py
+++ b/python/cdec/sa/features.py
@@ -142,17 +142,11 @@ def IsSupportedOnline(ctx): # Occurs in online data?
return False
def CountExceptLM(vocab):
- def CountExceptLM(ctx): # In bitext (inc online data) but NOT mono text
+ def CountExceptLM(ctx): # Word count in bitext (inc online data) but NOT mono text
return sum(1 for e in ctx.ephrase.words if e not in vocab)
return CountExceptLM
def CountExceptLex(ttable):
- def CountExceptLex(ctx):
- count = 0.0
- for e in ctx.ephrase.words:
- if not ttable.contains_e_word(e):
- count += 1
- return count
+ def CountExceptLex(ctx): # Word count in online data but NOT original bitext
+ return sum(1 for e in ctx.ephrase.words if not ttable.contains_e_word(e))
return CountExceptLex
-
-