diff options
author | philblunsom@gmail.com <philblunsom@gmail.com@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-06-29 23:21:55 +0000 |
---|---|---|
committer | philblunsom@gmail.com <philblunsom@gmail.com@ec762483-ff6d-05da-a07a-a48fb63a330f> | 2010-06-29 23:21:55 +0000 |
commit | 7390212db70aa86e55210cc621a06b91626d635a (patch) | |
tree | 6cc94e53486b31936b2c54d44cfba9cf01569847 /gi | |
parent | 5791e37a13c657528588e4d84c588c76065545c7 (diff) |
Added singleton filter.
git-svn-id: https://ws10smt.googlecode.com/svn/trunk@72 ec762483-ff6d-05da-a07a-a48fb63a330f
Diffstat (limited to 'gi')
-rw-r--r-- | gi/pyp-topics/src/contexts_corpus.cc | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/gi/pyp-topics/src/contexts_corpus.cc b/gi/pyp-topics/src/contexts_corpus.cc index e9644d5a..ad9554f5 100644 --- a/gi/pyp-topics/src/contexts_corpus.cc +++ b/gi/pyp-topics/src/contexts_corpus.cc @@ -35,7 +35,7 @@ void read_callback(const ContextsLexer::PhraseContextsType& new_contexts, void* // filter out singleton contexts if (!counts->empty()) { map<string,int>::const_iterator find_it = counts->find(context_str); - if (find_it == counts->end() || find_it->second == 1) + if (find_it == counts->end() || find_it->second < 5) continue; } |