From ae3cfd5700d20d30a06f5c27ea1c5e39a458c783 Mon Sep 17 00:00:00 2001 From: Michael Denkowski Date: Mon, 23 Sep 2013 08:21:58 -0700 Subject: One extractor, multiple online contexts. --- python/cdec/sa/extractor.py | 14 ++++---------- 1 file changed, 4 insertions(+), 10 deletions(-) (limited to 'python/cdec/sa/extractor.py') diff --git a/python/cdec/sa/extractor.py b/python/cdec/sa/extractor.py index acc13cbc..23534712 100644 --- a/python/cdec/sa/extractor.py +++ b/python/cdec/sa/extractor.py @@ -84,23 +84,17 @@ class GrammarExtractor: for fn in cdec.sa._SA_CONFIGURE: fn(config) - def grammar(self, sentence): + def grammar(self, sentence, ctx_name=None): if isinstance(sentence, unicode): sentence = sentence.encode('utf8') words = tuple(chain(('',), sentence.split(), ('',))) meta = cdec.sa.annotate(words) cnet = cdec.sa.make_lattice(words) - return self.factory.input(cnet, meta) + return self.factory.input(cnet, meta, ctx_name) # Add training instance to data - def add_instance(self, sentence, reference, alignment): + def add_instance(self, sentence, reference, alignment, ctx_name=None): f_words = cdec.sa.encode_words(sentence.split()) e_words = cdec.sa.encode_words(reference.split()) al = sorted(tuple(int(i) for i in pair.split('-')) for pair in alignment.split()) - self.factory.add_instance(f_words, e_words, al) - - # Debugging - def dump_online_stats(self): - self.factory.dump_online_stats() - def dump_online_rules(self): - self.factory.dump_online_rules() \ No newline at end of file + self.factory.add_instance(f_words, e_words, al, ctx_name) -- cgit v1.2.3