diff options
author | Patrick Simianer <p@simianer.de> | 2014-10-13 19:03:48 +0100 |
---|---|---|
committer | Patrick Simianer <p@simianer.de> | 2014-10-13 19:03:48 +0100 |
commit | cb9fb7088dde35881516c088db402abe747d49fa (patch) | |
tree | a91e4935a7941f1b261f76d88ab41fa3078a1891 /python/cdec/sa/rule.pxi | |
parent | 0a00e57e921c8eca8e02364db7d2e6607bfdcebc (diff) | |
parent | b1ed81ef3216b212295afa76c5d20a56fb647204 (diff) |
Merge remote-tracking branch 'upstream/master'
Diffstat (limited to 'python/cdec/sa/rule.pxi')
-rw-r--r-- | python/cdec/sa/rule.pxi | 19 |
1 files changed, 19 insertions, 0 deletions
diff --git a/python/cdec/sa/rule.pxi b/python/cdec/sa/rule.pxi index 7fde3e06..af8fabea 100644 --- a/python/cdec/sa/rule.pxi +++ b/python/cdec/sa/rule.pxi @@ -154,6 +154,25 @@ cdef class Phrase: property words: def __get__(self): return [sym_tostring(w) for w in self if not sym_isvar(w)] + + def iterspans(self, nt_flag = False, to_str = True): + """iterate over (terminal and nonterminal) spans, it generates pairs of the kind (terminal span, !nt_flag) or (nonterminal, nt_flag) + Example: iterspans(False, False) --> ([-1], False), ([2,3], True), ([-1], False), ([4], True), ([-1], False) + for the sequence -1 2 3 -1 4 -1""" + span = [] + cdef int i, s + get_sym = lambda sym : sym_tostring(sym) if to_str else lambda sym : sym + for i from 0 <= i < self.n: + s = self.syms[i] + if sym_isvar(s): + if len(span): + yield (span, not nt_flag) + span = [] + yield ([get_sym(s)], nt_flag) + else: + span.append(get_sym(s)) + if len(span): + yield (span, not nt_flag) cdef class Rule: |