1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
|
cimport lattice
from utils cimport *
cdef class Lattice:
cdef lattice.Lattice* lattice
def __cinit__(self):
self.lattice = new lattice.Lattice()
def __init__(self, inp):
"""Lattice(tuple) -> Lattice from node list.
Lattice(string) -> Lattice from PLF representation."""
if isinstance(inp, tuple):
self.lattice.resize(len(inp))
for i, arcs in enumerate(inp):
self[i] = arcs
elif isinstance(inp, basestring):
lattice.ConvertTextOrPLF(as_str(inp), self.lattice)
else:
raise TypeError('cannot create lattice from %s' % type(inp))
def __dealloc__(self):
del self.lattice
def __getitem__(self, int index):
if not 0 <= index < len(self):
raise IndexError('lattice index out of range')
arcs = []
cdef vector[lattice.LatticeArc] arc_vector = self.lattice[0][index]
cdef lattice.LatticeArc* arc
cdef unsigned i
for i in range(arc_vector.size()):
arc = &arc_vector[i]
label = unicode(TDConvert(arc.label).c_str(), 'utf8')
#arcs.append((label, arc.features, arc.dist2next))
arcs.append((label, arc.dist2next))
return tuple(arcs)
def __setitem__(self, int index, tuple arcs):
if not 0 <= index < len(self):
raise IndexError('lattice index out of range')
cdef lattice.LatticeArc* arc
for (label, dist2next) in arcs:
label_str = as_str(label)
arc = new lattice.LatticeArc() #TDConvert(label_str), features, dist2next)
self.lattice[0][index].push_back(arc[0])
del arc
def __len__(self):
return self.lattice.size()
def __str__(self):
return str(hypergraph.AsPLF(self.lattice[0], True).c_str())
def __unicode__(self):
return unicode(str(self), 'utf8')
def __iter__(self):
cdef unsigned i
for i in range(len(self)):
yield self[i]
def todot(self):
"""lattice.todot() -> Representation of the lattice in GraphViz dot format."""
def lines():
yield 'digraph lattice {'
yield 'rankdir = LR;'
yield 'node [shape=circle];'
for i in range(len(self)):
for label, weight, delta in self[i]:
yield '%d -> %d [label="%s"];' % (i, i+delta, label.replace('"', '\\"'))
yield '%d [shape=doublecircle]' % len(self)
yield '}'
return '\n'.join(lines()).encode('utf8')
def as_hypergraph(self):
"""lattice.as_hypergraph() -> Hypergraph representation of the lattice."""
cdef Hypergraph result = Hypergraph.__new__(Hypergraph)
result.hg = new hypergraph.Hypergraph()
cdef bytes plf = str(self)
hypergraph.ReadFromPLF(plf, result.hg)
return result
|