1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
|
module Grammar
class T
attr_accessor :word
def initialize word
@word = word
end
def to_s
"T<#{@word}>"
end
end
class NT
attr_accessor :symbol, :index
def initialize symbol=nil, index=nil
@symbol = symbol
@index = index
end
def from_s s
@symbol, @index = s.delete('[]').split ','
@symbol.strip!
@index = @index.to_i-1
end
def self.from_s s
n = NT.new
n.from_s s
return n
end
def to_s
return "NT<#{@symbol},#{@index}>" if @index>=0
return "NT<#{@symbol}>"
end
end
class Rule
attr_accessor :lhs, :rhs, :target, :map, :f
def initialize lhs=nil, rhs=nil, target=nil, map=nil, f=SparseVector.new
@lhs = lhs
@rhs = rhs
@target = target
@map = (map ? map : [])
@f = f
@arity_ = nil
end
def to_s
"#{@lhs.to_s} -> #{@rhs.map{ |i| i.to_s }.join ' '} ||| #{@target.map{ |i| i.to_s }.join ' '} [arity=#{arity}]"
end
def arity
@arity_ = rhs.select { |i| i.class == NT }.size if !@arity_
return @arity_
end
def read_right_ s, fill_map=false
_ = []
s.split.each { |x|
x.strip!
if x[0]=='[' && x[x.size-1] == ']'
_ << NT.from_s(x)
@map << _.last.index if fill_map
else
_ << T.new(x)
end
}
return _
end
def from_s s
lhs, rhs, target, f = splitpipe s, 3
@lhs = NT.from_s lhs
@rhs = read_right_ rhs
@target = read_right_ target, true
@f = (f ? SparseVector.from_kv(f) : nil)
end
def self.from_s_x s
r = self.new
r.from_s s
return r
end
end
class Grammar
attr_accessor :rules, :startn, :startt, :flat
def initialize fn
@rules = []; @startn = []; @startt = []; @flat = []
ReadFile.readlines_strip(fn).each_with_index { |s,i|
STDERR.write '.'; STDERR.write " #{i+1}\n" if (i+1)%80==0
@rules << Rule.from_s(s)
if @rules.last.rhs.first.class == NT
@startn << @rules.last
else
if rules.last.arity == 0
@flat << @rules.last
else
@startt << @rules.last
end
end
}
STDERR.write "\n"
end
def to_s
s = ''
@rules.each { |r| s += r.to_s+"\n" }
return s
end
def add_glue_rules
@rules.map { |r| r.lhs.symbol }.select { |s| s != 'S' }.uniq.each { |symbol|
@rules << Rule.new(NT.new('S'), [NT.new(symbol, 0)], [NT.new(symbol, 0)], [0])
@startn << @rules.last
@rules << Rule.new(NT.new('S'), [NT.new('S', 0), NT.new('X'), 1], [NT.new('S', 0), NT.new('X'), 1], [0, 1])
@startn << @rules.last
}
end
def add_pass_through_rules s
s.each { |word|
@rules << Rule.new(NT.new('X'), [T.new(word)], [T.new(word)])
@flat << @rules.last
}
end
end
end # module
|