summaryrefslogtreecommitdiff
path: root/test_parse.rb
blob: 018767576757e201a19522b7b00d6c0106284172 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
#!/usr/bin/env ruby

require_relative 'parse'


def chart2json passive_chart, n
  id = 0
  spancat2id = {}
  puts "{"
  puts "\"weights\":{ \"logp\":2.0, \"use_shell\":1.0 },"
  puts "\"nodes\":"
  puts "["
  # nodes
  visit(1, 0, n) { |i,j| 
    seen = {}
    passive_chart.at(i,j).each { |item|
     if !seen[item.lhs.symbol]
       puts "{ \"id\":#{id}, \"cat\":\"#{item.lhs.symbol}\", \"span\":[#{i},#{j}] },"
       spancat2id["#{item.lhs.symbol},#{i},#{j}"] = id
       id += 1
     end
     seen[item.lhs.symbol]=true
    }
  }
  puts "{ \"id\":-1, \"cat\":\"root\", \"span\":[-1, -1] }"
  puts "],"
  puts "\"edges\":"
  puts "["
  a = []
  visit(1, 0, n) { |i,j| 
    passive_chart.at(i,j).each { |item|
      if item.tail_spans.empty?
      a << "{ \"head\":#{spancat2id[item.lhs.symbol+','+i.to_s+','+j.to_s]}, \"rule\":\"[#{item.lhs.symbol}] ||| #{item.rhs.map{|x|(x.class==Grammar::NT ? '['+x.symbol+','+x.index.to_s+']' : x.word.gsub('"','\"'))}.join(' ')} ||| #{item.target.map{|x|(x.class==Grammar::NT ? '['+x.symbol+','+(x.index+0).to_s+']' : x.word.gsub('"', '\"'))}.join(' ')}\ |||\", \"tails\":[-1], \"f\":#{item.f.to_s.gsub('=>',':')} }"
      else
      a << "{ \"head\":#{spancat2id[item.lhs.symbol+','+i.to_s+','+j.to_s]}, \"rule\":\"[#{item.lhs.symbol}] ||| #{item.rhs.map{|x|(x.class==Grammar::NT ? '['+x.symbol+','+x.index.to_s+']' : x.word.gsub('"','\"'))}.join(' ')} ||| #{item.target.map{|x|(x.class==Grammar::NT ? '['+x.symbol+','+(x.index+1).to_s+']' : x.word.gsub('"', '\"'))}.join(' ')}\ |||\", \"tails\":[#{item.rhs.zip((0..item.rhs.size-1).map{|q|item.tail_spans[q]}).select{|x|x[0].class==Grammar::NT}.map{|x|spancat2id[x[0].symbol+','+x[1].left.to_s+','+x[1].right.to_s]}.join ', '}], \"f\":#{item.f.to_s.gsub('=>',':')} }"
      end
    }
  }
  puts a.join ",\n"
  puts "]"
  puts "}"
end


def main
  STDERR.write "> reading input from TODO\n"
  #input = 'ich sah ein kleines haus'.split
  #input = 'lebensmittel schuld an europäischer inflation'.split
  input = 'offizielle prognosen sind von nur 3 prozent ausgegangen , meldete bloomberg .'.split
  n = input.size

  STDERR.write "> reading grammar\n"
  grammar = Grammar::Grammar.new 'example/3/grammar.3.gz'
  STDERR.write ">> adding glue grammar\n"
  grammar.add_glue_rules
  STDERR.write ">> adding pass-through grammar\n"
  #grammar.add_pass_through_rules input

  STDERR.write "> initializing charts\n"
  passive_chart = Chart.new n
  active_chart = Chart.new n
  init input, n, active_chart, passive_chart, grammar

  STDERR.write "> parsing\n"
  parse input, n, active_chart, passive_chart, grammar

  #puts "\n---\npassive chart"
  #visit(1, 0, 5) { |i,j| puts "#{i},#{j}"; passive_chart.at(i,j).each { |item| puts " #{j} #{item.to_s}" }; puts }

  chart2json passive_chart, n
end


main