summaryrefslogtreecommitdiff
path: root/prototype/weaver.rb
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2015-03-23 11:01:45 +0100
committerPatrick Simianer <p@simianer.de>2015-03-23 11:01:45 +0100
commite84265273b121eb5fbf465b80ea39d43602703fe (patch)
treea9d81c8493eec4fb360c86d3645c5845ee034268 /prototype/weaver.rb
parentcaf2fa0398fc29d373bce5b3a6cd54e3948e9866 (diff)
fix prototype
Diffstat (limited to 'prototype/weaver.rb')
-rwxr-xr-xprototype/weaver.rb82
1 files changed, 0 insertions, 82 deletions
diff --git a/prototype/weaver.rb b/prototype/weaver.rb
deleted file mode 100755
index 5cda844..0000000
--- a/prototype/weaver.rb
+++ /dev/null
@@ -1,82 +0,0 @@
-#!/usr/bin/env ruby
-
-require 'trollop'
-require 'xmlsimple'
-require_relative 'parse'
-
-def read_grammar fn, add_glue, add_pass_through, input=nil
- STDERR.write "> reading grammar '#{fn}'\n"
- grammar = Grammar::Grammar.new fn
- if add_glue
- STDERR.write ">> adding glue rules\n"
- grammar.add_glue_rules
- end
- if add_pass_through
- STDERR.write ">> adding pass-through rules\n"
- grammar.add_pass_through_rules input
- end
- return grammar
-end
-
-def main
- cfg = Trollop::options do
- opt :input, "", :type => :string, :default => '-', :short => '-i'
- opt :grammar, "", :type => :string, :required => true, :short => '-g'
- opt :weights, "", :type => :string, :required => true, :short => '-w'
- opt :add_glue, "", :type => :bool, :default => false, :short => '-l'
- opt :add_pass_through, "", :type => :bool, :default => false, :short => '-p'
- end
-
- grammar = nil
- if cfg[:grammar]
- grammar = read_grammar cfg[:grammar], cfg[:add_glue], cfg[:add_pass_through]
- end
-
- sgm_input = false
- if ['sgm', 'xml'].include? cfg[:input].split('.')[-1]
- sgm_input = true
- end
-
- STDERR.write "> reading input from '#{cfg[:input]}'\n"
- ReadFile.readlines_strip(cfg[:input]).each { |input|
-
- if sgm_input
- x = XmlSimple.xml_in(input)
- input = x['content'].split
- else
- input = input.split
- end
- n = input.size
-
- if sgm_input && x['grammar']
- grammar = read_grammar x['grammar'], cfg[:add_glue], cfg[:add_pass_through], input
- elsif cfg[:add_pass_through]
- grammar.add_pass_through_rules input
- end
-
-
- STDERR.write "> initializing charts\n"
- passive_chart = Parse::Chart.new n
- active_chart = Parse::Chart.new n
- Parse::init input, n, active_chart, passive_chart, grammar
-
- STDERR.write "> parsing\n"
- Parse::parse input, n, active_chart, passive_chart, grammar
-
- weights = SparseVector.from_kv(ReadFile.read(cfg[:weights]), ' ', "\n")
- if !weights
- weights = SparseVector.new
- end
-
- hypergraph = passive_chart.to_hg weights
-
- STDERR.write "> viterbi\n"
- semiring = ViterbiSemiring.new
- path, score = HG::viterbi_path hypergraph, hypergraph.nodes_by_id[-1], semiring
- s = HG::derive path, path.last.head, []
- STDOUT.write "#{s.map { |i| i.word }.join ' '} ||| #{Math.log score}\n"
- }
-end
-
-main
-