From 60f93614186ebd6150602cae140b7a96dc4bca8a Mon Sep 17 00:00:00 2001 From: Patrick Simianer
Date: Wed, 24 Jun 2015 17:47:32 +0200 Subject: better wrapper script --- util/wrapper.rb | 47 +++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 47 insertions(+) create mode 100755 util/wrapper.rb (limited to 'util/wrapper.rb') diff --git a/util/wrapper.rb b/util/wrapper.rb new file mode 100755 index 0000000..8445f0f --- /dev/null +++ b/util/wrapper.rb @@ -0,0 +1,47 @@ +#!/usr/bin/env ruby + +require 'nanomsg' +require 'open3' +require 'trollop' + +conf = Trollop::options do + opt :action, "tokenize, detokenize or truecase", :short => "-a", :type => :string, :required => true + opt :addr, "socket address", :short => "-S", :type => :string, :required => true + opt :ext, "path to externals", :short => "-e", :type => :string, :required => true + opt :lang, "language", :short => "-l", :type => :string + opt :truecase_model, "model file for truecaser", :short => "-t", :type => :string +end + +sock = NanoMsg::PairSocket.new +sock.bind conf[:addr] +sock.send "hello" + +if conf[:action] == "detokenize" + cmd = "#{conf[:ext]}/detokenizer.perl -q -b -u -l #{conf[:lang]}" + if !conf[:lang] + STDERR.write "[detokenizer] No language given, exiting!\n"; exit + end +elsif conf[:action] == "tokenize" + cmd = "#{conf[:ext]}/tokenizer-no-escape.perl -q -b -a -l #{conf[:lang]}" + if !conf[:lang] + STDERR.write "[tokenizer] No language given, exiting!\n"; exit + end +elsif conf[:action] == "truecase" + cmd = "#{conf[:ext]}/truecase.perl -b --model #{conf[:truecase_model]}" + if !conf[:truecase_model] + STDERR.write "[truecaser] No model given for truecaser, exiting!\n"; exit + end +else + STDERR.write "[wrapper] Unknown action #{conf[:action]}, exiting!\n"; exit +end +pin, pout, perr = Open3.popen3(cmd) +while true + inp = sock.recv.strip+"\n" + break if !inp||inp=="shutdown" + pin.write inp + sock.send pout.gets.strip +end + +pin.close; pout.close; perr.close +sock.send "off" + -- cgit v1.2.3