From 5339c8fdb1df47a2dab688bf1469e02a28eb0c89 Mon Sep 17 00:00:00 2001 From: Patrick Simianer
Date: Fri, 4 Nov 2016 17:04:12 +0100 Subject: rename, remove non nlp stuff --- svm-light-fmt-conv | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100755 svm-light-fmt-conv (limited to 'svm-light-fmt-conv') diff --git a/svm-light-fmt-conv b/svm-light-fmt-conv new file mode 100755 index 0000000..a9ce98f --- /dev/null +++ b/svm-light-fmt-conv @@ -0,0 +1,22 @@ +#!/usr/bin/env ruby + +require 'zipf' + +fd = Marshal.load ReadFile.read ARGV[0] +d = fd.size + +not_quiet = ARGV[1] +train = [] +l_i = 1 +while line = STDIN.gets + STDERR.write "#{l_i}\n" if l_i%1000==0&¬_quiet + s = [] + line.split.each { |i| + k,w = i.split '=', 2 + s << [fd[k]+1, w.to_f] + } + s.sort_by! { |i| i.first } + puts "+1 #{s.map{|i| "#{i.first}:#{i[1]}" }.join(' ')}" + l_i+= 1 +end + -- cgit v1.2.3