diff options
author | Patrick Simianer <p@simianer.de> | 2016-07-05 11:01:46 +0200 |
---|---|---|
committer | Patrick Simianer <p@simianer.de> | 2016-07-05 11:01:46 +0200 |
commit | 2b1d7f881c19c4d4b5afae194e02d3300c7675d0 (patch) | |
tree | 5a06ee7de98640a39244b57bb369697176b44ebf /convert-to-svm-light-format | |
parent | 69949dda35c3ea21d8e926e5f0a596a0a0f61c6a (diff) |
mv
Diffstat (limited to 'convert-to-svm-light-format')
-rwxr-xr-x | convert-to-svm-light-format | 22 |
1 files changed, 22 insertions, 0 deletions
diff --git a/convert-to-svm-light-format b/convert-to-svm-light-format new file mode 100755 index 0000000..a9ce98f --- /dev/null +++ b/convert-to-svm-light-format @@ -0,0 +1,22 @@ +#!/usr/bin/env ruby + +require 'zipf' + +fd = Marshal.load ReadFile.read ARGV[0] +d = fd.size + +not_quiet = ARGV[1] +train = [] +l_i = 1 +while line = STDIN.gets + STDERR.write "#{l_i}\n" if l_i%1000==0&¬_quiet + s = [] + line.split.each { |i| + k,w = i.split '=', 2 + s << [fd[k]+1, w.to_f] + } + s.sort_by! { |i| i.first } + puts "+1 #{s.map{|i| "#{i.first}:#{i[1]}" }.join(' ')}" + l_i+= 1 +end + |