summaryrefslogtreecommitdiff
path: root/convert-to-svm-light-format
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2016-07-05 11:01:46 +0200
committerPatrick Simianer <p@simianer.de>2016-07-05 11:01:46 +0200
commit2b1d7f881c19c4d4b5afae194e02d3300c7675d0 (patch)
tree5a06ee7de98640a39244b57bb369697176b44ebf /convert-to-svm-light-format
parent69949dda35c3ea21d8e926e5f0a596a0a0f61c6a (diff)
mv
Diffstat (limited to 'convert-to-svm-light-format')
-rwxr-xr-xconvert-to-svm-light-format22
1 files changed, 22 insertions, 0 deletions
diff --git a/convert-to-svm-light-format b/convert-to-svm-light-format
new file mode 100755
index 0000000..a9ce98f
--- /dev/null
+++ b/convert-to-svm-light-format
@@ -0,0 +1,22 @@
+#!/usr/bin/env ruby
+
+require 'zipf'
+
+fd = Marshal.load ReadFile.read ARGV[0]
+d = fd.size
+
+not_quiet = ARGV[1]
+train = []
+l_i = 1
+while line = STDIN.gets
+ STDERR.write "#{l_i}\n" if l_i%1000==0&&not_quiet
+ s = []
+ line.split.each { |i|
+ k,w = i.split '=', 2
+ s << [fd[k]+1, w.to_f]
+ }
+ s.sort_by! { |i| i.first }
+ puts "+1 #{s.map{|i| "#{i.first}:#{i[1]}" }.join(' ')}"
+ l_i+= 1
+end
+