summaryrefslogtreecommitdiff
path: root/feature-dict
blob: 6849769c76a1d5600f6dd228a9a7fa9df4bddfbe (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
#!/usr/bin/env ruby

not_quiet = ARGV[1]
n = 0
feature_dict = {}
l_i = 1
while line = STDIN.gets
  STDERR.write "#{l_i}\n" if l_i%1000==0&&not_quiet
  line.split.each { |i|
    f, v = i.split('=', 2)
    if !feature_dict.has_key? f
      feature_dict[f] = n
      n += 1
    end
  }
  l_i += 1
end

f = File.new ARGV[0], 'w'
f.write Marshal.dump feature_dict
f.close

STDERR.write "size = #{feature_dict.size}\n"