blob: 2c3928f3274144b01134e58c6a29b37abe6501d9 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
  | 
#!/usr/bin/env ruby
require 'bloom-filter'
require 'trollop'
STDIN.set_encoding 'utf-8'
STDOUT.set_encoding 'utf-8'
cfg = Trollop::options do
  opt :size, "number of entries in the filter", :type => :int, :required => true
  opt :error_rate, "error rate", :type => :float, :default => 0.01
end
f = BloomFilter.new cfg[:size], cfg[:error_rate]
while line = STDIN.gets
  src, tgt = splitpipe(line)[0..1]
  src.strip!
  tgt.strip!
  f.insert(src+" ||| "+tgt)
end
f.dump('pt.bloom')
f.close
  |