blob: 2c3928f3274144b01134e58c6a29b37abe6501d9 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
|
#!/usr/bin/env ruby
require 'bloom-filter'
require 'trollop'
STDIN.set_encoding 'utf-8'
STDOUT.set_encoding 'utf-8'
cfg = Trollop::options do
opt :size, "number of entries in the filter", :type => :int, :required => true
opt :error_rate, "error rate", :type => :float, :default => 0.01
end
f = BloomFilter.new cfg[:size], cfg[:error_rate]
while line = STDIN.gets
src, tgt = splitpipe(line)[0..1]
src.strip!
tgt.strip!
f.insert(src+" ||| "+tgt)
end
f.dump('pt.bloom')
f.close
|