summaryrefslogtreecommitdiff
path: root/dtrain/hstreaming/rule_count/rulecount.rb
blob: 035bdf0631dd7c976ec466ead9cc797ecd7b969c (plain)
1
2
3
4
5
6
7
8
9
10
11
STDIN.set_encoding 'utf-8'
STDOUT.set_encoding 'utf-8'

while line = STDIN.gets
  a = line.strip.chomp.split "\t"
  a[3..a.size].each { |r|
    id = r.split("|||")[0..2].join("|||").to_s.strip.gsub("\s", "_")
    puts "#{id}\t1"
  }
end