summaryrefslogtreecommitdiff
path: root/dtrain/hstreaming/rule_count/rulecount.rb
diff options
context:
space:
mode:
Diffstat (limited to 'dtrain/hstreaming/rule_count/rulecount.rb')
-rw-r--r--dtrain/hstreaming/rule_count/rulecount.rb13
1 files changed, 13 insertions, 0 deletions
diff --git a/dtrain/hstreaming/rule_count/rulecount.rb b/dtrain/hstreaming/rule_count/rulecount.rb
new file mode 100644
index 00000000..67361fa4
--- /dev/null
+++ b/dtrain/hstreaming/rule_count/rulecount.rb
@@ -0,0 +1,13 @@
+#!/usr/bin/env ruby
+
+STDIN.set_encoding 'utf-8'
+STDOUT.set_encoding 'utf-8'
+
+while line = STDIN.gets
+ a = line.strip.chomp.split "\t"
+ a[3..a.size].each { |r|
+ id = r.split("|||")[0..2].join("|||").to_s.strip.gsub("\s", "_")
+ puts "#{id}\t1"
+ }
+end
+