summaryrefslogtreecommitdiff
path: root/dtrain/hstreaming/rule_count/rulecount.rb
diff options
context:
space:
mode:
Diffstat (limited to 'dtrain/hstreaming/rule_count/rulecount.rb')
-rw-r--r--dtrain/hstreaming/rule_count/rulecount.rb11
1 files changed, 11 insertions, 0 deletions
diff --git a/dtrain/hstreaming/rule_count/rulecount.rb b/dtrain/hstreaming/rule_count/rulecount.rb
new file mode 100644
index 00000000..035bdf06
--- /dev/null
+++ b/dtrain/hstreaming/rule_count/rulecount.rb
@@ -0,0 +1,11 @@
+STDIN.set_encoding 'utf-8'
+STDOUT.set_encoding 'utf-8'
+
+while line = STDIN.gets
+ a = line.strip.chomp.split "\t"
+ a[3..a.size].each { |r|
+ id = r.split("|||")[0..2].join("|||").to_s.strip.gsub("\s", "_")
+ puts "#{id}\t1"
+ }
+end
+