summaryrefslogtreecommitdiff
path: root/dtrain/hstreaming/rule_count/red.rb
diff options
context:
space:
mode:
authorPatrick Simianer <p@simianer.de>2011-12-03 21:38:59 +0100
committerPatrick Simianer <p@simianer.de>2011-12-03 21:38:59 +0100
commit578ed26bf818c1f18d5a319cde9b13ef9ff59f46 (patch)
treeb315bbaa2d44e8f54b1d70b1b1bb21704d89a266 /dtrain/hstreaming/rule_count/red.rb
parent4d1679b517ff46a1d6a152796f1033a4c380492c (diff)
new rule count
Diffstat (limited to 'dtrain/hstreaming/rule_count/red.rb')
-rw-r--r--dtrain/hstreaming/rule_count/red.rb22
1 files changed, 22 insertions, 0 deletions
diff --git a/dtrain/hstreaming/rule_count/red.rb b/dtrain/hstreaming/rule_count/red.rb
new file mode 100644
index 00000000..8f9109cc
--- /dev/null
+++ b/dtrain/hstreaming/rule_count/red.rb
@@ -0,0 +1,22 @@
+STDIN.set_encoding 'utf-8'
+STDOUT.set_encoding 'utf-8'
+
+def output(key, val)
+ puts "#{key}\t#{val}"
+end
+
+prev_key = nil
+sum = 0
+while line = STDIN.gets
+ key, val = line.strip.split /\t/
+ if key != prev_key && sum > 0
+ output prev_key, sum
+ prev_key = key
+ sum = 0
+ elsif !prev_key
+ prev_key = key
+ end
+ sum += val.to_i
+end
+output prev_key, sum
+