diff options
Diffstat (limited to 'dtrain/hstreaming/red-avg.rb')
-rwxr-xr-x | dtrain/hstreaming/red-avg.rb | 9 |
1 files changed, 5 insertions, 4 deletions
diff --git a/dtrain/hstreaming/red-avg.rb b/dtrain/hstreaming/red-avg.rb index 048128f5..771f4c0e 100755 --- a/dtrain/hstreaming/red-avg.rb +++ b/dtrain/hstreaming/red-avg.rb @@ -1,10 +1,11 @@ #!/usr/bin/env ruby1.9.1 -STDIN.set_encoding 'utf-8' - shard_count_key = "__SHARD_COUNT__" +STDIN.set_encoding 'utf-8' +STDOUT.set_encoding 'utf-8' + w = {} c = {} w.default = 0 @@ -12,11 +13,11 @@ c.default = 0 while line = STDIN.gets key, val = line.split /\t/ w[key] += val.to_f - c[key] += 1.0 + c[key] += 1 end +puts "# dtrain reducer: average" shard_count = w["__SHARD_COUNT__"] - w.each_key { |k| if k == shard_count_key then next end puts "#{k}\t#{w[k]/shard_count}" |