From 26c490f404731d053a6205719b6246502c07b449 Mon Sep 17 00:00:00 2001 From: Patrick Simianer Date: Sat, 14 Jun 2014 16:46:27 +0200 Subject: init --- overlapping_rules/word_pair_keys_mapred.sh | 12 ++++++++++++ 1 file changed, 12 insertions(+) create mode 100755 overlapping_rules/word_pair_keys_mapred.sh (limited to 'overlapping_rules/word_pair_keys_mapred.sh') diff --git a/overlapping_rules/word_pair_keys_mapred.sh b/overlapping_rules/word_pair_keys_mapred.sh new file mode 100755 index 0000000..3c6a3c3 --- /dev/null +++ b/overlapping_rules/word_pair_keys_mapred.sh @@ -0,0 +1,12 @@ +#!/bin/sh + +hadoop jar /usr/lib/hadoop-0.20-mapreduce/contrib/streaming/hadoop-streaming-2.0.0-mr1-cdh4.1.2.jar \ + -D mapred.reduce.tasks=24 \ + -D mapred.task.timeout=1200000000 \ + -input overlap/newstest2008-grammar+index \ + -output overlap/newstest2008-grammar_word-pair-keys \ + -mapper word_pair_keys.rb \ + -reducer "/bin/cat" \ + -file word_pair_keys.rb \ + -file util.rb + -- cgit v1.2.3