diff options
author | Chris Dyer <redpony@gmail.com> | 2013-03-18 05:14:48 -0700 |
---|---|---|
committer | Chris Dyer <redpony@gmail.com> | 2013-03-18 05:14:48 -0700 |
commit | 3aeab176d9068b13e3ca3394be4f9089f5952517 (patch) | |
tree | f0d458ee427a3dd3632c99ea7febe463dc571e07 /training/dtrain/hstreaming/hadoop-streaming-job.sh | |
parent | 4f452c5bf5cd0ed3cb50d31012f93a50366b3aac (diff) | |
parent | a416615b81380d664246f11a8047098c59185838 (diff) |
Merge pull request #17 from pks/master
dtrain
Diffstat (limited to 'training/dtrain/hstreaming/hadoop-streaming-job.sh')
-rwxr-xr-x | training/dtrain/hstreaming/hadoop-streaming-job.sh | 30 |
1 files changed, 0 insertions, 30 deletions
diff --git a/training/dtrain/hstreaming/hadoop-streaming-job.sh b/training/dtrain/hstreaming/hadoop-streaming-job.sh deleted file mode 100755 index 92419956..00000000 --- a/training/dtrain/hstreaming/hadoop-streaming-job.sh +++ /dev/null @@ -1,30 +0,0 @@ -#!/bin/sh - -EXP=a_simple_test - -# change these vars to fit your hadoop installation -HADOOP_HOME=/usr/lib/hadoop-0.20 -JAR=contrib/streaming/hadoop-streaming-0.20.2-cdh3u1.jar -HSTREAMING="$HADOOP_HOME/bin/hadoop jar $HADOOP_HOME/$JAR" - - IN=input_on_hdfs -OUT=output_weights_on_hdfs - -# you can -reducer to NONE if you want to -# do feature selection/averaging locally (e.g. to -# keep weights of all epochs) -$HSTREAMING \ - -mapper "dtrain.sh" \ - -reducer "ruby lplp.rb l2 select_k 100000" \ - -input $IN \ - -output $OUT \ - -file dtrain.sh \ - -file lplp.rb \ - -file ../dtrain \ - -file dtrain.ini \ - -file cdec.ini \ - -file ../test/example/nc-wmt11.en.srilm.gz \ - -jobconf mapred.reduce.tasks=30 \ - -jobconf mapred.max.map.failures.percent=0 \ - -jobconf mapred.job.name="dtrain $EXP" - |