Skip to content

Commit

Permalink
removed local file path prefixes
Browse files Browse the repository at this point in the history
since we're storing results in hdfs, I had to remove prefixes from the
input / output locations
  • Loading branch information
zbsimon committed Apr 20, 2015
1 parent 7c978de commit 8b56fa3
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions map_reduce_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -61,8 +61,8 @@ def run_map_job(mapper, input_dir, output_dir,
-libjars {1} \
-D mapreduce.job.reduces=0 \
-D stream.map.output.field.separator={2} \
-input $NLTK_HOME/{3} \
-output $NLTK_HOME/{4} \
-input {3} \
-output {4} \
-mapper "$NLTK_HOME/{5}" \
-inputformat {6} \
-outputformat {7}
Expand Down Expand Up @@ -96,8 +96,8 @@ def run_map_reduce_job(mapper, reducer, input_dir, output_dir,
-D stream.map.output.field.separator={2} \
-mapper "$NLTK_HOME/{3}" \
-reducer "$NLTK_HOME/{4}" \
-input $NLTK_HOME/{5} \
-output $NLTK_HOME/{6} \
-input {5} \
-output {6} \
-inputformat {7} \
-outputformat {8}
'''.format(files, "$AVRO_JAR,$HADOOP_JAR", kv_separator, mapper, reducer,
Expand Down

0 comments on commit 8b56fa3

Please sign in to comment.