aboutsummaryrefslogtreecommitdiffstats
path: root/mapreduce/mrjob.conf
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-04-07 00:55:02 +0000
committerBryan Newbold <bnewbold@archive.org>2018-04-07 00:55:02 +0000
commit683844f6bb26d867ea6bd2fd89d7669ace45075a (patch)
treef013ac467116f5982409bf2a05eb4bf354dafecf /mapreduce/mrjob.conf
parent1b7f579a881777a8e6fe517e9ee860ff875fe51f (diff)
downloadsandcrawler-683844f6bb26d867ea6bd2fd89d7669ace45075a.tar.gz
sandcrawler-683844f6bb26d867ea6bd2fd89d7669ace45075a.zip
configs and README updates
Diffstat (limited to 'mapreduce/mrjob.conf')
-rw-r--r--mapreduce/mrjob.conf4
1 files changed, 4 insertions, 0 deletions
diff --git a/mapreduce/mrjob.conf b/mapreduce/mrjob.conf
index cb286f1..66724cb 100644
--- a/mapreduce/mrjob.conf
+++ b/mapreduce/mrjob.conf
@@ -1,4 +1,8 @@
runners:
hadoop:
+ no_output: true
+ upload_files:
+ - common.py
+ - grobid2json.py
setup:
- export PYTHONPATH=$PYTHONPATH:venv/lib/python3.5/site-packages/