aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-04-15 05:44:07 +0000
committerBryan Newbold <bnewbold@archive.org>2018-04-19 05:15:02 +0000
commita8a568f03d7f537a8683adf23f6643c7704e8d3d (patch)
treedcaa8defc9a604304d6f234d42b084e22485d9c2
parentc3e925cdd00c28531ee37ac7ada5cdee229762db (diff)
downloadsandcrawler-a8a568f03d7f537a8683adf23f6643c7704e8d3d.tar.gz
sandcrawler-a8a568f03d7f537a8683adf23f6643c7704e8d3d.zip
local mrjob config
-rw-r--r--mapreduce/mrjob.conf6
1 files changed, 6 insertions, 0 deletions
diff --git a/mapreduce/mrjob.conf b/mapreduce/mrjob.conf
index 6e75505..6f36196 100644
--- a/mapreduce/mrjob.conf
+++ b/mapreduce/mrjob.conf
@@ -1,4 +1,10 @@
runners:
+ local:
+ upload_files:
+ - common.py
+ - grobid2json.py
+ setup:
+ - export PYTHONPATH=$PYTHONPATH:venv/lib/python3.5/site-packages/
hadoop:
no_output: true
upload_files: