diff options
-rwxr-xr-x | please | 8 |
1 files changed, 4 insertions, 4 deletions
@@ -22,7 +22,7 @@ GROBID_URI = "http://wbgrp-svc096.us.archive.org:8070" def rebuild_python(): print("Rebuilding python venv...") - cmd = """cd python; + cmd = """cd python_hadoop; export PIPENV_VENV_IN_PROJECT=1; pipenv install --deploy tar -czf venv-current.tar.gz -C .venv .""" @@ -41,7 +41,7 @@ def run_backfill(args): HDFS_DIR, args.env, datetime.strftime(datetime.now(), "%Y-%m-%d-%H%M.%S")) - cmd = """cd python; + cmd = """cd python_hadoop; pipenv run ./backfill_hbase_from_cdx.py \ --hbase-host {hbase_host} \ --hbase-table wbgrp-journal-extract-0-{env} \ @@ -61,7 +61,7 @@ def run_extract(args): HDFS_DIR, args.env, datetime.strftime(datetime.now(), "%Y-%m-%d-%H%M.%S")) - cmd = """cd python; + cmd = """cd python_hadoop; pipenv run ./extraction_cdx_grobid.py \ --hbase-host {hbase_host} \ --hbase-table wbgrp-journal-extract-0-{env} \ @@ -89,7 +89,7 @@ def run_extract_ungrobided(args): HDFS_DIR, args.env, datetime.strftime(datetime.now(), "%Y-%m-%d-%H%M.%S")) - cmd = """cd python; + cmd = """cd python_hadoop; pipenv run ./extraction_ungrobided.py \ --hbase-host {hbase_host} \ --hbase-table wbgrp-journal-extract-0-{env} \ |