aboutsummaryrefslogtreecommitdiffstats
path: root/python/grobid_tool.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2022-05-03 17:12:48 -0700
committerBryan Newbold <bnewbold@archive.org>2022-05-03 17:12:48 -0700
commit00ae74378413e87f230c88113ff8163a6f969d63 (patch)
tree16cdcbde7a002704e80f494b7fd13fc5c19dd695 /python/grobid_tool.py
parentef0421567dd67a248d0f92f32ad4e14ae0776920 (diff)
downloadsandcrawler-00ae74378413e87f230c88113ff8163a6f969d63.tar.gz
sandcrawler-00ae74378413e87f230c88113ff8163a6f969d63.zip
switch default kafka-broker host from wbgrp-svc263 to wbgrp-svc350
Diffstat (limited to 'python/grobid_tool.py')
-rwxr-xr-xpython/grobid_tool.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/grobid_tool.py b/python/grobid_tool.py
index 029cbf1..3ffac98 100755
--- a/python/grobid_tool.py
+++ b/python/grobid_tool.py
@@ -5,7 +5,7 @@ might go to stdout, or might go to Kafka topic.
Example of large parallel run, locally:
- cat /srv/sandcrawler/tasks/ungrobided.2019-09-23.json | pv -l | parallel -j30 --pipe ./grobid_tool.py --kafka-env prod --kafka-hosts wbgrp-svc263.us.archive.org:9092,wbgrp-svc284.us.archive.org:9092,wbgrp-svc285.us.archive.org:9092 --kafka-mode --grobid-host http://localhost:8070 -j0 extract-json -
+ cat /srv/sandcrawler/tasks/ungrobided.2019-09-23.json | pv -l | parallel -j30 --pipe ./grobid_tool.py --kafka-env prod --kafka-hosts wbgrp-svc350.us.archive.org:9092,wbgrp-svc284.us.archive.org:9092,wbgrp-svc285.us.archive.org:9092 --kafka-mode --grobid-host http://localhost:8070 -j0 extract-json -
"""
import argparse