aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-02-13 23:11:14 -0800
committerBryan Newbold <bnewbold@archive.org>2020-02-13 23:11:14 -0800
commitf613f69a40fcc9a445f21cadd35d7c36c8061db8 (patch)
tree30bbbc7a3463625adf9b567cb91623c917ea5562
parent2db64d580e3b5995e328c719e2bd014124179d0b (diff)
downloadsandcrawler-f613f69a40fcc9a445f21cadd35d7c36c8061db8.tar.gz
sandcrawler-f613f69a40fcc9a445f21cadd35d7c36c8061db8.zip
ingest: bulk workers don't hit SPNv2
-rwxr-xr-xpython/sandcrawler_worker.py2
1 files changed, 2 insertions, 0 deletions
diff --git a/python/sandcrawler_worker.py b/python/sandcrawler_worker.py
index 02d075c..0ba4d03 100755
--- a/python/sandcrawler_worker.py
+++ b/python/sandcrawler_worker.py
@@ -108,6 +108,8 @@ def run_ingest_file(args):
grobid_client=grobid_client,
sink=sink,
grobid_sink=grobid_sink,
+ # don't SPNv2 for --bulk backfill
+ try_spn2=not args.bulk,
)
pusher = KafkaJsonPusher(
worker=worker,