aboutsummaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-06-25 14:31:28 -0700
committerBryan Newbold <bnewbold@archive.org>2020-06-25 14:31:28 -0700
commitf651f171499d011a83a247eefb23c4e8a789b1c8 (patch)
tree4d36b07839a9532afc1a823d97fd02f274cf47bf /python
parentbe5a45fdf0622e6b65663d08f577aa41e0e89be0 (diff)
downloadsandcrawler-f651f171499d011a83a247eefb23c4e8a789b1c8.tar.gz
sandcrawler-f651f171499d011a83a247eefb23c4e8a789b1c8.zip
args.kafka_env refactor didn't happen (yet)
Diffstat (limited to 'python')
-rwxr-xr-xpython/sandcrawler_worker.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/python/sandcrawler_worker.py b/python/sandcrawler_worker.py
index 638dc35..0fd0194 100755
--- a/python/sandcrawler_worker.py
+++ b/python/sandcrawler_worker.py
@@ -51,8 +51,8 @@ def run_grobid_extract(args):
def run_pdf_extract(args):
consume_topic = "sandcrawler-{}.unextracted".format(args.env)
- text_topic = "sandcrawler-{}.pdf-text".format(args.kafka_env)
- thumbnail_topic = "sandcrawler-{}.pdf-thumbnail-180px-jpg".format(args.kafka_env)
+ text_topic = "sandcrawler-{}.pdf-text".format(args.env)
+ thumbnail_topic = "sandcrawler-{}.pdf-thumbnail-180px-jpg".format(args.env)
text_sink = KafkaCompressSink(
kafka_hosts=args.kafka_hosts,
produce_topic=text_topic,