summaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2021-09-30 15:31:03 -0700
committerBryan Newbold <bnewbold@robocracy.org>2021-09-30 15:31:38 -0700
commit519c7e77cf3a54b9620adef07fedac9b37a5f9f2 (patch)
treec5b120c48ed5aaff087984078341cffbae1b30b8 /python
parentb5bf0697b3d3b074fd9a6a8836ac114fbd8c1df1 (diff)
downloadfatcat-519c7e77cf3a54b9620adef07fedac9b37a5f9f2.tar.gz
fatcat-519c7e77cf3a54b9620adef07fedac9b37a5f9f2.zip
default ingest request topic now '-daily'; configurable for ingest_tool.py
Diffstat (limited to 'python')
-rw-r--r--python/example.env2
-rwxr-xr-xpython/fatcat_ingest.py7
-rw-r--r--python/fatcat_web/web_config.py2
-rwxr-xr-xpython/fatcat_worker.py2
4 files changed, 9 insertions, 4 deletions
diff --git a/python/example.env b/python/example.env
index 3a83d5b3..79cbe3ad 100644
--- a/python/example.env
+++ b/python/example.env
@@ -9,7 +9,7 @@ ELASTICSEARCH_CONTAINER_INDEX="fatcat_container"
# for local dev use:
#KAFKA_PIXY_ENDPOINT="http://localhost:19092"
KAFKA_PIXY_ENDPOINT=""
-KAFKA_SAVEPAPERNOW_TOPIC="sandcrawler-dev.ingest-file-requests"
+KAFKA_SAVEPAPERNOW_TOPIC="sandcrawler-dev.ingest-file-requests-priority"
GITLAB_CLIENT_ID=""
GITLAB_CLIENT_SECRET=""
IA_XAUTH_CLIENT_ID=""
diff --git a/python/fatcat_ingest.py b/python/fatcat_ingest.py
index 1a53a7dc..b62cb8a4 100755
--- a/python/fatcat_ingest.py
+++ b/python/fatcat_ingest.py
@@ -37,7 +37,10 @@ def _run_search_dump(args, search):
print("=== THIS IS A DRY RUN ===")
kafka_producer = None
- ingest_file_request_topic = "sandcrawler-{}.ingest-file-requests".format(args.env)
+ if args.kafka_request_topic:
+ ingest_file_request_topic = args.kafka_request_topic
+ else:
+ ingest_file_request_topic = "sandcrawler-{}.ingest-file-requests-daily".format(args.env)
if args.enqueue_kafka:
print("Will send ingest requests to kafka topic: {}".format(ingest_file_request_topic), file=sys.stderr)
kafka_producer = simple_kafka_producer(args.kafka_hosts)
@@ -185,6 +188,8 @@ def main():
parser.add_argument('--kafka-hosts',
default="localhost:9092",
help="list of Kafka brokers (host/port) to use")
+ parser.add_argument('--kafka-request-topic',
+ help="exact Kafka ingest request topic to use")
parser.add_argument('--elasticsearch-endpoint',
default="https://search.fatcat.wiki",
help="elasticsearch API. internal endpoint preferred, but public is default")
diff --git a/python/fatcat_web/web_config.py b/python/fatcat_web/web_config.py
index 98b89aea..f48a7b60 100644
--- a/python/fatcat_web/web_config.py
+++ b/python/fatcat_web/web_config.py
@@ -34,7 +34,7 @@ class Config(object):
# for save-paper-now. set to None if not configured, so we don't display forms/links
KAFKA_PIXY_ENDPOINT = os.environ.get("KAFKA_PIXY_ENDPOINT", default=None) or None
- KAFKA_SAVEPAPERNOW_TOPIC = os.environ.get("KAFKA_SAVEPAPERNOW_TOPIC", default="sandcrawler-dev.ingest-file-requests")
+ KAFKA_SAVEPAPERNOW_TOPIC = os.environ.get("KAFKA_SAVEPAPERNOW_TOPIC", default="sandcrawler-dev.ingest-file-requests-priority")
# for flask things, like session cookies
FLASK_SECRET_KEY = os.environ.get("FLASK_SECRET_KEY", default=None)
diff --git a/python/fatcat_worker.py b/python/fatcat_worker.py
index 95f5024a..c3efb5f4 100755
--- a/python/fatcat_worker.py
+++ b/python/fatcat_worker.py
@@ -23,7 +23,7 @@ def run_entity_updates(args):
file_topic = "fatcat-{}.file-updates".format(args.env)
container_topic = "fatcat-{}.container-updates".format(args.env)
work_ident_topic = "fatcat-{}.work-ident-updates".format(args.env)
- ingest_file_request_topic = "sandcrawler-{}.ingest-file-requests".format(args.env)
+ ingest_file_request_topic = "sandcrawler-{}.ingest-file-requests-daily".format(args.env)
worker = EntityUpdatesWorker(args.api, args.kafka_hosts,
changelog_topic,
release_topic=release_topic,