diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2020-03-02 16:41:02 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2020-03-02 16:41:02 -0800 |
commit | f4cce5a765a9f80f9c5e9c907689c06dc9ebf102 (patch) | |
tree | ae2b668c680c4163845e9b06b271f823aa963239 | |
parent | 3ff5c1f371fb6764df415e816884e1be0577088c (diff) | |
download | fatcat-f4cce5a765a9f80f9c5e9c907689c06dc9ebf102.tar.gz fatcat-f4cce5a765a9f80f9c5e9c907689c06dc9ebf102.zip |
add --force-crawl flag to ingest tool
-rwxr-xr-x | python/fatcat_ingest.py | 5 |
1 files changed, 5 insertions, 0 deletions
diff --git a/python/fatcat_ingest.py b/python/fatcat_ingest.py index 6fda74c5..9ba95015 100755 --- a/python/fatcat_ingest.py +++ b/python/fatcat_ingest.py @@ -90,6 +90,8 @@ def _run_search_dump(args, search): ) if not ingest_request: continue + if args.force_recrawl: + ingest_request['force_recrawl'] = True counts['ingest_request'] += 1 if args.dry_run: continue @@ -206,6 +208,9 @@ def main(): parser.add_argument('--allow-non-oa', action='store_true', help="By default, we limit to OA releases. This removes that filter") + parser.add_argument('--force-recrawl', + action='store_true', + help="Tell ingest worker to skip GWB history lookup and do SPNv2 crawl") subparsers = parser.add_subparsers() sub_container = subparsers.add_parser('container', |