diff options
Diffstat (limited to 'python/fatcat_import.py')
-rwxr-xr-x | python/fatcat_import.py | 25 |
1 files changed, 25 insertions, 0 deletions
diff --git a/python/fatcat_import.py b/python/fatcat_import.py index e80c5d5b..91fa2279 100755 --- a/python/fatcat_import.py +++ b/python/fatcat_import.py @@ -31,6 +31,16 @@ def run_arxiv(args): else: Bs4XmlFilePusher(ari, args.xml_file, "record").run() +def run_pubmed(args): + pi = PubmedImporter(args.api, + args.issn_map_file, + edit_batch_size=args.batch_size) + if args.kafka_mode: + raise NotImplementedError + #KafkaBs4XmlPusher(pi, args.kafka_hosts, args.kafka_env, "api-pubmed", "fatcat-import").run() + else: + Bs4XmlFilePusher(pi, args.xml_file, "PubmedArticle").run() + def run_orcid(args): foi = OrcidImporter(args.api, edit_batch_size=args.batch_size) @@ -185,6 +195,21 @@ def main(): action='store_true', help="consume from kafka topic (not stdin)") + sub_pubmed = subparsers.add_parser('pubmed') + sub_pubmed.set_defaults( + func=run_pubmed, + auth_var="FATCAT_AUTH_WORKER_PUBMED", + ) + sub_pubmed.add_argument('xml_file', + help="Pubmed XML file to import from", + default=sys.stdin, type=argparse.FileType('r')) + sub_pubmed.add_argument('issn_map_file', + help="ISSN to ISSN-L mapping file", + default=None, type=argparse.FileType('r')) + sub_pubmed.add_argument('--kafka-mode', + action='store_true', + help="consume from kafka topic (not stdin)") + sub_orcid = subparsers.add_parser('orcid') sub_orcid.set_defaults( func=run_orcid, |