From fa11747574f086e99459914f93d24bad7a8eacce Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Thu, 17 Jun 2021 16:26:50 -0700 Subject: more consistent and defensive lower-casing of DOIs After noticing more upper/lower ambiguity in production. In particular, we have some old ingest requests in sandcrawler DB, which get re-submitted/re-tried, which have capitalized DOIs in the link source id field. --- python/fatcat_tools/importers/ingest.py | 4 ++++ 1 file changed, 4 insertions(+) (limited to 'python/fatcat_tools/importers/ingest.py') diff --git a/python/fatcat_tools/importers/ingest.py b/python/fatcat_tools/importers/ingest.py index 483932ad..ae3e147a 100644 --- a/python/fatcat_tools/importers/ingest.py +++ b/python/fatcat_tools/importers/ingest.py @@ -133,6 +133,8 @@ class IngestFileResultImporter(EntityImporter): extid = request['ext_ids'].get(extid_type) if not extid: continue + if extid_type == 'doi': + extid = extid.lower() try: release = self.api.lookup_release(**{extid_type: extid}) except fatcat_openapi_client.rest.ApiException as err: @@ -217,6 +219,8 @@ class IngestFileResultImporter(EntityImporter): if request.get('link_source') and request.get('link_source_id'): edit_extra['link_source'] = request['link_source'] edit_extra['link_source_id'] = request['link_source_id'] + if edit_extra['link_source'] == 'doi': + edit_extra['link_source_id'] = edit_extra['link_source_id'].lower() return edit_extra -- cgit v1.2.3