summaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2019-05-22 16:01:37 -0700
committerBryan Newbold <bnewbold@robocracy.org>2019-05-22 16:01:37 -0700
commit5af153683cdd9b883bc142a4bd7bb447612d494a (patch)
treefd1332dbce1db1dd5019008bc8ba67e939544f08 /python
parenta9752a685be5a0ff7794ba652ca7954cb7508124 (diff)
downloadfatcat-5af153683cdd9b883bc142a4bd7bb447612d494a.tar.gz
fatcat-5af153683cdd9b883bc142a4bd7bb447612d494a.zip
more strict pubmed DOI handling
Diffstat (limited to 'python')
-rw-r--r--python/fatcat_tools/importers/pubmed.py4
1 files changed, 3 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/pubmed.py b/python/fatcat_tools/importers/pubmed.py
index b33bbf13..e5d413a7 100644
--- a/python/fatcat_tools/importers/pubmed.py
+++ b/python/fatcat_tools/importers/pubmed.py
@@ -380,7 +380,9 @@ class PubmedImporter(EntityImporter):
doi = doi.string.lower()
if doi.startswith('doi:'):
doi = doi[4:]
- assert doi.startswith('10.')
+ if not (doi.startswith('10.') and '/' in doi and doi.split('/')[1]):
+ sys.stderr.write("BOGUS DOI: {}\n".format(doi))
+ doi = None
pmcid = identifiers.find("ArticleId", IdType="pmc")
if pmcid: