aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2020-01-15 14:03:50 -0800
committerBryan Newbold <bnewbold@robocracy.org>2020-01-15 14:03:50 -0800
commit234dfa11d4e552d4ef784d8c7b13bfdaf42c597c (patch)
tree91e8ac4c9e60f54b0fc4480cbaf5a452d0797b77
parentec445720e768d3f0cc56c03052833b86d5068547 (diff)
downloadfatcat-234dfa11d4e552d4ef784d8c7b13bfdaf42c597c.tar.gz
fatcat-234dfa11d4e552d4ef784d8c7b13bfdaf42c597c.zip
ingest: allow more sources to auto-import
-rw-r--r--python/fatcat_tools/importers/ingest.py3
1 files changed, 2 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/ingest.py b/python/fatcat_tools/importers/ingest.py
index 16643eb5..e53dcae5 100644
--- a/python/fatcat_tools/importers/ingest.py
+++ b/python/fatcat_tools/importers/ingest.py
@@ -29,6 +29,7 @@ class IngestFileResultImporter(EntityImporter):
self.ingest_request_source_whitelist = [
'fatcat-changelog',
'fatcat-ingest-container',
+ 'fatcat-ingest',
'arabesque',
]
if kwargs.get('skip_source_whitelist', False):
@@ -57,7 +58,7 @@ class IngestFileResultImporter(EntityImporter):
self.counts['skip-ingest_request_source'] += 1
return False
if source.startswith('arabesque'):
- if row['reqeust'].get('link_source') not in ('arxiv', 'pmc'):
+ if row['reqeust'].get('link_source') not in ('arxiv', 'pmc', 'unpaywall', 'doi'):
self.counts['skip-arabesque-source'] += 1
return False
if source.startswith('savepapernow'):