summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2019-04-22 19:47:21 -0700
committerBryan Newbold <bnewbold@robocracy.org>2019-04-22 19:49:07 -0700
commit0bac91e6b124aff9e722f206d58e72c7c4ad861b (patch)
tree4ed68b0bf4a84b9ac67570fd62e0b2aee402178c
parent5b328d8a7ddeb641d588231c1f412fa0520c0f3d (diff)
downloadfatcat-0bac91e6b124aff9e722f206d58e72c7c4ad861b.tar.gz
fatcat-0bac91e6b124aff9e722f206d58e72c7c4ad861b.zip
archive.org isn't really a repository
-rw-r--r--python/fatcat_tools/importers/common.py4
1 files changed, 3 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/common.py b/python/fatcat_tools/importers/common.py
index 49931542..beec99df 100644
--- a/python/fatcat_tools/importers/common.py
+++ b/python/fatcat_tools/importers/common.py
@@ -50,7 +50,9 @@ def test_clean():
assert clean('<b>a&amp;b</b>', force_xml=True) == '<b>a&b</b>'
DOMAIN_REL_MAP = {
- "archive.org": "repository",
+ "archive.org": "archive",
+ # LOCKSS, Portico, DuraSpace, etc would also be "archive"
+
"arxiv.org": "repository",
"babel.hathitrust.org": "repository",
"cds.cern.ch": "repository",