summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMartin Czygan <martin.czygan@gmail.com>2020-01-08 03:35:41 +0100
committerMartin Czygan <martin.czygan@gmail.com>2020-01-08 03:35:41 +0100
commita23f73e37cd88de5467c47aa5f84b96448c5713d (patch)
treef52950549744c6f3d197e019d272d8bd6f58fb41
parent7d3ccb1c079f619ce664a984eef4f295294dd741 (diff)
downloadfatcat-a23f73e37cd88de5467c47aa5f84b96448c5713d.tar.gz
fatcat-a23f73e37cd88de5467c47aa5f84b96448c5713d.zip
datacite: CCDC are entries, mostly
-rw-r--r--python/fatcat_tools/importers/datacite.py4
-rw-r--r--python/tests/files/datacite/datacite_result_14.json2
2 files changed, 5 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/datacite.py b/python/fatcat_tools/importers/datacite.py
index 58dfc556..587a65aa 100644
--- a/python/fatcat_tools/importers/datacite.py
+++ b/python/fatcat_tools/importers/datacite.py
@@ -543,6 +543,10 @@ class DataciteImporter(EntityImporter):
if publisher == 'The Global Biodiversity Information Facility':
release_type = 'stub'
+ # release_type exception: lots of "Experimental Crystal Structure Determination"
+ if publisher == 'Cambridge Crystallographic Data Centre':
+ release_type = 'entry'
+
# Language values are varied ("ger", "es", "English", "ENG", "en-us",
# "other", ...). Try to crush it with langcodes: "It may sound to you
# like langcodes solves a pretty boring problem. At one level, that's
diff --git a/python/tests/files/datacite/datacite_result_14.json b/python/tests/files/datacite/datacite_result_14.json
index e28ee5c3..20f6bfd4 100644
--- a/python/tests/files/datacite/datacite_result_14.json
+++ b/python/tests/files/datacite/datacite_result_14.json
@@ -37,7 +37,7 @@
}
},
"title": "CCDC 222635: Experimental Crystal Structure Determination",
- "release_type": "dataset",
+ "release_type": "entry",
"release_stage": "published",
"release_year": 2004,
"ext_ids": {