From 53756811572bab0679cb8cee1b9de95e7b29b96a Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Fri, 17 Jan 2020 14:03:00 +0100 Subject: do not normalize "en dash" in DOI Technically, [...] DOI names may incorporate any printable characters from the Universal Character Set (UCS-2), of ISO/IEC 10646, which is the character set defined by Unicode (https://www.doi.org/doi_handbook/2_Numbering.html#2.5.1). For mostly QA reasons, we currently treat a DOI with an "en dash" as invalid. --- python/tests/files/datacite/datacite_doc_23.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'python/tests/files/datacite') diff --git a/python/tests/files/datacite/datacite_doc_23.json b/python/tests/files/datacite/datacite_doc_23.json index b755f1a5..8eaa8c21 100644 --- a/python/tests/files/datacite/datacite_doc_23.json +++ b/python/tests/files/datacite/datacite_doc_23.json @@ -23,7 +23,7 @@ "dateType": "Issued" } ], - "doi": "10.7916/d86x0cg1–xxx", + "doi": "10.7916/d86x0cg1-xxx", "isActive": true, "language": "GERMAN", "publicationYear": 2017, -- cgit v1.2.3