From fcc6f24a95a7b77bda4ec813daecc2b737a82412 Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Tue, 7 Jul 2020 02:08:26 +0200 Subject: datacite: address duplicated contributor issue Use string comparison. * https://fatcat.wiki/release/spjysmrnsrgyzgq6ise5o44rlu/contribs * https://api.datacite.org/dois/10.25940/roper-31098406 --- python/tests/files/datacite/datacite_doc_33.json | 62 ++++++++++++++++++++++ .../tests/files/datacite/datacite_result_05.json | 3 -- .../tests/files/datacite/datacite_result_08.json | 7 --- .../tests/files/datacite/datacite_result_33.json | 31 +++++++++++ 4 files changed, 93 insertions(+), 10 deletions(-) create mode 100644 python/tests/files/datacite/datacite_doc_33.json create mode 100644 python/tests/files/datacite/datacite_result_33.json (limited to 'python/tests/files/datacite') diff --git a/python/tests/files/datacite/datacite_doc_33.json b/python/tests/files/datacite/datacite_doc_33.json new file mode 100644 index 00000000..571d1220 --- /dev/null +++ b/python/tests/files/datacite/datacite_doc_33.json @@ -0,0 +1,62 @@ +{ + "id": "10.17912/micropub.biology.000143", + "type": "dois", + "attributes": { + "doi": "10.17912/micropub.biology.000143", + "identifiers": null, + "creators": [ + { + "name": "ABC News", + "givenName": "", + "familyName": "", + "affiliation": [], + "role": "author" + } + ], + "titles": [ + { + "title": "Sample" + } + ], + "publisher": "microPublication Biology", + "publicationYear": 2019, + "types": { + "resourceTypeGeneral": "DataPaper" + }, + "relatedIdentifiers": [], + "sizes": [], + "formats": [], + "version": null, + "rightsList": [], + "descriptions": [ + { + "description": 1234567890, + "descriptionType": "Abstract" + } + ], + "geoLocations": [], + "fundingReferences": [], + "url": "https://www.micropublication.org/journals/biology/micropub.biology.000143", + "created": "2019-08-19T14:43:08.000Z", + "registered": "2019-08-19T14:43:09.000Z", + "published": "2019", + "updated": "2019-11-09T12:32:02.000Z", + "contributors": [ + { + "name": "ABC News", + "givenName": "", + "familyName": "", + "affiliation": [], + "role": "" + } + ] + }, + "relationships": { + "client": { + "data": { + "id": "caltech.micropub", + "type": "clients" + } + } + } +} diff --git a/python/tests/files/datacite/datacite_result_05.json b/python/tests/files/datacite/datacite_result_05.json index 79c2a8fb..d634490d 100644 --- a/python/tests/files/datacite/datacite_result_05.json +++ b/python/tests/files/datacite/datacite_result_05.json @@ -504,9 +504,6 @@ "role": "author", "surname": "Wurzbacher" }, - { - "raw_name": "Kessy Abarenkov" - }, { "raw_name": "NHM UT-University Of Tartu; Natural History Museum And Botanic Garden" } diff --git a/python/tests/files/datacite/datacite_result_08.json b/python/tests/files/datacite/datacite_result_08.json index 70237280..5a46ef50 100644 --- a/python/tests/files/datacite/datacite_result_08.json +++ b/python/tests/files/datacite/datacite_result_08.json @@ -13,13 +13,6 @@ "raw_name": "Kei Kajisa", "role": "author", "surname": "Kajisa" - }, - { - "given_name": "Kei", - "index": 1, - "raw_name": "Kei Kajisa", - "role": "author", - "surname": "Kajisa" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_33.json b/python/tests/files/datacite/datacite_result_33.json new file mode 100644 index 00000000..bcb72469 --- /dev/null +++ b/python/tests/files/datacite/datacite_result_33.json @@ -0,0 +1,31 @@ +{ + "abstracts": [ + { + "content": "1234567890", + "mimetype": "text/plain" + } + ], + "contribs": [ + { + "given_name": "", + "surname": "", + "index": 0, + "raw_name": "ABC News", + "role": "author" + } + ], + "ext_ids": { + "doi": "10.17912/micropub.biology.000143" + }, + "extra": { + "datacite": { + "resourceTypeGeneral": "DataPaper" + }, + "container_name": "microPublication Biology" + }, + "refs": [], + "release_stage": "published", + "release_year": 2019, + "publisher": "microPublication Biology", + "title": "Sample" +} -- cgit v1.2.3 From 40f77b78aa331ca67b510dfece77e6a6000f8c2f Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Fri, 10 Jul 2020 00:50:34 +0200 Subject: wip: contrib, GH59 --- python/tests/files/datacite/datacite_doc_34.json | 61 ++++++++++++++++++++++ .../tests/files/datacite/datacite_result_05.json | 3 +- .../tests/files/datacite/datacite_result_09.json | 3 +- .../tests/files/datacite/datacite_result_26.json | 3 +- .../tests/files/datacite/datacite_result_34.json | 38 ++++++++++++++ 5 files changed, 105 insertions(+), 3 deletions(-) create mode 100644 python/tests/files/datacite/datacite_doc_34.json create mode 100644 python/tests/files/datacite/datacite_result_34.json (limited to 'python/tests/files/datacite') diff --git a/python/tests/files/datacite/datacite_doc_34.json b/python/tests/files/datacite/datacite_doc_34.json new file mode 100644 index 00000000..5dcf65f4 --- /dev/null +++ b/python/tests/files/datacite/datacite_doc_34.json @@ -0,0 +1,61 @@ +{ + "id": "10.17912/micropub.biology.000143", + "type": "dois", + "attributes": { + "doi": "10.17912/micropub.biology.000143", + "identifiers": null, + "creators": [ + { + "name": "Paul Katz", + "givenName": "", + "familyName": "", + "affiliation": [], + "role": "author" + } + ], + "titles": [ + { + "title": "Sample" + } + ], + "publisher": "microPublication Biology", + "publicationYear": 2019, + "types": { + "resourceTypeGeneral": "DataPaper" + }, + "relatedIdentifiers": [], + "sizes": [], + "formats": [], + "version": null, + "rightsList": [], + "descriptions": [ + { + "description": 1234567890, + "descriptionType": "Abstract" + } + ], + "geoLocations": [], + "fundingReferences": [], + "url": "https://www.micropublication.org/journals/biology/micropub.biology.000143", + "created": "2019-08-19T14:43:08.000Z", + "registered": "2019-08-19T14:43:09.000Z", + "published": "2019", + "updated": "2019-11-09T12:32:02.000Z", + "contributors": [ + { + "name": "Paul Katz", + "givenName": "", + "familyName": "", + "affiliation": [], + "role": "illustrator" + } ] + }, + "relationships": { + "client": { + "data": { + "id": "caltech.micropub", + "type": "clients" + } + } + } +} diff --git a/python/tests/files/datacite/datacite_result_05.json b/python/tests/files/datacite/datacite_result_05.json index d634490d..c91f3a7f 100644 --- a/python/tests/files/datacite/datacite_result_05.json +++ b/python/tests/files/datacite/datacite_result_05.json @@ -505,7 +505,8 @@ "surname": "Wurzbacher" }, { - "raw_name": "NHM UT-University Of Tartu; Natural History Museum And Botanic Garden" + "raw_name": "NHM UT-University Of Tartu; Natural History Museum And Botanic Garden", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_09.json b/python/tests/files/datacite/datacite_result_09.json index 09e02fc7..f6ec524a 100644 --- a/python/tests/files/datacite/datacite_result_09.json +++ b/python/tests/files/datacite/datacite_result_09.json @@ -17,7 +17,8 @@ "extra": { "type": "DataManager" }, - "raw_name": "Technische Informationsbibliothek (TIB)" + "raw_name": "Technische Informationsbibliothek (TIB)", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_26.json b/python/tests/files/datacite/datacite_result_26.json index 267eb9c2..f6e589ef 100644 --- a/python/tests/files/datacite/datacite_result_26.json +++ b/python/tests/files/datacite/datacite_result_26.json @@ -13,7 +13,8 @@ }, "given_name": "David", "raw_name": "David Wemmer", - "surname": "Wemmer" + "surname": "Wemmer", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_34.json b/python/tests/files/datacite/datacite_result_34.json new file mode 100644 index 00000000..8e087ab5 --- /dev/null +++ b/python/tests/files/datacite/datacite_result_34.json @@ -0,0 +1,38 @@ +{ + "abstracts": [ + { + "content": "1234567890", + "mimetype": "text/plain" + } + ], + "contribs": [ + { + "given_name": "", + "surname": "", + "index": 0, + "raw_name": "Paul Katz", + "role": "author" + }, + { + "given_name": "", + "surname": "", + "index": 0, + "raw_name": "Paul Katz", + "role": "illustrator" + } + ], + "ext_ids": { + "doi": "10.17912/micropub.biology.000143" + }, + "extra": { + "datacite": { + "resourceTypeGeneral": "DataPaper" + }, + "container_name": "microPublication Biology" + }, + "refs": [], + "release_stage": "published", + "release_year": 2019, + "publisher": "microPublication Biology", + "title": "Sample" +} -- cgit v1.2.3 From fdf1028c19b0623e30b91e49ffa65ed130dcfdc1 Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Fri, 10 Jul 2020 18:29:47 +0200 Subject: datacite: adjust tests --- python/tests/files/datacite/datacite_result_27.json | 3 ++- python/tests/files/datacite/datacite_result_28.json | 3 ++- python/tests/files/datacite/datacite_result_29.json | 3 ++- python/tests/files/datacite/datacite_result_34.json | 7 ------- 4 files changed, 6 insertions(+), 10 deletions(-) (limited to 'python/tests/files/datacite') diff --git a/python/tests/files/datacite/datacite_result_27.json b/python/tests/files/datacite/datacite_result_27.json index 3d033e6a..e934fb41 100644 --- a/python/tests/files/datacite/datacite_result_27.json +++ b/python/tests/files/datacite/datacite_result_27.json @@ -13,7 +13,8 @@ }, "given_name": "David", "raw_name": "David Wemmer", - "surname": "Wemmer" + "surname": "Wemmer", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_28.json b/python/tests/files/datacite/datacite_result_28.json index 84bed9c8..bcb1caaf 100644 --- a/python/tests/files/datacite/datacite_result_28.json +++ b/python/tests/files/datacite/datacite_result_28.json @@ -13,7 +13,8 @@ }, "given_name": "David", "raw_name": "David Wemmer", - "surname": "Wemmer" + "surname": "Wemmer", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_29.json b/python/tests/files/datacite/datacite_result_29.json index 84bed9c8..bcb1caaf 100644 --- a/python/tests/files/datacite/datacite_result_29.json +++ b/python/tests/files/datacite/datacite_result_29.json @@ -13,7 +13,8 @@ }, "given_name": "David", "raw_name": "David Wemmer", - "surname": "Wemmer" + "surname": "Wemmer", + "role": "author" } ], "ext_ids": { diff --git a/python/tests/files/datacite/datacite_result_34.json b/python/tests/files/datacite/datacite_result_34.json index 8e087ab5..4a52e22c 100644 --- a/python/tests/files/datacite/datacite_result_34.json +++ b/python/tests/files/datacite/datacite_result_34.json @@ -12,13 +12,6 @@ "index": 0, "raw_name": "Paul Katz", "role": "author" - }, - { - "given_name": "", - "surname": "", - "index": 0, - "raw_name": "Paul Katz", - "role": "illustrator" } ], "ext_ids": { -- cgit v1.2.3