diff options
-rw-r--r-- | notes/known_issues.md | 8 | ||||
-rw-r--r-- | tests/data/release/s5a6e6wnlvdelge256xpha6oqu | 46 | ||||
-rw-r--r-- | tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy | 44 | ||||
-rw-r--r-- | tests/data/verify.csv | 1 |
4 files changed, 99 insertions, 0 deletions
diff --git a/notes/known_issues.md b/notes/known_issues.md index e80acdc..32194fd 100644 --- a/notes/known_issues.md +++ b/notes/known_issues.md @@ -26,6 +26,14 @@ Sometimes, a lexicon entry is a "dataset", sometimes a "book", e.g. "Unold, Max" * https://fatcat.wiki/release/2kpa6ynwjzhtbbokqyxcl25gmm * https://fatcat.wiki/release/o4dh7w7nqvdknm4j336yrom4wy +## Article and Erratum + +* https://fatcat.wiki/release/s5a6e6wnlvdelge256xpha6oqu +* https://fatcat.wiki/release/zoeto2mymzhi3l74fr2ps5qjyy + +We think "EXACT", but is an errata and an article an exact match? They should +belong to the same cluster, that's probably ok. + # Ideas for fixes * [x] when title and authors match, check the year, and maybe the doi prefix; diff --git a/tests/data/release/s5a6e6wnlvdelge256xpha6oqu b/tests/data/release/s5a6e6wnlvdelge256xpha6oqu new file mode 100644 index 0000000..29d9f83 --- /dev/null +++ b/tests/data/release/s5a6e6wnlvdelge256xpha6oqu @@ -0,0 +1,46 @@ +{ + "abstracts": [], + "container_id": "jurtf7gsrbgzzm2hdpnmafjeju", + "contribs": [ + { + "index": 0, + "raw_name": "D. Daubner", + "role": "author" + }, + { + "index": 1, + "raw_name": "T. Juratli", + "role": "author" + }, + { + "index": 2, + "raw_name": "K. Engellandt", + "role": "author" + } + ], + "ext_ids": { + "doi": "10.1055/s-0032-1313212", + "pmid": "23023226", + "wikidata_qid": "Q45276716" + }, + "extra": { + "crossref": { + "type": "journal-article" + } + }, + "ident": "s5a6e6wnlvdelge256xpha6oqu", + "issue": "01", + "language": "de", + "pages": "71-73", + "publisher": "Georg Thieme Verlag KG", + "refs": [], + "release_date": "2012-09-21", + "release_stage": "published", + "release_type": "article-journal", + "release_year": 2012, + "revision": "b2141656-18d3-4325-a144-e3ece361bc0a", + "state": "active", + "title": "Ruptur eines reifen intrakraniellen Teratoms", + "volume": "185", + "work_id": "r7lldkbnvbbcniqnwdcwd5c2gm" +} diff --git a/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy b/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy new file mode 100644 index 0000000..952966d --- /dev/null +++ b/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy @@ -0,0 +1,44 @@ +{ + "abstracts": [], + "container_id": "jurtf7gsrbgzzm2hdpnmafjeju", + "contribs": [ + { + "index": 0, + "raw_name": "D. Daubner", + "role": "author" + }, + { + "index": 1, + "raw_name": "T. Juratli", + "role": "author" + }, + { + "index": 2, + "raw_name": "K. Engellandt", + "role": "author" + } + ], + "ext_ids": { + "doi": "10.1055/s-0032-1330472" + }, + "extra": { + "crossref": { + "type": "journal-article" + } + }, + "ident": "zoeto2mymzhi3l74fr2ps5qjyy", + "issue": "01", + "language": "de", + "pages": "E2-E2", + "publisher": "Georg Thieme Verlag KG", + "refs": [], + "release_date": "2012-12-20", + "release_stage": "published", + "release_type": "article-journal", + "release_year": 2012, + "revision": "df95fb6f-ad31-45a2-8b97-322fc1fb3342", + "state": "active", + "title": "Ruptur eines reifen intrakraniellen Teratoms", + "volume": "185", + "work_id": "wb533kwwszbqfijj2lq7su3kva" +} diff --git a/tests/data/verify.csv b/tests/data/verify.csv index 313dc01..a9eaf0c 100644 --- a/tests/data/verify.csv +++ b/tests/data/verify.csv @@ -179,3 +179,4 @@ fppfjl5kt5dsnfl2i5rarhqaaq,zqqbuha3uzd2fcvekdy3ygxnni,Status.DIFFERENT,CONTRIB_I cq6xrtp5zvesrjsklvseej6l5y,ufjdsz5ejbafbdpnuygvbotx5m,Status.EXACT,TITLE_AUTHOR_MATCH cfrqezy7uzgnnnp542pa3mu4yi,dwlvdxtqdzdmzkdyd2jo3lztna,Status.STRONG,TOKENIZED_AUTHORS 3w7pt5hlu5bvjkyo2dtoxm4ltq,3waartzi5vfprewchjr4z5nbi4,, +s5a6e6wnlvdelge256xpha6oqu,zoeto2mymzhi3l74fr2ps5qjyy,, |