aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--notes/known_issues.md8
-rw-r--r--tests/data/release/s5a6e6wnlvdelge256xpha6oqu46
-rw-r--r--tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy44
-rw-r--r--tests/data/verify.csv1
4 files changed, 99 insertions, 0 deletions
diff --git a/notes/known_issues.md b/notes/known_issues.md
index e80acdc..32194fd 100644
--- a/notes/known_issues.md
+++ b/notes/known_issues.md
@@ -26,6 +26,14 @@ Sometimes, a lexicon entry is a "dataset", sometimes a "book", e.g. "Unold, Max"
* https://fatcat.wiki/release/2kpa6ynwjzhtbbokqyxcl25gmm
* https://fatcat.wiki/release/o4dh7w7nqvdknm4j336yrom4wy
+## Article and Erratum
+
+* https://fatcat.wiki/release/s5a6e6wnlvdelge256xpha6oqu
+* https://fatcat.wiki/release/zoeto2mymzhi3l74fr2ps5qjyy
+
+We think "EXACT", but is an errata and an article an exact match? They should
+belong to the same cluster, that's probably ok.
+
# Ideas for fixes
* [x] when title and authors match, check the year, and maybe the doi prefix;
diff --git a/tests/data/release/s5a6e6wnlvdelge256xpha6oqu b/tests/data/release/s5a6e6wnlvdelge256xpha6oqu
new file mode 100644
index 0000000..29d9f83
--- /dev/null
+++ b/tests/data/release/s5a6e6wnlvdelge256xpha6oqu
@@ -0,0 +1,46 @@
+{
+ "abstracts": [],
+ "container_id": "jurtf7gsrbgzzm2hdpnmafjeju",
+ "contribs": [
+ {
+ "index": 0,
+ "raw_name": "D. Daubner",
+ "role": "author"
+ },
+ {
+ "index": 1,
+ "raw_name": "T. Juratli",
+ "role": "author"
+ },
+ {
+ "index": 2,
+ "raw_name": "K. Engellandt",
+ "role": "author"
+ }
+ ],
+ "ext_ids": {
+ "doi": "10.1055/s-0032-1313212",
+ "pmid": "23023226",
+ "wikidata_qid": "Q45276716"
+ },
+ "extra": {
+ "crossref": {
+ "type": "journal-article"
+ }
+ },
+ "ident": "s5a6e6wnlvdelge256xpha6oqu",
+ "issue": "01",
+ "language": "de",
+ "pages": "71-73",
+ "publisher": "Georg Thieme Verlag KG",
+ "refs": [],
+ "release_date": "2012-09-21",
+ "release_stage": "published",
+ "release_type": "article-journal",
+ "release_year": 2012,
+ "revision": "b2141656-18d3-4325-a144-e3ece361bc0a",
+ "state": "active",
+ "title": "Ruptur eines reifen intrakraniellen Teratoms",
+ "volume": "185",
+ "work_id": "r7lldkbnvbbcniqnwdcwd5c2gm"
+}
diff --git a/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy b/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy
new file mode 100644
index 0000000..952966d
--- /dev/null
+++ b/tests/data/release/zoeto2mymzhi3l74fr2ps5qjyy
@@ -0,0 +1,44 @@
+{
+ "abstracts": [],
+ "container_id": "jurtf7gsrbgzzm2hdpnmafjeju",
+ "contribs": [
+ {
+ "index": 0,
+ "raw_name": "D. Daubner",
+ "role": "author"
+ },
+ {
+ "index": 1,
+ "raw_name": "T. Juratli",
+ "role": "author"
+ },
+ {
+ "index": 2,
+ "raw_name": "K. Engellandt",
+ "role": "author"
+ }
+ ],
+ "ext_ids": {
+ "doi": "10.1055/s-0032-1330472"
+ },
+ "extra": {
+ "crossref": {
+ "type": "journal-article"
+ }
+ },
+ "ident": "zoeto2mymzhi3l74fr2ps5qjyy",
+ "issue": "01",
+ "language": "de",
+ "pages": "E2-E2",
+ "publisher": "Georg Thieme Verlag KG",
+ "refs": [],
+ "release_date": "2012-12-20",
+ "release_stage": "published",
+ "release_type": "article-journal",
+ "release_year": 2012,
+ "revision": "df95fb6f-ad31-45a2-8b97-322fc1fb3342",
+ "state": "active",
+ "title": "Ruptur eines reifen intrakraniellen Teratoms",
+ "volume": "185",
+ "work_id": "wb533kwwszbqfijj2lq7su3kva"
+}
diff --git a/tests/data/verify.csv b/tests/data/verify.csv
index 313dc01..a9eaf0c 100644
--- a/tests/data/verify.csv
+++ b/tests/data/verify.csv
@@ -179,3 +179,4 @@ fppfjl5kt5dsnfl2i5rarhqaaq,zqqbuha3uzd2fcvekdy3ygxnni,Status.DIFFERENT,CONTRIB_I
cq6xrtp5zvesrjsklvseej6l5y,ufjdsz5ejbafbdpnuygvbotx5m,Status.EXACT,TITLE_AUTHOR_MATCH
cfrqezy7uzgnnnp542pa3mu4yi,dwlvdxtqdzdmzkdyd2jo3lztna,Status.STRONG,TOKENIZED_AUTHORS
3w7pt5hlu5bvjkyo2dtoxm4ltq,3waartzi5vfprewchjr4z5nbi4,,
+s5a6e6wnlvdelge256xpha6oqu,zoeto2mymzhi3l74fr2ps5qjyy,,