From 6a93537a0c9dd2c1b4a28486384e40c3d410b4ed Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Fri, 4 Dec 2020 00:32:35 +0100 Subject: case: ignore choice review --- fuzzycat/common.py | 1 + fuzzycat/verify.py | 10 ++++++++++ 2 files changed, 11 insertions(+) (limited to 'fuzzycat') diff --git a/fuzzycat/common.py b/fuzzycat/common.py index 07f62df..bbffcc9 100644 --- a/fuzzycat/common.py +++ b/fuzzycat/common.py @@ -45,6 +45,7 @@ class Miss(str, Enum): CONTRIB_INTERSECTION_EMPTY = 'miss.contrib_intersection_empty' CUSTOM_IOP_MA_PATTERN = 'miss.custom_iop_ma_pattern' CUSTOM_PREFIX_10_14288 = 'miss.custom_prefix_10_14288' + CUSTOM_PREFIX_10_5860_CHOICE_REVIEW = 'miss.custom_prefix_10_5860_choice_review' CUSTOM_PREFIX_10_7916 = 'miss.custom_prefix_10_7916' CUSTOM_VHS = 'miss.vhs' # https://fatcat.wiki/release/44gk5ben5vghljq6twm7lwmxla DATASET_DOI = 'miss.dataset_doi' diff --git a/fuzzycat/verify.py b/fuzzycat/verify.py index 6d824d4..b385c25 100644 --- a/fuzzycat/verify.py +++ b/fuzzycat/verify.py @@ -434,6 +434,16 @@ def compare(a, b): # https://fatcat.wiki/release/q66xv7drk5fnph7enwwlkyuwqm return (Status.DIFFERENT, Miss.CONTRIB_INTERSECTION_EMPTY) + # mark choicereview articles as ambiguous, as they seem to be behind a paywall + try: + a_doi = glom(a, "ext_ids.doi") + b_doi = glom(b, "ext_ids.doi") + if has_doi_prefix(a_doi, "10.5860") or has_doi_prefix(b_doi, "10.5860"): + return (Status.AMBIGUOUS, Miss.CUSTOM_PREFIX_10_5860_CHOICE_REVIEW) + except PathAccessError: + pass + + return (Status.AMBIGUOUS, OK.DUMMY) -- cgit v1.2.3