From b7618ddfbf83aecbfb44daddf28aa1435def13a8 Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Tue, 17 Nov 2020 03:34:39 +0100 Subject: update stats --- fuzzycat/verify.py | 18 +++++++++--------- 1 file changed, 9 insertions(+), 9 deletions(-) diff --git a/fuzzycat/verify.py b/fuzzycat/verify.py index 4e12dba..730a5ee 100644 --- a/fuzzycat/verify.py +++ b/fuzzycat/verify.py @@ -26,20 +26,20 @@ Examples from clustering stage (from a sample of 100k records): WIP: { - "miss.blacklisted": 956, - "miss.contrib_intersection_empty": 3217, + "miss.blacklisted": 2950, + "miss.contrib_intersection_empty": 3167, "miss.dataset_doi": 8723, - "miss.num_diff": 14914, - "miss.release_type": 14305, - "miss.short_title": 3315, - "miss.subtitle": 102, + "miss.num_diff": 14905, + "miss.release_type": 14204, + "miss.short_title": 3309, + "miss.subtitle": 98, "miss.vhs": 45, - "miss.year": 12321, + "miss.year": 11755, "ok.arxiv_version": 13, - "ok.dummy": 8622, + "ok.dummy": 7367, "ok.preprint_published": 7, "ok.slug_title_author_match": 498, - "ok.title_author_match": 6187, + "ok.title_author_match": 6184, "skip.container_name_blacklist": 71, "skip.publisher_blacklist": 22, "skip.too_large": 1077, -- cgit v1.2.3