From b2cba5cc78f9ce1e1602252e0bc3195551e09326 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Fri, 6 Sep 2019 16:52:40 -0700 Subject: filter out bad ISSN{e,p} Unfortunately a few hundred of these got pushed into fatcat already; will probably fix with a new fixer bot tool. --- chocula.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/chocula.py b/chocula.py index 04595da..12b7ae1 100755 --- a/chocula.py +++ b/chocula.py @@ -1175,6 +1175,11 @@ class ChoculaDatabase(): if extra['color'] == 'green': out['is_oa'] = True + # filter out "NA" ISSNs + for k in ('issne', 'issnp'): + if out.get(k) and (len(out[k]) != 9 or out[k][4] != '-'): + out.pop(k) + cur = self.db.execute("SELECT * FROM homepage WHERE issnl = ?;", [issnl]) for hrow in cur: out['any_homepage'] = True -- cgit v1.2.3