diff options
| author | Bryan Newbold <bnewbold@robocracy.org> | 2018-06-25 10:40:20 -0700 | 
|---|---|---|
| committer | Bryan Newbold <bnewbold@robocracy.org> | 2018-06-25 10:40:20 -0700 | 
| commit | c2146fe7b5d299dab2692d2346d0037a944ac799 (patch) | |
| tree | 4da08d779872d1ed392bd7cd38945f403668ca1d | |
| parent | c7687e259cd003b3737a8bd9dd1ae51bf1f15a1e (diff) | |
| download | fatcat-c2146fe7b5d299dab2692d2346d0037a944ac799.tar.gz fatcat-c2146fe7b5d299dab2692d2346d0037a944ac799.zip | |
slightly more robust crossref import
| -rw-r--r-- | python/fatcat/crossref_importer.py | 9 | 
1 files changed, 9 insertions, 0 deletions
| diff --git a/python/fatcat/crossref_importer.py b/python/fatcat/crossref_importer.py index 06c162f0..18dd2498 100644 --- a/python/fatcat/crossref_importer.py +++ b/python/fatcat/crossref_importer.py @@ -22,6 +22,11 @@ class FatcatCrossrefImporter(FatcatImporter):          if (not 'author' in obj) or (not 'title' in obj):              return None +        # Other ways to be out of scope (provisionally) +        if ((not 'type' in obj) or (not 'container-title' in obj) or +                len(obj['container-title']) < 1): +            return None +          # contribs          contribs = []          for i, am in enumerate(obj['author']): @@ -62,6 +67,10 @@ class FatcatCrossrefImporter(FatcatImporter):          for i, rm in enumerate(obj.get('reference', [])):              try:                  year = int(rm.get('year')) +                if year > 2025 or year < 1000: +                    # NOTE: will need to update/config in the future! +                    # NOTE: are there crossref works with year < 1000? +                    return None              except:                  year = None              refs.append(fatcat_client.ReleaseRef( | 
