diff options
author | Martin Czygan <martin@archive.org> | 2020-07-06 18:53:24 +0000 |
---|---|---|
committer | Martin Czygan <martin@archive.org> | 2020-07-06 18:53:24 +0000 |
commit | 68cf95bd1d1588c0d3170b4032596756e07ae718 (patch) | |
tree | 3163a803dd6743c84c83a786b5aea7eda3bbca8e /python/fatcat_tools/importers/arxiv.py | |
parent | bea909f997bcef51e2624b9eea42c8fbe7115aaa (diff) | |
parent | 8583c6866f2bb89e8dfe5f5e5893048c2fd854e7 (diff) | |
download | fatcat-68cf95bd1d1588c0d3170b4032596756e07ae718.tar.gz fatcat-68cf95bd1d1588c0d3170b4032596756e07ae718.zip |
Merge branch 'bnewbold-lint' into 'master'
lint cleanups
See merge request webgroup/fatcat!62
Diffstat (limited to 'python/fatcat_tools/importers/arxiv.py')
-rw-r--r-- | python/fatcat_tools/importers/arxiv.py | 9 |
1 files changed, 4 insertions, 5 deletions
diff --git a/python/fatcat_tools/importers/arxiv.py b/python/fatcat_tools/importers/arxiv.py index 719592fc..43325ebc 100644 --- a/python/fatcat_tools/importers/arxiv.py +++ b/python/fatcat_tools/importers/arxiv.py @@ -7,7 +7,7 @@ from bs4 import BeautifulSoup from pylatexenc.latex2text import LatexNodes2Text import fatcat_openapi_client -from .common import EntityImporter, clean +from .common import EntityImporter from .crossref import lookup_license_slug @@ -97,7 +97,6 @@ class ArxivRawImporter(EntityImporter): **kwargs) self._test_override = False - def parse_record(self, record): if not record: @@ -188,7 +187,6 @@ class ArxivRawImporter(EntityImporter): if lang == 'en': lang = None - # extra: # withdrawn_date # translation_of @@ -244,7 +242,7 @@ class ArxivRawImporter(EntityImporter): For each version, do a lookup by full arxiv_id, and store work/release id results. - + If a version has a DOI, also do a doi lookup and store that result. If there is an existing release with both matching, set that as the existing work. If they don't match, use the full arxiv_id match and @@ -345,6 +343,7 @@ class ArxivRawImporter(EntityImporter): print(json.dumps(resp)) #sys.exit(-1) -if __name__=='__main__': + +if __name__ == '__main__': parser = ArxivRawImporter(None) parser.parse_file(open(sys.argv[1])) |