aboutsummaryrefslogtreecommitdiffstats
path: root/python/fatcat_tools/harvest
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2020-05-26 19:01:28 -0700
committerBryan Newbold <bnewbold@robocracy.org>2020-05-26 19:09:55 -0700
commit670aed3800873869550b477846f48cb2b4193005 (patch)
tree46fdb09a5cfe629b2581eaf195fd93ec87b399a3 /python/fatcat_tools/harvest
parentd7ebedc840d8fe27fe0b952986ec9d9161964123 (diff)
downloadfatcat-670aed3800873869550b477846f48cb2b4193005.tar.gz
fatcat-670aed3800873869550b477846f48cb2b4193005.zip
rename HarvestState.next() to HarvestState.next_span()
"span" short for "timespan" to harvest; there may be a better name to use. Motivation for this is to work around a pylint erorr that .next() was not callable. This might be a bug with pylint, but .next() is also a very generic name.
Diffstat (limited to 'python/fatcat_tools/harvest')
-rw-r--r--python/fatcat_tools/harvest/doi_registrars.py2
-rw-r--r--python/fatcat_tools/harvest/harvest_common.py4
-rw-r--r--python/fatcat_tools/harvest/oaipmh.py2
-rw-r--r--python/fatcat_tools/harvest/pubmed.py2
4 files changed, 5 insertions, 5 deletions
diff --git a/python/fatcat_tools/harvest/doi_registrars.py b/python/fatcat_tools/harvest/doi_registrars.py
index 4e027738..f84acb24 100644
--- a/python/fatcat_tools/harvest/doi_registrars.py
+++ b/python/fatcat_tools/harvest/doi_registrars.py
@@ -174,7 +174,7 @@ class HarvestCrossrefWorker:
def run(self, continuous=False):
while True:
- current = self.state.next(continuous) # pylint: disable=not-callable
+ current = self.state.next_span(continuous)
if current:
print("Fetching DOIs updated on {} (UTC)".format(current), file=sys.stderr)
self.fetch_date(current)
diff --git a/python/fatcat_tools/harvest/harvest_common.py b/python/fatcat_tools/harvest/harvest_common.py
index 5f7aa084..27ab8b4a 100644
--- a/python/fatcat_tools/harvest/harvest_common.py
+++ b/python/fatcat_tools/harvest/harvest_common.py
@@ -83,12 +83,12 @@ class HarvestState:
self.to_process.add(current)
current += datetime.timedelta(days=1)
- def next(self, continuous=False):
+ def next_span(self, continuous=False):
"""
Gets next timespan (date) to be processed, or returns None if completed.
If 'continuous' arg is True, will try to enqueue recent possibly valid
- timespans; the idea is to call next() repeatedly, and it will return a
+ timespans; the idea is to call next_span() repeatedly, and it will return a
new timespan when it becomes "available".
"""
if continuous:
diff --git a/python/fatcat_tools/harvest/oaipmh.py b/python/fatcat_tools/harvest/oaipmh.py
index af1ca0d5..d30f9507 100644
--- a/python/fatcat_tools/harvest/oaipmh.py
+++ b/python/fatcat_tools/harvest/oaipmh.py
@@ -98,7 +98,7 @@ class HarvestOaiPmhWorker:
def run(self, continuous=False):
while True:
- current = self.state.next(continuous) # pylint: disable=not-callable
+ current = self.state.next_span(continuous)
if current:
print("Fetching DOIs updated on {} (UTC)".format(current), file=sys.stderr)
self.fetch_date(current)
diff --git a/python/fatcat_tools/harvest/pubmed.py b/python/fatcat_tools/harvest/pubmed.py
index d78045c6..f6301b8d 100644
--- a/python/fatcat_tools/harvest/pubmed.py
+++ b/python/fatcat_tools/harvest/pubmed.py
@@ -144,7 +144,7 @@ class PubmedFTPWorker:
if len(self.date_file_map) == 0:
raise ValueError("map from dates to files should not be empty, maybe the HTML changed?")
- current = self.state.next(continuous) # pylint: disable=not-callable
+ current = self.state.next_span(continuous)
if current:
print("Fetching citations updated on {} (UTC)".format(current), file=sys.stderr)
self.fetch_date(current)