aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMartin Czygan <martin@archive.org>2021-10-15 21:01:33 +0000
committerMartin Czygan <martin@archive.org>2021-10-15 21:01:33 +0000
commitfa552aedaf8d0a898bba627be6bec5b579dd6b18 (patch)
treee2630189ca57d5b54c4ec21fdc5008e553aca5e6
parent4be667616ae209fa0efaaa2350c1b75eacf0e344 (diff)
parent1b4136d415cbe549c735d459cd0ab1345bb37011 (diff)
downloadfatcat-fa552aedaf8d0a898bba627be6bec5b579dd6b18.tar.gz
fatcat-fa552aedaf8d0a898bba627be6bec5b579dd6b18.zip
Merge branch 'martin-pubmed-proxy-connection-refused-fix' into 'master'
pubmed: switch default http site to retrieve update files See merge request webgroup/fatcat!122
-rw-r--r--python/fatcat_tools/harvest/pubmed.py6
1 files changed, 4 insertions, 2 deletions
diff --git a/python/fatcat_tools/harvest/pubmed.py b/python/fatcat_tools/harvest/pubmed.py
index 579dd505..92798a99 100644
--- a/python/fatcat_tools/harvest/pubmed.py
+++ b/python/fatcat_tools/harvest/pubmed.py
@@ -263,10 +263,12 @@ def ftpretr(url, max_retries=10, retry_delay=1, proxy_hostport=None):
return f.name
-def ftpretr_via_http_proxy(url, proxy_hostport="159.69.240.245:15201", max_retries=10, retry_delay=1):
+def ftpretr_via_http_proxy(url, proxy_hostport="ftp.ncbi.nlm.nih.gov", max_retries=10, retry_delay=1):
"""
Fetch file from FTP via external HTTP proxy, e.g. ftp.host.com:/a/b/c would
- be retrievable via proxy.com/a/b/c.
+ be retrievable via proxy.com/a/b/c; (in 09/2021 we used
+ "159.69.240.245:15201" as proxy_hostport but that started to fail
+ 2021-10-15; just switch to NIH's http version).
"""
parsed = urlparse(url)
server, path = parsed.netloc, parsed.path