diff options
author | Martin Czygan <martin@archive.org> | 2021-10-15 21:01:33 +0000 |
---|---|---|
committer | Martin Czygan <martin@archive.org> | 2021-10-15 21:01:33 +0000 |
commit | fa552aedaf8d0a898bba627be6bec5b579dd6b18 (patch) | |
tree | e2630189ca57d5b54c4ec21fdc5008e553aca5e6 /python | |
parent | 4be667616ae209fa0efaaa2350c1b75eacf0e344 (diff) | |
parent | 1b4136d415cbe549c735d459cd0ab1345bb37011 (diff) | |
download | fatcat-fa552aedaf8d0a898bba627be6bec5b579dd6b18.tar.gz fatcat-fa552aedaf8d0a898bba627be6bec5b579dd6b18.zip |
Merge branch 'martin-pubmed-proxy-connection-refused-fix' into 'master'
pubmed: switch default http site to retrieve update files
See merge request webgroup/fatcat!122
Diffstat (limited to 'python')
-rw-r--r-- | python/fatcat_tools/harvest/pubmed.py | 6 |
1 files changed, 4 insertions, 2 deletions
diff --git a/python/fatcat_tools/harvest/pubmed.py b/python/fatcat_tools/harvest/pubmed.py index 579dd505..92798a99 100644 --- a/python/fatcat_tools/harvest/pubmed.py +++ b/python/fatcat_tools/harvest/pubmed.py @@ -263,10 +263,12 @@ def ftpretr(url, max_retries=10, retry_delay=1, proxy_hostport=None): return f.name -def ftpretr_via_http_proxy(url, proxy_hostport="159.69.240.245:15201", max_retries=10, retry_delay=1): +def ftpretr_via_http_proxy(url, proxy_hostport="ftp.ncbi.nlm.nih.gov", max_retries=10, retry_delay=1): """ Fetch file from FTP via external HTTP proxy, e.g. ftp.host.com:/a/b/c would - be retrievable via proxy.com/a/b/c. + be retrievable via proxy.com/a/b/c; (in 09/2021 we used + "159.69.240.245:15201" as proxy_hostport but that started to fail + 2021-10-15; just switch to NIH's http version). """ parsed = urlparse(url) server, path = parsed.netloc, parsed.path |