From 9c39bb6469843825efe67f5e4849cab5ea1eea9d Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Mon, 19 Oct 2020 15:52:07 -0700 Subject: SPN: look for non-200 CDX responses Suspect that this has been the source of many `spn2-cdx-lookup-failure` --- python/sandcrawler/ia.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sandcrawler/ia.py b/python/sandcrawler/ia.py index 936ee97..0067b7e 100644 --- a/python/sandcrawler/ia.py +++ b/python/sandcrawler/ia.py @@ -977,7 +977,7 @@ class SavePageNowClient: if not cdx_row: # lookup exact try: - filter_status_code = 200 + filter_status_code = None if spn_result.terminal_url.startswith("ftp://"): filter_status_code = 226 cdx_row = wayback_client.cdx_client.fetch( -- cgit v1.2.3