From 31672b40c358b6dfbf29520838c8064ed2891cee Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Wed, 13 Nov 2019 21:24:22 -0800 Subject: treat failure to get terminal capture as a SavePageNowError --- python/sandcrawler/ingest.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sandcrawler/ingest.py b/python/sandcrawler/ingest.py index 6e96763..29bb78e 100644 --- a/python/sandcrawler/ingest.py +++ b/python/sandcrawler/ingest.py @@ -68,7 +68,7 @@ class IngestFileWorker(SandcrawlerWorker): cdx = self.cdx_client.lookup_latest(url, follow_redirects=True) if not cdx: sys.stderr.write("{}\n".format(cdx_list)) - raise Exception("Failed to crawl PDF URL") + raise SavePageNowError("Failed to find terminal capture from SPNv2") else: return self.spn_client.save_url_now_v1(url) -- cgit v1.2.3