diff options
| author | Bryan Newbold <bnewbold@archive.org> | 2020-10-19 17:00:49 -0700 | 
|---|---|---|
| committer | Bryan Newbold <bnewbold@archive.org> | 2020-10-19 17:00:56 -0700 | 
| commit | f10b1772c08da8740f3d59dd6dd4a28383a550d4 (patch) | |
| tree | 711080759af3a14cb7547aacb37fd43756297f66 | |
| parent | 41b3ae7f7f1d90a8e2aa141448cddd7b174e92fb (diff) | |
| download | sandcrawler-f10b1772c08da8740f3d59dd6dd4a28383a550d4.tar.gz sandcrawler-f10b1772c08da8740f3d59dd6dd4a28383a550d4.zip  | |
ingest: fix old_failure datetime
| -rw-r--r-- | python/sandcrawler/ingest.py | 2 | 
1 files changed, 1 insertions, 1 deletions
diff --git a/python/sandcrawler/ingest.py b/python/sandcrawler/ingest.py index b50bcee..6f9da86 100644 --- a/python/sandcrawler/ingest.py +++ b/python/sandcrawler/ingest.py @@ -176,7 +176,7 @@ class IngestFileWorker(SandcrawlerWorker):          #    soft404 = True          old_failure = False -        if resource and not resource.hit and resource.terminal_dt < '20190000000000': +        if resource and not resource.hit and resource.terminal_dt and resource.terminal_dt < '20190000000000':              old_failure = True          if self.try_spn2 and (resource == None or (resource.status == 'no-capture') or soft404 or old_failure):  | 
