aboutsummaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-02-22 19:32:45 -0800
committerBryan Newbold <bnewbold@archive.org>2020-02-22 19:32:45 -0800
commit43d9cc3d87654e6e3bd199fbb01972cc47df863e (patch)
treeec503da6a4c9f40dfdb40db3a4c58c488abc179c /python
parente608c22854c8796619e8d6cac1264a3e936eb9e9 (diff)
downloadsandcrawler-43d9cc3d87654e6e3bd199fbb01972cc47df863e.tar.gz
sandcrawler-43d9cc3d87654e6e3bd199fbb01972cc47df863e.zip
ingest: more revisit fixes
Diffstat (limited to 'python')
-rw-r--r--python/sandcrawler/ia.py8
1 files changed, 4 insertions, 4 deletions
diff --git a/python/sandcrawler/ia.py b/python/sandcrawler/ia.py
index 053fbbf..945c136 100644
--- a/python/sandcrawler/ia.py
+++ b/python/sandcrawler/ia.py
@@ -560,12 +560,12 @@ class WaybackClient:
start_url=start_url,
hit=True,
status="success",
- terminal_url=resource.revisit_cdx.url,
- terminal_dt=resource.revisit_cdx.datetime,
- terminal_status_code=resource.revisit_cdx.status_code,
+ terminal_url=cdx_row.url,
+ terminal_dt=cdx_row.datetime,
+ terminal_status_code=resource.revisit_cdx.status_code, # ?
body=resource.body,
cdx=cdx_row,
- revisit_cdx=revisit_cdx,
+ revisit_cdx=resource.revisit_cdx,
)
if cdx_row.status_code in (200, 226):