summaryrefslogtreecommitdiffstats
path: root/notes/cleanups/scripts/fetch_full_cdx_ts.py
diff options
context:
space:
mode:
Diffstat (limited to 'notes/cleanups/scripts/fetch_full_cdx_ts.py')
-rw-r--r--notes/cleanups/scripts/fetch_full_cdx_ts.py3
1 files changed, 2 insertions, 1 deletions
diff --git a/notes/cleanups/scripts/fetch_full_cdx_ts.py b/notes/cleanups/scripts/fetch_full_cdx_ts.py
index d5b0c476..ebcf0d62 100644
--- a/notes/cleanups/scripts/fetch_full_cdx_ts.py
+++ b/notes/cleanups/scripts/fetch_full_cdx_ts.py
@@ -115,7 +115,8 @@ def process_file(fe, session) -> dict:
seg = u.split('/')
assert seg[2] == "web.archive.org"
assert seg[3] == "web"
- assert seg[4].isdigit()
+ if not seg[4].isdigit():
+ continue
original_url = "/".join(seg[5:])
if len(seg[4]) == 12 or len(seg[4]) == 4:
short_urls.append(u)