From f157cc7a50e0fd9a1c79efb3c29be7d8508ffa66 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Fri, 12 Nov 2021 11:45:48 -0800 Subject: document cleanups run this week --- notes/cleanups/wayback_timestamps.md | 13 +++++++++++++ 1 file changed, 13 insertions(+) (limited to 'notes/cleanups') diff --git a/notes/cleanups/wayback_timestamps.md b/notes/cleanups/wayback_timestamps.md index 38bc3f7d..e3ea942d 100644 --- a/notes/cleanups/wayback_timestamps.md +++ b/notes/cleanups/wayback_timestamps.md @@ -289,3 +289,16 @@ Ugh. | pv -l \ | gzip \ > files_20211105_moreshortts.fetched.json.gz + # 9.96M 6:38:43 [ 416 /s] + +Looks like the last small tweak was successful! This was with git commit +`cd09c6d6bd4deef0627de4f8a8a301725db01e14`. + + + zcat files_20211105_moreshortts.fetched.json.gz | jq .status | sort | uniq -c | sort -nr + 6228307 "success-db" + 2876033 "success-self" + 846844 "success-api" + 7583 "fail-not-found" + 87 "fail-cdx-403" + -- cgit v1.2.3