aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-07-02 10:55:44 -0700
committerBryan Newbold <bnewbold@archive.org>2020-07-02 10:55:44 -0700
commit4f9ac8aae155a74439f03aa2ab9aa95e1d813092 (patch)
treebb1ba217d0fe5b4f42d80a29831d5af9ebea76d0
parent059070e383e5790c1434ea1073704f0b42653d8a (diff)
downloadsandcrawler-4f9ac8aae155a74439f03aa2ab9aa95e1d813092.tar.gz
sandcrawler-4f9ac8aae155a74439f03aa2ab9aa95e1d813092.zip
add another bad PDF sha1hex
-rw-r--r--python/sandcrawler/pdfextract.py1
1 files changed, 1 insertions, 0 deletions
diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py
index 350c591..4fd8712 100644
--- a/python/sandcrawler/pdfextract.py
+++ b/python/sandcrawler/pdfextract.py
@@ -19,6 +19,7 @@ from .ia import WaybackClient, WaybackError, PetaboxError
# these, maybe due to threading.
BAD_PDF_SHA1HEX = [
"373f84dfab4ed47047826e604e2918a9cd6a95b2",
+ "64d821d728f9a3dc944b4c03be00feea0b57e314",
"88edcbab1cac2d70af5870422974afc253f4f0c6",
"8e4f03c29ae1fe7227140ab4b625f375f6c00d31",
]