diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-07-02 10:55:44 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-07-02 10:55:44 -0700 |
commit | 4f9ac8aae155a74439f03aa2ab9aa95e1d813092 (patch) | |
tree | bb1ba217d0fe5b4f42d80a29831d5af9ebea76d0 | |
parent | 059070e383e5790c1434ea1073704f0b42653d8a (diff) | |
download | sandcrawler-4f9ac8aae155a74439f03aa2ab9aa95e1d813092.tar.gz sandcrawler-4f9ac8aae155a74439f03aa2ab9aa95e1d813092.zip |
add another bad PDF sha1hex
-rw-r--r-- | python/sandcrawler/pdfextract.py | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py index 350c591..4fd8712 100644 --- a/python/sandcrawler/pdfextract.py +++ b/python/sandcrawler/pdfextract.py @@ -19,6 +19,7 @@ from .ia import WaybackClient, WaybackError, PetaboxError # these, maybe due to threading. BAD_PDF_SHA1HEX = [ "373f84dfab4ed47047826e604e2918a9cd6a95b2", + "64d821d728f9a3dc944b4c03be00feea0b57e314", "88edcbab1cac2d70af5870422974afc253f4f0c6", "8e4f03c29ae1fe7227140ab4b625f375f6c00d31", ] |