From c32b13949a06e9e834c1fac40e3609cb8eeb9f31 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Wed, 13 Jul 2022 13:23:57 -0700 Subject: yet another bad PDF --- python/sandcrawler/pdfextract.py | 1 + 1 file changed, 1 insertion(+) diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py index 2e13278..11c54e9 100644 --- a/python/sandcrawler/pdfextract.py +++ b/python/sandcrawler/pdfextract.py @@ -99,6 +99,7 @@ BAD_PDF_SHA1HEX: List[str] = [ "98b02eb70066c182c705ef4d14d8b723ad7f1fab", "993ca31f6974f8387bb18dd7d38987d290da8781", "9dbd05af3442e6f42d67868054751b76973f4171", + "a1cc781c694a48e018f4de110b58f561aa212051", "a2298c137b9c8c8975bad62eea9224edb95e6952", "a2671738755ab8b24775e95375dc72f1ca4e5fd6", "a26f299fb97c646effeebd4c5e2968786bd0f781", -- cgit v1.2.3