From bbaa351a109c001a46e10f52549b43bcef48d348 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Sun, 11 Sep 2022 23:48:48 -0700 Subject: bad PDF sha1 --- python/sandcrawler/pdfextract.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py index 2d8bad4..3eb7581 100644 --- a/python/sandcrawler/pdfextract.py +++ b/python/sandcrawler/pdfextract.py @@ -72,6 +72,7 @@ BAD_PDF_SHA1HEX: List[str] = [ "5c5b45c85eff07d4302844e00ec8baa57b988c60", "5e04779cbbae5ce88bb786064f756885dd6895fe", "5e6a3adde9f08c276c4efd72bfacb256f2ec35d9", + "62247fe6b8d3ca50477cafddbe24bf63832d6674", "623ff84b616383d0a3e0dd8dbce12f0b5fe9a6ac", "646c4a654270606256397684204ff0f3d17be2e7", "64d821d728f9a3dc944b4c03be00feea0b57e314", @@ -100,6 +101,7 @@ BAD_PDF_SHA1HEX: List[str] = [ "949dfb7d833da9576b2ccb9eb1ab5457469c53d3", "961ec451172f373f919c593737466300e42062cb", "976989fa6e447578d9ce16ec5b526f0e09d6df50", + "977f23723027d7052df9b49eb467e6c0b9af93ff", "98b02eb70066c182c705ef4d14d8b723ad7f1fab", "993ca31f6974f8387bb18dd7d38987d290da8781", "9dbd05af3442e6f42d67868054751b76973f4171", -- cgit v1.2.3