aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2022-07-13 13:23:57 -0700
committerBryan Newbold <bnewbold@archive.org>2022-07-13 13:23:57 -0700
commitc32b13949a06e9e834c1fac40e3609cb8eeb9f31 (patch)
tree08b2c723af626bac3cfe147f6cad180a445e21e4
parent0202f325acd6436bf4753e62fd8803f29f4bd027 (diff)
downloadsandcrawler-c32b13949a06e9e834c1fac40e3609cb8eeb9f31.tar.gz
sandcrawler-c32b13949a06e9e834c1fac40e3609cb8eeb9f31.zip
yet another bad PDF
-rw-r--r--python/sandcrawler/pdfextract.py1
1 files changed, 1 insertions, 0 deletions
diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py
index 2e13278..11c54e9 100644
--- a/python/sandcrawler/pdfextract.py
+++ b/python/sandcrawler/pdfextract.py
@@ -99,6 +99,7 @@ BAD_PDF_SHA1HEX: List[str] = [
"98b02eb70066c182c705ef4d14d8b723ad7f1fab",
"993ca31f6974f8387bb18dd7d38987d290da8781",
"9dbd05af3442e6f42d67868054751b76973f4171",
+ "a1cc781c694a48e018f4de110b58f561aa212051",
"a2298c137b9c8c8975bad62eea9224edb95e6952",
"a2671738755ab8b24775e95375dc72f1ca4e5fd6",
"a26f299fb97c646effeebd4c5e2968786bd0f781",