From 3cdf4af9be4c762ff2ed79a57b5ad30637909f1e Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Tue, 26 Oct 2021 12:22:38 -0700 Subject: python: isort all imports --- python/sandcrawler/pdfextract.py | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) (limited to 'python/sandcrawler/pdfextract.py') diff --git a/python/sandcrawler/pdfextract.py b/python/sandcrawler/pdfextract.py index 9b4e834..2fb34b8 100644 --- a/python/sandcrawler/pdfextract.py +++ b/python/sandcrawler/pdfextract.py @@ -1,17 +1,16 @@ -import sys -import json import datetime -from io import BytesIO +import json +import sys from dataclasses import dataclass -from typing import Optional, Dict, Any +from io import BytesIO +from typing import Any, Dict, Optional import poppler from PIL import Image -from .workers import SandcrawlerWorker, SandcrawlerFetchWorker from .misc import gen_file_metadata - +from .workers import SandcrawlerFetchWorker, SandcrawlerWorker # This is a hack to work around timeouts when processing certain PDFs with # poppler. For some reason, the usual Kafka timeout catcher isn't working on -- cgit v1.2.3