aboutsummaryrefslogtreecommitdiffstats
path: root/mapreduce/common.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-04-06 15:16:44 -0700
committerBryan Newbold <bnewbold@archive.org>2018-04-06 15:16:44 -0700
commit3d3be7090d430d5dfa482bc5d9e5c348bcca36a6 (patch)
treef77cdb33f83b7c2a9b2c9babfb3b11a8faa5a1f8 /mapreduce/common.py
parent4c9538d80500500b1b60f4f2feb9d782035abc14 (diff)
downloadsandcrawler-3d3be7090d430d5dfa482bc5d9e5c348bcca36a6.tar.gz
sandcrawler-3d3be7090d430d5dfa482bc5d9e5c348bcca36a6.zip
lint fixes
Diffstat (limited to 'mapreduce/common.py')
-rw-r--r--mapreduce/common.py10
1 files changed, 5 insertions, 5 deletions
diff --git a/mapreduce/common.py b/mapreduce/common.py
index 1b8e572..6710044 100644
--- a/mapreduce/common.py
+++ b/mapreduce/common.py
@@ -14,7 +14,7 @@ def normalize_mime(raw):
if raw.startswith(norm):
return norm
- # Special cases
+ # Special cases
if raw.startswith('application/xml'):
return 'text/xml'
if raw.startswith('application/x-pdf'):
@@ -23,14 +23,14 @@ def normalize_mime(raw):
def test_normalize_mime():
- assert normalize_mime("asdf") == None
+ assert normalize_mime("asdf") is None
assert normalize_mime("application/pdf") == "application/pdf"
assert normalize_mime("application/pdf+journal") == "application/pdf"
assert normalize_mime("Application/PDF") == "application/pdf"
- assert normalize_mime("application/p") == None
+ assert normalize_mime("application/p") is None
assert normalize_mime("application/xml+stuff") == "text/xml"
assert normalize_mime("application/x-pdf") == "application/pdf"
- assert normalize_mime("application/x-html") == None
+ assert normalize_mime("application/x-html") is None
def parse_cdx_line(raw_cdx):
@@ -65,7 +65,7 @@ def parse_cdx_line(raw_cdx):
warc_file = warc.split('/')[-1]
try:
dt_iso = datetime.strptime(dt, "%Y%m%d%H%M%S").isoformat()
- except:
+ except Exception:
return None
# 'i' intentionally not set