aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-04-09 17:48:47 -0700
committerBryan Newbold <bnewbold@archive.org>2020-04-09 17:48:47 -0700
commit042bd36c25206ff45e305d094028b6482a4c4074 (patch)
tree5e25122ad6227855416fe964658e0581e048332c
parent5b22495057fa9cb40271764c9e80166882ba3f21 (diff)
downloadfatcat-covid19-042bd36c25206ff45e305d094028b6482a4c4074.tar.gz
fatcat-covid19-042bd36c25206ff45e305d094028b6482a4c4074.zip
bugfix: handle missing file mimetypes
-rwxr-xr-xbin/deliver_file2disk.py2
-rw-r--r--fatcat_covid19/common.py2
2 files changed, 2 insertions, 2 deletions
diff --git a/bin/deliver_file2disk.py b/bin/deliver_file2disk.py
index 49e0c73..e5f13c0 100755
--- a/bin/deliver_file2disk.py
+++ b/bin/deliver_file2disk.py
@@ -123,7 +123,7 @@ class DeliverFatcatDisk:
"""
good = []
for f in files:
- if f['mimetype'] and not 'pdf' in f['mimetype'].lower():
+ if f.get('mimetype') and not 'pdf' in f['mimetype'].lower():
continue
for url in f['urls']:
if 'archive.org/' in url['url']:
diff --git a/fatcat_covid19/common.py b/fatcat_covid19/common.py
index 97bc675..7b88344 100644
--- a/fatcat_covid19/common.py
+++ b/fatcat_covid19/common.py
@@ -80,7 +80,7 @@ def find_local_file(files, base_dir="."):
If found, returns the file entity; the path can be determined from the sha1hex field.
"""
for f in files:
- if f['mimetype'] and not 'pdf' in f['mimetype'].lower():
+ if f.get('mimetype') and not 'pdf' in f['mimetype'].lower():
continue
pdf_path = blob_path(f['sha1'], directory="pdf/", file_suffix=".pdf", base_dir=base_dir)
if os.path.isfile(pdf_path):