summaryrefslogtreecommitdiffstats
path: root/python/fatcat_tools/importers
diff options
context:
space:
mode:
Diffstat (limited to 'python/fatcat_tools/importers')
-rw-r--r--python/fatcat_tools/importers/ingest.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/python/fatcat_tools/importers/ingest.py b/python/fatcat_tools/importers/ingest.py
index 4dcb1ec3..4fbd19f1 100644
--- a/python/fatcat_tools/importers/ingest.py
+++ b/python/fatcat_tools/importers/ingest.py
@@ -392,7 +392,7 @@ class IngestWebResultImporter(IngestFileResultImporter):
if row['request'].get('ingest_type') != 'html':
self.counts['skip-ingest-type'] += 1
return False
- if row['file_meta'].get('mimetype') not in ("text/html", "application/html"):
+ if row['file_meta'].get('mimetype') not in ("text/html", "application/xhtml+xml"):
self.counts['skip-mimetype'] += 1
return False
@@ -407,7 +407,7 @@ class IngestWebResultImporter(IngestFileResultImporter):
if request.get('ingest_type') != "html":
self.counts['skip-ingest-type'] += 1
return None
- if file_meta['mimetype'] not in ("text/html", "application/html"):
+ if file_meta['mimetype'] not in ("text/html", "application/xhtml+xml"):
self.counts['skip-mimetype'] += 1
return None