aboutsummaryrefslogtreecommitdiffstats
path: root/python/sandcrawler/ingest.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-11-03 22:40:57 -0800
committerBryan Newbold <bnewbold@archive.org>2020-11-03 22:42:05 -0800
commit8f964b9b48572ac71f27ba64207816dfd3a6dc36 (patch)
tree68a0146e71a0eef4e43f7b7d686b806eb210cda5 /python/sandcrawler/ingest.py
parent653fac9632c6ae9dd036ad844454cf419cd5320b (diff)
downloadsandcrawler-8f964b9b48572ac71f27ba64207816dfd3a6dc36.tar.gz
sandcrawler-8f964b9b48572ac71f27ba64207816dfd3a6dc36.zip
small fixes from local testing for XML ingest
Diffstat (limited to 'python/sandcrawler/ingest.py')
-rw-r--r--python/sandcrawler/ingest.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/sandcrawler/ingest.py b/python/sandcrawler/ingest.py
index 363485e..2e227bf 100644
--- a/python/sandcrawler/ingest.py
+++ b/python/sandcrawler/ingest.py
@@ -336,7 +336,7 @@ class IngestFileWorker(SandcrawlerWorker):
)
def want(self, request: dict) -> bool:
- if not request.get('ingest_type') in ('file', 'pdf'):
+ if not request.get('ingest_type') in ('file', 'pdf', 'xml'):
return False
return True