diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-11-03 22:40:57 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-11-03 22:42:05 -0800 |
commit | 8f964b9b48572ac71f27ba64207816dfd3a6dc36 (patch) | |
tree | 68a0146e71a0eef4e43f7b7d686b806eb210cda5 /python/sandcrawler/ingest.py | |
parent | 653fac9632c6ae9dd036ad844454cf419cd5320b (diff) | |
download | sandcrawler-8f964b9b48572ac71f27ba64207816dfd3a6dc36.tar.gz sandcrawler-8f964b9b48572ac71f27ba64207816dfd3a6dc36.zip |
small fixes from local testing for XML ingest
Diffstat (limited to 'python/sandcrawler/ingest.py')
-rw-r--r-- | python/sandcrawler/ingest.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/python/sandcrawler/ingest.py b/python/sandcrawler/ingest.py index 363485e..2e227bf 100644 --- a/python/sandcrawler/ingest.py +++ b/python/sandcrawler/ingest.py @@ -336,7 +336,7 @@ class IngestFileWorker(SandcrawlerWorker): ) def want(self, request: dict) -> bool: - if not request.get('ingest_type') in ('file', 'pdf'): + if not request.get('ingest_type') in ('file', 'pdf', 'xml'): return False return True |