aboutsummaryrefslogtreecommitdiffstats
path: root/python/sandcrawler/ingest_file.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2021-09-30 15:09:42 -0700
committerBryan Newbold <bnewbold@archive.org>2021-10-15 18:15:04 -0700
commit86107e39b761e5b799562af662219fda04ade1be (patch)
tree9a9801fc1d8a583a792457c2b8468ce6dbea22f1 /python/sandcrawler/ingest_file.py
parent7430ddbcdec76091220de474060b968f0ef1bb70 (diff)
downloadsandcrawler-86107e39b761e5b799562af662219fda04ade1be.tar.gz
sandcrawler-86107e39b761e5b799562af662219fda04ade1be.zip
refactoring; progress on filesets
Diffstat (limited to 'python/sandcrawler/ingest_file.py')
-rw-r--r--python/sandcrawler/ingest_file.py5
1 files changed, 5 insertions, 0 deletions
diff --git a/python/sandcrawler/ingest_file.py b/python/sandcrawler/ingest_file.py
index b852c69..a02e923 100644
--- a/python/sandcrawler/ingest_file.py
+++ b/python/sandcrawler/ingest_file.py
@@ -25,6 +25,8 @@ from sandcrawler.workers import SandcrawlerWorker
from sandcrawler.db import SandcrawlerPostgrestClient
from sandcrawler.xml import xml_reserialize
+from sandcrawler.platforms.generic import DirectFileHelper
+
MAX_BODY_SIZE_BYTES = 128*1024*1024
@@ -520,6 +522,9 @@ class IngestFileWorker(SandcrawlerWorker):
return True
def process(self, request: dict, key: Any = None) -> dict:
+ return self.process_file(request, key=key)
+
+ def process_file(self, request: dict, key: Any = None) -> dict:
# old backwards compatibility
if request.get('ingest_type') == 'file':