diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-11-06 20:55:44 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-11-18 11:58:26 -0800 |
commit | c14e3a9d0ef68822da347e59e77c4b2b9a7b0828 (patch) | |
tree | 0642fce712478b5441809d99e2bdf03f4457b0f9 /fatcat_scholar/worker.py | |
parent | 4979c58ee91903148962f4d62d1a8d423349ad67 (diff) | |
download | fatcat-scholar-c14e3a9d0ef68822da347e59e77c4b2b9a7b0828.tar.gz fatcat-scholar-c14e3a9d0ef68822da347e59e77c4b2b9a7b0828.zip |
basic HTML transform/index support
Diffstat (limited to 'fatcat_scholar/worker.py')
-rw-r--r-- | fatcat_scholar/worker.py | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/fatcat_scholar/worker.py b/fatcat_scholar/worker.py index af84dd1..d2cc3cb 100644 --- a/fatcat_scholar/worker.py +++ b/fatcat_scholar/worker.py @@ -131,6 +131,7 @@ class IndexDocsWorker(KafkaWorker): grobid_fulltext=obj.get("grobid_fulltext"), pdftotext_fulltext=obj.get("pdftotext_fulltext"), pdf_meta=obj.get("pdf_meta"), + html_fulltext=obj.get("html_fulltext"), sim_fulltext=obj.get("sim_fulltext"), ) es_doc = transform_heavy(bundle) |