diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-11-06 19:51:00 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-11-18 11:58:26 -0800 |
commit | 4979c58ee91903148962f4d62d1a8d423349ad67 (patch) | |
tree | 09901de13601d058eb413614a0dc626e1e30f4d2 /fatcat_scholar/schema.py | |
parent | 7d38f46fc1970decfcfb1e3f4583b85605e5b8ee (diff) | |
download | fatcat-scholar-4979c58ee91903148962f4d62d1a8d423349ad67.tar.gz fatcat-scholar-4979c58ee91903148962f4d62d1a8d423349ad67.zip |
add basic html fulltext support to fetch pipeline
Diffstat (limited to 'fatcat_scholar/schema.py')
-rw-r--r-- | fatcat_scholar/schema.py | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/fatcat_scholar/schema.py b/fatcat_scholar/schema.py index 5637e0a..bec81ab 100644 --- a/fatcat_scholar/schema.py +++ b/fatcat_scholar/schema.py @@ -33,6 +33,7 @@ class IntermediateBundle(BaseModel): grobid_fulltext: Optional[Dict[str, Any]] pdftotext_fulltext: Optional[Dict[str, Any]] pdf_meta: Optional[Dict[str, Any]] + html_fulltext: Optional[Dict[str, Any]] sim_fulltext: Optional[Dict[str, Any]] fetched: Optional[datetime.datetime] |