summaryrefslogtreecommitdiffstats
path: root/fatcat_scholar/schema.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-11-06 19:51:00 -0800
committerBryan Newbold <bnewbold@archive.org>2020-11-18 11:58:26 -0800
commit4979c58ee91903148962f4d62d1a8d423349ad67 (patch)
tree09901de13601d058eb413614a0dc626e1e30f4d2 /fatcat_scholar/schema.py
parent7d38f46fc1970decfcfb1e3f4583b85605e5b8ee (diff)
downloadfatcat-scholar-4979c58ee91903148962f4d62d1a8d423349ad67.tar.gz
fatcat-scholar-4979c58ee91903148962f4d62d1a8d423349ad67.zip
add basic html fulltext support to fetch pipeline
Diffstat (limited to 'fatcat_scholar/schema.py')
-rw-r--r--fatcat_scholar/schema.py1
1 files changed, 1 insertions, 0 deletions
diff --git a/fatcat_scholar/schema.py b/fatcat_scholar/schema.py
index 5637e0a..bec81ab 100644
--- a/fatcat_scholar/schema.py
+++ b/fatcat_scholar/schema.py
@@ -33,6 +33,7 @@ class IntermediateBundle(BaseModel):
grobid_fulltext: Optional[Dict[str, Any]]
pdftotext_fulltext: Optional[Dict[str, Any]]
pdf_meta: Optional[Dict[str, Any]]
+ html_fulltext: Optional[Dict[str, Any]]
sim_fulltext: Optional[Dict[str, Any]]
fetched: Optional[datetime.datetime]