aboutsummaryrefslogtreecommitdiffstats
path: root/fatcat_scholar/transform.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-05-20 18:17:43 -0700
committerBryan Newbold <bnewbold@archive.org>2020-05-20 18:17:43 -0700
commit1ccd50eca45667aaf232f3bfb6a5aafadf17fc09 (patch)
tree13e5bcc999f76938d8de65ec0f20fb2e1b8c19ce /fatcat_scholar/transform.py
parent73cde66c9ab0bcae733097e53f1b6c4f00a8ea86 (diff)
downloadfatcat-scholar-1ccd50eca45667aaf232f3bfb6a5aafadf17fc09.tar.gz
fatcat-scholar-1ccd50eca45667aaf232f3bfb6a5aafadf17fc09.zip
fixes to release+sim pipeline
Diffstat (limited to 'fatcat_scholar/transform.py')
-rw-r--r--fatcat_scholar/transform.py3
1 files changed, 2 insertions, 1 deletions
diff --git a/fatcat_scholar/transform.py b/fatcat_scholar/transform.py
index a86fe15..d858a4c 100644
--- a/fatcat_scholar/transform.py
+++ b/fatcat_scholar/transform.py
@@ -184,11 +184,12 @@ def transform_heavy(heavy: IntermediateBundle) -> Optional[ScholarDoc]:
tags: List[str] = []
work_ident: Optional[str] = None
abstracts: List[ScholarAbstract] = []
- fulltext: Optional[ScholarFulltext]
+ fulltext: Optional[ScholarFulltext] = None
ia_sim: Optional[ScholarSim] = None
if heavy.sim_fulltext is not None:
ia_sim = es_sim_from_sim(heavy.sim_fulltext)
+ fulltext = es_fulltext_from_sim(heavy.sim_fulltext)
if heavy.doc_type == DocType.sim_page:
assert ia_sim is not None