summaryrefslogtreecommitdiffstats
path: root/fatcat_scholar/work_pipeline.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2021-01-22 19:31:50 -0800
committerBryan Newbold <bnewbold@archive.org>2021-01-22 19:31:50 -0800
commit2b5cfb73097f17f383457380e36bf977cd0da5ed (patch)
tree67ab6bd2d53735f4394ad1ce6e98dd2e0c8e8ef3 /fatcat_scholar/work_pipeline.py
parent0591b388a55771ed0581102989e23ba22a720a27 (diff)
downloadfatcat-scholar-2b5cfb73097f17f383457380e36bf977cd0da5ed.tar.gz
fatcat-scholar-2b5cfb73097f17f383457380e36bf977cd0da5ed.zip
bug fix: actually fetch/include HTML fulltext
Diffstat (limited to 'fatcat_scholar/work_pipeline.py')
-rw-r--r--fatcat_scholar/work_pipeline.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/fatcat_scholar/work_pipeline.py b/fatcat_scholar/work_pipeline.py
index ea33a01..fd85089 100644
--- a/fatcat_scholar/work_pipeline.py
+++ b/fatcat_scholar/work_pipeline.py
@@ -317,7 +317,7 @@ class WorkPipeline:
html_fulltext: Optional[Any] = None
for ident in pref_idents:
release = release_dict[ident]
- if not release.files:
+ if not (release.files or release.webcaptures):
continue
for fe in release.files:
if not fe.sha1 or fe.mimetype not in (None, "application/pdf"):