aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-02-03 20:15:09 -0800
committerBryan Newbold <bnewbold@archive.org>2020-02-03 20:15:09 -0800
commite865b395f945e5d97a99ce269f23957cae01feaa (patch)
tree2e5cf79f17c98ffbc61ee3b63009cbf809c84e75
parent41d957152b4489312120bb9ec998c134db93fab8 (diff)
downloadsandcrawler-e865b395f945e5d97a99ce269f23957cae01feaa.tar.gz
sandcrawler-e865b395f945e5d97a99ce269f23957cae01feaa.zip
grobid petabox: fix fetch body/content
-rw-r--r--python/sandcrawler/grobid.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/sandcrawler/grobid.py b/python/sandcrawler/grobid.py
index cbb499d..08e3a96 100644
--- a/python/sandcrawler/grobid.py
+++ b/python/sandcrawler/grobid.py
@@ -135,7 +135,7 @@ class GrobidWorker(SandcrawlerWorker):
source=record,
key=default_key,
)
- blob = resp.body
+ blob = resp.content
else:
raise ValueError("not a CDX (wayback) or petabox (archive.org) dict; not sure how to proceed")
if not blob: