diff options
-rw-r--r-- | python/sandcrawler/grobid.py | 5 |
1 files changed, 5 insertions, 0 deletions
diff --git a/python/sandcrawler/grobid.py b/python/sandcrawler/grobid.py index f221830..791e0fe 100644 --- a/python/sandcrawler/grobid.py +++ b/python/sandcrawler/grobid.py @@ -95,9 +95,14 @@ class GrobidClient(object): self.host_url + "/api/processFulltextDocument", files={ "input": blob, + }, + data={ "consolidateHeader": consolidate_mode, "consolidateCitations": 0, # too expensive for now "includeRawCitations": 1, + "includeRawAffiliations": 1, + "teiCoordinates": ["ref", "figure", "persName", "formula", "biblStruct"], + "segmentSentences": 1, }, timeout=180.0, ) |