aboutsummaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
Diffstat (limited to 'python')
-rw-r--r--python/sandcrawler/grobid.py3
1 files changed, 0 insertions, 3 deletions
diff --git a/python/sandcrawler/grobid.py b/python/sandcrawler/grobid.py
index a6858ff..f221830 100644
--- a/python/sandcrawler/grobid.py
+++ b/python/sandcrawler/grobid.py
@@ -83,8 +83,6 @@ class GrobidClient(object):
- status (slug)
- error_msg (if status == 'error')
- tei_xml (if status is 200)
-
- TODO: persist connection for performance?
"""
assert blob
@@ -188,7 +186,6 @@ class GrobidClient(object):
if len(ref.get("unstructured", "").strip()) <= 6:
return False
- # TODO: what other combinations are enough to skip parsing?
if (
ref.get("year")
and ref.get("author")