diff options
-rw-r--r-- | python/sandcrawler/grobid.py | 3 |
1 files changed, 0 insertions, 3 deletions
diff --git a/python/sandcrawler/grobid.py b/python/sandcrawler/grobid.py index a6858ff..f221830 100644 --- a/python/sandcrawler/grobid.py +++ b/python/sandcrawler/grobid.py @@ -83,8 +83,6 @@ class GrobidClient(object): - status (slug) - error_msg (if status == 'error') - tei_xml (if status is 200) - - TODO: persist connection for performance? """ assert blob @@ -188,7 +186,6 @@ class GrobidClient(object): if len(ref.get("unstructured", "").strip()) <= 6: return False - # TODO: what other combinations are enough to skip parsing? if ( ref.get("year") and ref.get("author") |