From e8eb959fbdd5d13cd53421ddf2487811d049c4e8 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Wed, 4 Apr 2018 11:47:41 -0700 Subject: more WIP on extractor --- extraction/TODO | 2 ++ 1 file changed, 2 insertions(+) create mode 100644 extraction/TODO (limited to 'extraction/TODO') diff --git a/extraction/TODO b/extraction/TODO new file mode 100644 index 0000000..ed10834 --- /dev/null +++ b/extraction/TODO @@ -0,0 +1,2 @@ +- abstract CDX line reading and HBase stuff out into a common library +- actual GROBID_SERVER="http://wbgrp-svc096.us.archive.org:8070" -- cgit v1.2.3