From 619410dd1cf19b1d4dc9b00b5b0c31e253264f8e Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Fri, 28 Sep 2018 18:01:21 -0700 Subject: update README_import with GROBID command --- python/README_import.md | 2 ++ 1 file changed, 2 insertions(+) (limited to 'python') diff --git a/python/README_import.md b/python/README_import.md index 38064a97..d3bbaddd 100644 --- a/python/README_import.md +++ b/python/README_import.md @@ -61,3 +61,5 @@ Unknown speed! # ... but do on the second zcat /srv/fatcat/datasets/2018-08-27-2352.17-matchcrossref.insertable.json.gz | pv -l | time parallel -j12 --round-robin --pipe ./fatcat_import.py import-matched - + # GROBID extracted (release+file) + time zcat /srv/fatcat/datasets/2018-09-23-0405.30-dumpgrobidmetainsertable.longtail_join.filtered.tsv.gz | pv -l | time parallel -j12 --round-robin --pipe ./fatcat_import.py import-grobid-metadata - -- cgit v1.2.3