aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2019-01-28 17:59:09 -0800
committerBryan Newbold <bnewbold@robocracy.org>2019-01-28 17:59:09 -0800
commitd7d42a21b0b652496d26a10457a23fe6b615da90 (patch)
treeee97d1b36b303b02295b81a38b4908da2ae08dd4
parentb654c8f0bf4629b14e9fcb6b7cb10f07fa8c43eb (diff)
downloadfatcat-d7d42a21b0b652496d26a10457a23fe6b615da90.tar.gz
fatcat-d7d42a21b0b652496d26a10457a23fe6b615da90.zip
add missing bezerk-mode flag to GROBID import
-rwxr-xr-xpython/fatcat_import.py11
1 files changed, 8 insertions, 3 deletions
diff --git a/python/fatcat_import.py b/python/fatcat_import.py
index fcb4941b..23f7e869 100755
--- a/python/fatcat_import.py
+++ b/python/fatcat_import.py
@@ -28,12 +28,14 @@ def run_journal_metadata(args):
def run_matched(args):
fmi = MatchedImporter(args.api,
- bezerk_mode=args.bezerk_mode,
edit_batch_size=args.batch_size)
JsonLinePusher(fmi, args.json_file).run()
def run_grobid_metadata(args):
- fmi = GrobidMetadataImporter(args.api, edit_batch_size=args.batch_size, longtail_oa=args.longtail_oa)
+ fmi = GrobidMetadataImporter(args.api,
+ edit_batch_size=args.batch_size,
+ longtail_oa=args.longtail_oa,
+ bezerk_mode=args.bezerk_mode)
LinePusher(fmi, args.tsv_file).run()
def main():
@@ -126,9 +128,12 @@ def main():
sub_grobid_metadata.add_argument('--group-size',
help="editgroup group size to use",
default=75, type=int)
- sub_matched.add_argument('--longtail-oa',
+ sub_grobid_metadata.add_argument('--longtail-oa',
action='store_true',
help="if this is an import of longtail OA content (sets an 'extra' flag)")
+ sub_grobid_metadata.add_argument('--bezerk-mode',
+ action='store_true',
+ help="don't lookup existing DOIs, just insert (clobbers; only for fast bootstrap)")
args = parser.parse_args()
if not args.__dict__.get("func"):