aboutsummaryrefslogtreecommitdiffstats
path: root/python/pdftrio_tool.py
diff options
context:
space:
mode:
Diffstat (limited to 'python/pdftrio_tool.py')
-rwxr-xr-xpython/pdftrio_tool.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/pdftrio_tool.py b/python/pdftrio_tool.py
index 9d3010e..24b749d 100755
--- a/python/pdftrio_tool.py
+++ b/python/pdftrio_tool.py
@@ -5,7 +5,7 @@ text extraction.
Example of large parallel run, locally:
-cat /srv/sandcrawler/tasks/something.cdx | pv -l | parallel -j30 --pipe ./pdftrio_tool.py --kafka-env prod --kafka-hosts wbgrp-svc263.us.archive.org:9092,wbgrp-svc284.us.archive.org:9092,wbgrp-svc285.us.archive.org:9092 --kafka-mode --pdftrio-host http://localhost:3939 -j0 classify-pdf-json -
+cat /srv/sandcrawler/tasks/something.cdx | pv -l | parallel -j30 --pipe ./pdftrio_tool.py --kafka-env prod --kafka-hosts wbgrp-svc350.us.archive.org:9092,wbgrp-svc284.us.archive.org:9092,wbgrp-svc285.us.archive.org:9092 --kafka-mode --pdftrio-host http://localhost:3939 -j0 classify-pdf-json -
"""
import argparse