diff options
Diffstat (limited to 'python/pdftrio_tool.py')
-rwxr-xr-x | python/pdftrio_tool.py | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/python/pdftrio_tool.py b/python/pdftrio_tool.py index 5cffa8c..e195bc7 100755 --- a/python/pdftrio_tool.py +++ b/python/pdftrio_tool.py @@ -9,10 +9,10 @@ Example of large parallel run, locally: cat /srv/sandcrawler/tasks/something.cdx | pv -l | parallel -j30 --pipe ./pdftrio_tool.py --kafka-env prod --kafka-hosts wbgrp-svc263.us.archive.org:9092,wbgrp-svc284.us.archive.org:9092,wbgrp-svc285.us.archive.org:9092 --kafka-mode --pdftrio-host http://localhost:3939 -j0 classify-pdf-json - """ -import sys -import json import argparse import datetime +import json +import sys from sandcrawler import * |