aboutsummaryrefslogtreecommitdiffstats
path: root/mapreduce/backfill_hbase_from_cdx.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-04-10 19:13:43 -0700
committerBryan Newbold <bnewbold@archive.org>2018-04-10 19:14:26 -0700
commita0be9706997182b18e48000375c462856aafc5ef (patch)
tree30a7ea934c041275adfeaae1d8f9d6349994e335 /mapreduce/backfill_hbase_from_cdx.py
parent0a778bd6d46a71b7cbec04eb3a5bdb00d91da0de (diff)
downloadsandcrawler-a0be9706997182b18e48000375c462856aafc5ef.tar.gz
sandcrawler-a0be9706997182b18e48000375c462856aafc5ef.zip
TODO updates
Diffstat (limited to 'mapreduce/backfill_hbase_from_cdx.py')
-rwxr-xr-xmapreduce/backfill_hbase_from_cdx.py7
1 files changed, 0 insertions, 7 deletions
diff --git a/mapreduce/backfill_hbase_from_cdx.py b/mapreduce/backfill_hbase_from_cdx.py
index 72331b0..6b2ec0b 100755
--- a/mapreduce/backfill_hbase_from_cdx.py
+++ b/mapreduce/backfill_hbase_from_cdx.py
@@ -7,13 +7,6 @@ formats.
Requires:
- happybase
- mrjob
-
-TODO:
-- argparse
-- refactor into an object
-- tests in separate file
-- nose tests
-- sentry integration for error reporting
"""
import json