aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-08-20 19:14:41 -0700
committerBryan Newbold <bnewbold@archive.org>2018-08-21 21:25:56 -0700
commitf5c52210aa331b329cd36dbd711977b065a70eb2 (patch)
treedea837626286f69950516f170a061232a3282be0
parentcce6047bdcf979729ec286d4c1f37676aeff2707 (diff)
downloadsandcrawler-f5c52210aa331b329cd36dbd711977b065a70eb2.tar.gz
sandcrawler-f5c52210aa331b329cd36dbd711977b065a70eb2.zip
HDFS doesn't like colons
-rwxr-xr-xplease2
1 files changed, 1 insertions, 1 deletions
diff --git a/please b/please
index c83f867..e328410 100755
--- a/please
+++ b/please
@@ -194,7 +194,7 @@ def run_colcount(args):
HDFS_DIR,
args.env,
datetime.strftime(datetime.now(), "%Y-%m-%d-%H%M.%S"),
- args.column)
+ args.column.replace(':', '_'))
cmd = """hadoop jar \
scalding/target/scala-2.11/sandcrawler-assembly-0.2.0-SNAPSHOT.jar \
com.twitter.scalding.Tool sandcrawler.HBaseColCountJob \