diff options
author | Bryan Newbold <bnewbold@archive.org> | 2018-05-21 12:09:25 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2018-05-21 12:09:27 -0700 |
commit | 174e5ec2766dca81e57ee455219b54a689b41e61 (patch) | |
tree | 12f6ee14b01e5b547308f9782d4871ff94c56f40 /scald-mvp/src/main/scala/example/WordCount.scala | |
parent | ca8c5dedea7907cf26ec63309f4e99030e644351 (diff) | |
download | sandcrawler-174e5ec2766dca81e57ee455219b54a689b41e61.tar.gz sandcrawler-174e5ec2766dca81e57ee455219b54a689b41e61.zip |
WordCount -> WordCountJob
Also use the exact file from scalding repo
Diffstat (limited to 'scald-mvp/src/main/scala/example/WordCount.scala')
-rw-r--r-- | scald-mvp/src/main/scala/example/WordCount.scala | 12 |
1 files changed, 0 insertions, 12 deletions
diff --git a/scald-mvp/src/main/scala/example/WordCount.scala b/scald-mvp/src/main/scala/example/WordCount.scala deleted file mode 100644 index 0de6ae0..0000000 --- a/scald-mvp/src/main/scala/example/WordCount.scala +++ /dev/null @@ -1,12 +0,0 @@ - -package example - -import com.twitter.scalding._ - -class WordCount(args : Args) extends Job(args) { - TypedPipe.from(TextLine(args("input"))) - .flatMap { line => line.split("""\s+""") } - .groupBy { word => word } - .size - .write(TypedTsv(args("output"))) -} |