aboutsummaryrefslogtreecommitdiffstats
path: root/scalding/src
diff options
context:
space:
mode:
authorbnewbold <bnewbold@archive.org>2018-07-13 22:02:59 +0000
committerbnewbold <bnewbold@archive.org>2018-07-13 22:02:59 +0000
commit0e74b5f49950c5c46d9be5e99066bee71cc8828f (patch)
treecc13851851bb3f20ba577881934942f54dc454c8 /scalding/src
parentb3149a911df8150056c54f86cd77c3516fc9838c (diff)
parent309f1fcb9dfe6968e7b1a0640280adf1b6c1ffc2 (diff)
downloadsandcrawler-0e74b5f49950c5c46d9be5e99066bee71cc8828f.tar.gz
sandcrawler-0e74b5f49950c5c46d9be5e99066bee71cc8828f.zip
Merge branch 'spertus-issue1' into 'master'
Changed grobid0:status to grobid0:status_code, per issue 1. See merge request webgroup/sandcrawler!7
Diffstat (limited to 'scalding/src')
-rw-r--r--scalding/src/main/scala/sandcrawler/HBaseStatusCountJob.scala2
-rw-r--r--scalding/src/test/scala/sandcrawler/HBaseStatusCountTest.scala2
2 files changed, 2 insertions, 2 deletions
diff --git a/scalding/src/main/scala/sandcrawler/HBaseStatusCountJob.scala b/scalding/src/main/scala/sandcrawler/HBaseStatusCountJob.scala
index 27b3177..aabf9f8 100644
--- a/scalding/src/main/scala/sandcrawler/HBaseStatusCountJob.scala
+++ b/scalding/src/main/scala/sandcrawler/HBaseStatusCountJob.scala
@@ -2,4 +2,4 @@ package sandcrawler
import com.twitter.scalding.Args
-class HBaseStatusCountJob(args: Args) extends HBaseCountJob(args, "grobid0:status")
+class HBaseStatusCountJob(args: Args) extends HBaseCountJob(args, "grobid0:status_code")
diff --git a/scalding/src/test/scala/sandcrawler/HBaseStatusCountTest.scala b/scalding/src/test/scala/sandcrawler/HBaseStatusCountTest.scala
index a0b313e..056347c 100644
--- a/scalding/src/test/scala/sandcrawler/HBaseStatusCountTest.scala
+++ b/scalding/src/test/scala/sandcrawler/HBaseStatusCountTest.scala
@@ -41,7 +41,7 @@ class HBaseStatusCountTest extends FunSpec with TupleConversions {
.arg("app.conf.path", "app.conf")
.arg("output", output)
.arg("debug", "true")
- .source[Tuple](HBaseCountJob.getHBaseSource("grobid0:status"),
+ .source[Tuple](HBaseCountJob.getHBaseSource("grobid0:status_code"),
sampleData.map(l => new Tuple(l.map(s => {new ImmutableBytesWritable(Bytes.toBytes(s))}):_*)))
.sink[Tuple](Tsv(output)) {
outputBuffer =>