aboutsummaryrefslogtreecommitdiffstats
path: root/scalding/src/test/scala/sandcrawler
diff options
context:
space:
mode:
authorEllen Spertus <ellen.spertus@gmail.com>2018-07-25 20:33:38 -0700
committerEllen Spertus <ellen.spertus@gmail.com>2018-07-25 20:33:38 -0700
commit0f0152189cf6df0f4b56d92149a60e902eb20be6 (patch)
tree8d22242ed5ae38caa086be16dee3a07a7fc44989 /scalding/src/test/scala/sandcrawler
parent4b63570522e5ebbc73980356372c39ce7547ba68 (diff)
downloadsandcrawler-0f0152189cf6df0f4b56d92149a60e902eb20be6.tar.gz
sandcrawler-0f0152189cf6df0f4b56d92149a60e902eb20be6.zip
Fixed bug with reading from TextLine. (Thanks, Bryan\!) Still had to comment out some tests.
Diffstat (limited to 'scalding/src/test/scala/sandcrawler')
-rw-r--r--scalding/src/test/scala/sandcrawler/HBaseCrossrefScoreTest.scala9
1 files changed, 4 insertions, 5 deletions
diff --git a/scalding/src/test/scala/sandcrawler/HBaseCrossrefScoreTest.scala b/scalding/src/test/scala/sandcrawler/HBaseCrossrefScoreTest.scala
index dc96003..96c7770 100644
--- a/scalding/src/test/scala/sandcrawler/HBaseCrossrefScoreTest.scala
+++ b/scalding/src/test/scala/sandcrawler/HBaseCrossrefScoreTest.scala
@@ -178,18 +178,17 @@ class HBaseCrossrefScoreTest extends FlatSpec with Matchers {
.arg("debug", "true")
.source[Tuple](HBaseCrossrefScore.getHBaseSource(testTable, testHost),
grobidSampleData.map(l => new Tuple(l.map(s => {new ImmutableBytesWritable(s)}):_*)))
- .source(TextLine(input), List((
+ .source(TextLine(input), List(
CrossrefString.replace("<<TITLE>>", "Title 1: TNG").replace("<<DOI>>", "DOI-0"),
CrossrefString.replace("<<TITLE>>", "Title 1: TNG").replace("<<DOI>>", "DOI-0.5"),
CrossrefString.replace("<<TITLE>>", "Title 1: TNG").replace("<<DOI>>", "DOI-0.75"),
- CrossrefString.replace("<<TITLE>>", "Title 2: Rebooted").replace("<<DOI>>", "DOI-1"))))
- .sink[(String, String, String, String, String,
- String)](TypedTsv[(String, String, String, String, String, String)](output)) {
+ CrossrefString.replace("<<TITLE>>", "Title 2: Rebooted").replace("<<DOI>>", "DOI-1")))
+ .sink[(String, String, String)](TypedTsv[(String, String, String)](output)) {
outputBuffer =>
- /*
it should "return a 3-element list" in {
outputBuffer should have length 3
}
+ /*
it should "return the right first entry" in {
val (slug, slug0, slug1, sha1, grobidJson, crossrefJson) = outputBuffer(0)
slug shouldBe "title1"