diff options
Diffstat (limited to 'scalding/src/test/scala')
| -rw-r--r-- | scalding/src/test/scala/sandcrawler/ScorableFeaturesTest.scala | 37 | ||||
| -rw-r--r-- | scalding/src/test/scala/sandcrawler/ScorableTest.scala | 32 | 
2 files changed, 37 insertions, 32 deletions
| diff --git a/scalding/src/test/scala/sandcrawler/ScorableFeaturesTest.scala b/scalding/src/test/scala/sandcrawler/ScorableFeaturesTest.scala new file mode 100644 index 0000000..7ec0c4d --- /dev/null +++ b/scalding/src/test/scala/sandcrawler/ScorableFeaturesTest.scala @@ -0,0 +1,37 @@ +package sandcrawler + +import org.scalatest._ + +class ScorableFeaturesTest extends FlatSpec with Matchers { +  private def titleToSlug(s : String) : String = { +    new ScorableFeatures(title = s).toSlug +  } + +  "mapToSlug()" should "extract the parts of titles before a colon" in { +    titleToSlug("HELLO:there") shouldBe "hello" +  } + +  it should "extract an entire colon-less string" in { +    titleToSlug("hello THERE") shouldBe "hellothere" +  } + +  it should "return Scorable.NoSlug if given empty string" in { +    titleToSlug("") shouldBe Scorable.NoSlug +  } + +  it should "return Scorable.NoSlug if given null" in { +    titleToSlug(null) shouldBe Scorable.NoSlug +  } + +  it should "strip punctuation" in { +    titleToSlug("HELLO!:the:re") shouldBe "hello" +    titleToSlug("a:b:c") shouldBe "a" +    titleToSlug( +      "If you're happy and you know it, clap your hands!") shouldBe "ifyourehappyandyouknowitclapyourhands" +  } + +  it should "remove whitespace" in { +    titleToSlug("foo bar : baz ::") shouldBe "foobar" +    titleToSlug("\na\t:b:c") shouldBe "a" +  } +} diff --git a/scalding/src/test/scala/sandcrawler/ScorableTest.scala b/scalding/src/test/scala/sandcrawler/ScorableTest.scala index 95faacc..fd44f57 100644 --- a/scalding/src/test/scala/sandcrawler/ScorableTest.scala +++ b/scalding/src/test/scala/sandcrawler/ScorableTest.scala @@ -54,38 +54,6 @@ class ScorableTest extends FlatSpec with Matchers {    "annex": null  }  """ -  private def titleToSlug(s : String) : String = { -    Scorable.mapToSlug(Scorable.toScorableMap(title = s)) -  } - -  "mapToSlug()" should "extract the parts of titles before a colon" in { -    titleToSlug("HELLO:there") shouldBe "hello" -  } - -  it should "extract an entire colon-less string" in { -    titleToSlug("hello THERE") shouldBe "hellothere" -  } - -  it should "return Scorable.NoSlug if given empty string" in { -    titleToSlug("") shouldBe Scorable.NoSlug -  } - -  it should "return Scorable.NoSlug if given null" in { -    titleToSlug(null) shouldBe Scorable.NoSlug -  } - -  it should "strip punctuation" in { -    titleToSlug("HELLO!:the:re") shouldBe "hello" -    titleToSlug("a:b:c") shouldBe "a" -    titleToSlug( -      "If you're happy and you know it, clap your hands!") shouldBe "ifyourehappyandyouknowitclapyourhands" -  } - -  it should "remove whitespace" in { -    titleToSlug("foo bar : baz ::") shouldBe "foobar" -    titleToSlug("\na\t:b:c") shouldBe "a" -  } -    "jsonToMap()" should "return a map, given a legal JSON string" in {      Scorable.jsonToMap(JsonString) should not be (None)    } | 
