diff options
author | Bryan Newbold <bnewbold@archive.org> | 2018-08-27 16:40:15 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2018-08-27 16:40:15 -0700 |
commit | b4eac17049e19d33b1a55664a7258c0f62f8a8c7 (patch) | |
tree | e71de0eb969f53765e4f7b8f5053b5ece3b28781 /scalding/src/test | |
parent | 309f40b66d474f12c0cfe60c449d43ae4bacb912 (diff) | |
download | sandcrawler-b4eac17049e19d33b1a55664a7258c0f62f8a8c7.tar.gz sandcrawler-b4eac17049e19d33b1a55664a7258c0f62f8a8c7.zip |
make similarity score case-insensitive
Diffstat (limited to 'scalding/src/test')
-rw-r--r-- | scalding/src/test/scala/sandcrawler/ScorableTest.scala | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/scalding/src/test/scala/sandcrawler/ScorableTest.scala b/scalding/src/test/scala/sandcrawler/ScorableTest.scala index f63bef8..2094543 100644 --- a/scalding/src/test/scala/sandcrawler/ScorableTest.scala +++ b/scalding/src/test/scala/sandcrawler/ScorableTest.scala @@ -70,4 +70,12 @@ class ScorableTest extends FlatSpec with Matchers { new ReduceFeatures(JsonString), new ReduceFeatures(JsonString)) score shouldBe Scorable.MaxScore } + + "computeOutput()" should "be case-insensitive" in { + val left = JsonString.replace("<<TITLE>>", "A TITLE UPPER CASE") + val right = JsonString.replace("<<TITLE>>", "a title upper case") + val score = Scorable.computeSimilarity( + new ReduceFeatures(left), new ReduceFeatures(right)) + score shouldBe Scorable.MaxScore + } } |