From 0e847f052b3347e74921361fa2ab001d54c75105 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Thu, 23 Aug 2018 17:17:04 -0700 Subject: increase MaxTitleLength from 255 to 1023 Motivated after finding some long titles with MathML mixed in. Until this issue can be investigated further, bumping this limit to pass the handful of matches found. --- scalding/src/main/scala/sandcrawler/Scorable.scala | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'scalding') diff --git a/scalding/src/main/scala/sandcrawler/Scorable.scala b/scalding/src/main/scala/sandcrawler/Scorable.scala index c704ed9..5aac032 100644 --- a/scalding/src/main/scala/sandcrawler/Scorable.scala +++ b/scalding/src/main/scala/sandcrawler/Scorable.scala @@ -30,7 +30,7 @@ abstract class Scorable { } object Scorable { - val MaxTitleLength = 255 + val MaxTitleLength = 1023 val NoSlug = "NO SLUG" // Used for slug if title is empty or unparseable def isValidSlug(slug : String) : Boolean = { -- cgit v1.2.3