diff options
author | Martin Czygan <martin.czygan@gmail.com> | 2021-05-12 21:14:41 +0200 |
---|---|---|
committer | Martin Czygan <martin.czygan@gmail.com> | 2021-05-12 21:14:41 +0200 |
commit | 4d185d6f050a87e908e772709b55a0a35e32f999 (patch) | |
tree | c85838b49556889da448627d68ed67d05eb85fd3 | |
parent | 245db6bb42eff602f710e2da7d49c340cc889f9e (diff) | |
download | refcat-4d185d6f050a87e908e772709b55a0a35e32f999.tar.gz refcat-4d185d6f050a87e908e772709b55a0a35e32f999.zip |
fix formatting
-rw-r--r-- | skate/url.go | 13 |
1 files changed, 5 insertions, 8 deletions
diff --git a/skate/url.go b/skate/url.go index 0f7ad7f..af4ac0c 100644 --- a/skate/url.go +++ b/skate/url.go @@ -19,24 +19,23 @@ var ( // http://agingmind.utdallas.edu/facedb/view/neutral-faces.doi:10.3758/BF03206543. // http://10.3386/w20634https://doi.org/10.3386/w20634 func SanitizeURL(s string) string { - index := suffixarray.New([]byte(s)) - indices := index.Lookup([]byte("http"), -1) + var ( + index = suffixarray.New([]byte(s)) + indices = index.Lookup([]byte("http"), -1) + ) if len(indices) > 1 { s = s[0:indices[1]] // only use the first s = strings.TrimRight(s, ":") + s = strings.TrimRight(s, ";") } - // http://!!!: // http://! // http://" s = patNonWordDomain.ReplaceAllString(s, `$1$3`) - // http:///en.m.wikipedia.org/ChenLong s = patRepeatedHttpSlashes.ReplaceAllString(s, `$1$3`) - // http://10.1113/jphysiol.2002.026047 s = patHttpDOI.ReplaceAllString(s, `https://doi.org/$2`) - // .diaksestanggal27-03-2017.10.30Wib // accessedon15 // .Accessed @@ -45,11 +44,9 @@ func SanitizeURL(s string) string { if patAccessedOn.MatchString(s) { s = patAccessedOn.ReplaceAllString(s, `$1`) } - // http://140.120.197.173/Ecology/Download/Timing-MSChart.zipJournalofInsectScience if patFileExtraSuffix.MatchString(s) { s = patFileExtraSuffix.ReplaceAllString(s, `$1`) } - return s } |