From 65f2156c2af3853142825d080d56650f0a1284ce Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Sat, 10 Jul 2021 00:20:02 +0200 Subject: reduce: tweak wiki bref --- skate/reduce.go | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/skate/reduce.go b/skate/reduce.go index 255f281..823255c 100644 --- a/skate/reduce.go +++ b/skate/reduce.go @@ -167,9 +167,9 @@ func ZippyExactWiki(releases, wiki io.Reader, mr MatchResult, w io.Writer) error return err } var bref BiblioRef - // We use base64 w/o padding of the original PageTitle as - // component for the id. XXX: ok for now? - key := fmt.Sprintf("%s_%s", + // We use lowercase base32 w/o padding of the original + // PageTitle as component for the id. XXX: ok for now? + key := fmt.Sprintf("wikipedia_%s_%s", strings.ToLower(b32enc.EncodeToString([]byte(wiki.PageTitle))), target.Ident) if seen.Contains(key) { @@ -177,7 +177,8 @@ func ZippyExactWiki(releases, wiki io.Reader, mr MatchResult, w io.Writer) error } seen.Add(key) bref.Key = key - bref.SourceWikipediaArticle = wiki.PageTitle + // XXX: We currently only use "en" subset. + bref.SourceWikipediaArticle = fmt.Sprintf("en:%s", wiki.PageTitle) bref.TargetReleaseIdent = target.Ident bref.TargetWorkIdent = target.WorkID bref.MatchProvenance = "wikipedia" -- cgit v1.2.3