From 7a131adfb89ef6e54a55cbfccf1ff3cb11a4f491 Mon Sep 17 00:00:00 2001 From: Carl Kittelberger Date: Sun, 3 Jul 2016 18:57:04 +0200 Subject: [PATCH] parsers/wikipedia: Fix handling of www.wikipedia.org and wikipedia.org links. --- parsers/wikipedia/parser.go | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/parsers/wikipedia/parser.go b/parsers/wikipedia/parser.go index 40b751f..77b285d 100644 --- a/parsers/wikipedia/parser.go +++ b/parsers/wikipedia/parser.go @@ -23,7 +23,8 @@ func (p *Parser) Init() error { } func (p *Parser) Parse(u *url.URL, referer *url.URL) (result parsers.ParseResult) { - if !strings.HasSuffix(strings.ToLower(u.Host), ".wikipedia.org") { + if !strings.HasSuffix(strings.ToLower(u.Host), ".wikipedia.org") || + strings.EqualFold(u.Host, "wikipedia.org") { result.Ignored = true return } @@ -37,6 +38,11 @@ func (p *Parser) Parse(u *url.URL, referer *url.URL) (result parsers.ParseResult } // We're using the original host for link localization + // or en.wikipedia.org for (www.)wikipedia.org + if strings.EqualFold(u.Host, "wikipedia.org") || + strings.EqualFold(u.Host, "www.wikipedia.org") { + u.Host = "en.wikipedia.org" + } r, err := http.Get("https://" + u.Host + "/api/rest_v1/page/summary/" + titleEscaped) if err != nil { result.Error = err