From 97d10e1764cfb2e5c4dc0009e1bcb5139bce0eaa Mon Sep 17 00:00:00 2001 From: Aevann Date: Fri, 1 Dec 2023 22:20:56 +0200 Subject: [PATCH] better fix than 64c3a79522809453c1c967cf8db5a6accfebe33f that doesnt cause a litany of other issues --- files/helpers/sanitize.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/files/helpers/sanitize.py b/files/helpers/sanitize.py index 5c530b62f..2e72f79cf 100644 --- a/files/helpers/sanitize.py +++ b/files/helpers/sanitize.py @@ -732,6 +732,9 @@ def is_whitelisted(domain, k): def normalize_url(url): + if 'wikipedia.org/wiki/' not in url: + url = unquote(url) + url = url.replace("reddit.com/user/", "reddit.com/u/") url = reddit_domain_regex.sub(r'\1https://old.reddit.com/\5', url) @@ -799,9 +802,10 @@ def normalize_url(url): url = imgur_regex.sub(r'\1_d.webp?maxwidth=9999&fidelity=grand', url) - url = url.rstrip('=') + if 'wikipedia.org/wiki/' not in url: + url = unquote(url) - return url + return url.rstrip('=') def normalize_url_gevent(url): url = requests.get(url, headers=HEADERS, timeout=2).url