rDrama/files/helpers/regex.py

import random
import re
from typing import List, Literal, Optional, Union
from .const import *
from random import choice, choices

valid_username_chars = 'a-zA-Z0-9_\-'
valid_username_regex = re.compile("^[a-zA-Z0-9_\-]{3,25}$", flags=re.A)
mention_regex = re.compile('(^|\s|>)@(([a-zA-Z0-9_\-]){1,30})(?![^<]*<\/(code|pre|a)>)', flags=re.A)

valid_password_regex = re.compile("^.{8,100}$", flags=re.A)

marseyaward_body_regex = re.compile(">[^<\s+]|[^>\s+]<", flags=re.A)

marseyaward_title_regex = re.compile("( *<img[^>]+>)+", flags=re.A)


marsey_regex = re.compile("marsey[a-z0-9]{1,24}", flags=re.A)
tags_regex = re.compile("[a-z0-9: ]{1,200}", flags=re.A)
hat_regex = re.compile("[a-zA-Z0-9\-() ,_]{1,50}", flags=re.A)
description_regex = re.compile("[^<>&\n\t]{1,300}", flags=re.A)


valid_sub_regex = re.compile("^[a-zA-Z0-9_\-]{3,25}$", flags=re.A)

query_regex = re.compile("(\w+):(\S+)", flags=re.A)

poll_regex = re.compile("\s*\$\$([^\$\n]+)\$\$\s*", flags=re.A)
bet_regex = re.compile("\s*\$\$\$([^\$\n]+)\$\$\$\s*", flags=re.A)
choice_regex = re.compile("\s*&&([^\$\n]+)&&\s*", flags=re.A)

html_comment_regex = re.compile("<!--.*-->", flags=re.A)

title_regex = re.compile("[^\w ]", flags=re.A)

based_regex = re.compile("based and (.{1,20}?)(-| )pilled", flags=re.I|re.A)

controversial_regex = re.compile('["> ](https:\/\/old\.reddit\.com/r/[a-zA-Z0-9_]{3,20}\/comments\/[\w\-.#&/=\?@%+]{5,250})["< ]', flags=re.A)

fishylinks_regex = re.compile("https?://\S+", flags=re.A)

spoiler_regex = re.compile('''\|\|(.+)\|\|''', flags=re.A)
reddit_regex = re.compile('(^|\s|<p>)\/?((r|u)\/(\w|-){3,25})(?![^<]*<\/(code|pre|a)>)', flags=re.A)
sub_regex = re.compile('(^|\s|<p>)\/?(h\/(\w|-){3,25})(?![^<]*<\/(code|pre|a)>)', flags=re.A)

strikethrough_regex = re.compile('(^|\s|>)~{1,2}([^~]+)~{1,2}', flags=re.A)

mute_regex = re.compile("\/mute @([a-z0-9_\-]{3,30}) ([0-9]+)", flags=re.A|re.I)

emoji_regex = re.compile(f"<p>\s*(:[!#@]{{0,3}}[{valid_username_chars}]+:\s*)+<\/p>", flags=re.A)
emoji_regex2 = re.compile(f'(?<!"):([!#@{valid_username_chars}]{{1,36}}?):', flags=re.A)
emoji_regex3 = re.compile(f'(?<!"):([!@{valid_username_chars}]{{1,35}}?):', flags=re.A)

snappy_url_regex = re.compile('<a href="(https?:\/\/.+?)".*?>(.+?)<\/a>', flags=re.A)
snappy_youtube_regex = re.compile('<lite-youtube videoid="(.+?)" params="autoplay=1', flags=re.A)

email_regex = re.compile(EMAIL_REGEX_PATTERN, flags=re.A)

utm_regex = re.compile('utm_[0-z]+=[0-z_]+&', flags=re.A)
utm_regex2 = re.compile('[?&]utm_[0-z]+=[0-z_]+', flags=re.A)

slur_regex = re.compile(f"<[^>]*>|{slur_single_words}", flags=re.I|re.A)
slur_regex_upper = re.compile(f"<[^>]*>|{slur_single_words.upper()}", flags=re.A)
profanity_regex = re.compile(f"<[^>]*>|{profanity_single_words}", flags=re.I|re.A)
profanity_regex_upper = re.compile(f"<[^>]*>|{profanity_single_words.upper()}", flags=re.A)

torture_regex = re.compile('(^|\s)(i|me) ', flags=re.I|re.A)
torture_regex2 = re.compile("(^|\s)i'm ", flags=re.I|re.A)
torture_regex_exclude = re.compile('^\s*>', flags=re.A)


image_check_regex = re.compile(f'!\[\]\(((?!(https:\/\/([a-z0-9-]+\.)*({hosts})\/|\/)).*?)\)', flags=re.A)

video_regex_extensions = '|'.join(VIDEO_FORMATS)
video_sub_regex = re.compile(f'(<p>[^<]*)(https:\/\/([a-z0-9-]+\.)*({hosts})\/[\w:~,()\-.#&\/=?@%;+]*?\.({video_regex_extensions}))', flags=re.A)

audio_regex_extensions = '|'.join(AUDIO_FORMATS)
audio_sub_regex = re.compile(f'(<p>[^<]*)(https:\/\/([a-z0-9-]+\.)*({hosts})\/[\w:~,()\-.#&\/=?@%;+]*?\.({audio_regex_extensions}))', flags=re.A)

image_regex_extensions = '|'.join(IMAGE_FORMATS)
image_regex = re.compile(f"(^|\s)(https:\/\/[\w\-.#&/=\?@%;+,:]{{5,250}}\.({image_regex_extensions})(\?[\w\-.#&/=\?@%;+,:]*)?)($|\s)", flags=re.I|re.A)
image_regex_extensions = image_regex_extensions.replace('|gif', '')
imgur_regex = re.compile(f'(https:\/\/i\.imgur\.com\/[a-z0-9]+)\.({image_regex_extensions})', flags=re.I|re.A)

giphy_regex = re.compile('(https:\/\/media\.giphy\.com\/media\/[a-z0-9]+\/giphy)\.gif', flags=re.I|re.A)

youtube_regex = re.compile('(<p>[^<]*)(https:\/\/youtube\.com\/watch\?v\=([a-z0-9-_]{5,20})[\w\-.#&/=\?@%+]*)', flags=re.I|re.A)
yt_id_regex = re.compile('[a-z0-9-_]{5,20}', flags=re.I|re.A)

link_fix_regex = re.compile("(\[.*?\]\()(?!http|/)(.*?\))", flags=re.A)

css_url_regex = re.compile('url\(\s*[\'"]?(.*?)[\'"]?\s*\)', flags=re.I|re.A)

procoins_li = (0,2500,5000,10000,25000,50000,100000,250000)

linefeeds_regex = re.compile("([^\n ])\n([^\n])", flags=re.A)

greentext_regex = re.compile("(\n|^)>([^ >][^\n]*)", flags=re.A)

ascii_only_regex = re.compile("[ -~]+", flags=re.A)

reddit_to_vreddit_regex = re.compile('(^|>|")https:\/\/old.reddit.com\/(r|u)\/', flags=re.A)
reddit_domain_regex = re.compile("(^|\s|\()https?:\/\/(reddit\.com|(?:(?:[A-z]{2})(?:-[A-z]{2})" "?|beta|i|m|pay|ssl|www|new|alpha)\.reddit\.com|libredd\.it|teddit\.net)\/(r|u)\/", flags=re.A)

color_regex = re.compile("[a-f0-9]{6}", flags=re.A)

# lazy match on the {}?, only match if there is trailing stuff
# Specifically match Snappy's way of formatting, this might break some losers' comments.
showmore_regex = re.compile(r"^(.{3000,}?</p>(?:</li></ul>)?)(\s*<p>.*)", flags=re.A|re.DOTALL)

search_token_regex = re.compile('"([^"]*)"|(\S+)', flags=re.A)

git_regex = re.compile("ref: (refs/.+)", flags=re.A)

pronouns_regex = re.compile("([a-z]{1,5})/[a-z]{1,5}(/[a-z]{1,5})?", flags=re.A|re.I)

knowledgebase_page_regex = re.compile("[a-zA-Z0-9_\-]+", flags=re.A)

def sub_matcher(match:re.Match, upper=False, replace_with:Union[dict[str, str], dict[str, List[str]]]=SLURS):
	group_num = 0
	match_str = match.group(group_num)
	if match_str.startswith('<'):
		return match_str
	else:
		repl = replace_with[match_str.lower()]
		return repl if not upper or "<img" in repl else repl.upper()

def sub_matcher_upper(match, replace_with:Union[dict[str, str], dict[str, List[str]]]=SLURS):
	return sub_matcher(match, upper=True, replace_with=replace_with)


# TODO: make censoring a bit better
def sub_matcher_slurs(match, upper=False):
	return sub_matcher(match, upper, replace_with=SLURS)

def sub_matcher_slurs_upper(match):
	return sub_matcher_slurs(match, upper=True)

def sub_matcher_profanities(match, upper=False):
	return sub_matcher(match, upper, replace_with=PROFANITIES)

def sub_matcher_profanities_upper(match):
	return sub_matcher_profanities(match, upper=True)

def censor_slurs(body:Optional[str], logged_user):
	if not body: return ""
	def replace_re(body:str, regex:re.Pattern, regex_upper:re.Pattern, sub_func, sub_func_upper):
		body = regex_upper.sub(sub_func_upper, body)
		return regex.sub(sub_func, body)
	
	if not logged_user or logged_user == 'chat' or logged_user.slurreplacer:
		body = replace_re(body, slur_regex, slur_regex_upper, sub_matcher_slurs, sub_matcher_slurs_upper)
	if SITE_NAME == 'rDrama':
		if not logged_user or logged_user == 'chat' or logged_user.profanityreplacer:
			body = replace_re(body, profanity_regex, profanity_regex_upper, sub_matcher_profanities, sub_matcher_profanities_upper)

	return body

def torture_ap(body, username):
	lines = body.splitlines(keepends=True)

	for i in range(len(lines)):
		if torture_regex_exclude.match(lines[i]):
			continue
		for k, l in AJ_REPLACEMENTS.items():
			lines[i] = lines[i].replace(k, l)
		lines[i] = torture_regex.sub(rf'\1@{username} ', lines[i])
		lines[i] = torture_regex2.sub(rf'\1@{username} is ', lines[i])

	return ''.join(lines).strip()


commands = {
	"fortune": FORTUNE_REPLIES,
	"factcheck": FACTCHECK_REPLIES,
	"8ball": EIGHTBALL_REPLIES,
	"roll": range(1, 9999)
}

command_regex = re.compile("(\s|\n|^)#(fortune|factcheck|8ball|roll)", flags=re.A|re.I)

def command_regex_matcher(match, upper=False):
	result = str(choice(commands[match.group(2).lower()]))
	if match.group(2) == 'roll':
		color = tuple(choices(range(256), k=3))
		result = f'<b style="color:rgb{color}">Your roll: {result}</b>'
	return match.group(1) + result
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`import random`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00			`import re`
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`from typing import List, Literal, Optional, Union`
move all env-getting to .const 2022-07-08 16:21:13 +00:00			`from .const import *`
make roll command neater 2022-07-14 14:43:05 +00:00			`from random import choice, choices`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
fix multipinging (hopefully this doesnt break other shit) 2022-08-17 19:41:09 +00:00			`valid_username_chars = 'a-zA-Z0-9_\-'`
			`valid_username_regex = re.compile("^[a-zA-Z0-9_\-]{3,25}$", flags=re.A)`
marsey UI stuff 2022-09-09 09:39:03 +00:00			`mention_regex = re.compile('(^\|\s\|>)@(([a-zA-Z0-9_\-]){1,30})(?![^<]*<\/(code\|pre\|a)>)', flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
			`valid_password_regex = re.compile("^.{8,100}$", flags=re.A)`

			`marseyaward_body_regex = re.compile(">[^<\s+]\|[^>\s+]<", flags=re.A)`

			`marseyaward_title_regex = re.compile("( *<img[^>]+>)+", flags=re.A)`


hat submission UI 2022-09-10 05:37:11 +00:00			`marsey_regex = re.compile("marsey[a-z0-9]{1,24}", flags=re.A)`
			`tags_regex = re.compile("[a-z0-9: ]{1,200}", flags=re.A)`
fix hat name regex 2022-09-03 01:57:03 +00:00			`hat_regex = re.compile("[a-zA-Z0-9\-() ,_]{1,50}", flags=re.A)`
hat submission UI 2022-09-10 05:37:11 +00:00			`description_regex = re.compile("[^<>&\n\t]{1,300}", flags=re.A)`
Hats (#348) * hat * hats * hats 2 * hats * hats 4 * hats 5 * hats 2022-09-02 23:58:55 +00:00
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
increase hole max char limit from 20 to 25 2022-08-11 13:34:56 +00:00			`valid_sub_regex = re.compile("^[a-zA-Z0-9_\-]{3,25}$", flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
			`query_regex = re.compile("(\w+):(\S+)", flags=re.A)`

			`poll_regex = re.compile("\s\$\$([^\$\n]+)\$\$\s", flags=re.A)`
			`bet_regex = re.compile("\s\$\$\$([^\$\n]+)\$\$\$\s", flags=re.A)`
			`choice_regex = re.compile("\s&&([^\$\n]+)&&\s", flags=re.A)`

sanitize: strip out html comments they're unnecessary and never get rendered 2022-10-20 23:06:55 +00:00			`html_comment_regex = re.compile("<!--.*-->", flags=re.A)`

move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00			`title_regex = re.compile("[^\w ]", flags=re.A)`

			`based_regex = re.compile("based and (.{1,20}?)(-\| )pilled", flags=re.I\|re.A)`

			`controversial_regex = re.compile('["> ](https:\/\/old\.reddit\.com/r/[a-zA-Z0-9_]{3,20}\/comments\/[\w\-.#&/=\?@%+]{5,250})["< ]', flags=re.A)`

			`fishylinks_regex = re.compile("https?://\S+", flags=re.A)`

			`spoiler_regex = re.compile('''\\|\\|(.+)\\|\\|''', flags=re.A)`
			`reddit_regex = re.compile('(^\|\s\|<p>)\/?((r\|u)\/(\w\|-){3,25})(?![^<]*<\/(code\|pre\|a)>)', flags=re.A)`
			`sub_regex = re.compile('(^\|\s\|<p>)\/?(h\/(\w\|-){3,25})(?![^<]*<\/(code\|pre\|a)>)', flags=re.A)`

fix strikethrough regex 2022-06-28 06:05:49 +00:00			`strikethrough_regex = re.compile('(^\|\s\|>)~{1,2}([^~]+)~{1,2}', flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
marsey UI stuff 2022-09-09 09:39:03 +00:00			`mute_regex = re.compile("\/mute @([a-z0-9_\-]{3,30}) ([0-9]+)", flags=re.A\|re.I)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
			`emoji_regex = re.compile(f"<p>\s(:[!#@]{{0,3}}[{valid_username_chars}]+:\s)+<\/p>", flags=re.A)`
fix long emojis 2022-07-03 08:00:42 +00:00			`emoji_regex2 = re.compile(f'(?<!"):([!#@{valid_username_chars}]{{1,36}}?):', flags=re.A)`
			`emoji_regex3 = re.compile(f'(?<!"):([!@{valid_username_chars}]{{1,35}}?):', flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
fix this https://chapotraphouse.club/post/79771/workaholics-are-worse-for-society-than/2183396?context=8#context 2022-06-24 14:45:19 +00:00			`snappy_url_regex = re.compile('<a href="(https?:\/\/.+?)".*?>(.+?)<\/a>', flags=re.A)`
make snappy archive youtube videos too 2022-07-11 17:45:07 +00:00			`snappy_youtube_regex = re.compile('<lite-youtube videoid="(.+?)" params="autoplay=1', flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
unify email regex 2022-10-19 10:39:03 +00:00			`email_regex = re.compile(EMAIL_REGEX_PATTERN, flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
fix utm regex (#357) 2022-09-17 21:13:14 +00:00			`utm_regex = re.compile('utm_[0-z]+=[0-z_]+&', flags=re.A)`
			`utm_regex2 = re.compile('[?&]utm_[0-z]+=[0-z_]+', flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`slur_regex = re.compile(f"<[^>]*>\|{slur_single_words}", flags=re.I\|re.A)`
			`slur_regex_upper = re.compile(f"<[^>]*>\|{slur_single_words.upper()}", flags=re.A)`
			`profanity_regex = re.compile(f"<[^>]*>\|{profanity_single_words}", flags=re.I\|re.A)`
			`profanity_regex_upper = re.compile(f"<[^>]*>\|{profanity_single_words.upper()}", flags=re.A)`

move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00			`torture_regex = re.compile('(^\|\s)(i\|me) ', flags=re.I\|re.A)`
			`torture_regex2 = re.compile("(^\|\s)i'm ", flags=re.I\|re.A)`
			`torture_regex_exclude = re.compile('^\s*>', flags=re.A)`


			`image_check_regex = re.compile(f'!\[\]\(((?!(https:\/\/([a-z0-9-]+\.)({hosts})\/\|\/)).?)\)', flags=re.A)`

constantify file extensions 2022-10-30 14:55:43 +00:00			`video_regex_extensions = '\|'.join(VIDEO_FORMATS)`
			`video_sub_regex = re.compile(f'(<p>[^<])(https:\/\/([a-z0-9-]+\.)({hosts})\/[\w:~,()\-.#&\/=?@%;+]*?\.({video_regex_extensions}))', flags=re.A)`

			`audio_regex_extensions = '\|'.join(AUDIO_FORMATS)`
			`audio_sub_regex = re.compile(f'(<p>[^<])(https:\/\/([a-z0-9-]+\.)({hosts})\/[\w:~,()\-.#&\/=?@%;+]*?\.({audio_regex_extensions}))', flags=re.A)`

			`image_regex_extensions = '\|'.join(IMAGE_FORMATS)`
constantify image extensions and fix imgur .gif bug 2022-11-05 21:01:23 +00:00			`image_regex = re.compile(f"(^\|\s)(https:\/\/[\w\-.#&/=\?@%;+,:]{{5,250}}\.({image_regex_extensions})(\?[\w\-.#&/=\?@%;+,:]*)?)($\|\s)", flags=re.I\|re.A)`
			`image_regex_extensions = image_regex_extensions.replace('\|gif', '')`
constantify file extensions 2022-10-30 14:55:43 +00:00			`imgur_regex = re.compile(f'(https:\/\/i\.imgur\.com\/[a-z0-9]+)\.({image_regex_extensions})', flags=re.I\|re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
			`giphy_regex = re.compile('(https:\/\/media\.giphy\.com\/media\/[a-z0-9]+\/giphy)\.gif', flags=re.I\|re.A)`

			`youtube_regex = re.compile('(<p>[^<])(https:\/\/youtube\.com\/watch\?v\=([a-z0-9-_]{5,20})[\w\-.#&/=\?@%+])', flags=re.I\|re.A)`
			`yt_id_regex = re.compile('[a-z0-9-_]{5,20}', flags=re.I\|re.A)`

Fix timeout in sanitize from link_fix_regex. h/t to @official-techsupport for finding and help fixing this bug. When given certain pathological input, `sanitize` would time out (notably only on posts, rather than comments, perhaps due to the longer maximum length of input). For example, using as input the result of: with open("test.txt", "w") as f: for i in range(26): f.write(f":{chr(ord('a') + i)}: ") f.write('x' * 20_000) We believe this to be because of some combination of the greedy quantifiers and the negative lookahead before the match. The regex was rewritten to (in theory) have much more linear performance. 2022-06-25 05:28:43 +00:00			`link_fix_regex = re.compile("(\[.?\]\()(?!http\|/)(.?\))", flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
Check URI approved embed in all CSS contexts. 2022-08-05 17:09:41 +00:00			`css_url_regex = re.compile('url\(\s[\'"]?(.?)[\'"]?\s*\)', flags=re.I\|re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
add jigsaw tier 2022-10-05 22:47:12 +00:00			`procoins_li = (0,2500,5000,10000,25000,50000,100000,250000)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
allow poetrysperg to skip the linefeeds thing 2022-11-01 00:04:37 +00:00			`linefeeds_regex = re.compile("([^\n ])\n([^\n])", flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
			`greentext_regex = re.compile("(\n\|^)>([^ >][^\n]*)", flags=re.A)`

			`ascii_only_regex = re.compile("[ -~]+", flags=re.A)`

fix reddit replacing (fr this time) 2022-08-14 03:14:36 +00:00			`reddit_to_vreddit_regex = re.compile('(^\|>\|")https:\/\/old.reddit.com\/(r\|u)\/', flags=re.A)`
fix regex capturing groups 2022-10-05 00:45:58 +00:00			`reddit_domain_regex = re.compile("(^\|\s\|\()https?:\/\/(reddit\.com\|(?:(?:[A-z]{2})(?:-[A-z]{2})" "?\|beta\|i\|m\|pay\|ssl\|www\|new\|alpha)\.reddit\.com\|libredd\.it\|teddit\.net)\/(r\|u)\/", flags=re.A)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
colors: filter properly 2022-11-07 00:19:13 +00:00			`color_regex = re.compile("[a-f0-9]{6}", flags=re.A)`
validate colors 2022-06-24 17:32:31 +00:00
showmore works in the presence of pre tags (#344) 2022-08-30 22:11:45 +00:00			`# lazy match on the {}?, only match if there is trailing stuff`
Re-enable showmore_regex for Snappy (#389) * Re-enable showmore_regex for Snappy * showmore a bit more aggressively 2022-10-06 06:17:28 +00:00			`# Specifically match Snappy's way of formatting, this might break some losers' comments.`
			`showmore_regex = re.compile(r"^(.{3000,}?</p>(?:</li></ul>)?)(\s<p>.)", flags=re.A\|re.DOTALL)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
compile regext outside of routes 2022-07-06 11:49:13 +00:00			`search_token_regex = re.compile('"([^"]*)"\|(\S+)', flags=re.A)`

			`git_regex = re.compile("ref: (refs/.+)", flags=re.A)`

refine pronouns 2022-07-23 13:35:45 +00:00			`pronouns_regex = re.compile("([a-z]{1,5})/[a-z]{1,5}(/[a-z]{1,5})?", flags=re.A\|re.I)`
add pronouns 2022-07-11 16:46:08 +00:00
LGB: Add static /kb/ route; two static pages. 2022-07-18 08:39:21 +00:00			`knowledgebase_page_regex = re.compile("[a-zA-Z0-9_\-]+", flags=re.A)`

fix 500... again 2022-11-03 23:05:11 +00:00			`def sub_matcher(match:re.Match, upper=False, replace_with:Union[dict[str, str], dict[str, List[str]]]=SLURS):`
don't use regex in the slur filters for now it doesn't work 2022-11-03 23:33:56 +00:00			`group_num = 0`
handle case where is None 2022-11-03 23:14:55 +00:00			`match_str = match.group(group_num)`
			`if match_str.startswith('<'):`
don't use regex in the slur filters for now it doesn't work 2022-11-03 23:33:56 +00:00			`return match_str`
revert what I did with the slur regex 2022-07-17 19:17:46 +00:00			`else:`
handle case where is None 2022-11-03 23:14:55 +00:00			`repl = replace_with[match_str.lower()]`
fix images in slur replacer (#359) doesn't work with ALL CAPS TEXT, there's prolly a better way for this 2022-09-18 10:19:37 +00:00			`return repl if not upper or "<img" in repl else repl.upper()`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`def sub_matcher_upper(match, replace_with:Union[dict[str, str], dict[str, List[str]]]=SLURS):`
			`return sub_matcher(match, upper=True, replace_with=replace_with)`
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00
			`# TODO: make censoring a bit better`
			`def sub_matcher_slurs(match, upper=False):`
			`return sub_matcher(match, upper, replace_with=SLURS)`

			`def sub_matcher_slurs_upper(match):`
			`return sub_matcher_slurs(match, upper=True)`

			`def sub_matcher_profanities(match, upper=False):`
			`return sub_matcher(match, upper, replace_with=PROFANITIES)`

			`def sub_matcher_profanities_upper(match):`
			`return sub_matcher_profanities(match, upper=True)`

fix prev commit 2022-11-03 23:01:12 +00:00			`def censor_slurs(body:Optional[str], logged_user):`
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`if not body: return ""`
			`def replace_re(body:str, regex:re.Pattern, regex_upper:re.Pattern, sub_func, sub_func_upper):`
			`body = regex_upper.sub(sub_func_upper, body)`
			`return regex.sub(sub_func, body)`

move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00			`if not logged_user or logged_user == 'chat' or logged_user.slurreplacer:`
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00			`body = replace_re(body, slur_regex, slur_regex_upper, sub_matcher_slurs, sub_matcher_slurs_upper)`
profanity: per fish request disable profanity filter everywhere but rdrama feel free to revert this or whatever if discussed 2022-11-04 13:43:59 +00:00			`if SITE_NAME == 'rDrama':`
			`if not logged_user or logged_user == 'chat' or logged_user.profanityreplacer:`
			`body = replace_re(body, profanity_regex, profanity_regex_upper, sub_matcher_profanities, sub_matcher_profanities_upper)`
users: add profanity filter to censor our gosh darned potty mouthes 2022-11-03 22:59:18 +00:00
move regex from helpers.const into its own helper file 2022-06-24 14:30:59 +00:00			`return body`

			`def torture_ap(body, username):`
			`lines = body.splitlines(keepends=True)`

			`for i in range(len(lines)):`
			`if torture_regex_exclude.match(lines[i]):`
			`continue`
			`for k, l in AJ_REPLACEMENTS.items():`
			`lines[i] = lines[i].replace(k, l)`
			`lines[i] = torture_regex.sub(rf'\1@{username} ', lines[i])`
			`lines[i] = torture_regex2.sub(rf'\1@{username} is ', lines[i])`

refactor torture_ap 2022-09-05 20:05:04 +00:00			`return ''.join(lines).strip()`
refactor comment commands 2022-07-11 12:14:18 +00:00

			`commands = {`
			`"fortune": FORTUNE_REPLIES,`
			`"factcheck": FACTCHECK_REPLIES,`
add #roll 2022-07-13 13:06:59 +00:00			`"8ball": EIGHTBALL_REPLIES,`
			`"roll": range(1, 9999)`
refactor comment commands 2022-07-11 12:14:18 +00:00			`}`

add #roll 2022-07-13 13:06:59 +00:00			`command_regex = re.compile("(\s\|\n\|^)#(fortune\|factcheck\|8ball\|roll)", flags=re.A\|re.I)`
refactor comment commands 2022-07-11 12:14:18 +00:00
			`def command_regex_matcher(match, upper=False):`
make roll command neater 2022-07-14 14:43:05 +00:00			`result = str(choice(commands[match.group(2).lower()]))`
			`if match.group(2) == 'roll':`
			`color = tuple(choices(range(256), k=3))`
			`result = f'<b style="color:rgb{color}">Your roll: {result}</b>'`
fix showmore quadratic behavior (#343) 2022-08-30 21:19:53 +00:00			`return match.group(1) + result`