MarseyWorld/files/helpers/owoify.py

from owoify.structures.word import Word
from owoify.utility.interleave_arrays import interleave_arrays
from owoify.utility.presets import *

from files.helpers.regex import *

# Includes, excerpts, and modifies some functions from:
# https://github.com/deadshot465/owoify-py @ owoify/owoify.py


OWO_EXCLUDE_PATTERNS = [
	owo_ignore_links_images_regex, # links []() and images ![]()
		# NB: May not be effective when URL part contains literal spaces vs %20
		# Also relies on owoify replacements currently not affecting symbols.
	owo_ignore_emojis_regex, #emojis
	owo_ignore_the_Regex, # exclude: 'the' ↦ 'teh'
	sanitize_url_regex, # bare links
	mention_regex, # mentions
	group_mention_regex, #ping group mentions
	command_regex, # markup commands
]

def owoify(source, chud_phrase):
	if '`' in source or '<pre>' in source or '<code>' in source:
		return source

	word_matches = owo_word_regex.findall(source)
	space_matches = owo_space_regex.findall(source)

	words = [Word(s) for s in word_matches]
	spaces = [Word(s) for s in space_matches]

	ignored_words = chud_phrase.split() if chud_phrase else []

	for pattern in (poll_regex, choice_regex, bet_regex):
		matches = [x.group(0) for x in pattern.finditer(source.lower())]
		for match in matches:
			ignored_words += match.split()

	words = list(map(lambda w: owoify_map_token_custom(w, ignored_words), words))

	result = interleave_arrays(words, spaces)
	result_strings = list(map(lambda w: str(w), result))
	return ''.join(result_strings)

def owoify_map_token_custom(token, ignored_words):
	if token.word.lower() in ignored_words:
		return token

	for pattern in OWO_EXCLUDE_PATTERNS:
		# if pattern appears anywhere in token, do not owoify.
		if pattern.search(token.word):
			return token

	# Original Owoification Logic (sans cases for higher owo levels)
	for func in SPECIFIC_WORD_MAPPING_LIST:
		token = func(token)

	for func in OWO_MAPPING_LIST:
		token = func(token)
	# End Original Owoification Logic

	return token
[DO NOT MERGE] import detanglation (#442) * move Base definition to files.classes.__init__.py * fix ImportError * move userpage listing to users.py * don't import the app from classes * consts: set default values to avoid crashes consts: warn if the secret key is the default config value * card view: sneed (user db schema) * cloudflare: use DEFAULT_CONFIG_VALUE * const: set default values * decouple media.py from __main__ * pass database to avoid imports * import cleanup and import request not in const, but in the requests mega import * move asset_submissions site check to __init__ * asset submissions feature flag * flag * g.is_tor * don't import request where it's not needed * i think this is fine * mail: move to own routes and helper * wrappers * required wrappers move * unfuck wrappers a bit * move snappy quotes and marseys to stateful consts * marsify * :pepodrool: * fix missing import * import cache * ...and settings.py * and static.py * static needs cache * route * lmao all of the jinja shit was in feeds.py amazing * classes should only import what they need from flask * import Response * hdjbjdhbhjf * ... * dfdfdfdf * make get a non-required import * isort imports (mostly) * but actually * configs * reload config on import * fgfgfgfg * config * config * initialize snappy and test * cookie of doom debug * edfjnkf * xikscdfd * debug config * set session cookie domain, i think this fixes the can't login bug * sdfbgnhvfdsghbnjfbdvvfghnn * hrsfxgf * dump the entire config on a request * kyskyskyskyskyskyskyskyskys * duifhdskfjdfd * dfdfdfdfdfdfdfdfdfdfdfdf * dfdfdfdf * imoprt all of the consts beacuse fuck it * 😭 * dfdfdfdfdfdfsdasdf * print the entire session * rffdfdfjkfksj * fgbhffh * not the secret keys * minor bug fixes * be helpful in the warning * gfgfgfg * move warning lower * isort main imports (i hope this doesn't fuck something up) * test * session cookie domain redux * dfdfdfd * try only importing Flask * formkeys fix * y * :pepodrool: * route helper * remove before flight * dfdfdfdfdf * isort classes * isort helpers * move check_for_alts to routehelpers and also sort imports and get rid of unused ones * that previous commit but actkally * readd the cache in a dozen places they were implicitly imported * use g.is_tor instead of request.headers. bla bla bla * upgrade streamers to their own route file * get rid of unused imports in __main__ * fgfgf * don't pull in the entire ORM where we don't need it * features * explicit imports for the get helper * explicit imports for the get helper redux * testing allroutes * remove unused import * decouple flask from classes * syntax fix also remember these have side fx for some reason (why?) * move side effects out of the class * posts * testing on devrama * settings * reloading * settingssdsdsds * streamer features * site settings * testing settings on devrama * import * fix modlog * remove debug stuff * revert commit 67275b21ab6e2f2520819e84d10bfc1c746a15b6 * archiveorg to _archiveorg * skhudkfkjfd * fix cron for PCM * fix bugs that snekky wants me to * Fix call to realbody passing db, standardize kwarg * test * import check_for_alts from the right place * cloudflare * testing on devrama * fix cron i think * shadow properly * tasks * Remove print which will surely be annoying in prod. * v and create new session * use files.classes * make errors import little and fix rare 500 in /allow_nsfw * Revert "use files.classes" This reverts commit 98c10b876cf86ce058b7fb955cf1ec0bfb9996c6. * pass v to media functions rather than using g * fix * dfdfdfdfd * cleanup, py type checking is dumb so don't use it where it causes issues * Fix some merge bugs, add DEFAULT_RATELIMIT to main. * Fix imports on sqlalchemy expressions. * `from random import random` is an error. * Fix replies db param. * errors: fix missing import * fix rare 500: only send to GIFT_NOTIF_ID if it exists, and send them the right text * Fix signup formkey. * fix 2 500s * propagate db to submissions * fix replies * dfdfdfdf * Fix verifiedcolor. * is_manual * can't use getters outside of an app context * don't attempt to do gumroad on sites where it's not enabled * don't attempt to do gumraod on sites's where it's unnecessary * Revert "don't attempt to do gumroad on sites where it's not enabled" This reverts commit 6f8a6331878655492dfaf1907b27f8be513c14d3. * fix 500 * validate media type Co-authored-by: TLSM <duolsm@outlook.com> 2022-11-15 09:19:08 +00:00			`from owoify.structures.word import Word`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00			`from owoify.utility.interleave_arrays import interleave_arrays`
			`from owoify.utility.presets import *`

move some regex to regex.py for consistency 2023-10-07 14:58:45 +00:00			`from files.helpers.regex import *`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00
			`# Includes, excerpts, and modifies some functions from:`
			`# https://github.com/deadshot465/owoify-py @ owoify/owoify.py`


			`OWO_EXCLUDE_PATTERNS = [`
move some regex to regex.py for consistency 2023-10-07 14:58:45 +00:00			`owo_ignore_links_images_regex, # links []() and images ![]()`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00			`# NB: May not be effective when URL part contains literal spaces vs %20`
			`# Also relies on owoify replacements currently not affecting symbols.`
move some regex to regex.py for consistency 2023-10-07 14:58:45 +00:00			`owo_ignore_emojis_regex, #emojis`
			`owo_ignore_the_Regex, # exclude: 'the' ↦ 'teh'`
			`sanitize_url_regex, # bare links`
			`mention_regex, # mentions`
			`group_mention_regex, #ping group mentions`
			`command_regex, # markup commands`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00			`]`

make chud award work with owoify award 2023-10-13 18:56:48 +00:00			`def owoify(source, chud_phrase):`
exempt codeblocks from owoify award 2023-08-15 20:16:51 +00:00			if '`' in source or '<pre>' in source or '<code>' in source:
			`return source`

move some regex to regex.py for consistency 2023-10-07 14:58:45 +00:00			`word_matches = owo_word_regex.findall(source)`
			`space_matches = owo_space_regex.findall(source)`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00
			`words = [Word(s) for s in word_matches]`
			`spaces = [Word(s) for s in space_matches]`

fix this https://rdrama.net/notification/5408283 2024-02-14 17:11:41 +00:00			`ignored_words = chud_phrase.split() if chud_phrase else []`
make chud award work with owoify award 2023-10-13 18:56:48 +00:00
fix this https://rdrama.net/notification/5408283 2024-02-14 17:11:41 +00:00			`for pattern in (poll_regex, choice_regex, bet_regex):`
			`matches = [x.group(0) for x in pattern.finditer(source.lower())]`
			`for match in matches:`
			`ignored_words += match.split()`

			`words = list(map(lambda w: owoify_map_token_custom(w, ignored_words), words))`
Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00
			`result = interleave_arrays(words, spaces)`
			`result_strings = list(map(lambda w: str(w), result))`
			`return ''.join(result_strings)`

fix this https://rdrama.net/notification/5408283 2024-02-14 17:11:41 +00:00			`def owoify_map_token_custom(token, ignored_words):`
			`if token.word.lower() in ignored_words:`
make chud award work with owoify award 2023-10-13 18:56:48 +00:00			`return token`

Fix owoify award affecting links, emoji, markup. 2022-08-27 04:48:44 +00:00			`for pattern in OWO_EXCLUDE_PATTERNS:`
			`# if pattern appears anywhere in token, do not owoify.`
			`if pattern.search(token.word):`
			`return token`

			`# Original Owoification Logic (sans cases for higher owo levels)`
			`for func in SPECIFIC_WORD_MAPPING_LIST:`
			`token = func(token)`

			`for func in OWO_MAPPING_LIST:`
			`token = func(token)`
			`# End Original Owoification Logic`

			`return token`