make thumbnail_thread not fail bc of idle_in_transaction_session_timeout

2023-07-30 04:35:09 +03:00 · 2023-07-30 04:35:09 +03:00 · bd3a672c2d
parent b1d0e7bb6f
commit bd3a672c2d
2 changed files with 37 additions and 58 deletions
--- a/files/helpers/media.py
+++ b/files/helpers/media.py
@ -180,7 +180,7 @@ def process_image(filename, v, resize=0, trim=False, uploader_id=None, db=None):
 	# to avoid this, we'll simply return None instead
 	has_request = has_request_context()
 	size = os.stat(filename).st_size
-	patron = bool(v.patron)
+	patron = bool(v and v.patron)
 	if size > MAX_IMAGE_AUDIO_SIZE_MB_PATRON * 1024 * 1024 or not patron and size > MAX_IMAGE_AUDIO_SIZE_MB * 1024 * 1024:
 		os.remove(filename)
--- a/files/routes/posts.py
+++ b/files/routes/posts.py
@ -290,69 +290,49 @@ def thumbnail_thread(pid, vid):
 		else:
 			return f"{post_url}/{fragment_url}"
-	p = db.query(Post).filter_by(id=pid).options(load_only(Post.url)).one_or_none()
+def expand_url(post_url, fragment_url):
-
+	if fragment_url.startswith("https://"):
-	if not p or not p.url:
+		return fragment_url
-		time.sleep(5)
+	elif fragment_url.startswith("https://"):
-		p = db.query(Post).filter_by(id=pid).options(load_only(Post.url)).one_or_none()
+		return f"https://{fragment_url.split('https://')[1]}"
-
+	elif fragment_url.startswith('//'):
-	if not p or not p.url: return
+		return f"https:{fragment_url}"
-
+	elif fragment_url.startswith('/') and '\\' not in fragment_url:
-	fetch_url = p.url
+		parsed_url = urlparse(post_url)
 		return f"https://{parsed_url.netloc}{fragment_url}"
 	else:
 		return f"{post_url}/{fragment_url}"
 def thumbnail_thread(fetch_url, pid):
 	if fetch_url.startswith('/') and '\\' not in fetch_url:
 		fetch_url = f"{SITE_FULL}{fetch_url}"
 	try:
-		x=requests.get(fetch_url, headers=HEADERS, timeout=5, proxies=proxies)
+		x = requests.get(fetch_url, headers=HEADERS, timeout=5, proxies=proxies)
 	except:
 		db.close()
 		return
 	if x.status_code != 200:
 		db.close()
 		return
 	if x.headers.get("Content-Type","").startswith("text/html"):
-		soup=BeautifulSoup(x.content, 'lxml')
+		soup = BeautifulSoup(x.content, 'lxml')
-		thumb_candidate_urls=[]
+		thumb_candidate_urls = []
-		meta_tags = [
+		for tag_name in ("twitter:image", "og:image", "thumbnail"):
-			"drama:thumbnail",
+			tag = soup.find('meta', attrs={"name": tag_name, "content": True})
 			"twitter:image",
 			"og:image",
 			"thumbnail"
 			]
 		for tag_name in meta_tags:
 			tag = soup.find(
 				'meta',
 				attrs={
 					"name": tag_name,
 					"content": True
 					}
 				)
 			if not tag:
-				tag = soup.find(
+				tag = soup.find('meta', attrs={"property": tag_name, "content": True})
 					'meta',
 					attrs={
 						'property': tag_name,
 						'content': True
 						}
 					)
 			if tag:
-				thumb_candidate_urls.append(expand_url(p.url, tag['content']))
+				thumb_candidate_urls.append(expand_url(fetch_url, tag['content']))
 		for tag in soup.find_all("img", attrs={'src':True}):
 			thumb_candidate_urls.append(expand_url(p.url, tag['src']))
 		for tag in soup.find_all("img", attrs={'src': True}):
 			thumb_candidate_urls.append(expand_url(fetch_url, tag['src']))
 		for url in thumb_candidate_urls:
 			try:
-				image_req=requests.get(url, headers=HEADERS, timeout=5, proxies=proxies)
+				image_req = requests.get(url, headers=HEADERS, timeout=5, proxies=proxies)
 			except:
 				continue
@ -370,19 +350,14 @@ def thumbnail_thread(pid, vid):
 					continue
 			break
 		else:
 			db.close()
 			return
 	elif x.headers.get("Content-Type","").startswith("image/"):
-		image_req=x
+		image_req = x
 		with Image.open(BytesIO(x.content)) as i:
 			size = len(i.fp.read())
 			if size > 8 * 1024 * 1024:
 				db.close()
 				return
 	else:
 		db.close()
 		return
 	name = f'/images/{time.time()}'.replace('.','') + '.webp'
@ -391,13 +366,17 @@ def thumbnail_thread(pid, vid):
 		for chunk in image_req.iter_content(1024):
 			file.write(chunk)
-	v = db.query(User).filter_by(id=vid).options(load_only(User.id, User.patron)).one()
+	db = db_session()
-	url = process_image(name, v, resize=99, uploader_id=p.author_id, db=db)
+	p = db.query(Post).filter_by(id=pid).options(load_only(Post.author_id)).one_or_none()
-	if url:
+
-		p.thumburl = url
+	thumburl = process_image(name, None, resize=99, uploader_id=p.author_id, db=db)
 	if thumburl:
 		p.thumburl = thumburl
 		db.add(p)
 		db.commit()
 	db.close()
 	stdout.flush()
@ -678,9 +657,6 @@ def submit_post(v, sub=None):
 		else:
 			abort(415)
 	if not p.thumburl and p.url and p.domain != SITE:
 		gevent.spawn(thumbnail_thread, p.id, v.id)
 	if not p.private:
 		notify_users = NOTIFY_USERS(f'{title} {body}', v, ghost=p.ghost, log_cost=p)
@ -752,7 +728,10 @@ def submit_post(v, sub=None):
 	if not p.private:
 		execute_snappy(p, v)
-	g.db.flush() #Necessary, do NOT remove
+	g.db.commit() #Necessary, do NOT remove
 	if not p.thumburl and p.url and p.domain != SITE:
 		gevent.spawn(thumbnail_thread, p.url, p.id)
 	if v.client: return p.json
 	else: