2023-09-09 01:46:40 -07:00
|
|
|
import random
|
2023-10-10 02:25:37 -07:00
|
|
|
import markdown2
|
|
|
|
import math
|
2023-09-16 00:09:04 -07:00
|
|
|
from urllib.parse import urlparse
|
2023-10-20 20:20:13 -07:00
|
|
|
import requests
|
2023-10-22 17:03:35 -07:00
|
|
|
from functools import wraps
|
2023-09-16 00:09:04 -07:00
|
|
|
import flask
|
|
|
|
from bs4 import BeautifulSoup
|
2023-08-29 03:01:06 -07:00
|
|
|
import requests
|
|
|
|
import os
|
2023-11-27 01:05:35 -08:00
|
|
|
import imghdr
|
2023-11-29 23:57:51 -08:00
|
|
|
from flask import current_app, json, redirect, url_for, request
|
2023-10-20 19:49:01 -07:00
|
|
|
from flask_login import current_user
|
|
|
|
from sqlalchemy import text
|
|
|
|
|
2023-09-16 00:09:04 -07:00
|
|
|
from app import db, cache
|
2023-12-03 01:41:15 -08:00
|
|
|
from app.models import Settings, Domain, Instance, BannedInstances, User, Community
|
2023-09-16 00:09:04 -07:00
|
|
|
|
|
|
|
|
|
|
|
# Flask's render_template function, with support for themes added
|
|
|
|
def render_template(template_name: str, **context) -> str:
|
|
|
|
theme = get_setting('theme', '')
|
|
|
|
if theme != '':
|
|
|
|
return flask.render_template(f'themes/{theme}/{template_name}', **context)
|
|
|
|
else:
|
|
|
|
return flask.render_template(template_name, **context)
|
2023-08-29 03:01:06 -07:00
|
|
|
|
|
|
|
|
|
|
|
# Jinja: when a file was modified. Useful for cache-busting
|
|
|
|
def getmtime(filename):
|
|
|
|
return os.path.getmtime('static/' + filename)
|
|
|
|
|
|
|
|
|
|
|
|
# do a GET request to a uri, return the result
|
|
|
|
def get_request(uri, params=None, headers=None) -> requests.Response:
|
2023-11-16 01:31:14 -08:00
|
|
|
if headers is None:
|
|
|
|
headers = {'User-Agent': 'PieFed/1.0'}
|
|
|
|
else:
|
|
|
|
headers.update({'User-Agent': 'PieFed/1.0'})
|
2023-08-29 03:01:06 -07:00
|
|
|
try:
|
2023-11-16 01:31:14 -08:00
|
|
|
response = requests.get(uri, params=params, headers=headers, timeout=5, allow_redirects=True)
|
2023-08-29 03:01:06 -07:00
|
|
|
except requests.exceptions.SSLError as invalid_cert:
|
|
|
|
# Not our problem if the other end doesn't have proper SSL
|
|
|
|
current_app.logger.info(f"{uri} {invalid_cert}")
|
|
|
|
raise requests.exceptions.SSLError from invalid_cert
|
|
|
|
except ValueError as ex:
|
|
|
|
# Convert to a more generic error we handle
|
|
|
|
raise requests.exceptions.RequestException(f"InvalidCodepoint: {str(ex)}") from None
|
|
|
|
|
|
|
|
return response
|
2023-09-02 21:30:20 -07:00
|
|
|
|
|
|
|
|
2023-09-16 00:09:04 -07:00
|
|
|
# saves an arbitrary object into a persistent key-value store. cached.
|
2023-09-17 02:19:51 -07:00
|
|
|
@cache.memoize(timeout=50)
|
2023-09-02 21:30:20 -07:00
|
|
|
def get_setting(name: str, default=None):
|
|
|
|
setting = Settings.query.filter_by(name=name).first()
|
|
|
|
if setting is None:
|
|
|
|
return default
|
|
|
|
else:
|
|
|
|
return json.loads(setting.value)
|
|
|
|
|
|
|
|
|
2023-09-09 01:46:40 -07:00
|
|
|
# retrieves arbitrary object from persistent key-value store
|
2023-09-02 21:30:20 -07:00
|
|
|
def set_setting(name: str, value):
|
|
|
|
setting = Settings.query.filter_by(name=name).first()
|
|
|
|
if setting is None:
|
2023-09-17 02:19:51 -07:00
|
|
|
db.session.add(Settings(name=name, value=json.dumps(value)))
|
2023-09-02 21:30:20 -07:00
|
|
|
else:
|
|
|
|
setting.value = json.dumps(value)
|
|
|
|
db.session.commit()
|
2023-09-16 00:09:04 -07:00
|
|
|
cache.delete_memoized(get_setting)
|
2023-09-05 01:25:10 -07:00
|
|
|
|
|
|
|
|
|
|
|
# Return the contents of a file as a string. Inspired by PHP's function of the same name.
|
|
|
|
def file_get_contents(filename):
|
|
|
|
with open(filename, 'r') as file:
|
|
|
|
contents = file.read()
|
|
|
|
return contents
|
2023-09-09 01:46:40 -07:00
|
|
|
|
|
|
|
|
|
|
|
random_chars = '0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ'
|
|
|
|
|
|
|
|
|
|
|
|
def gibberish(length: int = 10) -> str:
|
|
|
|
return "".join([random.choice(random_chars) for x in range(length)])
|
2023-09-16 00:09:04 -07:00
|
|
|
|
|
|
|
|
|
|
|
def is_image_url(url):
|
|
|
|
parsed_url = urlparse(url)
|
|
|
|
path = parsed_url.path.lower()
|
|
|
|
common_image_extensions = ['.jpg', '.jpeg', '.png', '.gif', '.bmp', '.tiff', '.webp']
|
|
|
|
return any(path.endswith(extension) for extension in common_image_extensions)
|
|
|
|
|
|
|
|
|
|
|
|
# sanitise HTML using an allow list
|
|
|
|
def allowlist_html(html: str) -> str:
|
2023-10-10 02:25:37 -07:00
|
|
|
allowed_tags = ['p', 'strong', 'a', 'ul', 'ol', 'li', 'em', 'blockquote', 'cite', 'br', 'h3', 'h4', 'h5', 'pre',
|
|
|
|
'code']
|
2023-09-16 00:09:04 -07:00
|
|
|
# Parse the HTML using BeautifulSoup
|
|
|
|
soup = BeautifulSoup(html, 'html.parser')
|
|
|
|
|
|
|
|
# Find all tags in the parsed HTML
|
|
|
|
for tag in soup.find_all():
|
|
|
|
# If the tag is not in the allowed_tags list, remove it and its contents
|
|
|
|
if tag.name not in allowed_tags:
|
|
|
|
tag.extract()
|
|
|
|
else:
|
|
|
|
# Filter and sanitize attributes
|
|
|
|
for attr in list(tag.attrs):
|
|
|
|
if attr not in ['href', 'src']: # Add allowed attributes here
|
|
|
|
del tag[attr]
|
|
|
|
|
|
|
|
# Encode the HTML to prevent script execution
|
2023-10-10 02:25:37 -07:00
|
|
|
return str(soup)
|
2023-09-16 00:09:04 -07:00
|
|
|
|
|
|
|
|
|
|
|
# convert basic HTML to Markdown
|
|
|
|
def html_to_markdown(html: str) -> str:
|
|
|
|
soup = BeautifulSoup(html, 'html.parser')
|
|
|
|
return html_to_markdown_worker(soup)
|
|
|
|
|
|
|
|
|
|
|
|
def html_to_markdown_worker(element, indent_level=0):
|
|
|
|
formatted_text = ''
|
|
|
|
for item in element.contents:
|
|
|
|
if isinstance(item, str):
|
|
|
|
formatted_text += item
|
|
|
|
elif item.name == 'p':
|
|
|
|
formatted_text += '\n\n'
|
|
|
|
elif item.name == 'br':
|
|
|
|
formatted_text += ' \n' # Double space at the end for line break
|
|
|
|
elif item.name == 'strong':
|
|
|
|
formatted_text += '**' + html_to_markdown_worker(item) + '**'
|
|
|
|
elif item.name == 'ul':
|
|
|
|
formatted_text += '\n'
|
|
|
|
formatted_text += html_to_markdown_worker(item, indent_level + 1)
|
|
|
|
formatted_text += '\n'
|
|
|
|
elif item.name == 'ol':
|
|
|
|
formatted_text += '\n'
|
|
|
|
formatted_text += html_to_markdown_worker(item, indent_level + 1)
|
|
|
|
formatted_text += '\n'
|
|
|
|
elif item.name == 'li':
|
|
|
|
bullet = '-' if item.find_parent(['ul', 'ol']) and item.find_previous_sibling() is None else ''
|
|
|
|
formatted_text += ' ' * indent_level + bullet + ' ' + html_to_markdown_worker(item).strip() + '\n'
|
|
|
|
elif item.name == 'blockquote':
|
|
|
|
formatted_text += ' ' * indent_level + '> ' + html_to_markdown_worker(item).strip() + '\n'
|
|
|
|
elif item.name == 'code':
|
|
|
|
formatted_text += '`' + html_to_markdown_worker(item) + '`'
|
|
|
|
return formatted_text
|
|
|
|
|
|
|
|
|
2023-10-10 02:25:37 -07:00
|
|
|
def markdown_to_html(markdown_text) -> str:
|
2023-10-20 19:49:01 -07:00
|
|
|
if markdown_text:
|
|
|
|
return allowlist_html(markdown2.markdown(markdown_text, safe_mode=True))
|
|
|
|
else:
|
|
|
|
return ''
|
2023-10-10 02:25:37 -07:00
|
|
|
|
|
|
|
|
2023-10-23 00:18:46 -07:00
|
|
|
def markdown_to_text(markdown_text) -> str:
|
|
|
|
return markdown_text.replace("# ", '')
|
|
|
|
|
|
|
|
|
2023-11-21 23:48:27 -08:00
|
|
|
def domain_from_url(url: str, create=True) -> Domain:
|
2023-11-28 23:32:07 -08:00
|
|
|
parsed_url = urlparse(url.lower().replace('www.', ''))
|
2023-09-16 00:09:04 -07:00
|
|
|
domain = Domain.query.filter_by(name=parsed_url.hostname.lower()).first()
|
2023-10-23 02:54:11 -07:00
|
|
|
if create and domain is None:
|
|
|
|
domain = Domain(name=parsed_url.hostname.lower())
|
|
|
|
db.session.add(domain)
|
|
|
|
db.session.commit()
|
2023-09-16 00:09:04 -07:00
|
|
|
return domain
|
|
|
|
|
2023-10-02 02:16:44 -07:00
|
|
|
|
|
|
|
def shorten_string(input_str, max_length=50):
|
|
|
|
if len(input_str) <= max_length:
|
|
|
|
return input_str
|
|
|
|
else:
|
|
|
|
return input_str[:max_length - 3] + '…'
|
|
|
|
|
|
|
|
|
|
|
|
def shorten_url(input: str, max_length=20):
|
|
|
|
return shorten_string(input.replace('https://', '').replace('http://', ''))
|
2023-10-10 02:25:37 -07:00
|
|
|
|
|
|
|
|
|
|
|
# the number of digits in a number. e.g. 1000 would be 4
|
|
|
|
def digits(input: int) -> int:
|
|
|
|
if input == 0:
|
|
|
|
return 1 # Special case: 0 has 1 digit
|
|
|
|
else:
|
|
|
|
return math.floor(math.log10(abs(input))) + 1
|
2023-10-20 19:49:01 -07:00
|
|
|
|
|
|
|
|
|
|
|
@cache.memoize(timeout=50)
|
|
|
|
def user_access(permission: str, user_id: int) -> bool:
|
|
|
|
has_access = db.session.execute(text('SELECT * FROM "role_permission" as rp ' +
|
|
|
|
'INNER JOIN user_role ur on rp.role_id = ur.role_id ' +
|
|
|
|
'WHERE ur.user_id = :user_id AND rp.permission = :permission'),
|
|
|
|
{'user_id': user_id, 'permission': permission}).first()
|
2023-10-20 20:20:13 -07:00
|
|
|
return has_access is not None
|
|
|
|
|
|
|
|
|
2023-12-03 01:41:15 -08:00
|
|
|
@cache.memoize(timeout=10)
|
|
|
|
def community_membership(user: User, community: Community) -> int:
|
|
|
|
# @cache.memoize works with User.subscribed but cache.delete_memoized does not, making it bad to use on class methods.
|
|
|
|
# however cache.memoize and cache.delete_memoized works fine with normal functions
|
|
|
|
if community is None:
|
|
|
|
return False
|
|
|
|
return user.subscribed(community.id)
|
|
|
|
|
|
|
|
|
2023-10-20 20:20:13 -07:00
|
|
|
def retrieve_block_list():
|
|
|
|
try:
|
|
|
|
response = requests.get('https://github.com/rimu/no-qanon/blob/master/domains.txt', timeout=1)
|
|
|
|
except:
|
|
|
|
return None
|
|
|
|
if response and response.status_code == 200:
|
2023-10-22 17:03:35 -07:00
|
|
|
return response.text
|
|
|
|
|
|
|
|
|
2023-11-27 01:05:35 -08:00
|
|
|
def validate_image(stream):
|
|
|
|
header = stream.read(512)
|
|
|
|
stream.seek(0)
|
|
|
|
format = imghdr.what(None, header)
|
|
|
|
if not format:
|
|
|
|
return None
|
|
|
|
return '.' + (format if format != 'jpeg' else 'jpg')
|
|
|
|
|
|
|
|
|
2023-10-22 17:03:35 -07:00
|
|
|
def validation_required(func):
|
|
|
|
@wraps(func)
|
|
|
|
def decorated_view(*args, **kwargs):
|
|
|
|
if current_user.verified:
|
|
|
|
return func(*args, **kwargs)
|
|
|
|
else:
|
|
|
|
return redirect(url_for('auth.validation_required'))
|
2023-11-03 01:59:48 -07:00
|
|
|
return decorated_view
|
|
|
|
|
|
|
|
|
|
|
|
def permission_required(permission):
|
|
|
|
def decorator(func):
|
|
|
|
@wraps(func)
|
|
|
|
def decorated_view(*args, **kwargs):
|
|
|
|
if user_access(permission, current_user.id):
|
|
|
|
return func(*args, **kwargs)
|
|
|
|
else:
|
|
|
|
# Handle the case where the user doesn't have the required permission
|
|
|
|
return redirect(url_for('auth.permission_denied'))
|
|
|
|
|
|
|
|
return decorated_view
|
|
|
|
|
|
|
|
return decorator
|
2023-11-29 23:57:51 -08:00
|
|
|
|
|
|
|
|
|
|
|
# sends the user back to where they came from
|
|
|
|
def back(default_url):
|
|
|
|
# Get the referrer from the request headers
|
|
|
|
referrer = request.referrer
|
|
|
|
|
|
|
|
# If the referrer exists and is not the same as the current request URL, redirect to the referrer
|
|
|
|
if referrer and referrer != request.url:
|
|
|
|
return redirect(referrer)
|
|
|
|
|
|
|
|
# If referrer is not available or is the same as the current request URL, redirect to the default URL
|
|
|
|
return redirect(default_url)
|