2023-11-30 06:36:08 +13:00
|
|
|
from typing import List
|
2024-06-16 17:55:08 +08:00
|
|
|
from urllib.parse import urlparse
|
2023-11-30 06:36:08 +13:00
|
|
|
|
2024-03-12 20:06:24 +13:00
|
|
|
from flask_login import current_user
|
|
|
|
from sqlalchemy import desc, text, or_
|
2023-11-30 06:36:08 +13:00
|
|
|
|
|
|
|
from app import db
|
2024-05-12 13:02:45 +12:00
|
|
|
from app.models import PostReply, Post
|
2024-04-14 08:57:46 +12:00
|
|
|
from app.utils import blocked_instances, blocked_users
|
2023-11-30 06:36:08 +13:00
|
|
|
|
|
|
|
|
|
|
|
# replies to a post, in a tree, sorted by a variety of methods
|
|
|
|
def post_replies(post_id: int, sort_by: str, show_first: int = 0) -> List[PostReply]:
|
2024-06-02 16:45:21 +12:00
|
|
|
comments = PostReply.query.filter_by(post_id=post_id).filter(PostReply.deleted == False)
|
2024-03-12 20:06:24 +13:00
|
|
|
if current_user.is_authenticated:
|
|
|
|
instance_ids = blocked_instances(current_user.id)
|
|
|
|
if instance_ids:
|
|
|
|
comments = comments.filter(or_(PostReply.instance_id.not_in(instance_ids), PostReply.instance_id == None))
|
2024-03-21 21:50:25 +13:00
|
|
|
if current_user.ignore_bots:
|
|
|
|
comments = comments.filter(PostReply.from_bot == False)
|
2024-04-14 08:57:46 +12:00
|
|
|
blocked_accounts = blocked_users(current_user.id)
|
|
|
|
if blocked_accounts:
|
|
|
|
comments = comments.filter(PostReply.user_id.not_in(blocked_accounts))
|
2024-06-28 18:34:54 +08:00
|
|
|
if current_user.reply_hide_threshold:
|
|
|
|
comments = comments.filter(PostReply.score > current_user.reply_hide_threshold)
|
|
|
|
else:
|
|
|
|
comments.filter(PostReply.score > -20)
|
|
|
|
|
2023-11-30 06:36:08 +13:00
|
|
|
if sort_by == 'hot':
|
|
|
|
comments = comments.order_by(desc(PostReply.ranking))
|
|
|
|
elif sort_by == 'top':
|
|
|
|
comments = comments.order_by(desc(PostReply.score))
|
|
|
|
elif sort_by == 'new':
|
|
|
|
comments = comments.order_by(desc(PostReply.posted_at))
|
|
|
|
|
2023-12-15 17:35:11 +13:00
|
|
|
comments = comments.limit(2000) # paginating indented replies is too hard so just get the first 2000.
|
|
|
|
|
2023-11-30 06:36:08 +13:00
|
|
|
comments_dict = {comment.id: {'comment': comment, 'replies': []} for comment in comments.all()}
|
|
|
|
|
|
|
|
for comment in comments:
|
|
|
|
if comment.parent_id is not None:
|
|
|
|
parent_comment = comments_dict.get(comment.parent_id)
|
|
|
|
if parent_comment:
|
|
|
|
parent_comment['replies'].append(comments_dict[comment.id])
|
|
|
|
|
|
|
|
return [comment for comment in comments_dict.values() if comment['comment'].parent_id is None]
|
|
|
|
|
|
|
|
|
|
|
|
def get_comment_branch(post_id: int, comment_id: int, sort_by: str) -> List[PostReply]:
|
|
|
|
# Fetch the specified parent comment and its replies
|
|
|
|
parent_comment = PostReply.query.get(comment_id)
|
|
|
|
if parent_comment is None:
|
|
|
|
return []
|
|
|
|
|
2024-06-02 16:45:21 +12:00
|
|
|
comments = PostReply.query.filter(PostReply.post_id == post_id, PostReply.deleted == False)
|
2024-03-12 20:06:24 +13:00
|
|
|
if current_user.is_authenticated:
|
|
|
|
instance_ids = blocked_instances(current_user.id)
|
|
|
|
if instance_ids:
|
|
|
|
comments = comments.filter(or_(PostReply.instance_id.not_in(instance_ids), PostReply.instance_id == None))
|
2023-11-30 06:36:08 +13:00
|
|
|
if sort_by == 'hot':
|
|
|
|
comments = comments.order_by(desc(PostReply.ranking))
|
|
|
|
elif sort_by == 'top':
|
|
|
|
comments = comments.order_by(desc(PostReply.score))
|
|
|
|
elif sort_by == 'new':
|
|
|
|
comments = comments.order_by(desc(PostReply.posted_at))
|
|
|
|
|
|
|
|
comments_dict = {comment.id: {'comment': comment, 'replies': []} for comment in comments.all()}
|
|
|
|
|
|
|
|
for comment in comments:
|
|
|
|
if comment.parent_id is not None:
|
|
|
|
parent_comment = comments_dict.get(comment.parent_id)
|
|
|
|
if parent_comment:
|
|
|
|
parent_comment['replies'].append(comments_dict[comment.id])
|
|
|
|
|
|
|
|
return [comment for comment in comments_dict.values() if comment['comment'].id == comment_id]
|
|
|
|
|
|
|
|
|
|
|
|
# The number of replies a post has
|
|
|
|
def post_reply_count(post_id) -> int:
|
2024-06-02 16:45:21 +12:00
|
|
|
return db.session.execute(text('SELECT COUNT(id) as c FROM "post_reply" WHERE post_id = :post_id AND deleted is false'),
|
2023-11-30 06:36:08 +13:00
|
|
|
{'post_id': post_id}).scalar()
|
2024-05-12 13:02:45 +12:00
|
|
|
|
|
|
|
|
|
|
|
def tags_to_string(post: Post) -> str:
|
|
|
|
if post.tags.count() > 0:
|
|
|
|
return ', '.join([tag.name for tag in post.tags])
|
2024-06-16 17:55:08 +08:00
|
|
|
|
|
|
|
|
2024-06-16 21:21:58 +08:00
|
|
|
def body_has_no_archive_link(body):
|
2024-06-16 19:09:56 +08:00
|
|
|
if body:
|
|
|
|
return 'https://archive.' not in body and 'https://12ft.io' not in body
|
|
|
|
else:
|
|
|
|
return True
|
2024-06-16 19:03:23 +08:00
|
|
|
|
|
|
|
|
2024-06-16 21:21:58 +08:00
|
|
|
def url_needs_archive(url) -> bool:
|
2024-06-16 19:07:19 +08:00
|
|
|
paywalled_sites = ['washingtonpost.com', 'nytimes.com', 'wsj.com', 'economist.com', 'ft.com', 'telegraph.co.uk',
|
2024-06-16 19:03:23 +08:00
|
|
|
'bild.de', 'theatlantic.com', 'lemonde.fr', 'nzherald.co.nz']
|
2024-06-16 17:55:08 +08:00
|
|
|
if url:
|
|
|
|
try:
|
|
|
|
parsed_url = urlparse(url.replace('www.', ''))
|
|
|
|
hostname = parsed_url.hostname.lower()
|
|
|
|
except:
|
|
|
|
return False
|
|
|
|
return hostname in paywalled_sites
|
|
|
|
else:
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
2024-06-16 21:21:58 +08:00
|
|
|
def generate_archive_link(url) -> bool:
|
2024-06-16 17:55:08 +08:00
|
|
|
return 'https://archive.ph/' + url
|