2023-12-22 15:34:45 +13:00
from __future__ import annotations
2024-01-18 15:15:10 +13:00
import html
2023-08-05 21:24:10 +12:00
import os
2023-12-27 15:47:17 +13:00
from datetime import timedelta
2023-12-24 16:20:18 +13:00
from random import randint
2023-09-16 19:09:04 +12:00
from typing import Union , Tuple
2024-04-04 21:36:03 +13:00
import redis
2024-01-06 11:01:44 +13:00
from flask import current_app , request , g , url_for
2024-02-10 19:58:34 +13:00
from flask_babel import _
2024-02-09 14:58:51 +13:00
from sqlalchemy import text , func
2023-12-24 16:20:18 +13:00
from app import db , cache , constants , celery
2023-12-22 14:05:39 +13:00
from app . models import User , Post , Community , BannedInstances , File , PostReply , AllowedInstances , Instance , utcnow , \
2024-04-16 21:49:05 +12:00
PostVote , PostReplyVote , ActivityPubLog , Notification , Site , CommunityMember , InstanceRole , Report , Conversation , \
Language
2023-08-10 21:13:37 +12:00
import time
import base64
import requests
from cryptography . hazmat . primitives import serialization , hashes
from cryptography . hazmat . primitives . asymmetric import padding
from app . constants import *
2024-04-04 21:36:03 +13:00
from urllib . parse import urlparse , parse_qs
2023-12-24 16:20:18 +13:00
from PIL import Image , ImageOps
from io import BytesIO
2024-01-13 18:18:32 +13:00
import pytesseract
2023-08-05 21:24:10 +12:00
2024-03-27 16:02:04 +13:00
from app . utils import get_request , allowlist_html , get_setting , ap_datetime , markdown_to_html , \
2024-01-06 11:01:44 +13:00
is_image_url , domain_from_url , gibberish , ensure_directory_exists , markdown_to_text , head_request , post_ranking , \
2024-03-22 12:22:19 +13:00
shorten_string , reply_already_exists , reply_is_just_link_to_gif_reaction , confidence , remove_tracking_from_link , \
2024-04-29 16:03:00 +12:00
blocked_phrases , microblog_content_to_title , generate_image_from_video_url , is_video_url , reply_is_stupid , \
notification_subscribers , communities_banned_from
2023-09-08 20:04:01 +12:00
2023-08-05 21:24:10 +12:00
def public_key ( ) :
if not os . path . exists ( ' ./public.pem ' ) :
os . system ( ' openssl genrsa -out private.pem 2048 ' )
os . system ( ' openssl rsa -in private.pem -outform PEM -pubout -out public.pem ' )
else :
publicKey = open ( ' ./public.pem ' , ' r ' ) . read ( )
PUBLICKEY = publicKey . replace ( ' \n ' , ' \\ n ' ) # JSON-LD doesn't want to work with linebreaks,
# but needs the \n character to know where to break the line ;)
return PUBLICKEY
2023-08-10 21:13:37 +12:00
2023-12-27 14:38:41 +13:00
def community_members ( community_id ) :
sql = ' SELECT COUNT(id) as c FROM " user " as u '
sql + = ' INNER JOIN community_member cm on u.id = cm.user_id '
sql + = ' WHERE u.banned is false AND u.deleted is false AND cm.is_banned is false and cm.community_id = :community_id '
return db . session . execute ( text ( sql ) , { ' community_id ' : community_id } ) . scalar ( )
2023-08-10 21:13:37 +12:00
def users_total ( ) :
return db . session . execute ( text (
' SELECT COUNT(id) as c FROM " user " WHERE ap_id is null AND verified is true AND banned is false AND deleted is false ' ) ) . scalar ( )
def active_half_year ( ) :
return db . session . execute ( text (
" SELECT COUNT(id) as c FROM \" user \" WHERE last_seen >= CURRENT_DATE - INTERVAL ' 6 months ' AND ap_id is null AND verified is true AND banned is false AND deleted is false " ) ) . scalar ( )
def active_month ( ) :
return db . session . execute ( text (
" SELECT COUNT(id) as c FROM \" user \" WHERE last_seen >= CURRENT_DATE - INTERVAL ' 1 month ' AND ap_id is null AND verified is true AND banned is false AND deleted is false " ) ) . scalar ( )
2024-02-14 14:38:55 +13:00
def active_week ( ) :
return db . session . execute ( text (
" SELECT COUNT(id) as c FROM \" user \" WHERE last_seen >= CURRENT_DATE - INTERVAL ' 1 week ' AND ap_id is null AND verified is true AND banned is false AND deleted is false " ) ) . scalar ( )
def active_day ( ) :
return db . session . execute ( text (
" SELECT COUNT(id) as c FROM \" user \" WHERE last_seen >= CURRENT_DATE - INTERVAL ' 1 day ' AND ap_id is null AND verified is true AND banned is false AND deleted is false " ) ) . scalar ( )
2023-08-10 21:13:37 +12:00
def local_posts ( ) :
2024-02-08 12:46:41 +13:00
return db . session . execute ( text ( ' SELECT COUNT(id) as c FROM " post " WHERE instance_id = 1 ' ) ) . scalar ( )
2023-08-10 21:13:37 +12:00
def local_comments ( ) :
2024-02-08 12:46:41 +13:00
return db . session . execute ( text ( ' SELECT COUNT(id) as c FROM " post_reply " WHERE instance_id = 1 ' ) ) . scalar ( )
2023-08-10 21:13:37 +12:00
2024-02-14 14:38:55 +13:00
def local_communities ( ) :
return db . session . execute ( text ( ' SELECT COUNT(id) as c FROM " community " WHERE instance_id = 1 ' ) ) . scalar ( )
2023-08-10 21:13:37 +12:00
def send_activity ( sender : User , host : str , content : str ) :
date = time . strftime ( ' %a , %d % b % Y % H: % M: % S UTC ' , time . gmtime ( ) )
private_key = serialization . load_pem_private_key ( sender . private_key , password = None )
# todo: look up instance details to set host_inbox
host_inbox = ' /inbox '
signed_string = f " (request-target): post { host_inbox } \n host: { host } \n date: " + date
signature = private_key . sign ( signed_string . encode ( ' utf-8 ' ) , padding . PKCS1v15 ( ) , hashes . SHA256 ( ) )
encoded_signature = base64 . b64encode ( signature ) . decode ( ' utf-8 ' )
# Construct the Signature header
header = f ' keyId= " https:// { current_app . config [ " SERVER_NAME " ] } /u/ { sender . user_name } " ,headers= " (request-target) host date " ,signature= " { encoded_signature } " '
# Create headers for the request
headers = {
' Host ' : host ,
' Date ' : date ,
' Signature ' : header
}
# Make the HTTP request
try :
response = requests . post ( f ' https:// { host } { host_inbox } ' , headers = headers , data = content ,
timeout = REQUEST_TIMEOUT )
except requests . exceptions . RequestException :
time . sleep ( 1 )
response = requests . post ( f ' https:// { host } { host_inbox } ' , headers = headers , data = content ,
timeout = REQUEST_TIMEOUT / 2 )
return response . status_code
def post_to_activity ( post : Post , community : Community ) :
2024-03-09 19:13:15 +13:00
# local PieFed posts do not have a create or announce id
create_id = post . ap_create_id if post . ap_create_id else f " https:// { current_app . config [ ' SERVER_NAME ' ] } /activities/create/ { gibberish ( 15 ) } "
announce_id = post . ap_announce_id if post . ap_announce_id else f " https:// { current_app . config [ ' SERVER_NAME ' ] } /activities/announce/ { gibberish ( 15 ) } "
2023-08-10 21:13:37 +12:00
activity_data = {
" actor " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } " ,
" to " : [
" https://www.w3.org/ns/activitystreams#Public "
] ,
" object " : {
2024-03-09 19:13:15 +13:00
" id " : create_id ,
2024-03-18 21:00:17 +00:00
" actor " : post . author . ap_public_url ,
2023-08-10 21:13:37 +12:00
" to " : [
" https://www.w3.org/ns/activitystreams#Public "
] ,
" object " : {
" type " : " Page " ,
2024-03-18 21:00:17 +00:00
" id " : post . ap_id ,
" attributedTo " : post . author . ap_public_url ,
2023-08-10 21:13:37 +12:00
" to " : [
f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } " ,
" https://www.w3.org/ns/activitystreams#Public "
] ,
" name " : post . title ,
" cc " : [ ] ,
2024-03-18 21:00:17 +00:00
" content " : post . body_html if post . body_html else ' ' ,
2023-08-10 21:13:37 +12:00
" mediaType " : " text/html " ,
" source " : {
2024-03-18 21:00:17 +00:00
" content " : post . body if post . body else ' ' ,
2023-08-10 21:13:37 +12:00
" mediaType " : " text/markdown "
} ,
" attachment " : [ ] ,
2024-02-06 17:40:03 +13:00
" commentsEnabled " : post . comments_enabled ,
2023-08-10 21:13:37 +12:00
" sensitive " : post . nsfw or post . nsfl ,
2023-12-09 22:14:16 +13:00
" published " : ap_datetime ( post . created_at ) ,
2024-02-11 20:29:58 +13:00
" stickied " : post . sticky ,
2023-08-10 21:13:37 +12:00
" audience " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } "
} ,
" cc " : [
f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } "
] ,
" type " : " Create " ,
" audience " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } "
} ,
" cc " : [
f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } /followers "
] ,
" type " : " Announce " ,
2024-03-09 19:13:15 +13:00
" id " : announce_id
2023-08-10 21:13:37 +12:00
}
if post . edited_at is not None :
2024-02-03 10:36:19 +13:00
activity_data [ " object " ] [ " object " ] [ " updated " ] = ap_datetime ( post . edited_at )
2023-08-10 21:13:37 +12:00
if post . language is not None :
activity_data [ " object " ] [ " object " ] [ " language " ] = { " identifier " : post . language }
2024-04-16 20:59:58 +12:00
if ( post . type == POST_TYPE_LINK or post . type == POST_TYPE_VIDEO ) and post . url is not None :
2024-03-09 18:19:03 +13:00
activity_data [ " object " ] [ " object " ] [ " attachment " ] = [ { " href " : post . url , " type " : " Link " } ]
2023-08-10 21:13:37 +12:00
if post . image_id is not None :
2024-02-23 20:23:59 +13:00
activity_data [ " object " ] [ " object " ] [ " image " ] = { " url " : post . image . view_url ( ) , " type " : " Image " }
2024-01-26 17:15:43 +13:00
if post . image . alt_text :
activity_data [ " object " ] [ " object " ] [ " image " ] [ ' altText ' ] = post . image . alt_text
2023-08-10 21:13:37 +12:00
return activity_data
2023-08-22 21:24:11 +12:00
2024-03-24 22:10:41 +00:00
def post_to_page ( post : Post , community : Community ) :
activity_data = {
" type " : " Page " ,
" id " : post . ap_id ,
" attributedTo " : post . author . ap_public_url ,
" to " : [
f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } " ,
" https://www.w3.org/ns/activitystreams#Public "
] ,
" name " : post . title ,
" cc " : [ ] ,
" content " : post . body_html if post . body_html else ' ' ,
" mediaType " : " text/html " ,
" source " : {
" content " : post . body if post . body else ' ' ,
" mediaType " : " text/markdown "
} ,
" attachment " : [ ] ,
" commentsEnabled " : post . comments_enabled ,
" sensitive " : post . nsfw or post . nsfl ,
" published " : ap_datetime ( post . created_at ) ,
" stickied " : post . sticky ,
" audience " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /c/ { community . name } "
}
if post . edited_at is not None :
activity_data [ " updated " ] = ap_datetime ( post . edited_at )
if post . language is not None :
activity_data [ " language " ] = { " identifier " : post . language }
2024-04-16 20:59:58 +12:00
if ( post . type == POST_TYPE_LINK or post . type == POST_TYPE_VIDEO ) and post . url is not None :
2024-03-24 22:10:41 +00:00
activity_data [ " attachment " ] = [ { " href " : post . url , " type " : " Link " } ]
if post . image_id is not None :
activity_data [ " image " ] = { " url " : post . image . view_url ( ) , " type " : " Image " }
if post . image . alt_text :
activity_data [ " image " ] [ ' altText ' ] = post . image . alt_text
return activity_data
2023-08-22 21:24:11 +12:00
def banned_user_agents ( ) :
2023-09-08 20:04:01 +12:00
return [ ] # todo: finish this function
2023-08-22 21:24:11 +12:00
2023-09-17 21:19:51 +12:00
@cache.memoize ( 150 )
2024-01-03 16:29:58 +13:00
def instance_blocked ( host : str ) - > bool : # see also utils.instance_banned()
2024-04-09 19:23:19 +12:00
if host is None or host == ' ' :
return True
2023-09-16 19:09:04 +12:00
host = host . lower ( )
if ' https:// ' in host or ' http:// ' in host :
host = urlparse ( host ) . hostname
2023-08-22 21:24:11 +12:00
instance = BannedInstances . query . filter_by ( domain = host . strip ( ) ) . first ( )
return instance is not None
2023-11-03 20:32:12 +13:00
@cache.memoize ( 150 )
def instance_allowed ( host : str ) - > bool :
2024-04-09 19:23:19 +12:00
if host is None or host == ' ' :
return True
2023-11-03 20:32:12 +13:00
host = host . lower ( )
if ' https:// ' in host or ' http:// ' in host :
host = urlparse ( host ) . hostname
instance = AllowedInstances . query . filter_by ( domain = host . strip ( ) ) . first ( )
return instance is not None
2024-03-02 10:20:15 +13:00
def find_actor_or_create ( actor : str , create_if_not_found = True , community_only = False ) - > Union [ User , Community , None ] :
2024-03-16 20:17:24 +00:00
actor_url = actor . strip ( )
2024-02-10 16:29:03 +13:00
actor = actor . strip ( ) . lower ( )
2023-09-08 20:04:01 +12:00
user = None
# actor parameter must be formatted as https://server/u/actor or https://server/c/actor
2023-12-21 22:14:43 +13:00
# Initially, check if the user exists in the local DB already
2023-08-22 21:24:11 +12:00
if current_app . config [ ' SERVER_NAME ' ] + ' /c/ ' in actor :
2024-02-10 16:29:03 +13:00
return Community . query . filter ( Community . ap_profile_id == actor ) . first ( ) # finds communities formatted like https://localhost/c/*
2023-09-08 20:04:01 +12:00
if current_app . config [ ' SERVER_NAME ' ] + ' /u/ ' in actor :
2024-02-10 16:29:03 +13:00
user = User . query . filter ( func . lower ( User . user_name ) == actor . split ( ' / ' ) [ - 1 ] ) . filter_by ( ap_id = None , banned = False ) . first ( ) # finds local users
2023-09-08 20:04:01 +12:00
if user is None :
return None
elif actor . startswith ( ' https:// ' ) :
server , address = extract_domain_and_actor ( actor )
2023-11-03 20:32:12 +13:00
if get_setting ( ' use_allowlist ' , False ) :
if not instance_allowed ( server ) :
return None
else :
if instance_blocked ( server ) :
return None
2024-02-10 16:29:03 +13:00
user = User . query . filter ( User . ap_profile_id == actor ) . first ( ) # finds users formatted like https://kbin.social/u/tables
2023-12-29 20:14:29 +13:00
if ( user and user . banned ) or ( user and user . deleted ) :
2023-10-21 15:49:01 +13:00
return None
2023-09-08 20:04:01 +12:00
if user is None :
2024-02-10 16:29:03 +13:00
user = Community . query . filter ( Community . ap_profile_id == actor ) . first ( )
2024-03-25 13:30:09 +13:00
if user and user . banned :
# Try to find a non-banned copy of the community. Sometimes duplicates happen and one copy is banned.
user = Community . query . filter ( Community . ap_profile_id == actor ) . filter ( Community . banned == False ) . first ( )
if user is None : # no un-banned version of this community exists, only the banned one. So it was banned for being bad, not for being a duplicate.
return None
2023-12-21 22:14:43 +13:00
if user is not None :
2024-02-14 12:31:44 +13:00
if not user . is_local ( ) and ( user . ap_fetched_at is None or user . ap_fetched_at < utcnow ( ) - timedelta ( days = 7 ) ) :
2023-12-27 16:58:30 +13:00
# To reduce load on remote servers, refreshing the user profile happens after a delay of 1 to 10 seconds. Meanwhile, subsequent calls to
# find_actor_or_create() which happen to be for the same actor might queue up refreshes of the same user. To avoid this, set a flag to
# indicate that user is currently being refreshed.
refresh_in_progress = cache . get ( f ' refreshing_ { user . id } ' )
if not refresh_in_progress :
2023-12-28 20:00:42 +13:00
cache . set ( f ' refreshing_ { user . id } ' , True , timeout = 300 )
2024-02-14 12:31:44 +13:00
if isinstance ( user , User ) :
refresh_user_profile ( user . id )
elif isinstance ( user , Community ) :
2024-02-27 05:19:52 +13:00
refresh_community_profile ( user . id )
2024-02-14 12:31:44 +13:00
refresh_instance_profile ( user . instance_id )
2023-08-22 21:24:11 +12:00
return user
2023-12-21 22:14:43 +13:00
else : # User does not exist in the DB, it's going to need to be created from it's remote home instance
2024-02-25 15:31:16 +13:00
if create_if_not_found :
if actor . startswith ( ' https:// ' ) :
try :
2024-03-16 20:17:24 +00:00
actor_data = get_request ( actor_url , headers = { ' Accept ' : ' application/activity+json ' } )
2024-02-25 15:31:16 +13:00
except requests . exceptions . ReadTimeout :
time . sleep ( randint ( 3 , 10 ) )
2024-03-16 20:33:48 +00:00
try :
actor_data = get_request ( actor_url , headers = { ' Accept ' : ' application/activity+json ' } )
except requests . exceptions . ReadTimeout :
return None
except requests . exceptions . ConnectionError :
return None
2024-02-25 15:31:16 +13:00
if actor_data . status_code == 200 :
actor_json = actor_data . json ( )
actor_data . close ( )
2024-03-02 10:20:15 +13:00
actor_model = actor_json_to_model ( actor_json , address , server )
if community_only and not isinstance ( actor_model , Community ) :
return None
return actor_model
2024-02-25 15:31:16 +13:00
else :
# retrieve user details via webfinger, etc
try :
webfinger_data = get_request ( f " https:// { server } /.well-known/webfinger " ,
params = { ' resource ' : f " acct: { address } @ { server } " } )
except requests . exceptions . ReadTimeout :
time . sleep ( randint ( 3 , 10 ) )
webfinger_data = get_request ( f " https:// { server } /.well-known/webfinger " ,
params = { ' resource ' : f " acct: { address } @ { server } " } )
if webfinger_data . status_code == 200 :
webfinger_json = webfinger_data . json ( )
webfinger_data . close ( )
for links in webfinger_json [ ' links ' ] :
if ' rel ' in links and links [ ' rel ' ] == ' self ' : # this contains the URL of the activitypub profile
type = links [ ' type ' ] if ' type ' in links else ' application/activity+json '
# retrieve the activitypub profile
try :
actor_data = get_request ( links [ ' href ' ] , headers = { ' Accept ' : type } )
except requests . exceptions . ReadTimeout :
time . sleep ( randint ( 3 , 10 ) )
actor_data = get_request ( links [ ' href ' ] , headers = { ' Accept ' : type } )
# to see the structure of the json contained in actor_data, do a GET to https://lemmy.world/c/technology with header Accept: application/activity+json
if actor_data . status_code == 200 :
actor_json = actor_data . json ( )
actor_data . close ( )
2024-03-02 10:20:15 +13:00
actor_model = actor_json_to_model ( actor_json , address , server )
if community_only and not isinstance ( actor_model , Community ) :
return None
return actor_model
2023-12-21 22:14:43 +13:00
return None
2023-09-08 20:04:01 +12:00
2024-04-16 21:49:05 +12:00
def find_language_or_create ( code : str , name : str ) - > Language :
existing_language = Language . query . filter ( Language . code == code ) . first ( )
if existing_language :
return existing_language
else :
new_language = Language ( code = code , name = name )
db . session . add ( new_language )
return new_language
2023-09-08 20:04:01 +12:00
def extract_domain_and_actor ( url_string : str ) :
# Parse the URL
parsed_url = urlparse ( url_string )
# Extract the server domain name
server_domain = parsed_url . netloc
# Extract the part of the string after the last '/' character
actor = parsed_url . path . split ( ' / ' ) [ - 1 ]
return server_domain , actor
2023-12-29 17:32:35 +13:00
def user_removed_from_remote_server ( actor_url , is_piefed = False ) :
result = False
response = None
try :
if is_piefed :
response = head_request ( actor_url , headers = { ' Accept ' : ' application/activity+json ' } )
else :
response = get_request ( actor_url , headers = { ' Accept ' : ' application/activity+json ' } )
if response . status_code == 404 or response . status_code == 410 :
result = True
else :
result = False
except :
result = True
finally :
if response :
response . close ( )
return result
2023-12-27 15:47:17 +13:00
def refresh_user_profile ( user_id ) :
if current_app . debug :
refresh_user_profile_task ( user_id )
else :
2023-12-29 17:32:35 +13:00
refresh_user_profile_task . apply_async ( args = ( user_id , ) , countdown = randint ( 1 , 10 ) )
2023-12-27 15:47:17 +13:00
@celery.task
def refresh_user_profile_task ( user_id ) :
user = User . query . get ( user_id )
if user :
2024-01-05 11:00:16 +13:00
try :
actor_data = get_request ( user . ap_profile_id , headers = { ' Accept ' : ' application/activity+json ' } )
except requests . exceptions . ReadTimeout :
time . sleep ( randint ( 3 , 10 ) )
2024-04-20 17:33:04 +12:00
try :
actor_data = get_request ( user . ap_profile_id , headers = { ' Accept ' : ' application/activity+json ' } )
except requests . exceptions . ReadTimeout :
return
2023-12-27 15:47:17 +13:00
if actor_data . status_code == 200 :
activity_json = actor_data . json ( )
actor_data . close ( )
2024-03-12 20:58:47 +13:00
# update indexible state on their posts, if necessary
new_indexable = activity_json [ ' indexable ' ] if ' indexable ' in activity_json else True
if new_indexable != user . indexable :
db . session . execute ( text ( ' UPDATE " post " set indexable = :indexable WHERE user_id = :user_id ' ) ,
{ ' user_id ' : user . id ,
' indexable ' : new_indexable } )
2023-12-27 15:47:17 +13:00
user . user_name = activity_json [ ' preferredUsername ' ]
user . about_html = parse_summary ( activity_json )
user . ap_fetched_at = utcnow ( )
2024-03-12 20:58:47 +13:00
user . public_key = activity_json [ ' publicKey ' ] [ ' publicKeyPem ' ]
user . indexable = new_indexable
2023-12-27 15:47:17 +13:00
avatar_changed = cover_changed = False
if ' icon ' in activity_json :
2024-01-03 16:29:58 +13:00
if user . avatar_id and activity_json [ ' icon ' ] [ ' url ' ] != user . avatar . source_url :
2023-12-27 15:47:17 +13:00
user . avatar . delete_from_disk ( )
2024-01-03 16:29:58 +13:00
avatar = File ( source_url = activity_json [ ' icon ' ] [ ' url ' ] )
user . avatar = avatar
db . session . add ( avatar )
avatar_changed = True
2023-12-27 15:47:17 +13:00
if ' image ' in activity_json :
2024-01-03 16:29:58 +13:00
if user . cover_id and activity_json [ ' image ' ] [ ' url ' ] != user . cover . source_url :
2023-12-27 15:47:17 +13:00
user . cover . delete_from_disk ( )
2024-01-03 16:29:58 +13:00
cover = File ( source_url = activity_json [ ' image ' ] [ ' url ' ] )
user . cover = cover
db . session . add ( cover )
cover_changed = True
2023-12-27 15:47:17 +13:00
db . session . commit ( )
if user . avatar_id and avatar_changed :
make_image_sizes ( user . avatar_id , 40 , 250 , ' users ' )
if user . cover_id and cover_changed :
make_image_sizes ( user . cover_id , 700 , 1600 , ' users ' )
2024-02-27 05:19:52 +13:00
def refresh_community_profile ( community_id ) :
if current_app . debug :
2024-02-27 05:26:06 +13:00
refresh_community_profile_task ( community_id )
2024-02-27 05:19:52 +13:00
else :
2024-02-27 05:26:06 +13:00
refresh_community_profile_task . apply_async ( args = ( community_id , ) , countdown = randint ( 1 , 10 ) )
2024-02-27 05:19:52 +13:00
@celery.task
def refresh_community_profile_task ( community_id ) :
community = Community . query . get ( community_id )
if community and not community . is_local ( ) :
try :
actor_data = get_request ( community . ap_profile_id , headers = { ' Accept ' : ' application/activity+json ' } )
except requests . exceptions . ReadTimeout :
time . sleep ( randint ( 3 , 10 ) )
2024-04-20 17:33:04 +12:00
try :
actor_data = get_request ( community . ap_profile_id , headers = { ' Accept ' : ' application/activity+json ' } )
except Exception as e :
return
2024-02-27 05:19:52 +13:00
if actor_data . status_code == 200 :
activity_json = actor_data . json ( )
actor_data . close ( )
if ' attributedTo ' in activity_json : # lemmy and mbin
mods_url = activity_json [ ' attributedTo ' ]
elif ' moderators ' in activity_json : # kbin
mods_url = activity_json [ ' moderators ' ]
else :
mods_url = None
community . nsfw = activity_json [ ' sensitive ' ]
if ' nsfl ' in activity_json and activity_json [ ' nsfl ' ] :
community . nsfl = activity_json [ ' nsfl ' ]
community . title = activity_json [ ' name ' ]
community . description = activity_json [ ' summary ' ] if ' summary ' in activity_json else ' '
community . rules = activity_json [ ' rules ' ] if ' rules ' in activity_json else ' '
community . rules_html = markdown_to_html ( activity_json [ ' rules ' ] if ' rules ' in activity_json else ' ' )
community . restricted_to_mods = activity_json [ ' postingRestrictedToMods ' ]
community . new_mods_wanted = activity_json [ ' newModsWanted ' ] if ' newModsWanted ' in activity_json else False
community . private_mods = activity_json [ ' privateMods ' ] if ' privateMods ' in activity_json else False
community . ap_moderators_url = mods_url
community . ap_fetched_at = utcnow ( )
community . public_key = activity_json [ ' publicKey ' ] [ ' publicKeyPem ' ]
if ' source ' in activity_json and \
activity_json [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
community . description = activity_json [ ' source ' ] [ ' content ' ]
community . description_html = markdown_to_html ( community . description )
elif ' content ' in activity_json :
community . description_html = allowlist_html ( activity_json [ ' content ' ] )
2024-03-27 16:02:04 +13:00
community . description = ' '
2024-02-27 05:19:52 +13:00
icon_changed = cover_changed = False
if ' icon ' in activity_json :
if community . icon_id and activity_json [ ' icon ' ] [ ' url ' ] != community . icon . source_url :
community . icon . delete_from_disk ( )
icon = File ( source_url = activity_json [ ' icon ' ] [ ' url ' ] )
community . icon = icon
db . session . add ( icon )
icon_changed = True
if ' image ' in activity_json :
if community . image_id and activity_json [ ' image ' ] [ ' url ' ] != community . image . source_url :
community . image . delete_from_disk ( )
image = File ( source_url = activity_json [ ' image ' ] [ ' url ' ] )
community . image = image
db . session . add ( image )
cover_changed = True
2024-04-18 13:57:33 +12:00
if ' language ' in activity_json and isinstance ( activity_json [ ' language ' ] , list ) :
for ap_language in activity_json [ ' language ' ] :
new_language = find_language_or_create ( ap_language [ ' identifier ' ] , ap_language [ ' name ' ] )
2024-04-19 20:05:27 +12:00
if new_language not in community . languages :
2024-04-18 13:57:33 +12:00
community . languages . append ( new_language )
2024-02-27 05:19:52 +13:00
db . session . commit ( )
if community . icon_id and icon_changed :
make_image_sizes ( community . icon_id , 60 , 250 , ' communities ' )
if community . image_id and cover_changed :
make_image_sizes ( community . image_id , 700 , 1600 , ' communities ' )
if community . ap_moderators_url :
mods_request = get_request ( community . ap_moderators_url , headers = { ' Accept ' : ' application/activity+json ' } )
if mods_request . status_code == 200 :
mods_data = mods_request . json ( )
mods_request . close ( )
if mods_data and mods_data [ ' type ' ] == ' OrderedCollection ' and ' orderedItems ' in mods_data :
for actor in mods_data [ ' orderedItems ' ] :
time . sleep ( 0.5 )
user = find_actor_or_create ( actor )
if user :
existing_membership = CommunityMember . query . filter_by ( community_id = community . id ,
user_id = user . id ) . first ( )
if existing_membership :
existing_membership . is_moderator = True
db . session . commit ( )
else :
new_membership = CommunityMember ( community_id = community . id , user_id = user . id ,
is_moderator = True )
db . session . add ( new_membership )
db . session . commit ( )
# Remove people who are no longer mods
for member in CommunityMember . query . filter_by ( community_id = community . id , is_moderator = True ) . all ( ) :
member_user = User . query . get ( member . user_id )
is_mod = False
for actor in mods_data [ ' orderedItems ' ] :
if actor . lower ( ) == member_user . profile_id ( ) . lower ( ) :
is_mod = True
break
if not is_mod :
db . session . query ( CommunityMember ) . filter_by ( community_id = community . id ,
user_id = member_user . id ,
is_moderator = True ) . delete ( )
db . session . commit ( )
2023-12-21 22:14:43 +13:00
def actor_json_to_model ( activity_json , address , server ) :
2024-03-20 11:34:25 +00:00
if activity_json [ ' type ' ] == ' Person ' or activity_json [ ' type ' ] == ' Service ' :
2024-02-29 17:10:38 +13:00
try :
user = User ( user_name = activity_json [ ' preferredUsername ' ] ,
title = activity_json [ ' name ' ] if ' name ' in activity_json else None ,
email = f " { address } @ { server } " ,
about_html = parse_summary ( activity_json ) ,
matrix_user_id = activity_json [ ' matrixUserId ' ] if ' matrixUserId ' in activity_json else ' ' ,
indexable = activity_json [ ' indexable ' ] if ' indexable ' in activity_json else False ,
searchable = activity_json [ ' discoverable ' ] if ' discoverable ' in activity_json else True ,
created = activity_json [ ' published ' ] if ' published ' in activity_json else utcnow ( ) ,
2024-04-23 21:28:58 +12:00
ap_id = f " { address . lower ( ) } @ { server . lower ( ) } " ,
2024-02-29 17:10:38 +13:00
ap_public_url = activity_json [ ' id ' ] ,
ap_profile_id = activity_json [ ' id ' ] . lower ( ) ,
2024-03-02 10:20:15 +13:00
ap_inbox_url = activity_json [ ' endpoints ' ] [ ' sharedInbox ' ] if ' endpoints ' in activity_json else activity_json [ ' inbox ' ] if ' inbox ' in activity_json else ' ' ,
2024-02-29 17:10:38 +13:00
ap_followers_url = activity_json [ ' followers ' ] if ' followers ' in activity_json else None ,
ap_preferred_username = activity_json [ ' preferredUsername ' ] ,
ap_manually_approves_followers = activity_json [ ' manuallyApprovesFollowers ' ] if ' manuallyApprovesFollowers ' in activity_json else False ,
ap_fetched_at = utcnow ( ) ,
ap_domain = server ,
public_key = activity_json [ ' publicKey ' ] [ ' publicKeyPem ' ] ,
2024-03-20 11:34:25 +00:00
bot = True if activity_json [ ' type ' ] == ' Service ' else False ,
2024-02-29 17:10:38 +13:00
instance_id = find_instance_id ( server )
# language=community_json['language'][0]['identifier'] # todo: language
)
except KeyError as e :
current_app . logger . error ( f ' KeyError for { address } @ { server } while parsing ' + str ( activity_json ) )
return None
2024-04-09 10:29:55 +12:00
if ' icon ' in activity_json and activity_json [ ' icon ' ] is not None and ' url ' in activity_json [ ' icon ' ] :
2023-12-21 22:14:43 +13:00
avatar = File ( source_url = activity_json [ ' icon ' ] [ ' url ' ] )
user . avatar = avatar
db . session . add ( avatar )
2024-04-09 10:29:55 +12:00
if ' image ' in activity_json and activity_json [ ' image ' ] is not None and ' url ' in activity_json [ ' image ' ] :
2023-12-21 22:14:43 +13:00
cover = File ( source_url = activity_json [ ' image ' ] [ ' url ' ] )
user . cover = cover
db . session . add ( cover )
db . session . add ( user )
db . session . commit ( )
2023-12-24 16:20:18 +13:00
if user . avatar_id :
make_image_sizes ( user . avatar_id , 40 , 250 , ' users ' )
if user . cover_id :
2024-02-10 06:41:24 +13:00
make_image_sizes ( user . cover_id , 878 , None , ' users ' )
2023-12-21 22:14:43 +13:00
return user
elif activity_json [ ' type ' ] == ' Group ' :
if ' attributedTo ' in activity_json : # lemmy and mbin
mods_url = activity_json [ ' attributedTo ' ]
elif ' moderators ' in activity_json : # kbin
mods_url = activity_json [ ' moderators ' ]
else :
mods_url = None
2024-01-21 21:04:48 +13:00
# only allow nsfw communities if enabled for this instance
site = Site . query . get ( 1 ) # can't use g.site because actor_json_to_model can be called from celery
if activity_json [ ' sensitive ' ] and not site . enable_nsfw :
return None
if ' nsfl ' in activity_json and activity_json [ ' nsfl ' ] and not site . enable_nsfl :
return None
2023-12-21 22:14:43 +13:00
community = Community ( name = activity_json [ ' preferredUsername ' ] ,
title = activity_json [ ' name ' ] ,
description = activity_json [ ' summary ' ] if ' summary ' in activity_json else ' ' ,
rules = activity_json [ ' rules ' ] if ' rules ' in activity_json else ' ' ,
rules_html = markdown_to_html ( activity_json [ ' rules ' ] if ' rules ' in activity_json else ' ' ) ,
nsfw = activity_json [ ' sensitive ' ] ,
restricted_to_mods = activity_json [ ' postingRestrictedToMods ' ] ,
2024-01-02 19:41:00 +13:00
new_mods_wanted = activity_json [ ' newModsWanted ' ] if ' newModsWanted ' in activity_json else False ,
private_mods = activity_json [ ' privateMods ' ] if ' privateMods ' in activity_json else False ,
2023-12-21 22:14:43 +13:00
created_at = activity_json [ ' published ' ] if ' published ' in activity_json else utcnow ( ) ,
last_active = activity_json [ ' updated ' ] if ' updated ' in activity_json else utcnow ( ) ,
2024-04-23 21:28:58 +12:00
ap_id = f " { address [ 1 : ] . lower ( ) } @ { server . lower ( ) } " if address . startswith ( ' ! ' ) else f " { address } @ { server } " ,
2023-12-21 22:14:43 +13:00
ap_public_url = activity_json [ ' id ' ] ,
2024-02-10 11:42:18 +13:00
ap_profile_id = activity_json [ ' id ' ] . lower ( ) ,
2023-12-21 22:14:43 +13:00
ap_followers_url = activity_json [ ' followers ' ] ,
ap_inbox_url = activity_json [ ' endpoints ' ] [ ' sharedInbox ' ] ,
2024-02-21 08:36:47 +13:00
ap_outbox_url = activity_json [ ' outbox ' ] ,
2024-03-24 00:15:10 +00:00
ap_featured_url = activity_json [ ' featured ' ] if ' featured ' in activity_json else ' ' ,
2023-12-21 22:14:43 +13:00
ap_moderators_url = mods_url ,
ap_fetched_at = utcnow ( ) ,
ap_domain = server ,
public_key = activity_json [ ' publicKey ' ] [ ' publicKeyPem ' ] ,
# language=community_json['language'][0]['identifier'] # todo: language
instance_id = find_instance_id ( server ) ,
low_quality = ' memes ' in activity_json [ ' preferredUsername ' ]
)
# parse markdown and overwrite html field with result
if ' source ' in activity_json and \
activity_json [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
community . description = activity_json [ ' source ' ] [ ' content ' ]
community . description_html = markdown_to_html ( community . description )
elif ' content ' in activity_json :
community . description_html = allowlist_html ( activity_json [ ' content ' ] )
2024-03-27 16:02:04 +13:00
community . description = ' '
2024-04-09 10:29:55 +12:00
if ' icon ' in activity_json and activity_json [ ' icon ' ] is not None and ' url ' in activity_json [ ' icon ' ] :
2023-12-21 22:14:43 +13:00
icon = File ( source_url = activity_json [ ' icon ' ] [ ' url ' ] )
community . icon = icon
db . session . add ( icon )
2024-04-09 10:29:55 +12:00
if ' image ' in activity_json and activity_json [ ' image ' ] is not None and ' url ' in activity_json [ ' image ' ] :
2023-12-21 22:14:43 +13:00
image = File ( source_url = activity_json [ ' image ' ] [ ' url ' ] )
community . image = image
db . session . add ( image )
2024-04-16 21:49:05 +12:00
if ' language ' in activity_json and isinstance ( activity_json [ ' language ' ] , list ) :
for ap_language in activity_json [ ' language ' ] :
community . languages . append ( find_language_or_create ( ap_language [ ' identifier ' ] , ap_language [ ' name ' ] ) )
2023-12-21 22:14:43 +13:00
db . session . add ( community )
db . session . commit ( )
2023-12-24 16:20:18 +13:00
if community . icon_id :
2023-12-24 17:41:34 +13:00
make_image_sizes ( community . icon_id , 60 , 250 , ' communities ' )
2023-12-24 16:20:18 +13:00
if community . image_id :
make_image_sizes ( community . image_id , 700 , 1600 , ' communities ' )
2023-12-21 22:14:43 +13:00
return community
2024-03-15 22:32:48 +00:00
def post_json_to_model ( activity_log , post_json , user , community ) - > Post :
2024-03-09 12:15:58 +13:00
try :
2024-03-15 23:47:21 +00:00
nsfl_in_title = ' [NSFL] ' in post_json [ ' name ' ] . upper ( ) or ' (NSFL) ' in post_json [ ' name ' ] . upper ( )
2024-03-09 12:15:58 +13:00
post = Post ( user_id = user . id , community_id = community . id ,
title = html . unescape ( post_json [ ' name ' ] ) ,
2024-03-15 23:47:21 +00:00
comments_enabled = post_json [ ' commentsEnabled ' ] if ' commentsEnabled ' in post_json else True ,
2024-03-09 12:15:58 +13:00
sticky = post_json [ ' stickied ' ] if ' stickied ' in post_json else False ,
nsfw = post_json [ ' sensitive ' ] ,
2024-03-15 23:47:21 +00:00
nsfl = post_json [ ' nsfl ' ] if ' nsfl ' in post_json else nsfl_in_title ,
2024-03-09 12:15:58 +13:00
ap_id = post_json [ ' id ' ] ,
type = constants . POST_TYPE_ARTICLE ,
posted_at = post_json [ ' published ' ] ,
last_active = post_json [ ' published ' ] ,
2024-03-15 23:47:21 +00:00
instance_id = user . instance_id ,
indexable = user . indexable
2024-03-09 12:15:58 +13:00
)
if ' source ' in post_json and \
post_json [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
post . body = post_json [ ' source ' ] [ ' content ' ]
post . body_html = markdown_to_html ( post . body )
elif ' content ' in post_json :
post . body_html = allowlist_html ( post_json [ ' content ' ] )
2024-03-27 16:02:04 +13:00
post . body = ' '
2024-03-09 18:19:03 +13:00
if ' attachment ' in post_json and len ( post_json [ ' attachment ' ] ) > 0 and ' type ' in post_json [ ' attachment ' ] [ 0 ] :
2024-03-09 12:15:58 +13:00
if post_json [ ' attachment ' ] [ 0 ] [ ' type ' ] == ' Link ' :
post . url = post_json [ ' attachment ' ] [ 0 ] [ ' href ' ]
if is_image_url ( post . url ) :
post . type = POST_TYPE_IMAGE
2024-03-15 23:47:21 +00:00
if ' image ' in post_json and ' url ' in post_json [ ' image ' ] :
image = File ( source_url = post_json [ ' image ' ] [ ' url ' ] )
else :
image = File ( source_url = post . url )
db . session . add ( image )
post . image = image
2024-03-09 12:15:58 +13:00
else :
post . type = POST_TYPE_LINK
2024-03-15 23:47:21 +00:00
post . url = remove_tracking_from_link ( post . url )
2024-03-09 12:15:58 +13:00
domain = domain_from_url ( post . url )
# notify about links to banned websites.
already_notified = set ( ) # often admins and mods are the same people - avoid notifying them twice
if domain :
if domain . notify_mods :
for community_member in post . community . moderators ( ) :
notify = Notification ( title = ' Suspicious content ' , url = post . ap_id , user_id = community_member . user_id , author_id = user . id )
2024-02-23 16:52:17 +13:00
db . session . add ( notify )
2024-03-09 12:15:58 +13:00
already_notified . add ( community_member . user_id )
if domain . notify_admins :
for admin in Site . admins ( ) :
if admin . id not in already_notified :
notify = Notification ( title = ' Suspicious content ' , url = post . ap_id , user_id = admin . id , author_id = user . id )
db . session . add ( notify )
admin . unread_notifications + = 1
if domain . banned :
post = None
2024-03-15 22:32:48 +00:00
activity_log . exception_message = domain . name + ' is blocked by admin '
2024-03-09 12:15:58 +13:00
if not domain . banned :
domain . post_count + = 1
post . domain = domain
if post is not None :
2024-04-09 19:27:42 +12:00
if ' image ' in post_json and post . image is None :
image = File ( source_url = post_json [ ' image ' ] [ ' url ' ] )
db . session . add ( image )
post . image = image
2024-03-09 12:15:58 +13:00
db . session . add ( post )
community . post_count + = 1
2024-03-15 22:32:48 +00:00
activity_log . result = ' success '
2024-03-09 12:15:58 +13:00
db . session . commit ( )
2024-03-15 23:47:21 +00:00
if post . image_id :
make_image_sizes ( post . image_id , 150 , 512 , ' posts ' ) # the 512 sized image is for masonry view
2024-03-09 12:15:58 +13:00
return post
except KeyError as e :
current_app . logger . error ( f ' KeyError in post_json_to_model: ' + str ( post_json ) )
return None
2023-12-21 22:14:43 +13:00
2023-12-24 16:20:18 +13:00
# Save two different versions of a File, after downloading it from file.source_url. Set a width parameter to None to avoid generating one of that size
def make_image_sizes ( file_id , thumbnail_width = 50 , medium_width = 120 , directory = ' posts ' ) :
if current_app . debug :
make_image_sizes_async ( file_id , thumbnail_width , medium_width , directory )
else :
make_image_sizes_async . apply_async ( args = ( file_id , thumbnail_width , medium_width , directory ) , countdown = randint ( 1 , 10 ) ) # Delay by up to 10 seconds so servers do not experience a stampede of requests all in the same second
@celery.task
def make_image_sizes_async ( file_id , thumbnail_width , medium_width , directory ) :
file = File . query . get ( file_id )
if file and file . source_url :
2024-04-16 16:35:12 +12:00
# Videos
if file . source_url . endswith ( ' .mp4 ' ) or file . source_url . endswith ( ' .webm ' ) :
new_filename = gibberish ( 15 )
# set up the storage directory
directory = f ' app/static/media/ { directory } / ' + new_filename [ 0 : 2 ] + ' / ' + new_filename [ 2 : 4 ]
ensure_directory_exists ( directory )
# file path and names to store the resized images on disk
final_place = os . path . join ( directory , new_filename + ' .jpg ' )
final_place_thumbnail = os . path . join ( directory , new_filename + ' _thumbnail.webp ' )
2024-04-20 16:47:27 +12:00
try :
generate_image_from_video_url ( file . source_url , final_place )
except Exception as e :
return
if final_place :
image = Image . open ( final_place )
img_width = image . width
# Resize the image to medium
if medium_width :
if img_width > medium_width :
image . thumbnail ( ( medium_width , medium_width ) )
image . save ( final_place )
file . file_path = final_place
file . width = image . width
file . height = image . height
# Resize the image to a thumbnail (webp)
if thumbnail_width :
if img_width > thumbnail_width :
image . thumbnail ( ( thumbnail_width , thumbnail_width ) )
image . save ( final_place_thumbnail , format = " WebP " , quality = 93 )
file . thumbnail_path = final_place_thumbnail
file . thumbnail_width = image . width
file . thumbnail_height = image . height
db . session . commit ( )
2024-04-16 16:35:12 +12:00
# Images
2023-12-24 16:20:18 +13:00
else :
2024-04-16 16:35:12 +12:00
try :
source_image_response = get_request ( file . source_url )
except :
pass
else :
if source_image_response . status_code == 200 :
content_type = source_image_response . headers . get ( ' content-type ' )
if content_type and content_type . startswith ( ' image ' ) :
source_image = source_image_response . content
source_image_response . close ( )
file_ext = os . path . splitext ( file . source_url ) [ 1 ]
# fall back to parsing the http content type if the url does not contain a file extension
if file_ext == ' ' :
content_type_parts = content_type . split ( ' / ' )
if content_type_parts :
file_ext = ' . ' + content_type_parts [ - 1 ]
else :
if ' ? ' in file_ext :
file_ext = file_ext . split ( ' ? ' ) [ 0 ]
new_filename = gibberish ( 15 )
# set up the storage directory
directory = f ' app/static/media/ { directory } / ' + new_filename [ 0 : 2 ] + ' / ' + new_filename [ 2 : 4 ]
ensure_directory_exists ( directory )
# file path and names to store the resized images on disk
final_place = os . path . join ( directory , new_filename + file_ext )
final_place_thumbnail = os . path . join ( directory , new_filename + ' _thumbnail.webp ' )
# Load image data into Pillow
Image . MAX_IMAGE_PIXELS = 89478485
image = Image . open ( BytesIO ( source_image ) )
image = ImageOps . exif_transpose ( image )
img_width = image . width
img_height = image . height
# Resize the image to medium
if medium_width :
if img_width > medium_width :
image . thumbnail ( ( medium_width , medium_width ) )
image . save ( final_place )
file . file_path = final_place
file . width = image . width
file . height = image . height
# Resize the image to a thumbnail (webp)
if thumbnail_width :
if img_width > thumbnail_width :
image . thumbnail ( ( thumbnail_width , thumbnail_width ) )
image . save ( final_place_thumbnail , format = " WebP " , quality = 93 )
file . thumbnail_path = final_place_thumbnail
file . thumbnail_width = image . width
file . thumbnail_height = image . height
db . session . commit ( )
# Alert regarding fascist meme content
if img_width < 2000 : # images > 2000px tend to be real photos instead of 4chan screenshots.
try :
image_text = pytesseract . image_to_string ( Image . open ( BytesIO ( source_image ) ) . convert ( ' L ' ) , timeout = 30 )
2024-04-20 20:17:58 +12:00
except Exception as e :
2024-04-20 17:01:36 +12:00
image_text = ' '
2024-04-16 16:35:12 +12:00
if ' Anonymous ' in image_text and ( ' No. ' in image_text or ' N0 ' in image_text ) : # chan posts usually contain the text 'Anonymous' and ' No.12345'
post = Post . query . filter_by ( image_id = file . id ) . first ( )
notification = Notification ( title = ' Review this ' ,
user_id = 1 ,
author_id = post . user_id ,
url = url_for ( ' activitypub.post_ap ' , post_id = post . id ) )
db . session . add ( notification )
db . session . commit ( )
2023-12-24 16:20:18 +13:00
2023-09-08 20:04:01 +12:00
# create a summary from markdown if present, otherwise use html if available
def parse_summary ( user_json ) - > str :
if ' source ' in user_json and user_json [ ' source ' ] . get ( ' mediaType ' ) == ' text/markdown ' :
# Convert Markdown to HTML
markdown_text = user_json [ ' source ' ] [ ' content ' ]
2024-03-27 16:02:04 +13:00
html_content = allowlist_html ( markdown_to_html ( markdown_text ) )
2023-09-08 20:04:01 +12:00
return html_content
elif ' summary ' in user_json :
2023-09-16 19:09:04 +12:00
return allowlist_html ( user_json [ ' summary ' ] )
2023-09-08 20:04:01 +12:00
else :
return ' '
2023-09-16 19:09:04 +12:00
def default_context ( ) :
context = [
" https://www.w3.org/ns/activitystreams " ,
" https://w3id.org/security/v1 " ,
]
if current_app . config [ ' FULL_AP_CONTEXT ' ] :
context . append ( {
" lemmy " : " https://join-lemmy.org/ns# " ,
" litepub " : " http://litepub.social/ns# " ,
" pt " : " https://joinpeertube.org/ns# " ,
" sc " : " http://schema.org/ " ,
" ChatMessage " : " litepub:ChatMessage " ,
" commentsEnabled " : " pt:commentsEnabled " ,
" sensitive " : " as:sensitive " ,
" matrixUserId " : " lemmy:matrixUserId " ,
" postingRestrictedToMods " : " lemmy:postingRestrictedToMods " ,
" removeData " : " lemmy:removeData " ,
" stickied " : " lemmy:stickied " ,
" moderators " : {
" @type " : " @id " ,
" @id " : " lemmy:moderators "
} ,
" expires " : " as:endTime " ,
" distinguished " : " lemmy:distinguished " ,
" language " : " sc:inLanguage " ,
" identifier " : " sc:identifier "
} )
return context
def find_reply_parent ( in_reply_to : str ) - > Tuple [ int , int , int ] :
if ' comment ' in in_reply_to :
parent_comment = PostReply . get_by_ap_id ( in_reply_to )
2023-12-22 14:05:39 +13:00
if not parent_comment :
return ( None , None , None )
2023-09-16 19:09:04 +12:00
parent_comment_id = parent_comment . id
post_id = parent_comment . post_id
root_id = parent_comment . root_id
elif ' post ' in in_reply_to :
parent_comment_id = None
post = Post . get_by_ap_id ( in_reply_to )
2023-12-22 14:05:39 +13:00
if not post :
return ( None , None , None )
2023-09-16 19:09:04 +12:00
post_id = post . id
root_id = None
else :
parent_comment_id = None
root_id = None
post_id = None
post = Post . get_by_ap_id ( in_reply_to )
if post :
post_id = post . id
else :
parent_comment = PostReply . get_by_ap_id ( in_reply_to )
if parent_comment :
parent_comment_id = parent_comment . id
post_id = parent_comment . post_id
root_id = parent_comment . root_id
2023-12-22 14:05:39 +13:00
else :
return ( None , None , None )
2023-09-16 19:09:04 +12:00
return post_id , parent_comment_id , root_id
def find_liked_object ( ap_id ) - > Union [ Post , PostReply , None ] :
post = Post . get_by_ap_id ( ap_id )
if post :
return post
else :
post_reply = PostReply . get_by_ap_id ( ap_id )
if post_reply :
return post_reply
return None
2023-11-23 15:10:44 +13:00
2024-04-06 16:29:47 +13:00
def find_reported_object ( ap_id ) - > Union [ User , Post , PostReply , None ] :
post = Post . get_by_ap_id ( ap_id )
if post :
return post
else :
post_reply = PostReply . get_by_ap_id ( ap_id )
if post_reply :
return post_reply
else :
user = find_actor_or_create ( ap_id , create_if_not_found = False )
if user :
return user
return None
2023-12-21 22:14:43 +13:00
def find_instance_id ( server ) :
server = server . strip ( )
instance = Instance . query . filter_by ( domain = server ) . first ( )
if instance :
return instance . id
else :
2023-12-28 20:00:42 +13:00
# Our instance does not know about {server} yet. Initially, create a sparse row in the 'instance' table and spawn a background
# task to update the row with more details later
2024-02-23 16:52:17 +13:00
new_instance = Instance ( domain = server , software = ' unknown ' , created_at = utcnow ( ) , trusted = server == ' piefed.social ' )
2023-12-28 20:00:42 +13:00
db . session . add ( new_instance )
db . session . commit ( )
2023-12-30 11:36:24 +13:00
# Spawn background task to fill in more details
2023-12-28 20:00:42 +13:00
refresh_instance_profile ( new_instance . id )
return new_instance . id
def refresh_instance_profile ( instance_id : int ) :
2024-02-14 12:31:44 +13:00
if instance_id :
if current_app . debug :
refresh_instance_profile_task ( instance_id )
else :
refresh_instance_profile_task . apply_async ( args = ( instance_id , ) , countdown = randint ( 1 , 10 ) )
2023-12-28 20:00:42 +13:00
@celery.task
def refresh_instance_profile_task ( instance_id : int ) :
instance = Instance . query . get ( instance_id )
2024-03-17 19:32:35 +00:00
if instance . inbox is None or instance . updated_at < utcnow ( ) - timedelta ( days = 7 ) :
2023-12-22 16:18:44 +13:00
try :
2024-02-14 12:31:44 +13:00
instance_data = get_request ( f " https:// { instance . domain } " , headers = { ' Accept ' : ' application/activity+json ' } )
except :
return
if instance_data . status_code == 200 :
try :
instance_json = instance_data . json ( )
instance_data . close ( )
except requests . exceptions . JSONDecodeError as ex :
instance_json = { }
if ' type ' in instance_json and instance_json [ ' type ' ] == ' Application ' :
2024-03-24 15:35:45 +13:00
# 'name' is unreliable as the admin can change it to anything. todo: find better way
2024-02-14 12:31:44 +13:00
if instance_json [ ' name ' ] . lower ( ) == ' kbin ' :
software = ' Kbin '
elif instance_json [ ' name ' ] . lower ( ) == ' mbin ' :
software = ' Mbin '
2024-02-25 15:31:16 +13:00
elif instance_json [ ' name ' ] . lower ( ) == ' piefed ' :
software = ' PieFed '
2024-03-24 15:35:45 +13:00
elif instance_json [ ' name ' ] . lower ( ) == ' system account ' :
software = ' Friendica '
2024-02-14 12:31:44 +13:00
else :
software = ' Lemmy '
instance . inbox = instance_json [ ' inbox ' ]
instance . outbox = instance_json [ ' outbox ' ]
instance . software = software
if instance . inbox . endswith ( ' /site_inbox ' ) : # Lemmy provides a /site_inbox but it always returns 400 when trying to POST to it. wtf.
instance . inbox = instance . inbox . replace ( ' /site_inbox ' , ' /inbox ' )
else : # it's pretty much always /inbox so just assume that it is for whatever this instance is running (mostly likely Mastodon)
instance . inbox = f " https:// { instance . domain } /inbox "
instance . updated_at = utcnow ( )
db . session . commit ( )
# retrieve list of Admins from /api/v3/site, update InstanceRole
try :
response = get_request ( f ' https:// { instance . domain } /api/v3/site ' )
except :
response = None
if response and response . status_code == 200 :
try :
instance_data = response . json ( )
except :
instance_data = None
finally :
response . close ( )
if instance_data :
if ' admins ' in instance_data :
admin_profile_ids = [ ]
for admin in instance_data [ ' admins ' ] :
admin_profile_ids . append ( admin [ ' person ' ] [ ' actor_id ' ] . lower ( ) )
user = find_actor_or_create ( admin [ ' person ' ] [ ' actor_id ' ] )
if user and not instance . user_is_admin ( user . id ) :
new_instance_role = InstanceRole ( instance_id = instance . id , user_id = user . id , role = ' admin ' )
db . session . add ( new_instance_role )
db . session . commit ( )
# remove any InstanceRoles that are no longer part of instance-data['admins']
for instance_admin in InstanceRole . query . filter_by ( instance_id = instance . id ) :
if instance_admin . user . profile_id ( ) not in admin_profile_ids :
db . session . query ( InstanceRole ) . filter (
InstanceRole . user_id == instance_admin . user . id ,
InstanceRole . instance_id == instance . id ,
InstanceRole . role == ' admin ' ) . delete ( )
db . session . commit ( )
2024-03-18 16:37:45 +13:00
elif instance_data . status_code == 406 : # Mastodon does this
instance . software = ' Mastodon '
instance . inbox = f " https:// { instance . domain } /inbox "
instance . updated_at = utcnow ( )
db . session . commit ( )
2023-12-21 22:14:43 +13:00
2023-11-24 22:52:42 +13:00
# alter the effect of upvotes based on their instance. Default to 1.0
@cache.memoize ( timeout = 50 )
def instance_weight ( domain ) :
if domain :
instance = Instance . query . filter_by ( domain = domain ) . first ( )
if instance :
return instance . vote_weight
return 1.0
2023-12-10 15:10:09 +13:00
def is_activitypub_request ( ) :
return ' application/ld+json ' in request . headers . get ( ' Accept ' , ' ' ) or ' application/activity+json ' in request . headers . get ( ' Accept ' , ' ' )
2023-12-22 14:05:39 +13:00
def downvote_post ( post , user ) :
user . last_seen = utcnow ( )
2023-12-27 19:51:07 +13:00
user . recalculate_attitude ( )
2023-12-22 14:05:39 +13:00
existing_vote = PostVote . query . filter_by ( user_id = user . id , post_id = post . id ) . first ( )
if not existing_vote :
effect = - 1.0
post . down_votes + = 1
2024-04-14 07:59:24 +12:00
# Make 'hot' sort more spicy by amplifying the effect of early downvotes
if post . up_votes + post . down_votes < = 30 :
2024-04-15 12:08:04 +12:00
post . score - = current_app . config [ ' SPICY_UNDER_30 ' ]
2024-04-14 07:59:24 +12:00
elif post . up_votes + post . down_votes < = 60 :
2024-04-15 12:08:04 +12:00
post . score - = current_app . config [ ' SPICY_UNDER_60 ' ]
2024-04-14 07:59:24 +12:00
else :
post . score - = 1.0
2023-12-22 14:05:39 +13:00
vote = PostVote ( user_id = user . id , post_id = post . id , author_id = post . author . id ,
effect = effect )
post . author . reputation + = effect
db . session . add ( vote )
else :
# remove previously cast upvote
if existing_vote . effect > 0 :
post . author . reputation - = existing_vote . effect
post . up_votes - = 1
post . score - = existing_vote . effect
db . session . delete ( existing_vote )
# apply down vote
effect = - 1.0
post . down_votes + = 1
post . score - = 1.0
vote = PostVote ( user_id = user . id , post_id = post . id , author_id = post . author . id ,
effect = effect )
post . author . reputation + = effect
db . session . add ( vote )
else :
pass # they have already downvoted this post
2024-01-03 20:14:39 +13:00
post . ranking = post_ranking ( post . score , post . posted_at )
db . session . commit ( )
2023-12-22 14:05:39 +13:00
def downvote_post_reply ( comment , user ) :
user . last_seen = utcnow ( )
2023-12-27 19:51:07 +13:00
user . recalculate_attitude ( )
2023-12-22 14:05:39 +13:00
existing_vote = PostReplyVote . query . filter_by ( user_id = user . id ,
post_reply_id = comment . id ) . first ( )
if not existing_vote :
effect = - 1.0
comment . down_votes + = 1
comment . score - = 1.0
vote = PostReplyVote ( user_id = user . id , post_reply_id = comment . id ,
author_id = comment . author . id , effect = effect )
comment . author . reputation + = effect
db . session . add ( vote )
else :
# remove previously cast upvote
if existing_vote . effect > 0 :
comment . author . reputation - = existing_vote . effect
comment . up_votes - = 1
comment . score - = existing_vote . effect
db . session . delete ( existing_vote )
# apply down vote
effect = - 1.0
comment . down_votes + = 1
comment . score - = 1.0
vote = PostReplyVote ( user_id = user . id , post_reply_id = comment . id ,
author_id = comment . author . id , effect = effect )
comment . author . reputation + = effect
db . session . add ( vote )
else :
pass # they have already downvoted this reply
2024-01-07 21:36:04 +13:00
comment . ranking = confidence ( comment . up_votes , comment . down_votes )
2023-12-22 14:05:39 +13:00
def upvote_post_reply ( comment , user ) :
user . last_seen = utcnow ( )
2023-12-27 19:51:07 +13:00
user . recalculate_attitude ( )
2023-12-22 14:05:39 +13:00
effect = instance_weight ( user . ap_domain )
existing_vote = PostReplyVote . query . filter_by ( user_id = user . id ,
post_reply_id = comment . id ) . first ( )
if not existing_vote :
comment . up_votes + = 1
comment . score + = effect
vote = PostReplyVote ( user_id = user . id , post_reply_id = comment . id ,
author_id = comment . author . id , effect = effect )
2023-12-27 13:02:52 +13:00
if comment . community . low_quality and effect > 0 :
effect = 0
2023-12-22 14:05:39 +13:00
comment . author . reputation + = effect
db . session . add ( vote )
else :
# remove previously cast downvote
if existing_vote . effect < 0 :
comment . author . reputation - = existing_vote . effect
comment . down_votes - = 1
comment . score - = existing_vote . effect
db . session . delete ( existing_vote )
# apply up vote
comment . up_votes + = 1
comment . score + = effect
vote = PostReplyVote ( user_id = user . id , post_reply_id = comment . id ,
author_id = comment . author . id , effect = effect )
2023-12-27 13:02:52 +13:00
if comment . community . low_quality and effect > 0 :
effect = 0
2023-12-22 14:05:39 +13:00
comment . author . reputation + = effect
db . session . add ( vote )
else :
pass # they have already upvoted this reply
2024-01-07 21:36:04 +13:00
comment . ranking = confidence ( comment . up_votes , comment . down_votes )
2023-12-22 14:05:39 +13:00
def upvote_post ( post , user ) :
user . last_seen = utcnow ( )
2023-12-27 19:51:07 +13:00
user . recalculate_attitude ( )
2023-12-22 14:05:39 +13:00
effect = instance_weight ( user . ap_domain )
2024-04-14 07:59:24 +12:00
# Make 'hot' sort more spicy by amplifying the effect of early upvotes
spicy_effect = effect
if post . up_votes + post . down_votes < = 10 :
2024-04-15 12:08:04 +12:00
spicy_effect = effect * current_app . config [ ' SPICY_UNDER_10 ' ]
2024-04-14 07:59:24 +12:00
elif post . up_votes + post . down_votes < = 30 :
2024-04-15 12:08:04 +12:00
spicy_effect = effect * current_app . config [ ' SPICY_UNDER_30 ' ]
2024-04-14 07:59:24 +12:00
elif post . up_votes + post . down_votes < = 60 :
2024-04-15 12:08:04 +12:00
spicy_effect = effect * current_app . config [ ' SPICY_UNDER_60 ' ]
2023-12-22 14:05:39 +13:00
existing_vote = PostVote . query . filter_by ( user_id = user . id , post_id = post . id ) . first ( )
if not existing_vote :
post . up_votes + = 1
2024-04-14 07:59:24 +12:00
post . score + = spicy_effect
2023-12-22 14:05:39 +13:00
vote = PostVote ( user_id = user . id , post_id = post . id , author_id = post . author . id ,
effect = effect )
2023-12-27 13:02:52 +13:00
if post . community . low_quality and effect > 0 :
effect = 0
2023-12-22 14:05:39 +13:00
post . author . reputation + = effect
db . session . add ( vote )
else :
# remove previous cast downvote
if existing_vote . effect < 0 :
post . author . reputation - = existing_vote . effect
post . down_votes - = 1
post . score - = existing_vote . effect
db . session . delete ( existing_vote )
# apply up vote
post . up_votes + = 1
post . score + = effect
vote = PostVote ( user_id = user . id , post_id = post . id , author_id = post . author . id ,
effect = effect )
2023-12-27 13:02:52 +13:00
if post . community . low_quality and effect > 0 :
effect = 0
2023-12-22 14:05:39 +13:00
post . author . reputation + = effect
db . session . add ( vote )
2024-01-03 20:14:39 +13:00
post . ranking = post_ranking ( post . score , post . posted_at )
db . session . commit ( )
2023-12-22 14:05:39 +13:00
2023-12-26 12:36:20 +13:00
def delete_post_or_comment ( user_ap_id , community_ap_id , to_be_deleted_ap_id ) :
if current_app . debug :
delete_post_or_comment_task ( user_ap_id , community_ap_id , to_be_deleted_ap_id )
else :
delete_post_or_comment_task . delay ( user_ap_id , community_ap_id , to_be_deleted_ap_id )
@celery.task
def delete_post_or_comment_task ( user_ap_id , community_ap_id , to_be_deleted_ap_id ) :
deletor = find_actor_or_create ( user_ap_id )
2024-03-02 10:20:15 +13:00
community = find_actor_or_create ( community_ap_id , community_only = True )
2023-12-26 12:36:20 +13:00
to_delete = find_liked_object ( to_be_deleted_ap_id )
if deletor and community and to_delete :
2024-02-14 12:31:44 +13:00
if deletor . is_admin ( ) or community . is_moderator ( deletor ) or community . is_instance_admin ( deletor ) or to_delete . author . id == deletor . id :
2023-12-26 12:36:20 +13:00
if isinstance ( to_delete , Post ) :
to_delete . delete_dependencies ( )
db . session . delete ( to_delete )
2024-01-05 10:36:55 +13:00
community . post_count - = 1
2023-12-26 12:36:20 +13:00
db . session . commit ( )
elif isinstance ( to_delete , PostReply ) :
2024-01-05 10:36:55 +13:00
to_delete . post . reply_count - = 1
2023-12-26 12:36:20 +13:00
if to_delete . has_replies ( ) :
to_delete . body = ' Deleted by author ' if to_delete . author . id == deletor . id else ' Deleted by moderator '
to_delete . body_html = markdown_to_html ( to_delete . body )
else :
to_delete . delete_dependencies ( )
db . session . delete ( to_delete )
2024-01-05 10:36:55 +13:00
2023-12-26 12:36:20 +13:00
db . session . commit ( )
2023-12-30 13:23:12 +13:00
def create_post_reply ( activity_log : ActivityPubLog , community : Community , in_reply_to , request_json : dict , user : User , announce_id = None ) - > Union [ Post , None ] :
2024-01-27 12:22:35 +13:00
if community . local_only :
activity_log . exception_message = ' Community is local only, reply discarded '
activity_log . result = ' ignored '
return None
2023-12-30 13:23:12 +13:00
post_id , parent_comment_id , root_id = find_reply_parent ( in_reply_to )
if post_id or parent_comment_id or root_id :
2024-01-18 15:34:55 +13:00
# set depth to +1 of the parent depth
if parent_comment_id :
parent_comment = PostReply . query . get ( parent_comment_id )
depth = parent_comment . depth + 1
else :
depth = 0
2023-12-30 13:23:12 +13:00
post_reply = PostReply ( user_id = user . id , community_id = community . id ,
post_id = post_id , parent_id = parent_comment_id ,
root_id = root_id ,
nsfw = community . nsfw ,
nsfl = community . nsfl ,
2024-03-21 21:50:25 +13:00
from_bot = user . bot ,
2023-12-30 13:23:12 +13:00
up_votes = 1 ,
2024-01-18 15:34:55 +13:00
depth = depth ,
2023-12-30 13:23:12 +13:00
score = instance_weight ( user . ap_domain ) ,
ap_id = request_json [ ' object ' ] [ ' id ' ] ,
ap_create_id = request_json [ ' id ' ] ,
ap_announce_id = announce_id ,
instance_id = user . instance_id )
2024-02-29 11:26:45 +13:00
# Get comment content. Lemmy and Kbin put this in different places.
if ' source ' in request_json [ ' object ' ] and isinstance ( request_json [ ' object ' ] [ ' source ' ] , dict ) and \
2024-03-17 02:53:00 +13:00
' mediaType ' in request_json [ ' object ' ] [ ' source ' ] and \
2023-12-30 13:23:12 +13:00
request_json [ ' object ' ] [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
post_reply . body = request_json [ ' object ' ] [ ' source ' ] [ ' content ' ]
post_reply . body_html = markdown_to_html ( post_reply . body )
2024-02-29 11:26:45 +13:00
elif ' content ' in request_json [ ' object ' ] : # Kbin
2023-12-30 13:23:12 +13:00
post_reply . body_html = allowlist_html ( request_json [ ' object ' ] [ ' content ' ] )
2024-03-27 16:02:04 +13:00
post_reply . body = ' '
2023-12-30 13:23:12 +13:00
if post_id is not None :
2024-03-22 12:22:19 +13:00
# Discard post_reply if it contains certain phrases. Good for stopping spam floods.
if post_reply . body :
for blocked_phrase in blocked_phrases ( ) :
if blocked_phrase in post_reply . body :
return None
2023-12-30 13:23:12 +13:00
post = Post . query . get ( post_id )
if post . comments_enabled :
2024-01-06 11:01:44 +13:00
anchor = None
if not parent_comment_id :
notification_target = post
else :
notification_target = PostReply . query . get ( parent_comment_id )
if notification_target . author . has_blocked_user ( post_reply . user_id ) :
activity_log . exception_message = ' Replier blocked, reply discarded '
activity_log . result = ' ignored '
return None
2024-01-06 14:54:10 +13:00
if reply_already_exists ( user_id = user . id , post_id = post . id , parent_id = post_reply . parent_id , body = post_reply . body ) :
activity_log . exception_message = ' Duplicate reply '
activity_log . result = ' ignored '
return None
if reply_is_just_link_to_gif_reaction ( post_reply . body ) :
user . reputation - = 1
activity_log . exception_message = ' gif comment ignored '
activity_log . result = ' ignored '
return None
2024-04-22 15:25:37 +12:00
if reply_is_stupid ( post_reply . body ) :
activity_log . exception_message = ' Stupid reply '
activity_log . result = ' ignored '
return None
2023-12-30 13:23:12 +13:00
db . session . add ( post_reply )
2024-04-19 21:17:21 +12:00
if not user . bot :
post . reply_count + = 1
community . post_reply_count + = 1
community . last_active = post . last_active = utcnow ( )
2023-12-30 13:23:12 +13:00
activity_log . result = ' success '
2024-01-18 15:34:55 +13:00
post_reply . ranking = confidence ( post_reply . up_votes , post_reply . down_votes )
2023-12-30 13:23:12 +13:00
db . session . commit ( )
2024-01-06 11:01:44 +13:00
# send notification to the post/comment being replied to
2024-04-29 21:43:37 +12:00
if parent_comment_id :
notify_about_post_reply ( parent_comment , post_reply )
else :
notify_about_post_reply ( None , post_reply )
2024-01-06 11:01:44 +13:00
2024-01-02 16:07:41 +13:00
if user . reputation > 100 :
post_reply . up_votes + = 1
post_reply . score + = 1
2024-01-07 21:36:04 +13:00
post_reply . ranking = confidence ( post_reply . up_votes , post_reply . down_votes )
2024-01-02 16:07:41 +13:00
db . session . commit ( )
2023-12-30 13:23:12 +13:00
else :
activity_log . exception_message = ' Comments disabled, reply discarded '
activity_log . result = ' ignored '
2024-02-24 11:07:06 +13:00
return None
2023-12-30 13:23:12 +13:00
return post
else :
activity_log . exception_message = ' Could not find parent post '
return None
else :
activity_log . exception_message = ' Parent not found '
def create_post ( activity_log : ActivityPubLog , community : Community , request_json : dict , user : User , announce_id = None ) - > Union [ Post , None ] :
2024-01-27 12:22:35 +13:00
if community . local_only :
activity_log . exception_message = ' Community is local only, post discarded '
activity_log . result = ' ignored '
return None
2024-03-26 22:46:15 +00:00
if ' name ' not in request_json [ ' object ' ] : # Microblog posts
if ' content ' in request_json [ ' object ' ] and request_json [ ' object ' ] [ ' content ' ] is not None :
name = " [Microblog] "
else :
return None
else :
name = request_json [ ' object ' ] [ ' name ' ]
nsfl_in_title = ' [NSFL] ' in name . upper ( ) or ' (NSFL) ' in name . upper ( )
2023-12-30 13:23:12 +13:00
post = Post ( user_id = user . id , community_id = community . id ,
2024-03-26 22:46:15 +00:00
title = html . unescape ( name ) ,
2024-02-29 12:33:34 +13:00
comments_enabled = request_json [ ' object ' ] [ ' commentsEnabled ' ] if ' commentsEnabled ' in request_json [ ' object ' ] else True ,
2023-12-30 13:23:12 +13:00
sticky = request_json [ ' object ' ] [ ' stickied ' ] if ' stickied ' in request_json [ ' object ' ] else False ,
2024-03-17 02:55:59 +13:00
nsfw = request_json [ ' object ' ] [ ' sensitive ' ] if ' sensitive ' in request_json [ ' object ' ] else False ,
2024-02-01 11:59:09 +13:00
nsfl = request_json [ ' object ' ] [ ' nsfl ' ] if ' nsfl ' in request_json [ ' object ' ] else nsfl_in_title ,
2023-12-30 13:23:12 +13:00
ap_id = request_json [ ' object ' ] [ ' id ' ] ,
ap_create_id = request_json [ ' id ' ] ,
ap_announce_id = announce_id ,
type = constants . POST_TYPE_ARTICLE ,
up_votes = 1 ,
2024-03-21 21:50:25 +13:00
from_bot = user . bot ,
2024-01-02 16:07:41 +13:00
score = instance_weight ( user . ap_domain ) ,
2024-03-12 20:58:47 +13:00
instance_id = user . instance_id ,
indexable = user . indexable
2023-12-30 13:23:12 +13:00
)
2024-02-29 11:26:45 +13:00
# Get post content. Lemmy and Kbin put this in different places.
if ' source ' in request_json [ ' object ' ] and isinstance ( request_json [ ' object ' ] [ ' source ' ] , dict ) and request_json [ ' object ' ] [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' : # Lemmy
2023-12-30 13:23:12 +13:00
post . body = request_json [ ' object ' ] [ ' source ' ] [ ' content ' ]
post . body_html = markdown_to_html ( post . body )
2024-02-29 11:26:45 +13:00
elif ' content ' in request_json [ ' object ' ] and request_json [ ' object ' ] [ ' content ' ] is not None : # Kbin
2023-12-30 13:23:12 +13:00
post . body_html = allowlist_html ( request_json [ ' object ' ] [ ' content ' ] )
2024-03-27 16:08:25 +13:00
post . body = ' '
2024-03-26 22:46:15 +00:00
if name == " [Microblog] " :
name + = ' ' + microblog_content_to_title ( post . body_html )
if ' [NSFL] ' in name . upper ( ) or ' (NSFL) ' in name . upper ( ) :
post . nsfl = True
post . title = name
2024-03-22 12:22:19 +13:00
# Discard post if it contains certain phrases. Good for stopping spam floods.
blocked_phrases_list = blocked_phrases ( )
for blocked_phrase in blocked_phrases_list :
if blocked_phrase in post . title :
return None
if post . body :
for blocked_phrase in blocked_phrases_list :
if blocked_phrase in post . body :
return None
2023-12-30 13:23:12 +13:00
if ' attachment ' in request_json [ ' object ' ] and len ( request_json [ ' object ' ] [ ' attachment ' ] ) > 0 and \
' type ' in request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] :
if request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' type ' ] == ' Link ' :
2024-03-26 22:46:15 +00:00
post . url = request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' href ' ] # Lemmy
if request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' type ' ] == ' Document ' :
post . url = request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' url ' ] # Mastodon
if post . url :
2023-12-30 13:23:12 +13:00
if is_image_url ( post . url ) :
post . type = POST_TYPE_IMAGE
2024-03-12 09:53:34 +13:00
if ' image ' in request_json [ ' object ' ] and ' url ' in request_json [ ' object ' ] [ ' image ' ] :
image = File ( source_url = request_json [ ' object ' ] [ ' image ' ] [ ' url ' ] )
else :
image = File ( source_url = post . url )
2024-03-04 10:56:17 +13:00
db . session . add ( image )
post . image = image
2024-04-16 20:59:58 +12:00
elif is_video_url ( post . url ) :
post . type = POST_TYPE_VIDEO
image = File ( source_url = post . url )
db . session . add ( image )
post . image = image
2023-12-30 13:23:12 +13:00
else :
post . type = POST_TYPE_LINK
2024-03-08 22:01:46 +13:00
post . url = remove_tracking_from_link ( post . url )
2023-12-30 13:23:12 +13:00
domain = domain_from_url ( post . url )
# notify about links to banned websites.
already_notified = set ( ) # often admins and mods are the same people - avoid notifying them twice
if domain . notify_mods :
for community_member in post . community . moderators ( ) :
notify = Notification ( title = ' Suspicious content ' , url = post . ap_id ,
user_id = community_member . user_id ,
author_id = user . id )
db . session . add ( notify )
already_notified . add ( community_member . user_id )
if domain . notify_admins :
for admin in Site . admins ( ) :
if admin . id not in already_notified :
notify = Notification ( title = ' Suspicious content ' ,
url = post . ap_id , user_id = admin . id ,
author_id = user . id )
db . session . add ( notify )
if not domain . banned :
domain . post_count + = 1
post . domain = domain
2024-03-17 02:22:33 +13:00
else :
post = None
activity_log . exception_message = domain . name + ' is blocked by admin '
2024-04-20 16:34:54 +12:00
2023-12-30 13:23:12 +13:00
if post is not None :
2024-04-20 16:34:54 +12:00
if ' language ' in request_json [ ' object ' ] and isinstance ( request_json [ ' object ' ] [ ' language ' ] , dict ) :
language = find_language_or_create ( request_json [ ' object ' ] [ ' language ' ] [ ' identifier ' ] ,
request_json [ ' object ' ] [ ' language ' ] [ ' name ' ] )
post . language_id = language . id
2024-03-17 02:21:16 +13:00
if ' image ' in request_json [ ' object ' ] and post . image is None :
image = File ( source_url = request_json [ ' object ' ] [ ' image ' ] [ ' url ' ] )
db . session . add ( image )
post . image = image
2023-12-30 13:23:12 +13:00
db . session . add ( post )
2024-01-03 20:14:39 +13:00
post . ranking = post_ranking ( post . score , post . posted_at )
2023-12-30 13:23:12 +13:00
community . post_count + = 1
community . last_active = utcnow ( )
activity_log . result = ' success '
db . session . commit ( )
if post . image_id :
2024-02-19 09:02:12 +13:00
make_image_sizes ( post . image_id , 150 , 512 , ' posts ' ) # the 512 sized image is for masonry view
2024-01-07 12:47:06 +13:00
2024-04-03 07:44:59 +13:00
# Update list of cross posts
2024-04-02 18:01:24 +01:00
if post . url :
other_posts = Post . query . filter ( Post . id != post . id , Post . url == post . url ,
Post . posted_at > post . posted_at - timedelta ( days = 6 ) ) . all ( )
for op in other_posts :
if op . cross_posts is None :
op . cross_posts = [ post . id ]
else :
op . cross_posts . append ( post . id )
if post . cross_posts is None :
post . cross_posts = [ op . id ]
else :
post . cross_posts . append ( op . id )
db . session . commit ( )
2024-04-29 16:03:00 +12:00
if post . community_id not in communities_banned_from ( user . id ) :
notify_about_post ( post )
2024-01-07 12:47:06 +13:00
2024-01-02 16:07:41 +13:00
if user . reputation > 100 :
post . up_votes + = 1
post . score + = 1
2024-01-03 20:14:39 +13:00
post . ranking = post_ranking ( post . score , post . posted_at )
2024-01-02 16:07:41 +13:00
db . session . commit ( )
2023-12-30 13:23:12 +13:00
return post
2024-01-07 12:49:25 +13:00
def notify_about_post ( post : Post ) :
2024-04-22 20:53:03 +12:00
# todo: eventually this function could trigger a lot of DB activity. This function will need to be a celery task.
2024-04-19 20:13:02 +12:00
2024-04-29 16:03:00 +12:00
# Send notifications based on subscriptions
2024-04-19 20:13:02 +12:00
notifications_sent_to = set ( )
2024-04-30 11:33:43 +12:00
send_notifs_to = set ( notification_subscribers ( post . user_id , NOTIF_USER ) +
2024-04-29 16:03:00 +12:00
notification_subscribers ( post . community_id , NOTIF_COMMUNITY ) +
notification_subscribers ( post . community . topic_id , NOTIF_TOPIC ) )
for notify_id in send_notifs_to :
2024-04-22 20:53:03 +12:00
if notify_id != post . user_id and notify_id not in notifications_sent_to :
new_notification = Notification ( title = shorten_string ( post . title , 50 ) , url = f " /post/ { post . id } " ,
user_id = notify_id , author_id = post . user_id )
2024-01-07 12:49:25 +13:00
db . session . add ( new_notification )
2024-04-22 20:53:03 +12:00
user = User . query . get ( notify_id )
2024-01-07 12:49:25 +13:00
user . unread_notifications + = 1
db . session . commit ( )
2024-04-29 16:03:00 +12:00
notifications_sent_to . add ( notify_id )
2024-01-07 12:49:25 +13:00
2024-04-29 21:43:37 +12:00
def notify_about_post_reply ( parent_reply : Union [ PostReply , None ] , new_reply : PostReply ) :
if parent_reply is None : # This happens when a new_reply is a top-level comment, not a comment on a comment
send_notifs_to = notification_subscribers ( new_reply . post . id , NOTIF_POST )
for notify_id in send_notifs_to :
if new_reply . user_id != notify_id :
new_notification = Notification ( title = shorten_string ( _ ( ' Reply to %(post_title)s ' ,
post_title = new_reply . post . title ) , 50 ) ,
url = f " /post/ { new_reply . post . id } #comment_ { new_reply . id } " ,
user_id = notify_id , author_id = new_reply . user_id )
db . session . add ( new_notification )
user = User . query . get ( notify_id )
user . unread_notifications + = 1
db . session . commit ( )
else :
# Send notifications based on subscriptions
send_notifs_to = set ( notification_subscribers ( parent_reply . id , NOTIF_REPLY ) )
for notify_id in send_notifs_to :
if new_reply . user_id != notify_id :
new_notification = Notification ( title = shorten_string ( _ ( ' Reply to comment on %(post_title)s ' ,
post_title = parent_reply . post . title ) , 50 ) ,
url = f " /post/ { parent_reply . post . id } #comment_ { new_reply . id } " ,
user_id = notify_id , author_id = new_reply . user_id )
db . session . add ( new_notification )
user = User . query . get ( notify_id )
user . unread_notifications + = 1
db . session . commit ( )
2023-12-30 13:23:12 +13:00
def update_post_reply_from_activity ( reply : PostReply , request_json : dict ) :
2024-02-29 17:10:38 +13:00
if ' source ' in request_json [ ' object ' ] and \
isinstance ( request_json [ ' object ' ] [ ' source ' ] , dict ) and \
request_json [ ' object ' ] [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
2023-12-30 13:23:12 +13:00
reply . body = request_json [ ' object ' ] [ ' source ' ] [ ' content ' ]
reply . body_html = markdown_to_html ( reply . body )
elif ' content ' in request_json [ ' object ' ] :
reply . body_html = allowlist_html ( request_json [ ' object ' ] [ ' content ' ] )
2024-03-27 16:02:04 +13:00
reply . body = ' '
2023-12-30 13:23:12 +13:00
reply . edited_at = utcnow ( )
db . session . commit ( )
def update_post_from_activity ( post : Post , request_json : dict ) :
2024-04-01 23:44:58 +01:00
if ' name ' not in request_json [ ' object ' ] : # Microblog posts
name = " [Microblog] "
else :
name = request_json [ ' object ' ] [ ' name ' ]
nsfl_in_title = ' [NSFL] ' in name . upper ( ) or ' (NSFL) ' in name . upper ( )
post . title = name
2024-02-29 17:10:38 +13:00
if ' source ' in request_json [ ' object ' ] and \
isinstance ( request_json [ ' object ' ] [ ' source ' ] , dict ) and \
request_json [ ' object ' ] [ ' source ' ] [ ' mediaType ' ] == ' text/markdown ' :
2023-12-30 13:23:12 +13:00
post . body = request_json [ ' object ' ] [ ' source ' ] [ ' content ' ]
post . body_html = markdown_to_html ( post . body )
2024-04-01 23:44:58 +01:00
elif ' content ' in request_json [ ' object ' ] and request_json [ ' object ' ] [ ' content ' ] is not None : # Kbin
2023-12-30 13:23:12 +13:00
post . body_html = allowlist_html ( request_json [ ' object ' ] [ ' content ' ] )
2024-03-27 16:02:04 +13:00
post . body = ' '
2024-04-01 23:44:58 +01:00
if name == " [Microblog] " :
name + = ' ' + microblog_content_to_title ( post . body_html )
nsfl_in_title = ' [NSFL] ' in name . upper ( ) or ' (NSFL) ' in name . upper ( )
post . title = name
2024-04-16 21:49:05 +12:00
# Language
if ' language ' in request_json [ ' object ' ] and isinstance ( request_json [ ' object ' ] [ ' language ' ] , dict ) :
language = find_language_or_create ( request_json [ ' object ' ] [ ' language ' ] [ ' identifier ' ] , request_json [ ' object ' ] [ ' language ' ] [ ' name ' ] )
post . language_id = language . id
# Links
2024-04-01 23:44:58 +01:00
old_url = post . url
old_image_id = post . image_id
post . url = ' '
if ' attachment ' in request_json [ ' object ' ] and len ( request_json [ ' object ' ] [ ' attachment ' ] ) > 0 and \
' type ' in request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] :
if request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' type ' ] == ' Link ' :
post . url = request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' href ' ] # Lemmy
if request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' type ' ] == ' Document ' :
post . url = request_json [ ' object ' ] [ ' attachment ' ] [ 0 ] [ ' url ' ] # Mastodon
if post . url == ' ' :
post . type = POST_TYPE_ARTICLE
if ( post . url and post . url != old_url ) or ( post . url == ' ' and old_url != ' ' ) :
if post . image_id :
old_image = File . query . get ( post . image_id )
post . image_id = None
old_image . delete_from_disk ( )
File . query . filter_by ( id = old_image_id ) . delete ( )
post . image = None
if ( post . url and post . url != old_url ) :
if is_image_url ( post . url ) :
post . type = POST_TYPE_IMAGE
if ' image ' in request_json [ ' object ' ] and ' url ' in request_json [ ' object ' ] [ ' image ' ] :
image = File ( source_url = request_json [ ' object ' ] [ ' image ' ] [ ' url ' ] )
else :
image = File ( source_url = post . url )
db . session . add ( image )
post . image = image
2024-04-16 20:59:58 +12:00
elif is_video_url ( post . url ) :
post . type == POST_TYPE_VIDEO
image = File ( source_url = post . url )
db . session . add ( image )
post . image = image
2024-04-01 23:44:58 +01:00
else :
post . type = POST_TYPE_LINK
post . url = remove_tracking_from_link ( post . url )
domain = domain_from_url ( post . url )
# notify about links to banned websites.
already_notified = set ( ) # often admins and mods are the same people - avoid notifying them twice
if domain . notify_mods :
for community_member in post . community . moderators ( ) :
notify = Notification ( title = ' Suspicious content ' , url = post . ap_id ,
user_id = community_member . user_id ,
2024-04-02 12:38:59 +13:00
author_id = 1 )
2024-04-01 23:44:58 +01:00
db . session . add ( notify )
already_notified . add ( community_member . user_id )
if domain . notify_admins :
for admin in Site . admins ( ) :
if admin . id not in already_notified :
notify = Notification ( title = ' Suspicious content ' ,
url = post . ap_id , user_id = admin . id ,
2024-04-02 12:38:59 +13:00
author_id = 1 )
2024-04-01 23:44:58 +01:00
db . session . add ( notify )
if not domain . banned :
domain . post_count + = 1
post . domain = domain
else :
post . url = old_url # don't change if url changed from non-banned domain to banned domain
2024-04-02 18:01:24 +01:00
2024-04-16 21:49:05 +12:00
# Posts which link to the same url as other posts
2024-04-02 18:01:24 +01:00
new_cross_posts = Post . query . filter ( Post . id != post . id , Post . url == post . url ,
Post . posted_at > utcnow ( ) - timedelta ( days = 6 ) ) . all ( )
for ncp in new_cross_posts :
if ncp . cross_posts is None :
ncp . cross_posts = [ post . id ]
else :
ncp . cross_posts . append ( post . id )
if post . cross_posts is None :
post . cross_posts = [ ncp . id ]
else :
post . cross_posts . append ( ncp . id )
if post . url != old_url :
if post . cross_posts is not None :
old_cross_posts = Post . query . filter ( Post . id . in_ ( post . cross_posts ) ) . all ( )
post . cross_posts . clear ( )
for ocp in old_cross_posts :
2024-04-09 19:16:11 +12:00
if ocp . cross_posts is not None and post . id in ocp . cross_posts :
2024-04-02 18:01:24 +01:00
ocp . cross_posts . remove ( post . id )
2024-04-01 23:44:58 +01:00
if post is not None :
if ' image ' in request_json [ ' object ' ] and post . image is None :
image = File ( source_url = request_json [ ' object ' ] [ ' image ' ] [ ' url ' ] )
db . session . add ( image )
post . image = image
db . session . add ( post )
db . session . commit ( )
if post . image_id and post . image_id != old_image_id :
make_image_sizes ( post . image_id , 150 , 512 , ' posts ' ) # the 512 sized image is for masonry view
2024-03-17 02:55:59 +13:00
if ' sensitive ' in request_json [ ' object ' ] :
post . nsfw = request_json [ ' object ' ] [ ' sensitive ' ]
2024-04-01 10:12:31 +13:00
if nsfl_in_title :
post . nsfl = True
elif ' nsfl ' in request_json [ ' object ' ] :
2024-02-16 06:17:13 +13:00
post . nsfl = request_json [ ' object ' ] [ ' nsfl ' ]
2024-04-01 23:44:58 +01:00
post . comments_enabled = request_json [ ' object ' ] [ ' commentsEnabled ' ] if ' commentsEnabled ' in request_json [ ' object ' ] else True
2023-12-30 13:23:12 +13:00
post . edited_at = utcnow ( )
db . session . commit ( )
def undo_downvote ( activity_log , comment , post , target_ap_id , user ) :
if ' /comment/ ' in target_ap_id :
comment = PostReply . query . filter_by ( ap_id = target_ap_id ) . first ( )
if ' /post/ ' in target_ap_id :
post = Post . query . filter_by ( ap_id = target_ap_id ) . first ( )
if ( user and not user . is_local ( ) ) and post :
existing_vote = PostVote . query . filter_by ( user_id = user . id , post_id = post . id ) . first ( )
if existing_vote :
post . author . reputation - = existing_vote . effect
post . down_votes - = 1
post . score - = existing_vote . effect
db . session . delete ( existing_vote )
activity_log . result = ' success '
if ( user and not user . is_local ( ) ) and comment :
existing_vote = PostReplyVote . query . filter_by ( user_id = user . id ,
post_reply_id = comment . id ) . first ( )
if existing_vote :
comment . author . reputation - = existing_vote . effect
comment . down_votes - = 1
comment . score - = existing_vote . effect
db . session . delete ( existing_vote )
activity_log . result = ' success '
if user is None :
activity_log . exception_message = ' Blocked or unfound user '
if user and user . is_local ( ) :
activity_log . exception_message = ' Activity about local content which is already present '
activity_log . result = ' ignored '
return post
def undo_vote ( activity_log , comment , post , target_ap_id , user ) :
2024-01-05 09:39:20 +13:00
voted_on = find_liked_object ( target_ap_id )
if ( user and not user . is_local ( ) ) and isinstance ( voted_on , Post ) :
post = voted_on
2023-12-30 13:23:12 +13:00
user . last_seen = utcnow ( )
existing_vote = PostVote . query . filter_by ( user_id = user . id , post_id = post . id ) . first ( )
if existing_vote :
post . author . reputation - = existing_vote . effect
if existing_vote . effect < 0 : # Lemmy sends 'like' for upvote and 'dislike' for down votes. Cool! When it undoes an upvote it sends an 'Undo Like'. Fine. When it undoes a downvote it sends an 'Undo Like' - not 'Undo Dislike'?!
post . down_votes - = 1
else :
post . up_votes - = 1
post . score - = existing_vote . effect
db . session . delete ( existing_vote )
activity_log . result = ' success '
2024-01-05 09:39:20 +13:00
if ( user and not user . is_local ( ) ) and isinstance ( voted_on , PostReply ) :
comment = voted_on
2023-12-30 13:23:12 +13:00
existing_vote = PostReplyVote . query . filter_by ( user_id = user . id , post_reply_id = comment . id ) . first ( )
if existing_vote :
comment . author . reputation - = existing_vote . effect
if existing_vote . effect < 0 : # Lemmy sends 'like' for upvote and 'dislike' for down votes. Cool! When it undoes an upvote it sends an 'Undo Like'. Fine. When it undoes a downvote it sends an 'Undo Like' - not 'Undo Dislike'?!
comment . down_votes - = 1
else :
comment . up_votes - = 1
comment . score - = existing_vote . effect
db . session . delete ( existing_vote )
activity_log . result = ' success '
2024-04-17 15:10:04 +01:00
if user is None or ( post is None and comment is None ) :
activity_log . exception_message = ' Blocked or unfound user or comment '
if user and user . is_local ( ) :
activity_log . exception_message = ' Activity about local content which is already present '
activity_log . result = ' ignored '
if post :
return post
if comment :
return comment
return None
2023-12-30 13:23:12 +13:00
2024-04-06 16:29:47 +13:00
def process_report ( user , reported , request_json , activity_log ) :
if len ( request_json [ ' summary ' ] ) < 15 :
reasons = request_json [ ' summary ' ]
description = ' '
else :
reasons = request_json [ ' summary ' ] [ : 15 ]
description = request_json [ ' summary ' ] [ 15 : ]
if isinstance ( reported , User ) :
if reported . reports == - 1 :
return
type = 0
report = Report ( reasons = reasons , description = description ,
type = type , reporter_id = user . id , suspect_user_id = reported . id , source_instance_id = user . instance_id )
db . session . add ( report )
# Notify site admin
already_notified = set ( )
for admin in Site . admins ( ) :
if admin . id not in already_notified :
notify = Notification ( title = ' Reported user ' , url = ' /admin/reports ' , user_id = admin . id ,
author_id = user . id )
db . session . add ( notify )
admin . unread_notifications + = 1
reported . reports + = 1
db . session . commit ( )
elif isinstance ( reported , Post ) :
if reported . reports == - 1 :
return
type = 1
report = Report ( reasons = reasons , description = description , type = type , reporter_id = user . id ,
suspect_user_id = reported . author . id , suspect_post_id = reported . id ,
suspect_community_id = reported . community . id , in_community_id = reported . community . id ,
source_instance_id = user . instance_id )
db . session . add ( report )
already_notified = set ( )
for mod in reported . community . moderators ( ) :
notification = Notification ( user_id = mod . user_id , title = _ ( ' A post has been reported ' ) ,
url = f " https:// { current_app . config [ ' SERVER_NAME ' ] } /post/ { reported . id } " ,
author_id = user . id )
db . session . add ( notification )
already_notified . add ( mod . user_id )
reported . reports + = 1
db . session . commit ( )
elif isinstance ( reported , PostReply ) :
if reported . reports == - 1 :
return
type = 2
post = Post . query . get ( reported . post_id )
report = Report ( reasons = reasons , description = description , type = type , reporter_id = user . id , suspect_post_id = post . id ,
suspect_community_id = post . community . id ,
suspect_user_id = reported . author . id , suspect_post_reply_id = reported . id ,
in_community_id = post . community . id ,
source_instance_id = user . instance_id )
db . session . add ( report )
# Notify moderators
already_notified = set ( )
for mod in post . community . moderators ( ) :
notification = Notification ( user_id = mod . user_id , title = _ ( ' A comment has been reported ' ) ,
url = f " https:// { current_app . config [ ' SERVER_NAME ' ] } /comment/ { reported . id } " ,
author_id = user . id )
db . session . add ( notification )
already_notified . add ( mod . user_id )
reported . reports + = 1
db . session . commit ( )
elif isinstance ( reported , Community ) :
. . .
elif isinstance ( reported , Conversation ) :
. . .
2024-04-04 21:36:03 +13:00
def get_redis_connection ( ) - > redis . Redis :
connection_string = current_app . config [ ' CACHE_REDIS_URL ' ]
if connection_string . startswith ( ' unix:// ' ) :
unix_socket_path , db , password = parse_redis_pipe_string ( connection_string )
return redis . Redis ( unix_socket_path = unix_socket_path , db = db , password = password )
else :
host , port , db , password = parse_redis_socket_string ( connection_string )
return redis . Redis ( host = host , port = port , db = db , password = password )
def parse_redis_pipe_string ( connection_string : str ) :
if connection_string . startswith ( ' unix:// ' ) :
# Parse the connection string
parsed_url = urlparse ( connection_string )
# Extract the path (Unix socket path)
unix_socket_path = parsed_url . path
# Extract query parameters (if any)
query_params = parse_qs ( parsed_url . query )
# Extract database number (default to 0 if not provided)
db = int ( query_params . get ( ' db ' , [ 0 ] ) [ 0 ] )
# Extract password (if provided)
password = query_params . get ( ' password ' , [ None ] ) [ 0 ]
return unix_socket_path , db , password
def parse_redis_socket_string ( connection_string : str ) :
# Parse the connection string
parsed_url = urlparse ( connection_string )
# Extract username (if provided) and password
if parsed_url . username :
username = parsed_url . username
else :
username = None
password = parsed_url . password
# Extract host and port
host = parsed_url . hostname
port = parsed_url . port
# Extract database number (default to 0 if not provided)
db = int ( parsed_url . path . lstrip ( ' / ' ) or 0 )
return host , port , db , password
2023-11-23 15:10:44 +13:00
def lemmy_site_data ( ) :
2023-12-23 11:32:22 +13:00
site = g . site
2023-11-23 15:10:44 +13:00
data = {
" site_view " : {
" site " : {
" id " : 1 ,
2023-12-17 00:12:49 +13:00
" name " : site . name ,
" sidebar " : site . sidebar ,
" published " : site . created_at . isoformat ( ) ,
" updated " : site . updated . isoformat ( ) ,
2024-02-14 14:53:03 +13:00
" icon " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /static/images/logo2.png " ,
" banner " : " " ,
2023-12-17 00:12:49 +13:00
" description " : site . description ,
" actor_id " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } / " ,
" last_refreshed_at " : site . updated . isoformat ( ) ,
" inbox_url " : f " https:// { current_app . config [ ' SERVER_NAME ' ] } /inbox " ,
" public_key " : site . public_key ,
2023-11-23 15:10:44 +13:00
" instance_id " : 1
} ,
" local_site " : {
" id " : 1 ,
" site_id " : 1 ,
" site_setup " : True ,
2023-12-17 00:12:49 +13:00
" enable_downvotes " : site . enable_downvotes ,
" enable_nsfw " : site . enable_nsfw ,
" enable_nsfl " : site . enable_nsfl ,
" community_creation_admin_only " : site . community_creation_admin_only ,
2023-11-23 15:10:44 +13:00
" require_email_verification " : True ,
2023-12-17 00:12:49 +13:00
" application_question " : site . application_question ,
2023-11-23 15:10:44 +13:00
" private_instance " : False ,
" default_theme " : " browser " ,
" default_post_listing_type " : " All " ,
" hide_modlog_mod_names " : True ,
" application_email_admins " : True ,
" actor_name_max_length " : 20 ,
" federation_enabled " : True ,
" captcha_enabled " : True ,
" captcha_difficulty " : " medium " ,
2023-12-17 00:12:49 +13:00
" published " : site . created_at . isoformat ( ) ,
" updated " : site . updated . isoformat ( ) ,
" registration_mode " : site . registration_mode ,
" reports_email_admins " : site . reports_email_admins
2023-11-23 15:10:44 +13:00
} ,
" local_site_rate_limit " : {
" id " : 1 ,
" local_site_id " : 1 ,
" message " : 999 ,
" message_per_second " : 60 ,
" post " : 50 ,
" post_per_second " : 600 ,
" register " : 20 ,
" register_per_second " : 3600 ,
" image " : 100 ,
" image_per_second " : 3600 ,
" comment " : 100 ,
" comment_per_second " : 600 ,
" search " : 999 ,
" search_per_second " : 600 ,
2023-12-17 00:12:49 +13:00
" published " : site . created_at . isoformat ( ) ,
2023-11-23 15:10:44 +13:00
} ,
" counts " : {
" id " : 1 ,
" site_id " : 1 ,
2024-02-14 14:38:55 +13:00
" users " : users_total ( ) ,
" posts " : local_posts ( ) ,
" comments " : local_comments ( ) ,
" communities " : local_communities ( ) ,
" users_active_day " : active_day ( ) ,
" users_active_week " : active_week ( ) ,
" users_active_month " : active_month ( ) ,
" users_active_half_year " : active_half_year ( )
2023-11-23 15:10:44 +13:00
}
} ,
2024-02-14 14:38:55 +13:00
" admins " : [ ] ,
2023-11-23 15:10:44 +13:00
" version " : " 1.0.0 " ,
2024-04-22 20:10:13 +12:00
" all_languages " : [ ] ,
" discussion_languages " : [ ] ,
2024-02-14 14:38:55 +13:00
" taglines " : [ ] ,
2023-11-23 15:10:44 +13:00
" custom_emojis " : [ ]
}
2024-04-22 20:10:13 +12:00
# Languages
discussion_languages = [ ]
for language in Language . query . all ( ) :
# hardcode English as the site language, for now. This will need to be an admin setting, soon.
if language . code == ' und ' or language . code == ' en ' :
discussion_languages . append ( language . id )
data [ ' all_languages ' ] . append ( {
' id ' : language . id ,
' code ' : language . code ,
' name ' : language . name
} )
data [ ' discussion_languages ' ] = discussion_languages
# Admins
2024-02-14 14:38:55 +13:00
for admin in Site . admins ( ) :
person = {
" id " : admin . id ,
2024-04-18 14:17:27 +12:00
" name " : admin . user_name ,
" display_name " : admin . display_name ( ) ,
2024-02-14 14:53:03 +13:00
" avatar " : ' https:// ' + current_app . config [ ' SERVER_NAME ' ] + admin . avatar_image ( ) ,
2024-02-14 14:38:55 +13:00
" banned " : admin . banned ,
2024-04-18 14:23:01 +12:00
" published " : admin . created . isoformat ( ) + ' Z ' ,
" updated " : admin . created . isoformat ( ) + ' Z ' ,
2024-02-14 14:38:55 +13:00
" actor_id " : admin . profile_id ( ) ,
" local " : True ,
" deleted " : admin . deleted ,
" matrix_user_id " : admin . matrix_user_id ,
" admin " : True ,
" bot_account " : admin . bot ,
" instance_id " : 1
}
counts = {
" id " : admin . id ,
" person_id " : admin . id ,
" post_count " : 0 ,
" post_score " : 0 ,
" comment_count " : 0 ,
" comment_score " : 0
}
data [ ' admins ' ] . append ( { ' person ' : person , ' counts ' : counts } )
2023-11-23 15:10:44 +13:00
return data
2024-04-24 13:44:25 +01:00
def ensure_domains_match ( activity : dict ) - > bool :
if ' id ' in activity :
note_id = activity [ ' id ' ]
else :
note_id = None
if ' actor ' in activity :
note_actor = activity [ ' actor ' ]
elif ' attributedTo ' in activity :
note_actor = activity [ ' attributedTo ' ]
else :
note_actor = None
if note_id and note_actor :
parsed_url = urlparse ( note_id )
id_domain = parsed_url . netloc
parsed_url = urlparse ( note_actor )
actor_domain = parsed_url . netloc
if id_domain == actor_domain :
return True
return False