From b4382764f55dba5eeea4e50124ff1e5d2a6d05e3 Mon Sep 17 00:00:00 2001 From: rimu <3310831+rimu@users.noreply.github.com> Date: Mon, 23 Dec 2024 13:35:24 +1300 Subject: [PATCH] improve speed of detect post vote manipulation detection #343 --- app/utils.py | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/app/utils.py b/app/utils.py index b4377f93..c08c0a22 100644 --- a/app/utils.py +++ b/app/utils.py @@ -1251,10 +1251,16 @@ def get_task_session() -> Session: return Session(bind=db.engine) +user2_cache = {} + + def jaccard_similarity(user1_upvoted: set, user2_id: int): - user2_upvoted_posts = ['post/' + str(id) for id in recently_upvoted_posts(user2_id)] - user2_upvoted_replies = ['reply/' + str(id) for id in recently_upvoted_post_replies(user2_id)] - user2_upvoted = set(user2_upvoted_posts + user2_upvoted_replies) + if user2_id not in user2_cache: + user2_upvoted_posts = ['post/' + str(id) for id in recently_upvoted_posts(user2_id)] + user2_upvoted_replies = ['reply/' + str(id) for id in recently_upvoted_post_replies(user2_id)] + user2_cache[user2_id] = set(user2_upvoted_posts + user2_upvoted_replies) + + user2_upvoted = user2_cache[user2_id] if len(user2_upvoted) > 12: intersection = len(user1_upvoted.intersection(user2_upvoted))