Simplify regex for raw URLs in text

2025-01-23 19:36:56 -08:00 · 2024-06-17 16:54:27 +01:00 · 2024-06-17 16:54:27 +01:00 · 8137c6b4b1
commit 8137c6b4b1
parent 4f3a8b1d74
1 changed files with 1 additions and 1 deletions
--- a/app/utils.py
+++ b/app/utils.py
@ -188,7 +188,7 @@ def allowlist_html(html: str) -> str:
    soup = BeautifulSoup(html, 'html.parser')

    # Find all plain text links, convert to <a> tags
-    re_url = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')
+    re_url = re.compile(r'(http[s]?://[!-~]+)')   # http(s):// followed by chars in ASCII range 33 to 126
    for tag in soup.find_all(text=True):
        tags = []
        url = False