mirror of
https://github.com/django/django.git
synced 2025-10-24 14:16:09 +00:00
Fixed CVE-2024-38875 -- Mitigated potential DoS in urlize and urlizetrunc template filters.
Thank you to Elias Myllymäki for the report. Co-authored-by: Sarah Boyce <42296566+sarahboyce@users.noreply.github.com>
This commit is contained in:
@@ -9,7 +9,7 @@ from urllib.parse import parse_qsl, quote, unquote, urlencode, urlsplit, urlunsp
|
|||||||
|
|
||||||
from django.utils.deprecation import RemovedInDjango60Warning
|
from django.utils.deprecation import RemovedInDjango60Warning
|
||||||
from django.utils.encoding import punycode
|
from django.utils.encoding import punycode
|
||||||
from django.utils.functional import Promise, keep_lazy, keep_lazy_text
|
from django.utils.functional import Promise, cached_property, keep_lazy, keep_lazy_text
|
||||||
from django.utils.http import RFC3986_GENDELIMS, RFC3986_SUBDELIMS
|
from django.utils.http import RFC3986_GENDELIMS, RFC3986_SUBDELIMS
|
||||||
from django.utils.regex_helper import _lazy_re_compile
|
from django.utils.regex_helper import _lazy_re_compile
|
||||||
from django.utils.safestring import SafeData, SafeString, mark_safe
|
from django.utils.safestring import SafeData, SafeString, mark_safe
|
||||||
@@ -257,6 +257,16 @@ def smart_urlquote(url):
|
|||||||
return urlunsplit((scheme, netloc, path, query, fragment))
|
return urlunsplit((scheme, netloc, path, query, fragment))
|
||||||
|
|
||||||
|
|
||||||
|
class CountsDict(dict):
|
||||||
|
def __init__(self, *args, word, **kwargs):
|
||||||
|
super().__init__(*args, *kwargs)
|
||||||
|
self.word = word
|
||||||
|
|
||||||
|
def __missing__(self, key):
|
||||||
|
self[key] = self.word.count(key)
|
||||||
|
return self[key]
|
||||||
|
|
||||||
|
|
||||||
class Urlizer:
|
class Urlizer:
|
||||||
"""
|
"""
|
||||||
Convert any URLs in text into clickable links.
|
Convert any URLs in text into clickable links.
|
||||||
@@ -362,40 +372,72 @@ class Urlizer:
|
|||||||
return x
|
return x
|
||||||
return "%s…" % x[: max(0, limit - 1)]
|
return "%s…" % x[: max(0, limit - 1)]
|
||||||
|
|
||||||
|
@cached_property
|
||||||
|
def wrapping_punctuation_openings(self):
|
||||||
|
return "".join(dict(self.wrapping_punctuation).keys())
|
||||||
|
|
||||||
|
@cached_property
|
||||||
|
def trailing_punctuation_chars_no_semicolon(self):
|
||||||
|
return self.trailing_punctuation_chars.replace(";", "")
|
||||||
|
|
||||||
|
@cached_property
|
||||||
|
def trailing_punctuation_chars_has_semicolon(self):
|
||||||
|
return ";" in self.trailing_punctuation_chars
|
||||||
|
|
||||||
def trim_punctuation(self, word):
|
def trim_punctuation(self, word):
|
||||||
"""
|
"""
|
||||||
Trim trailing and wrapping punctuation from `word`. Return the items of
|
Trim trailing and wrapping punctuation from `word`. Return the items of
|
||||||
the new state.
|
the new state.
|
||||||
"""
|
"""
|
||||||
lead, middle, trail = "", word, ""
|
# Strip all opening wrapping punctuation.
|
||||||
|
middle = word.lstrip(self.wrapping_punctuation_openings)
|
||||||
|
lead = word[: len(word) - len(middle)]
|
||||||
|
trail = ""
|
||||||
|
|
||||||
# Continue trimming until middle remains unchanged.
|
# Continue trimming until middle remains unchanged.
|
||||||
trimmed_something = True
|
trimmed_something = True
|
||||||
while trimmed_something:
|
counts = CountsDict(word=middle)
|
||||||
|
while trimmed_something and middle:
|
||||||
trimmed_something = False
|
trimmed_something = False
|
||||||
# Trim wrapping punctuation.
|
# Trim wrapping punctuation.
|
||||||
for opening, closing in self.wrapping_punctuation:
|
for opening, closing in self.wrapping_punctuation:
|
||||||
if middle.startswith(opening):
|
if counts[opening] < counts[closing]:
|
||||||
middle = middle.removeprefix(opening)
|
rstripped = middle.rstrip(closing)
|
||||||
lead += opening
|
if rstripped != middle:
|
||||||
trimmed_something = True
|
strip = counts[closing] - counts[opening]
|
||||||
# Keep parentheses at the end only if they're balanced.
|
trail = middle[-strip:]
|
||||||
if (
|
middle = middle[:-strip]
|
||||||
middle.endswith(closing)
|
trimmed_something = True
|
||||||
and middle.count(closing) == middle.count(opening) + 1
|
counts[closing] -= strip
|
||||||
):
|
|
||||||
middle = middle.removesuffix(closing)
|
rstripped = middle.rstrip(self.trailing_punctuation_chars_no_semicolon)
|
||||||
trail = closing + trail
|
if rstripped != middle:
|
||||||
trimmed_something = True
|
trail = middle[len(rstripped) :] + trail
|
||||||
# Trim trailing punctuation (after trimming wrapping punctuation,
|
middle = rstripped
|
||||||
# as encoded entities contain ';'). Unescape entities to avoid
|
|
||||||
# breaking them by removing ';'.
|
|
||||||
middle_unescaped = html.unescape(middle)
|
|
||||||
stripped = middle_unescaped.rstrip(self.trailing_punctuation_chars)
|
|
||||||
if middle_unescaped != stripped:
|
|
||||||
punctuation_count = len(middle_unescaped) - len(stripped)
|
|
||||||
trail = middle[-punctuation_count:] + trail
|
|
||||||
middle = middle[:-punctuation_count]
|
|
||||||
trimmed_something = True
|
trimmed_something = True
|
||||||
|
|
||||||
|
if self.trailing_punctuation_chars_has_semicolon and middle.endswith(";"):
|
||||||
|
# Only strip if not part of an HTML entity.
|
||||||
|
amp = middle.rfind("&")
|
||||||
|
if amp == -1:
|
||||||
|
can_strip = True
|
||||||
|
else:
|
||||||
|
potential_entity = middle[amp:]
|
||||||
|
escaped = html.unescape(potential_entity)
|
||||||
|
can_strip = (escaped == potential_entity) or escaped.endswith(";")
|
||||||
|
|
||||||
|
if can_strip:
|
||||||
|
rstripped = middle.rstrip(";")
|
||||||
|
amount_stripped = len(middle) - len(rstripped)
|
||||||
|
if amp > -1 and amount_stripped > 1:
|
||||||
|
# Leave a trailing semicolon as might be an entity.
|
||||||
|
trail = middle[len(rstripped) + 1 :] + trail
|
||||||
|
middle = rstripped + ";"
|
||||||
|
else:
|
||||||
|
trail = middle[len(rstripped) :] + trail
|
||||||
|
middle = rstripped
|
||||||
|
trimmed_something = True
|
||||||
|
|
||||||
return lead, middle, trail
|
return lead, middle, trail
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
|
@@ -7,3 +7,9 @@ Django 4.2.14 release notes
|
|||||||
Django 4.2.14 fixes two security issues with severity "moderate" and two
|
Django 4.2.14 fixes two security issues with severity "moderate" and two
|
||||||
security issues with severity "low" in 4.2.13.
|
security issues with severity "low" in 4.2.13.
|
||||||
|
|
||||||
|
CVE-2024-38875: Potential denial-of-service vulnerability in ``django.utils.html.urlize()``
|
||||||
|
===========================================================================================
|
||||||
|
|
||||||
|
:tfilter:`urlize` and :tfilter:`urlizetrunc` were subject to a potential
|
||||||
|
denial-of-service attack via certain inputs with a very large number of
|
||||||
|
brackets.
|
||||||
|
@@ -7,6 +7,13 @@ Django 5.0.7 release notes
|
|||||||
Django 5.0.7 fixes two security issues with severity "moderate", two security
|
Django 5.0.7 fixes two security issues with severity "moderate", two security
|
||||||
issues with severity "low", and several bugs in 5.0.6.
|
issues with severity "low", and several bugs in 5.0.6.
|
||||||
|
|
||||||
|
CVE-2024-38875: Potential denial-of-service vulnerability in ``django.utils.html.urlize()``
|
||||||
|
===========================================================================================
|
||||||
|
|
||||||
|
:tfilter:`urlize` and :tfilter:`urlizetrunc` were subject to a potential
|
||||||
|
denial-of-service attack via certain inputs with a very large number of
|
||||||
|
brackets.
|
||||||
|
|
||||||
Bugfixes
|
Bugfixes
|
||||||
========
|
========
|
||||||
|
|
||||||
|
@@ -352,6 +352,13 @@ class TestUtilsHtml(SimpleTestCase):
|
|||||||
"foo@.example.com",
|
"foo@.example.com",
|
||||||
"foo@localhost",
|
"foo@localhost",
|
||||||
"foo@localhost.",
|
"foo@localhost.",
|
||||||
|
# trim_punctuation catastrophic tests
|
||||||
|
"(" * 100_000 + ":" + ")" * 100_000,
|
||||||
|
"(" * 100_000 + "&:" + ")" * 100_000,
|
||||||
|
"([" * 100_000 + ":" + "])" * 100_000,
|
||||||
|
"[(" * 100_000 + ":" + ")]" * 100_000,
|
||||||
|
"([[" * 100_000 + ":" + "]])" * 100_000,
|
||||||
|
"&:" + ";" * 100_000,
|
||||||
)
|
)
|
||||||
for value in tests:
|
for value in tests:
|
||||||
with self.subTest(value=value):
|
with self.subTest(value=value):
|
||||||
|
Reference in New Issue
Block a user