django/tests/utils_tests/test_encoding.py

import datetime
import inspect
import sys
import unittest
from pathlib import Path
from unittest import mock
from urllib.parse import quote, quote_plus

from django.test import SimpleTestCase
from django.utils.encoding import (
    DjangoUnicodeDecodeError,
    escape_uri_path,
    filepath_to_uri,
    force_bytes,
    force_str,
    get_system_encoding,
    iri_to_uri,
    repercent_broken_unicode,
    smart_bytes,
    smart_str,
    uri_to_iri,
)
from django.utils.functional import SimpleLazyObject
from django.utils.translation import gettext_lazy


class TestEncodingUtils(SimpleTestCase):
    def test_force_str_exception(self):
        """
        Broken __str__ actually raises an error.
        """

        class MyString:
            def __str__(self):
                return b"\xc3\xb6\xc3\xa4\xc3\xbc"

        # str(s) raises a TypeError if the result is not a text type.
        with self.assertRaises(TypeError):
            force_str(MyString())

    def test_force_str_lazy(self):
        s = SimpleLazyObject(lambda: "x")
        self.assertIs(type(force_str(s)), str)

    def test_force_str_DjangoUnicodeDecodeError(self):
        msg = (
            "'utf-8' codec can't decode byte 0xff in position 0: invalid "
            "start byte. You passed in b'\\xff' (<class 'bytes'>)"
        )
        with self.assertRaisesMessage(DjangoUnicodeDecodeError, msg):
            force_str(b"\xff")

    def test_force_bytes_exception(self):
        """
        force_bytes knows how to convert to bytes an exception
        containing non-ASCII characters in its args.
        """
        error_msg = "This is an exception, voilà"
        exc = ValueError(error_msg)
        self.assertEqual(force_bytes(exc), error_msg.encode())
        self.assertEqual(
            force_bytes(exc, encoding="ascii", errors="ignore"),
            b"This is an exception, voil",
        )

    def test_force_bytes_strings_only(self):
        today = datetime.date.today()
        self.assertEqual(force_bytes(today, strings_only=True), today)

    def test_force_bytes_encoding(self):
        error_msg = "This is an exception, voilà".encode()
        result = force_bytes(error_msg, encoding="ascii", errors="ignore")
        self.assertEqual(result, b"This is an exception, voil")

    def test_force_bytes_memory_view(self):
        data = b"abc"
        result = force_bytes(memoryview(data))
        # Type check is needed because memoryview(bytes) == bytes.
        self.assertIs(type(result), bytes)
        self.assertEqual(result, data)

    def test_smart_bytes(self):
        class Test:
            def __str__(self):
                return "ŠĐĆŽćžšđ"

        lazy_func = gettext_lazy("x")
        self.assertIs(smart_bytes(lazy_func), lazy_func)
        self.assertEqual(
            smart_bytes(Test()),
            b"\xc5\xa0\xc4\x90\xc4\x86\xc5\xbd\xc4\x87\xc5\xbe\xc5\xa1\xc4\x91",
        )
        self.assertEqual(smart_bytes(1), b"1")
        self.assertEqual(smart_bytes("foo"), b"foo")

    def test_smart_str(self):
        class Test:
            def __str__(self):
                return "ŠĐĆŽćžšđ"

        lazy_func = gettext_lazy("x")
        self.assertIs(smart_str(lazy_func), lazy_func)
        self.assertEqual(
            smart_str(Test()), "\u0160\u0110\u0106\u017d\u0107\u017e\u0161\u0111"
        )
        self.assertEqual(smart_str(1), "1")
        self.assertEqual(smart_str("foo"), "foo")

    def test_get_default_encoding(self):
        with mock.patch("locale.getlocale", side_effect=Exception):
            self.assertEqual(get_system_encoding(), "ascii")

    def test_repercent_broken_unicode_recursion_error(self):
        # Prepare a string long enough to force a recursion error if the tested
        # function uses recursion.
        data = b"\xfc" * sys.getrecursionlimit()
        try:
            self.assertEqual(
                repercent_broken_unicode(data), b"%FC" * sys.getrecursionlimit()
            )
        except RecursionError:
            self.fail("Unexpected RecursionError raised.")

    def test_repercent_broken_unicode_small_fragments(self):
        data = b"test\xfctest\xfctest\xfc"
        decoded_paths = []

        def mock_quote(*args, **kwargs):
            # The second frame is the call to repercent_broken_unicode().
            decoded_paths.append(inspect.currentframe().f_back.f_locals["path"])
            return quote(*args, **kwargs)

        with mock.patch("django.utils.encoding.quote", mock_quote):
            self.assertEqual(repercent_broken_unicode(data), b"test%FCtest%FCtest%FC")

        # decode() is called on smaller fragment of the path each time.
        self.assertEqual(
            decoded_paths,
            [b"test\xfctest\xfctest\xfc", b"test\xfctest\xfc", b"test\xfc"],
        )


class TestRFC3987IEncodingUtils(unittest.TestCase):
    def test_filepath_to_uri(self):
        self.assertIsNone(filepath_to_uri(None))
        self.assertEqual(
            filepath_to_uri("upload\\чубака.mp4"),
            "upload/%D1%87%D1%83%D0%B1%D0%B0%D0%BA%D0%B0.mp4",
        )
        self.assertEqual(filepath_to_uri(Path("upload/test.png")), "upload/test.png")
        self.assertEqual(filepath_to_uri(Path("upload\\test.png")), "upload/test.png")

    def test_iri_to_uri(self):
        cases = [
            # Valid UTF-8 sequences are encoded.
            ("red%09rosé#red", "red%09ros%C3%A9#red"),
            ("/blog/for/Jürgen Münster/", "/blog/for/J%C3%BCrgen%20M%C3%BCnster/"),
            (
                "locations/%s" % quote_plus("Paris & Orléans"),
                "locations/Paris+%26+Orl%C3%A9ans",
            ),
            # Reserved chars remain unescaped.
            ("%&", "%&"),
            ("red&♥ros%#red", "red&%E2%99%A5ros%#red"),
            (gettext_lazy("red&♥ros%#red"), "red&%E2%99%A5ros%#red"),
        ]

        for iri, uri in cases:
            with self.subTest(iri):
                self.assertEqual(iri_to_uri(iri), uri)

                # Test idempotency.
                self.assertEqual(iri_to_uri(iri_to_uri(iri)), uri)

    def test_uri_to_iri(self):
        cases = [
            (None, None),
            # Valid UTF-8 sequences are decoded.
            ("/%e2%89%Ab%E2%99%a5%E2%89%aB/", "/≫♥≫/"),
            ("/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93", "/♥♥/?utf8=✓"),
            ("/%41%5a%6B/", "/AZk/"),
            # Reserved and non-URL valid ASCII chars are not decoded.
            ("/%25%20%02%41%7b/", "/%25%20%02A%7b/"),
            # Broken UTF-8 sequences remain escaped.
            ("/%AAd%AAj%AAa%AAn%AAg%AAo%AA/", "/%AAd%AAj%AAa%AAn%AAg%AAo%AA/"),
            ("/%E2%99%A5%E2%E2%99%A5/", "/♥%E2♥/"),
            ("/%E2%99%A5%E2%99%E2%99%A5/", "/♥%E2%99♥/"),
            ("/%E2%E2%99%A5%E2%99%A5%99/", "/%E2♥♥%99/"),
            (
                "/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93",
                "/♥♥/?utf8=%9C%93✓%9C%93",
            ),
        ]

        for uri, iri in cases:
            with self.subTest(uri):
                self.assertEqual(uri_to_iri(uri), iri)

                # Test idempotency.
                self.assertEqual(uri_to_iri(uri_to_iri(uri)), iri)

    def test_complementarity(self):
        cases = [
            (
                "/blog/for/J%C3%BCrgen%20M%C3%BCnster/",
                "/blog/for/J\xfcrgen%20M\xfcnster/",
            ),
            ("%&", "%&"),
            ("red&%E2%99%A5ros%#red", "red&♥ros%#red"),
            ("/%E2%99%A5%E2%99%A5/", "/♥♥/"),
            ("/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93", "/♥♥/?utf8=✓"),
            ("/%25%20%02%7b/", "/%25%20%02%7b/"),
            ("/%AAd%AAj%AAa%AAn%AAg%AAo%AA/", "/%AAd%AAj%AAa%AAn%AAg%AAo%AA/"),
            ("/%E2%99%A5%E2%E2%99%A5/", "/♥%E2♥/"),
            ("/%E2%99%A5%E2%99%E2%99%A5/", "/♥%E2%99♥/"),
            ("/%E2%E2%99%A5%E2%99%A5%99/", "/%E2♥♥%99/"),
            (
                "/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93",
                "/♥♥/?utf8=%9C%93✓%9C%93",
            ),
        ]

        for uri, iri in cases:
            with self.subTest(uri):
                self.assertEqual(iri_to_uri(uri_to_iri(uri)), uri)
                self.assertEqual(uri_to_iri(iri_to_uri(iri)), iri)

    def test_escape_uri_path(self):
        cases = [
            (
                "/;some/=awful/?path/:with/@lots/&of/+awful/chars",
                "/%3Bsome/%3Dawful/%3Fpath/:with/@lots/&of/+awful/chars",
            ),
            ("/foo#bar", "/foo%23bar"),
            ("/foo?bar", "/foo%3Fbar"),
        ]
        for uri, expected in cases:
            with self.subTest(uri):
                self.assertEqual(escape_uri_path(uri), expected)
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 15:28:28 +00:00			`import datetime`
[4.2.x] Fixed CVE-2023-41164 -- Fixed potential DoS in django.utils.encoding.uri_to_iri(). Thanks MProgrammer (https://hackerone.com/mprogrammer) for the report. Co-authored-by: nessita <124304+nessita@users.noreply.github.com> 2023-08-22 06:53:03 +00:00			`import inspect`
Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 15:04:53 +00:00			`import sys`
Sorted imports with isort; refs #23860. 2015-01-28 12:35:27 +00:00			`import unittest`
Refs #28428 -- Made filepath_to_uri() support pathlib.Path. 2019-10-29 20:15:18 +00:00			`from pathlib import Path`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`from unittest import mock`
[4.2.x] Fixed CVE-2023-41164 -- Fixed potential DoS in django.utils.encoding.uri_to_iri(). Thanks MProgrammer (https://hackerone.com/mprogrammer) for the report. Co-authored-by: nessita <124304+nessita@users.noreply.github.com> 2023-08-22 06:53:03 +00:00			`from urllib.parse import quote, quote_plus`
Stopped using django.utils.unittest in the test suite. Refs #20680. 2013-07-01 12:22:27 +00:00
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-01 20:48:53 +00:00			`from django.test import SimpleTestCase`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 15:43:34 +00:00			`from django.utils.encoding import (`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-01 20:48:53 +00:00			`DjangoUnicodeDecodeError,`
			`escape_uri_path,`
			`filepath_to_uri,`
			`force_bytes,`
Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 15:04:53 +00:00			`force_str,`
			`get_system_encoding,`
			`iri_to_uri,`
			`repercent_broken_unicode,`
			`smart_bytes,`
			`smart_str,`
			`uri_to_iri,`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 15:43:34 +00:00			`)`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-26 20:46:13 +00:00			`from django.utils.functional import SimpleLazyObject`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`from django.utils.translation import gettext_lazy`
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 07:24:39 +00:00

Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-01 20:48:53 +00:00			`class TestEncodingUtils(SimpleTestCase):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`def test_force_str_exception(self):`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-06 17:16:06 +00:00			`"""`
Refs #23919 -- Removed unneeded str() calls 2017-01-20 09:20:53 +00:00			`Broken __str__ actually raises an error.`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-06 17:16:06 +00:00			`"""`
Refs #33476 -- Reformatted code with Black. 2022-02-03 19:24:19 +00:00
Refs #23919 -- Stopped inheriting from object to define new style classes. 2017-01-19 07:39:46 +00:00			`class MyString:`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-06 17:16:06 +00:00			`def __str__(self):`
			`return b"\xc3\xb6\xc3\xa4\xc3\xbc"`

Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 10:38:01 +00:00			`# str(s) raises a TypeError if the result is not a text type.`
			`with self.assertRaises(TypeError):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`force_str(MyString())`
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 15:28:28 +00:00
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`def test_force_str_lazy(self):`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-26 20:46:13 +00:00			`s = SimpleLazyObject(lambda: "x")`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`self.assertIs(type(force_str(s)), str)`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-26 20:46:13 +00:00
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`def test_force_str_DjangoUnicodeDecodeError(self):`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-01 20:48:53 +00:00			`msg = (`
			`"'utf-8' codec can't decode byte 0xff in position 0: invalid "`
			`"start byte. You passed in b'\\xff' (<class 'bytes'>)"`
			`)`
			`with self.assertRaisesMessage(DjangoUnicodeDecodeError, msg):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`force_str(b"\xff")`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-01 20:48:53 +00:00
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 07:24:39 +00:00			`def test_force_bytes_exception(self):`
			`"""`
Refs #27392 -- Removed "Tests that", "Ensures that", etc. from test docstrings. 2016-10-27 07:53:39 +00:00			`force_bytes knows how to convert to bytes an exception`
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 07:24:39 +00:00			`containing non-ASCII characters in its args.`
			`"""`
			`error_msg = "This is an exception, voilà"`
			`exc = ValueError(error_msg)`
Refs #23919 -- Removed default 'utf-8' argument for str.encode()/decode(). 2017-02-07 17:05:47 +00:00			`self.assertEqual(force_bytes(exc), error_msg.encode())`
Removed an untested and broken branch in force_bytes() (refs #6353). The new test crashed in the removed branch. It's unclear if the branch has value since c6a2bd9b962af1cdf46f964589e6023046cfa8ec didn't include tests. 2017-02-04 00:36:53 +00:00			`self.assertEqual(`
			`force_bytes(exc, encoding="ascii", errors="ignore"),`
			`b"This is an exception, voil",`
			`)`
Fixed #20108 -- Fixed filepath_to_uri decoding error This was a regression due to unicode_literals usage. Thanks Ivan Virabyan for the report and the initial patch. 2013-03-22 16:55:12 +00:00
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 15:28:28 +00:00			`def test_force_bytes_strings_only(self):`
			`today = datetime.date.today()`
			`self.assertEqual(force_bytes(today, strings_only=True), today)`

Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`def test_force_bytes_encoding(self):`
			`error_msg = "This is an exception, voilà".encode()`
			`result = force_bytes(error_msg, encoding="ascii", errors="ignore")`
			`self.assertEqual(result, b"This is an exception, voil")`

			`def test_force_bytes_memory_view(self):`
Made test for memoryview handling in force_bytes() more strict. 2018-07-09 15:01:42 +00:00			`data = b"abc"`
			`result = force_bytes(memoryview(data))`
			`# Type check is needed because memoryview(bytes) == bytes.`
			`self.assertIs(type(result), bytes)`
			`self.assertEqual(result, data)`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00
			`def test_smart_bytes(self):`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 15:45:54 +00:00			`class Test:`
Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 10:38:01 +00:00			`def __str__(self):`
			`return "ŠĐĆŽćžšđ"`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 15:45:54 +00:00
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`lazy_func = gettext_lazy("x")`
			`self.assertIs(smart_bytes(lazy_func), lazy_func)`
			`self.assertEqual(`
			`smart_bytes(Test()),`
			`b"\xc5\xa0\xc4\x90\xc4\x86\xc5\xbd\xc4\x87\xc5\xbe\xc5\xa1\xc4\x91",`
			`)`
			`self.assertEqual(smart_bytes(1), b"1")`
			`self.assertEqual(smart_bytes("foo"), b"foo")`

Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`def test_smart_str(self):`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`class Test:`
Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 10:38:01 +00:00			`def __str__(self):`
			`return "ŠĐĆŽćžšđ"`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 15:45:54 +00:00
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`lazy_func = gettext_lazy("x")`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 09:08:08 +00:00			`self.assertIs(smart_str(lazy_func), lazy_func)`
			`self.assertEqual(`
			`smart_str(Test()), "\u0160\u0110\u0106\u017d\u0107\u017e\u0161\u0111"`
			`)`
			`self.assertEqual(smart_str(1), "1")`
			`self.assertEqual(smart_str("foo"), "foo")`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 15:43:34 +00:00
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`def test_get_default_encoding(self):`
Refs #33173 -- Used locale.getlocale() instead of getdefaultlocale(). locale.getdefaultlocale() was deprecated in Python 3.11, see https://bugs.python.org/issue46659. 2022-03-08 12:17:05 +00:00			`with mock.patch("locale.getlocale", side_effect=Exception):`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`self.assertEqual(get_system_encoding(), "ascii")`

Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 15:04:53 +00:00			`def test_repercent_broken_unicode_recursion_error(self):`
			`# Prepare a string long enough to force a recursion error if the tested`
			`# function uses recursion.`
			`data = b"\xfc" * sys.getrecursionlimit()`
			`try:`
			`self.assertEqual(`
			`repercent_broken_unicode(data), b"%FC" * sys.getrecursionlimit()`
Refs #33476 -- Reformatted code with Black. 2022-02-03 19:24:19 +00:00			`)`
Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 15:04:53 +00:00			`except RecursionError:`
			`self.fail("Unexpected RecursionError raised.")`

[4.2.x] Fixed CVE-2023-41164 -- Fixed potential DoS in django.utils.encoding.uri_to_iri(). Thanks MProgrammer (https://hackerone.com/mprogrammer) for the report. Co-authored-by: nessita <124304+nessita@users.noreply.github.com> 2023-08-22 06:53:03 +00:00			`def test_repercent_broken_unicode_small_fragments(self):`
			`data = b"test\xfctest\xfctest\xfc"`
			`decoded_paths = []`

			`def mock_quote(args, *kwargs):`
			`# The second frame is the call to repercent_broken_unicode().`
			`decoded_paths.append(inspect.currentframe().f_back.f_locals["path"])`
			`return quote(args, *kwargs)`

			`with mock.patch("django.utils.encoding.quote", mock_quote):`
			`self.assertEqual(repercent_broken_unicode(data), b"test%FCtest%FCtest%FC")`

			`# decode() is called on smaller fragment of the path each time.`
			`self.assertEqual(`
			`decoded_paths,`
			`[b"test\xfctest\xfctest\xfc", b"test\xfctest\xfc", b"test\xfc"],`
			`)`

Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00
			`class TestRFC3987IEncodingUtils(unittest.TestCase):`
Fixed #20108 -- Fixed filepath_to_uri decoding error This was a regression due to unicode_literals usage. Thanks Ivan Virabyan for the report and the initial patch. 2013-03-22 16:55:12 +00:00			`def test_filepath_to_uri(self):`
Used more specific unittest assertions in tests. * assertIsNone()/assertIsNotNone() instead of comparing to None. * assertLess() for < comparisons. * assertIs() for 'is' expressions. * assertIsInstance() for isinstance() expressions. * rounding of assertAlmostEqual() for round() expressions. * assertIs(..., True/False) instead of comparing to True/False. * assertIs()/assertIsNot() for ==/!= comparisons. * assertNotEqual() for == comparisons. * assertTrue()/assertFalse() instead of comparing to True/False. 2019-10-21 08:55:05 +00:00			`self.assertIsNone(filepath_to_uri(None))`
Fixed E128 flake8 warnings in tests/. 2016-04-08 02:04:45 +00:00			`self.assertEqual(`
			`filepath_to_uri("upload\\чубака.mp4"),`
			`"upload/%D1%87%D1%83%D0%B1%D0%B0%D0%BA%D0%B0.mp4",`
			`)`
Refs #28428 -- Made filepath_to_uri() support pathlib.Path. 2019-10-29 20:15:18 +00:00			`self.assertEqual(filepath_to_uri(Path("upload/test.png")), "upload/test.png")`
			`self.assertEqual(filepath_to_uri(Path("upload\\test.png")), "upload/test.png")`
Fixed #21198 -- Prevented invalid use of @python_2_unicode_compatible. Thanks jpic for the report and chmodas for working on a patch. Reverts 2ea80b94. Refs #19362. 2013-10-13 16:06:58 +00:00
Consolidated some text utils into the utils_tests test package. 2014-09-23 12:45:59 +00:00			`def test_iri_to_uri(self):`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`cases = [`
			`# Valid UTF-8 sequences are encoded.`
			`("red%09rosé#red", "red%09ros%C3%A9#red"),`
			`("/blog/for/Jürgen Münster/", "/blog/for/J%C3%BCrgen%20M%C3%BCnster/"),`
Refs #23919 -- Replaced usage of django.utils.http utilities with Python equivalents Thanks Tim Graham for the review. 2017-01-26 13:25:15 +00:00			`(`
			`"locations/%s" % quote_plus("Paris & Orléans"),`
			`"locations/Paris+%26+Orl%C3%A9ans",`
			`),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`# Reserved chars remain unescaped.`
			`("%&", "%&"),`
			`("red&♥ros%#red", "red&%E2%99%A5ros%#red"),`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`(gettext_lazy("red&♥ros%#red"), "red&%E2%99%A5ros%#red"),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`]`

			`for iri, uri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`with self.subTest(iri):`
			`self.assertEqual(iri_to_uri(iri), uri)`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`# Test idempotency.`
			`self.assertEqual(iri_to_uri(iri_to_uri(iri)), uri)`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00
			`def test_uri_to_iri(self):`
			`cases = [`
Completed test coverage for django.utils.encoding. 2017-02-23 01:54:55 +00:00			`(None, None),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`# Valid UTF-8 sequences are decoded.`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 13:55:44 +00:00			`("/%e2%89%Ab%E2%99%a5%E2%89%aB/", "/≫♥≫/"),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`("/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93", "/♥♥/?utf8=✓"),`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 13:55:44 +00:00			`("/%41%5a%6B/", "/AZk/"),`
			`# Reserved and non-URL valid ASCII chars are not decoded.`
			`("/%25%20%02%41%7b/", "/%25%20%02A%7b/"),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`# Broken UTF-8 sequences remain escaped.`
			`("/%AAd%AAj%AAa%AAn%AAg%AAo%AA/", "/%AAd%AAj%AAa%AAn%AAg%AAo%AA/"),`
			`("/%E2%99%A5%E2%E2%99%A5/", "/♥%E2♥/"),`
			`("/%E2%99%A5%E2%99%E2%99%A5/", "/♥%E2%99♥/"),`
			`("/%E2%E2%99%A5%E2%99%A5%99/", "/%E2♥♥%99/"),`
			`(`
			`"/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93",`
			`"/♥♥/?utf8=%9C%93✓%9C%93",`
			`),`
			`]`
Consolidated some text utils into the utils_tests test package. 2014-09-23 12:45:59 +00:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`for uri, iri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`with self.subTest(uri):`
			`self.assertEqual(uri_to_iri(uri), iri)`
Consolidated some text utils into the utils_tests test package. 2014-09-23 12:45:59 +00:00
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`# Test idempotency.`
			`self.assertEqual(uri_to_iri(uri_to_iri(uri)), iri)`
Consolidated some text utils into the utils_tests test package. 2014-09-23 12:45:59 +00:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`def test_complementarity(self):`
			`cases = [`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 13:55:44 +00:00			`(`
			`"/blog/for/J%C3%BCrgen%20M%C3%BCnster/",`
			`"/blog/for/J\xfcrgen%20M\xfcnster/",`
			`),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`("%&", "%&"),`
			`("red&%E2%99%A5ros%#red", "red&♥ros%#red"),`
			`("/%E2%99%A5%E2%99%A5/", "/♥♥/"),`
			`("/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93", "/♥♥/?utf8=✓"),`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 13:55:44 +00:00			`("/%25%20%02%7b/", "/%25%20%02%7b/"),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`("/%AAd%AAj%AAa%AAn%AAg%AAo%AA/", "/%AAd%AAj%AAa%AAn%AAg%AAo%AA/"),`
			`("/%E2%99%A5%E2%E2%99%A5/", "/♥%E2♥/"),`
			`("/%E2%99%A5%E2%99%E2%99%A5/", "/♥%E2%99♥/"),`
			`("/%E2%E2%99%A5%E2%99%A5%99/", "/%E2♥♥%99/"),`
			`(`
			`"/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93",`
			`"/♥♥/?utf8=%9C%93✓%9C%93",`
			`),`
			`]`
Consolidated some text utils into the utils_tests test package. 2014-09-23 12:45:59 +00:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 12:25:22 +00:00			`for uri, iri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`with self.subTest(uri):`
			`self.assertEqual(iri_to_uri(uri_to_iri(uri)), uri)`
			`self.assertEqual(uri_to_iri(iri_to_uri(iri)), iri)`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 15:45:54 +00:00
			`def test_escape_uri_path(self):`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 09:58:06 +00:00			`cases = [`
			`(`
			`"/;some/=awful/?path/:with/@lots/&of/+awful/chars",`
			`"/%3Bsome/%3Dawful/%3Fpath/:with/@lots/&of/+awful/chars",`
			`),`
			`("/foo#bar", "/foo%23bar"),`
			`("/foo?bar", "/foo%3Fbar"),`
			`]`
			`for uri, expected in cases:`
			`with self.subTest(uri):`
			`self.assertEqual(escape_uri_path(uri), expected)`