django/tests/utils_tests/test_text.py

# -*- coding: utf-8 -*-
from __future__ import unicode_literals

import json
import warnings
from unittest import skipUnless

from django.test import SimpleTestCase, ignore_warnings
from django.test.utils import reset_warning_registry
from django.utils import six, text
from django.utils.deprecation import RemovedInDjango19Warning
from django.utils.encoding import force_text
from django.utils.functional import lazy
from django.utils.translation import override

lazystr = lazy(force_text, six.text_type)

IS_WIDE_BUILD = (len('\U0001F4A9') == 1)


class TestUtilsText(SimpleTestCase):

    def test_get_text_list(self):
        self.assertEqual(text.get_text_list(['a', 'b', 'c', 'd']), 'a, b, c or d')
        self.assertEqual(text.get_text_list(['a', 'b', 'c'], 'and'), 'a, b and c')
        self.assertEqual(text.get_text_list(['a', 'b'], 'and'), 'a and b')
        self.assertEqual(text.get_text_list(['a']), 'a')
        self.assertEqual(text.get_text_list([]), '')
        with override('ar'):
            self.assertEqual(text.get_text_list(['a', 'b', 'c']), "a، b أو c")

    def test_smart_split(self):
        testdata = [
            ('This is "a person" test.',
                ['This', 'is', '"a person"', 'test.']),
            ('This is "a person\'s" test.',
                ['This', 'is', '"a person\'s"', 'test.']),
            ('This is "a person\\"s" test.',
                ['This', 'is', '"a person\\"s"', 'test.']),
            ('"a \'one',
                ['"a', "'one"]),
            ('all friends\' tests',
                ['all', 'friends\'', 'tests']),
            ('url search_page words="something else"',
                ['url', 'search_page', 'words="something else"']),
            ("url search_page words='something else'",
                ['url', 'search_page', "words='something else'"]),
            ('url search_page words "something else"',
                ['url', 'search_page', 'words', '"something else"']),
            ('url search_page words-"something else"',
                ['url', 'search_page', 'words-"something else"']),
            ('url search_page words=hello',
                ['url', 'search_page', 'words=hello']),
            ('url search_page words="something else',
                ['url', 'search_page', 'words="something', 'else']),
            ("cut:','|cut:' '",
                ["cut:','|cut:' '"]),
            (lazystr("a b c d"),  # Test for #20231
                ['a', 'b', 'c', 'd']),
        ]
        for test, expected in testdata:
            self.assertEqual(list(text.smart_split(test)), expected)

    def test_truncate_chars(self):
        truncator = text.Truncator(
            'The quick brown fox jumped over the lazy dog.'
        )
        self.assertEqual('The quick brown fox jumped over the lazy dog.',
            truncator.chars(100)),
        self.assertEqual('The quick brown fox ...',
            truncator.chars(23)),
        self.assertEqual('The quick brown fo.....',
            truncator.chars(23, '.....')),

        # Ensure that we normalize our unicode data first
        nfc = text.Truncator('o\xfco\xfco\xfco\xfc')
        nfd = text.Truncator('ou\u0308ou\u0308ou\u0308ou\u0308')
        self.assertEqual('oüoüoüoü', nfc.chars(8))
        self.assertEqual('oüoüoüoü', nfd.chars(8))
        self.assertEqual('oü...', nfc.chars(5))
        self.assertEqual('oü...', nfd.chars(5))

        # Ensure the final length is calculated correctly when there are
        # combining characters with no precomposed form, and that combining
        # characters are not split up.
        truncator = text.Truncator('-B\u030AB\u030A----8')
        self.assertEqual('-B\u030A...', truncator.chars(5))
        self.assertEqual('-B\u030AB\u030A-...', truncator.chars(7))
        self.assertEqual('-B\u030AB\u030A----8', truncator.chars(8))

        # Ensure the length of the end text is correctly calculated when it
        # contains combining characters with no precomposed form.
        truncator = text.Truncator('-----')
        self.assertEqual('---B\u030A', truncator.chars(4, 'B\u030A'))
        self.assertEqual('-----', truncator.chars(5, 'B\u030A'))

        # Make a best effort to shorten to the desired length, but requesting
        # a length shorter than the ellipsis shouldn't break
        self.assertEqual('...', text.Truncator('asdf').chars(1))

    def test_truncate_words(self):
        truncator = text.Truncator('The quick brown fox jumped over the lazy '
            'dog.')
        self.assertEqual('The quick brown fox jumped over the lazy dog.',
            truncator.words(10))
        self.assertEqual('The quick brown fox...', truncator.words(4))
        self.assertEqual('The quick brown fox[snip]',
            truncator.words(4, '[snip]'))

    def test_truncate_html_words(self):
        truncator = text.Truncator('<p id="par"><strong><em>The quick brown fox'
            ' jumped over the lazy dog.</em></strong></p>')
        self.assertEqual('<p id="par"><strong><em>The quick brown fox jumped over'
            ' the lazy dog.</em></strong></p>', truncator.words(10, html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox...</em>'
            '</strong></p>', truncator.words(4, html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox....</em>'
            '</strong></p>', truncator.words(4, '....', html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox</em>'
            '</strong></p>', truncator.words(4, '', html=True))

        # Test with new line inside tag
        truncator = text.Truncator('<p>The quick <a href="xyz.html"\n'
            'id="mylink">brown fox</a> jumped over the lazy dog.</p>')
        self.assertEqual('<p>The quick <a href="xyz.html"\n'
            'id="mylink">brown...</a></p>', truncator.words(3, '...', html=True))

        # Test self-closing tags
        truncator = text.Truncator('<br/>The <hr />quick brown fox jumped over'
            ' the lazy dog.')
        self.assertEqual('<br/>The <hr />quick brown...',
            truncator.words(3, '...', html=True))
        truncator = text.Truncator('<br>The <hr/>quick <em>brown fox</em> '
            'jumped over the lazy dog.')
        self.assertEqual('<br>The <hr/>quick <em>brown...</em>',
            truncator.words(3, '...', html=True))

        # Test html entities
        truncator = text.Truncator('<i>Buenos d&iacute;as!'
            ' &#x00bf;C&oacute;mo est&aacute;?</i>')
        self.assertEqual('<i>Buenos d&iacute;as! &#x00bf;C&oacute;mo...</i>',
            truncator.words(3, '...', html=True))
        truncator = text.Truncator('<p>I &lt;3 python, what about you?</p>')
        self.assertEqual('<p>I &lt;3 python...</p>',
            truncator.words(3, '...', html=True))

    def test_wrap(self):
        digits = '1234 67 9'
        self.assertEqual(text.wrap(digits, 100), '1234 67 9')
        self.assertEqual(text.wrap(digits, 9), '1234 67 9')
        self.assertEqual(text.wrap(digits, 8), '1234 67\n9')

        self.assertEqual(text.wrap('short\na long line', 7),
                         'short\na long\nline')

        self.assertEqual(text.wrap('do-not-break-long-words please? ok', 8),
                         'do-not-break-long-words\nplease?\nok')

        long_word = 'l%sng' % ('o' * 20)
        self.assertEqual(text.wrap(long_word, 20), long_word)
        self.assertEqual(text.wrap('a %s word' % long_word, 10),
                         'a\n%s\nword' % long_word)

    def test_normalize_newlines(self):
        self.assertEqual(text.normalize_newlines("abc\ndef\rghi\r\n"),
                         "abc\ndef\nghi\n")
        self.assertEqual(text.normalize_newlines("\n\r\r\n\r"), "\n\n\n\n")
        self.assertEqual(text.normalize_newlines("abcdefghi"), "abcdefghi")
        self.assertEqual(text.normalize_newlines(""), "")

    def test_normalize_newlines_bytes(self):
        """normalize_newlines should be able to handle bytes too"""
        normalized = text.normalize_newlines(b"abc\ndef\rghi\r\n")
        self.assertEqual(normalized, "abc\ndef\nghi\n")
        self.assertIsInstance(normalized, six.text_type)

    def test_slugify(self):
        items = (
            ('Hello, World!', 'hello-world'),
            ('spam & eggs', 'spam-eggs'),
        )
        for value, output in items:
            self.assertEqual(text.slugify(value), output)

    def test_unescape_entities(self):
        items = [
            ('', ''),
            ('foo', 'foo'),
            ('&amp;', '&'),
            ('&#x26;', '&'),
            ('&#38;', '&'),
            ('foo &amp; bar', 'foo & bar'),
            ('foo & bar', 'foo & bar'),
        ]
        for value, output in items:
            self.assertEqual(text.unescape_entities(value), output)

    def test_get_valid_filename(self):
        filename = "^&'@{}[],$=!-#()%+~_123.txt"
        self.assertEqual(text.get_valid_filename(filename), "-_123.txt")

    def test_compress_sequence(self):
        data = [{'key': i} for i in range(10)]
        seq = list(json.JSONEncoder().iterencode(data))
        seq = [s.encode('utf-8') for s in seq]
        actual_length = len(b''.join(seq))
        out = text.compress_sequence(seq)
        compressed_length = len(b''.join(out))
        self.assertTrue(compressed_length < actual_length)

    @ignore_warnings(category=RemovedInDjango19Warning)
    def test_javascript_quote(self):
        input = "<script>alert('Hello \\xff.\n Welcome\there\r');</script>"
        output = r"<script>alert(\'Hello \\xff.\n Welcome\there\r\');<\/script>"
        self.assertEqual(text.javascript_quote(input), output)

        # Exercising quote_double_quotes keyword argument
        input = '"Text"'
        self.assertEqual(text.javascript_quote(input), '"Text"')
        self.assertEqual(text.javascript_quote(input, quote_double_quotes=True),
                         '&quot;Text&quot;')

    @ignore_warnings(category=RemovedInDjango19Warning)
    @skipUnless(IS_WIDE_BUILD, 'Not running in a wide build of Python')
    def test_javascript_quote_unicode(self):
        input = "<script>alert('Hello \\xff.\n Wel𝕃come\there\r');</script>"
        output = r"<script>alert(\'Hello \\xff.\n Wel𝕃come\there\r\');<\/script>"
        self.assertEqual(text.javascript_quote(input), output)

    def test_deprecation(self):
        reset_warning_registry()
        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            text.javascript_quote('thingy')
            self.assertEqual(len(w), 1)
            self.assertIn('escapejs()', repr(w[0].message))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								# -*- coding: utf-8 -*-
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								from __future__ import unicode_literals
-												[1.8.x] Fixed #24242 -- Improved efficiency of utils.text.compress_sequence()

The function no longer flushes zfile after each write as doing so can
lead to the gzipped streamed content being larger than the original
content; each flush adds a 5/6 byte type 0 block. Removing this means
buf.read() may return nothing, so only yield if that has some data.
Testing shows without the flush() the buffer is being flushed every 17k
or so and compresses the same as if it had been done as a whole string.

Backport of caa3562d5bec1196502352a715a539bdb0f73c2d from master

											
										
										
											2015-01-29 07:59:41 +00:00
+								import json
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 13:46:23 +00:00
+								import warnings
-												[1.8.x] Fixed #24242 -- Improved efficiency of utils.text.compress_sequence()

The function no longer flushes zfile after each write as doing so can
lead to the gzipped streamed content being larger than the original
content; each flush adds a 5/6 byte type 0 block. Removing this means
buf.read() may return nothing, so only yield if that has some data.
Testing shows without the flush() the buffer is being flushed every 17k
or so and compresses the same as if it had been done as a whole string.

Backport of caa3562d5bec1196502352a715a539bdb0f73c2d from master

											
										
										
											2015-01-29 07:59:41 +00:00
+								from unittest import skipUnless
-												Fixed test failures when running in a narrow Python build.

											
										
										
											2014-02-18 17:07:07 +00:00
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								from django.test import SimpleTestCase, ignore_warnings
-												Refs #23947 -- Worked around a bug in Python that prevents deprecation warnings from appearing in tests.

											
										
										
											2014-12-05 20:14:20 +00:00
+								from django.test.utils import reset_warning_registry
-												Fixed #21574 -- Handle bytes consistently in utils.text.normalize_newlines.

All input is now coerced to text before being normalized.
This changes nothing under Python 2 but it allows bytes
to be passed to the function without a TypeError under Python3
(bytes are assumed to be utf-8 encoded text).

Thanks to trac user vajrasky for the report.

											
										
										
											2013-12-12 14:58:14 +00:00
+								from django.utils import six, text
-												Fixed #21188 -- Introduced subclasses for to-be-removed-in-django-XX warnings

Thanks Anssi Kääriäinen for the idea and Simon Charette for the
review.

											
										
										
											2014-02-26 21:48:20 +00:00
+								from django.utils.deprecation import RemovedInDjango19Warning
-												Consolidated some text utils into the utils_tests test package.

											
										
										
											2014-09-23 12:45:59 +00:00
+								from django.utils.encoding import force_text
 								from django.utils.functional import lazy
 								from django.utils.translation import override
 								lazystr = lazy(force_text, six.text_type)
-												Reorganized utils tests so it's all in separate modules. Thanks to Stephan Jaekel.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@13889 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-09-27 15:15:04 +00:00
-												Fixed test failures when running in a narrow Python build.

											
										
										
											2014-02-18 17:07:07 +00:00
+								IS_WIDE_BUILD = (len('\U0001F4A9') == 1)
-												Fixing E302 Errors

Signed-off-by: Jason Myers <jason@jasonamyers.com>

											
										
										
											2013-11-02 21:34:05 +00:00
-												Fixed #18042 -- Advanced deprecation warnings.

Thanks Ramiro for the patch.

											
										
										
											2012-05-03 13:27:01 +00:00
+								class TestUtilsText(SimpleTestCase):
-												Consolidated some text utils into the utils_tests test package.

											
										
										
											2014-09-23 12:45:59 +00:00
+								    def test_get_text_list(self):
 								        self.assertEqual(text.get_text_list(['a', 'b', 'c', 'd']), 'a, b, c or d')
 								        self.assertEqual(text.get_text_list(['a', 'b', 'c'], 'and'), 'a, b and c')
 								        self.assertEqual(text.get_text_list(['a', 'b'], 'and'), 'a and b')
 								        self.assertEqual(text.get_text_list(['a']), 'a')
 								        self.assertEqual(text.get_text_list([]), '')
 								        with override('ar'):
 								            self.assertEqual(text.get_text_list(['a', 'b', 'c']), "a، b أو c")
 								    def test_smart_split(self):
 								        testdata = [
 								            ('This is "a person" test.',
 								                ['This', 'is', '"a person"', 'test.']),
 								            ('This is "a person\'s" test.',
 								                ['This', 'is', '"a person\'s"', 'test.']),
 								            ('This is "a person\\"s" test.',
 								                ['This', 'is', '"a person\\"s"', 'test.']),
 								            ('"a \'one',
 								                ['"a', "'one"]),
 								            ('all friends\' tests',
 								                ['all', 'friends\'', 'tests']),
 								            ('url search_page words="something else"',
 								                ['url', 'search_page', 'words="something else"']),
 								            ("url search_page words='something else'",
 								                ['url', 'search_page', "words='something else'"]),
 								            ('url search_page words "something else"',
 								                ['url', 'search_page', 'words', '"something else"']),
 								            ('url search_page words-"something else"',
 								                ['url', 'search_page', 'words-"something else"']),
 								            ('url search_page words=hello',
 								                ['url', 'search_page', 'words=hello']),
 								            ('url search_page words="something else',
 								                ['url', 'search_page', 'words="something', 'else']),
 								            ("cut:','|cut:' '",
 								                ["cut:','|cut:' '"]),
 								            (lazystr("a b c d"),  # Test for #20231
 								                ['a', 'b', 'c', 'd']),
 								        ]
 								        for test, expected in testdata:
 								            self.assertEqual(list(text.smart_split(test)), expected)
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								    def test_truncate_chars(self):
 								        truncator = text.Truncator(
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								            'The quick brown fox jumped over the lazy dog.'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								        )
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('The quick brown fox jumped over the lazy dog.',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            truncator.chars(100)),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('The quick brown fox ...',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            truncator.chars(23)),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('The quick brown fo.....',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            truncator.chars(23, '.....')),
 								        # Ensure that we normalize our unicode data first
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        nfc = text.Truncator('o\xfco\xfco\xfco\xfc')
 								        nfd = text.Truncator('ou\u0308ou\u0308ou\u0308ou\u0308')
 								        self.assertEqual('oüoüoüoü', nfc.chars(8))
 								        self.assertEqual('oüoüoüoü', nfd.chars(8))
 								        self.assertEqual('oü...', nfc.chars(5))
 								        self.assertEqual('oü...', nfd.chars(5))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
 								        # Ensure the final length is calculated correctly when there are
 								        # combining characters with no precomposed form, and that combining
 								        # characters are not split up.
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        truncator = text.Truncator('-B\u030AB\u030A----8')
 								        self.assertEqual('-B\u030A...', truncator.chars(5))
 								        self.assertEqual('-B\u030AB\u030A-...', truncator.chars(7))
 								        self.assertEqual('-B\u030AB\u030A----8', truncator.chars(8))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
 								        # Ensure the length of the end text is correctly calculated when it
 								        # contains combining characters with no precomposed form.
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        truncator = text.Truncator('-----')
 								        self.assertEqual('---B\u030A', truncator.chars(4, 'B\u030A'))
 								        self.assertEqual('-----', truncator.chars(5, 'B\u030A'))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
 								        # Make a best effort to shorten to the desired length, but requesting
 								        # a length shorter than the ellipsis shouldn't break
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('...', text.Truncator('asdf').chars(1))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
-												Reorganized utils tests so it's all in separate modules. Thanks to Stephan Jaekel.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@13889 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-09-27 15:15:04 +00:00
+								    def test_truncate_words(self):
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        truncator = text.Truncator('The quick brown fox jumped over the lazy '
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            'dog.')
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('The quick brown fox jumped over the lazy dog.',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            truncator.words(10))
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('The quick brown fox...', truncator.words(4))
 								        self.assertEqual('The quick brown fox[snip]',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            truncator.words(4, '[snip]'))
 								    def test_truncate_html_words(self):
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
+								        truncator = text.Truncator('<p id="par"><strong><em>The quick brown fox'
 								            ' jumped over the lazy dog.</em></strong></p>')
 								        self.assertEqual('<p id="par"><strong><em>The quick brown fox jumped over'
 								            ' the lazy dog.</em></strong></p>', truncator.words(10, html=True))
 								        self.assertEqual('<p id="par"><strong><em>The quick brown fox...</em>'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            '</strong></p>', truncator.words(4, html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
+								        self.assertEqual('<p id="par"><strong><em>The quick brown fox....</em>'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
+								            '</strong></p>', truncator.words(4, '....', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
+								        self.assertEqual('<p id="par"><strong><em>The quick brown fox</em>'
 								            '</strong></p>', truncator.words(4, '', html=True))
-												Fixed #10931 -- Made `Truncator` handle newlines properly. Thanks to gsong and Claude Paroz.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@17329 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2012-01-02 18:47:18 +00:00
+								        # Test with new line inside tag
 								        truncator = text.Truncator('<p>The quick <a href="xyz.html"\n'
 								            'id="mylink">brown fox</a> jumped over the lazy dog.</p>')
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual('<p>The quick <a href="xyz.html"\n'
-												Fixed #10931 -- Made `Truncator` handle newlines properly. Thanks to gsong and Claude Paroz.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@17329 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2012-01-02 18:47:18 +00:00
+								            'id="mylink">brown...</a></p>', truncator.words(3, '...', html=True))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 13:47:10 +00:00
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
+								        # Test self-closing tags
 								        truncator = text.Truncator('<br/>The <hr />quick brown fox jumped over'
 								            ' the lazy dog.')
 								        self.assertEqual('<br/>The <hr />quick brown...',
-												Fixed #21266 -- Fixed E201,E202 pep8 warnings.

											
										
										
											2013-10-14 19:13:14 +00:00
+								            truncator.words(3, '...', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
+								        truncator = text.Truncator('<br>The <hr/>quick <em>brown fox</em> '
 								            'jumped over the lazy dog.')
 								        self.assertEqual('<br>The <hr/>quick <em>brown...</em>',
-												Fixed #21266 -- Fixed E201,E202 pep8 warnings.

											
										
										
											2013-10-14 19:13:14 +00:00
+								            truncator.words(3, '...', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-13 17:24:49 +00:00
-												Fixed #20568 -- truncatewords_html no longer splits words containing HTML entities.

Thanks yann0 at hotmail.com for the report.

											
										
										
											2013-07-18 08:45:34 +00:00
+								        # Test html entities
 								        truncator = text.Truncator('<i>Buenos d&iacute;as!'
 								            ' &#x00bf;C&oacute;mo est&aacute;?</i>')
 								        self.assertEqual('<i>Buenos d&iacute;as! &#x00bf;C&oacute;mo...</i>',
 								            truncator.words(3, '...', html=True))
 								        truncator = text.Truncator('<p>I &lt;3 python, what about you?</p>')
 								        self.assertEqual('<p>I &lt;3 python...</p>',
 								            truncator.words(3, '...', html=True))
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-11-30 21:21:37 +00:00
+								    def test_wrap(self):
 								        digits = '1234 67 9'
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								        self.assertEqual(text.wrap(digits, 100), '1234 67 9')
 								        self.assertEqual(text.wrap(digits, 9), '1234 67 9')
 								        self.assertEqual(text.wrap(digits, 8), '1234 67\n9')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-11-30 21:21:37 +00:00
 								        self.assertEqual(text.wrap('short\na long line', 7),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								                         'short\na long\nline')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-11-30 21:21:37 +00:00
 								        self.assertEqual(text.wrap('do-not-break-long-words please? ok', 8),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								                         'do-not-break-long-words\nplease?\nok')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-11-30 21:21:37 +00:00
 								        long_word = 'l%sng' % ('o' * 20)
 								        self.assertEqual(text.wrap(long_word, 20), long_word)
 								        self.assertEqual(text.wrap('a %s word' % long_word, 10),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-07 16:08:47 +00:00
+								                         'a\n%s\nword' % long_word)
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 12:53:22 +00:00
-												Fixed #21572 -- Added unit test for django.utils.text.normalize_newlines.

											
										
										
											2013-12-07 08:28:22 +00:00
+								    def test_normalize_newlines(self):
 								        self.assertEqual(text.normalize_newlines("abc\ndef\rghi\r\n"),
 								                         "abc\ndef\nghi\n")
 								        self.assertEqual(text.normalize_newlines("\n\r\r\n\r"), "\n\n\n\n")
 								        self.assertEqual(text.normalize_newlines("abcdefghi"), "abcdefghi")
 								        self.assertEqual(text.normalize_newlines(""), "")
-												Fixed #21574 -- Handle bytes consistently in utils.text.normalize_newlines.

All input is now coerced to text before being normalized.
This changes nothing under Python 2 but it allows bytes
to be passed to the function without a TypeError under Python3
(bytes are assumed to be utf-8 encoded text).

Thanks to trac user vajrasky for the report.

											
										
										
											2013-12-12 14:58:14 +00:00
+								    def test_normalize_newlines_bytes(self):
 								        """normalize_newlines should be able to handle bytes too"""
 								        normalized = text.normalize_newlines(b"abc\ndef\rghi\r\n")
 								        self.assertEqual(normalized, "abc\ndef\nghi\n")
 								        self.assertIsInstance(normalized, six.text_type)
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 12:53:22 +00:00
+								    def test_slugify(self):
 								        items = (
-												[py3] Made 212b9826bd Python 3-friendly

											
										
										
											2012-08-18 15:47:21 +00:00
+								            ('Hello, World!', 'hello-world'),
 								            ('spam & eggs', 'spam-eggs'),
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 12:53:22 +00:00
+								        )
 								        for value, output in items:
 								            self.assertEqual(text.slugify(value), output)
-												Fix #21185: Added tests for unescape_entities.

Also fixed a py3 incompatibility.
Thanks to brutasse for the report.

											
										
										
											2013-09-27 15:00:42 +00:00
 								    def test_unescape_entities(self):
 								        items = [
 								            ('', ''),
 								            ('foo', 'foo'),
 								            ('&amp;', '&'),
 								            ('&#x26;', '&'),
 								            ('&#38;', '&'),
 								            ('foo &amp; bar', 'foo & bar'),
 								            ('foo & bar', 'foo & bar'),
 								        ]
 								        for value, output in items:
 								            self.assertEqual(text.unescape_entities(value), output)
-												Fixed #21505 -- Added unit test for django.utils.text.get_valid_filename.

											
										
										
											2013-11-24 08:10:21 +00:00
 								    def test_get_valid_filename(self):
 								        filename = "^&'@{}[],$=!-#()%+~_123.txt"
 								        self.assertEqual(text.get_valid_filename(filename), "-_123.txt")
-												Fixed #21731 -- Made javascript_quote escapes '</'.

											
										
										
											2014-01-04 04:57:50 +00:00
-												[1.8.x] Fixed #24242 -- Improved efficiency of utils.text.compress_sequence()

The function no longer flushes zfile after each write as doing so can
lead to the gzipped streamed content being larger than the original
content; each flush adds a 5/6 byte type 0 block. Removing this means
buf.read() may return nothing, so only yield if that has some data.
Testing shows without the flush() the buffer is being flushed every 17k
or so and compresses the same as if it had been done as a whole string.

Backport of caa3562d5bec1196502352a715a539bdb0f73c2d from master

											
										
										
											2015-01-29 07:59:41 +00:00
+								    def test_compress_sequence(self):
 								        data = [{'key': i} for i in range(10)]
 								        seq = list(json.JSONEncoder().iterencode(data))
 								        seq = [s.encode('utf-8') for s in seq]
 								        actual_length = len(b''.join(seq))
 								        out = text.compress_sequence(seq)
 								        compressed_length = len(b''.join(out))
 								        self.assertTrue(compressed_length < actual_length)
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								    @ignore_warnings(category=RemovedInDjango19Warning)
-												Fixed #21731 -- Made javascript_quote escapes '</'.

											
										
										
											2014-01-04 04:57:50 +00:00
+								    def test_javascript_quote(self):
 								        input = "<script>alert('Hello \\xff.\n Welcome\there\r');</script>"
 								        output = r"<script>alert(\'Hello \\xff.\n Welcome\there\r\');<\/script>"
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								        self.assertEqual(text.javascript_quote(input), output)
-												Fixed #21731 -- Made javascript_quote escapes '</'.

											
										
										
											2014-01-04 04:57:50 +00:00
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								        # Exercising quote_double_quotes keyword argument
 								        input = '"Text"'
 								        self.assertEqual(text.javascript_quote(input), '"Text"')
 								        self.assertEqual(text.javascript_quote(input, quote_double_quotes=True),
 								                         '&quot;Text&quot;')
-												Fixed #21725 -- Fixed JavaScript quoting encoding.

Thanks to nedbatchelder for the report.

											
										
										
											2014-02-15 17:55:33 +00:00
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								    @ignore_warnings(category=RemovedInDjango19Warning)
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 13:46:23 +00:00
+								    @skipUnless(IS_WIDE_BUILD, 'Not running in a wide build of Python')
-												Fixed #21725 -- Fixed JavaScript quoting encoding.

Thanks to nedbatchelder for the report.

											
										
										
											2014-02-15 17:55:33 +00:00
+								    def test_javascript_quote_unicode(self):
 								        input = "<script>alert('Hello \\xff.\n Wel𝕃come\there\r');</script>"
 								        output = r"<script>alert(\'Hello \\xff.\n Wel𝕃come\there\r\');<\/script>"
-												Applied ignore_warnings to Django tests

											
										
										
											2014-12-21 20:19:05 +00:00
+								        self.assertEqual(text.javascript_quote(input), output)
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 13:46:23 +00:00
 								    def test_deprecation(self):
-												Refs #23947 -- Worked around a bug in Python that prevents deprecation warnings from appearing in tests.

											
										
										
											2014-12-05 20:14:20 +00:00
+								        reset_warning_registry()
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 13:46:23 +00:00
+								        with warnings.catch_warnings(record=True) as w:
 								            warnings.simplefilter("always")
 								            text.javascript_quote('thingy')
 								            self.assertEqual(len(w), 1)
 								            self.assertIn('escapejs()', repr(w[0].message))