django/tests/utils_tests/test_text.py

# -*- coding: utf-8 -*-
from __future__ import unicode_literals

from unittest import skipUnless
import warnings

from django.test import SimpleTestCase
from django.test.utils import reset_warning_registry
from django.utils import six, text
from django.utils.deprecation import RemovedInDjango19Warning
from django.utils.encoding import force_text
from django.utils.functional import lazy
from django.utils.translation import override

lazystr = lazy(force_text, six.text_type)

IS_WIDE_BUILD = (len('\U0001F4A9') == 1)


class TestUtilsText(SimpleTestCase):

    def test_get_text_list(self):
        self.assertEqual(text.get_text_list(['a', 'b', 'c', 'd']), 'a, b, c or d')
        self.assertEqual(text.get_text_list(['a', 'b', 'c'], 'and'), 'a, b and c')
        self.assertEqual(text.get_text_list(['a', 'b'], 'and'), 'a and b')
        self.assertEqual(text.get_text_list(['a']), 'a')
        self.assertEqual(text.get_text_list([]), '')
        with override('ar'):
            self.assertEqual(text.get_text_list(['a', 'b', 'c']), "a، b أو c")

    def test_smart_split(self):
        testdata = [
            ('This is "a person" test.',
                ['This', 'is', '"a person"', 'test.']),
            ('This is "a person\'s" test.',
                ['This', 'is', '"a person\'s"', 'test.']),
            ('This is "a person\\"s" test.',
                ['This', 'is', '"a person\\"s"', 'test.']),
            ('"a \'one',
                ['"a', "'one"]),
            ('all friends\' tests',
                ['all', 'friends\'', 'tests']),
            ('url search_page words="something else"',
                ['url', 'search_page', 'words="something else"']),
            ("url search_page words='something else'",
                ['url', 'search_page', "words='something else'"]),
            ('url search_page words "something else"',
                ['url', 'search_page', 'words', '"something else"']),
            ('url search_page words-"something else"',
                ['url', 'search_page', 'words-"something else"']),
            ('url search_page words=hello',
                ['url', 'search_page', 'words=hello']),
            ('url search_page words="something else',
                ['url', 'search_page', 'words="something', 'else']),
            ("cut:','|cut:' '",
                ["cut:','|cut:' '"]),
            (lazystr("a b c d"),  # Test for #20231
                ['a', 'b', 'c', 'd']),
        ]
        for test, expected in testdata:
            self.assertEqual(list(text.smart_split(test)), expected)

    def test_truncate_chars(self):
        truncator = text.Truncator(
            'The quick brown fox jumped over the lazy dog.'
        )
        self.assertEqual('The quick brown fox jumped over the lazy dog.',
            truncator.chars(100)),
        self.assertEqual('The quick brown fox ...',
            truncator.chars(23)),
        self.assertEqual('The quick brown fo.....',
            truncator.chars(23, '.....')),

        # Ensure that we normalize our unicode data first
        nfc = text.Truncator('o\xfco\xfco\xfco\xfc')
        nfd = text.Truncator('ou\u0308ou\u0308ou\u0308ou\u0308')
        self.assertEqual('oüoüoüoü', nfc.chars(8))
        self.assertEqual('oüoüoüoü', nfd.chars(8))
        self.assertEqual('oü...', nfc.chars(5))
        self.assertEqual('oü...', nfd.chars(5))

        # Ensure the final length is calculated correctly when there are
        # combining characters with no precomposed form, and that combining
        # characters are not split up.
        truncator = text.Truncator('-B\u030AB\u030A----8')
        self.assertEqual('-B\u030A...', truncator.chars(5))
        self.assertEqual('-B\u030AB\u030A-...', truncator.chars(7))
        self.assertEqual('-B\u030AB\u030A----8', truncator.chars(8))

        # Ensure the length of the end text is correctly calculated when it
        # contains combining characters with no precomposed form.
        truncator = text.Truncator('-----')
        self.assertEqual('---B\u030A', truncator.chars(4, 'B\u030A'))
        self.assertEqual('-----', truncator.chars(5, 'B\u030A'))

        # Make a best effort to shorten to the desired length, but requesting
        # a length shorter than the ellipsis shouldn't break
        self.assertEqual('...', text.Truncator('asdf').chars(1))

    def test_truncate_words(self):
        truncator = text.Truncator('The quick brown fox jumped over the lazy '
            'dog.')
        self.assertEqual('The quick brown fox jumped over the lazy dog.',
            truncator.words(10))
        self.assertEqual('The quick brown fox...', truncator.words(4))
        self.assertEqual('The quick brown fox[snip]',
            truncator.words(4, '[snip]'))

    def test_truncate_html_words(self):
        truncator = text.Truncator('<p id="par"><strong><em>The quick brown fox'
            ' jumped over the lazy dog.</em></strong></p>')
        self.assertEqual('<p id="par"><strong><em>The quick brown fox jumped over'
            ' the lazy dog.</em></strong></p>', truncator.words(10, html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox...</em>'
            '</strong></p>', truncator.words(4, html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox....</em>'
            '</strong></p>', truncator.words(4, '....', html=True))
        self.assertEqual('<p id="par"><strong><em>The quick brown fox</em>'
            '</strong></p>', truncator.words(4, '', html=True))

        # Test with new line inside tag
        truncator = text.Truncator('<p>The quick <a href="xyz.html"\n'
            'id="mylink">brown fox</a> jumped over the lazy dog.</p>')
        self.assertEqual('<p>The quick <a href="xyz.html"\n'
            'id="mylink">brown...</a></p>', truncator.words(3, '...', html=True))

        # Test self-closing tags
        truncator = text.Truncator('<br/>The <hr />quick brown fox jumped over'
            ' the lazy dog.')
        self.assertEqual('<br/>The <hr />quick brown...',
            truncator.words(3, '...', html=True))
        truncator = text.Truncator('<br>The <hr/>quick <em>brown fox</em> '
            'jumped over the lazy dog.')
        self.assertEqual('<br>The <hr/>quick <em>brown...</em>',
            truncator.words(3, '...', html=True))

        # Test html entities
        truncator = text.Truncator('<i>Buenos d&iacute;as!'
            ' &#x00bf;C&oacute;mo est&aacute;?</i>')
        self.assertEqual('<i>Buenos d&iacute;as! &#x00bf;C&oacute;mo...</i>',
            truncator.words(3, '...', html=True))
        truncator = text.Truncator('<p>I &lt;3 python, what about you?</p>')
        self.assertEqual('<p>I &lt;3 python...</p>',
            truncator.words(3, '...', html=True))

    def test_wrap(self):
        digits = '1234 67 9'
        self.assertEqual(text.wrap(digits, 100), '1234 67 9')
        self.assertEqual(text.wrap(digits, 9), '1234 67 9')
        self.assertEqual(text.wrap(digits, 8), '1234 67\n9')

        self.assertEqual(text.wrap('short\na long line', 7),
                         'short\na long\nline')

        self.assertEqual(text.wrap('do-not-break-long-words please? ok', 8),
                         'do-not-break-long-words\nplease?\nok')

        long_word = 'l%sng' % ('o' * 20)
        self.assertEqual(text.wrap(long_word, 20), long_word)
        self.assertEqual(text.wrap('a %s word' % long_word, 10),
                         'a\n%s\nword' % long_word)

    def test_normalize_newlines(self):
        self.assertEqual(text.normalize_newlines("abc\ndef\rghi\r\n"),
                         "abc\ndef\nghi\n")
        self.assertEqual(text.normalize_newlines("\n\r\r\n\r"), "\n\n\n\n")
        self.assertEqual(text.normalize_newlines("abcdefghi"), "abcdefghi")
        self.assertEqual(text.normalize_newlines(""), "")

    def test_normalize_newlines_bytes(self):
        """normalize_newlines should be able to handle bytes too"""
        normalized = text.normalize_newlines(b"abc\ndef\rghi\r\n")
        self.assertEqual(normalized, "abc\ndef\nghi\n")
        self.assertIsInstance(normalized, six.text_type)

    def test_slugify(self):
        items = (
            ('Hello, World!', 'hello-world'),
            ('spam & eggs', 'spam-eggs'),
        )
        for value, output in items:
            self.assertEqual(text.slugify(value), output)

    def test_unescape_entities(self):
        items = [
            ('', ''),
            ('foo', 'foo'),
            ('&amp;', '&'),
            ('&#x26;', '&'),
            ('&#38;', '&'),
            ('foo &amp; bar', 'foo & bar'),
            ('foo & bar', 'foo & bar'),
        ]
        for value, output in items:
            self.assertEqual(text.unescape_entities(value), output)

    def test_get_valid_filename(self):
        filename = "^&'@{}[],$=!-#()%+~_123.txt"
        self.assertEqual(text.get_valid_filename(filename), "-_123.txt")

    def test_javascript_quote(self):
        input = "<script>alert('Hello \\xff.\n Welcome\there\r');</script>"
        output = r"<script>alert(\'Hello \\xff.\n Welcome\there\r\');<\/script>"
        with warnings.catch_warnings():
            warnings.simplefilter("ignore", RemovedInDjango19Warning)
            self.assertEqual(text.javascript_quote(input), output)

            # Exercising quote_double_quotes keyword argument
            input = '"Text"'
            self.assertEqual(text.javascript_quote(input), '"Text"')
            self.assertEqual(text.javascript_quote(input, quote_double_quotes=True),
                             '&quot;Text&quot;')

    @skipUnless(IS_WIDE_BUILD, 'Not running in a wide build of Python')
    def test_javascript_quote_unicode(self):
        input = "<script>alert('Hello \\xff.\n Wel𝕃come\there\r');</script>"
        output = r"<script>alert(\'Hello \\xff.\n Wel𝕃come\there\r\');<\/script>"
        with warnings.catch_warnings():
            warnings.simplefilter("ignore", RemovedInDjango19Warning)
            self.assertEqual(text.javascript_quote(input), output)

    def test_deprecation(self):
        reset_warning_registry()
        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            text.javascript_quote('thingy')
            self.assertEqual(len(w), 1)
            self.assertIn('escapejs()', repr(w[0].message))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								# -*- coding: utf-8 -*-
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								from __future__ import unicode_literals
-												Fixed test failures when running in a narrow Python build.

											
										
										
											2014-02-19 01:07:07 +08:00
+								from unittest import skipUnless
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								import warnings
-												Fixed test failures when running in a narrow Python build.

											
										
										
											2014-02-19 01:07:07 +08:00
-												Fixed #18042 -- Advanced deprecation warnings.

Thanks Ramiro for the patch.

											
										
										
											2012-05-03 21:27:01 +08:00
+								from django.test import SimpleTestCase
-												Refs #23947 -- Worked around a bug in Python that prevents deprecation warnings from appearing in tests.

											
										
										
											2014-12-06 04:14:20 +08:00
+								from django.test.utils import reset_warning_registry
-												Fixed #21574 -- Handle bytes consistently in utils.text.normalize_newlines.

All input is now coerced to text before being normalized.
This changes nothing under Python 2 but it allows bytes
to be passed to the function without a TypeError under Python3
(bytes are assumed to be utf-8 encoded text).

Thanks to trac user vajrasky for the report.

											
										
										
											2013-12-12 22:58:14 +08:00
+								from django.utils import six, text
-												Fixed #21188 -- Introduced subclasses for to-be-removed-in-django-XX warnings

Thanks Anssi Kääriäinen for the idea and Simon Charette for the
review.

											
										
										
											2014-02-27 05:48:20 +08:00
+								from django.utils.deprecation import RemovedInDjango19Warning
-												Consolidated some text utils into the utils_tests test package.

											
										
										
											2014-09-23 20:45:59 +08:00
+								from django.utils.encoding import force_text
 								from django.utils.functional import lazy
 								from django.utils.translation import override
 								lazystr = lazy(force_text, six.text_type)
-												Reorganized utils tests so it's all in separate modules. Thanks to Stephan Jaekel.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@13889 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-09-27 23:15:04 +08:00
-												Fixed test failures when running in a narrow Python build.

											
										
										
											2014-02-19 01:07:07 +08:00
+								IS_WIDE_BUILD = (len('\U0001F4A9') == 1)
-												Fixing E302 Errors

Signed-off-by: Jason Myers <jason@jasonamyers.com>

											
										
										
											2013-11-03 05:34:05 +08:00
-												Fixed #18042 -- Advanced deprecation warnings.

Thanks Ramiro for the patch.

											
										
										
											2012-05-03 21:27:01 +08:00
+								class TestUtilsText(SimpleTestCase):
-												Consolidated some text utils into the utils_tests test package.

											
										
										
											2014-09-23 20:45:59 +08:00
+								    def test_get_text_list(self):
 								        self.assertEqual(text.get_text_list(['a', 'b', 'c', 'd']), 'a, b, c or d')
 								        self.assertEqual(text.get_text_list(['a', 'b', 'c'], 'and'), 'a, b and c')
 								        self.assertEqual(text.get_text_list(['a', 'b'], 'and'), 'a and b')
 								        self.assertEqual(text.get_text_list(['a']), 'a')
 								        self.assertEqual(text.get_text_list([]), '')
 								        with override('ar'):
 								            self.assertEqual(text.get_text_list(['a', 'b', 'c']), "a، b أو c")
 								    def test_smart_split(self):
 								        testdata = [
 								            ('This is "a person" test.',
 								                ['This', 'is', '"a person"', 'test.']),
 								            ('This is "a person\'s" test.',
 								                ['This', 'is', '"a person\'s"', 'test.']),
 								            ('This is "a person\\"s" test.',
 								                ['This', 'is', '"a person\\"s"', 'test.']),
 								            ('"a \'one',
 								                ['"a', "'one"]),
 								            ('all friends\' tests',
 								                ['all', 'friends\'', 'tests']),
 								            ('url search_page words="something else"',
 								                ['url', 'search_page', 'words="something else"']),
 								            ("url search_page words='something else'",
 								                ['url', 'search_page', "words='something else'"]),
 								            ('url search_page words "something else"',
 								                ['url', 'search_page', 'words', '"something else"']),
 								            ('url search_page words-"something else"',
 								                ['url', 'search_page', 'words-"something else"']),
 								            ('url search_page words=hello',
 								                ['url', 'search_page', 'words=hello']),
 								            ('url search_page words="something else',
 								                ['url', 'search_page', 'words="something', 'else']),
 								            ("cut:','|cut:' '",
 								                ["cut:','|cut:' '"]),
 								            (lazystr("a b c d"),  # Test for #20231
 								                ['a', 'b', 'c', 'd']),
 								        ]
 								        for test, expected in testdata:
 								            self.assertEqual(list(text.smart_split(test)), expected)
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								    def test_truncate_chars(self):
 								        truncator = text.Truncator(
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								            'The quick brown fox jumped over the lazy dog.'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								        )
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('The quick brown fox jumped over the lazy dog.',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            truncator.chars(100)),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('The quick brown fox ...',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            truncator.chars(23)),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('The quick brown fo.....',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            truncator.chars(23, '.....')),
 								        # Ensure that we normalize our unicode data first
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        nfc = text.Truncator('o\xfco\xfco\xfco\xfc')
 								        nfd = text.Truncator('ou\u0308ou\u0308ou\u0308ou\u0308')
 								        self.assertEqual('oüoüoüoü', nfc.chars(8))
 								        self.assertEqual('oüoüoüoü', nfd.chars(8))
 								        self.assertEqual('oü...', nfc.chars(5))
 								        self.assertEqual('oü...', nfd.chars(5))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
 								        # Ensure the final length is calculated correctly when there are
 								        # combining characters with no precomposed form, and that combining
 								        # characters are not split up.
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        truncator = text.Truncator('-B\u030AB\u030A----8')
 								        self.assertEqual('-B\u030A...', truncator.chars(5))
 								        self.assertEqual('-B\u030AB\u030A-...', truncator.chars(7))
 								        self.assertEqual('-B\u030AB\u030A----8', truncator.chars(8))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
 								        # Ensure the length of the end text is correctly calculated when it
 								        # contains combining characters with no precomposed form.
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        truncator = text.Truncator('-----')
 								        self.assertEqual('---B\u030A', truncator.chars(4, 'B\u030A'))
 								        self.assertEqual('-----', truncator.chars(5, 'B\u030A'))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
 								        # Make a best effort to shorten to the desired length, but requesting
 								        # a length shorter than the ellipsis shouldn't break
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('...', text.Truncator('asdf').chars(1))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
-												Reorganized utils tests so it's all in separate modules. Thanks to Stephan Jaekel.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@13889 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-09-27 23:15:04 +08:00
+								    def test_truncate_words(self):
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        truncator = text.Truncator('The quick brown fox jumped over the lazy '
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            'dog.')
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('The quick brown fox jumped over the lazy dog.',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            truncator.words(10))
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('The quick brown fox...', truncator.words(4))
 								        self.assertEqual('The quick brown fox[snip]',
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            truncator.words(4, '[snip]'))
 								    def test_truncate_html_words(self):
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
+								        truncator = text.Truncator('<p id="par"><strong><em>The quick brown fox'
 								            ' jumped over the lazy dog.</em></strong></p>')
 								        self.assertEqual('<p id="par"><strong><em>The quick brown fox jumped over'
 								            ' the lazy dog.</em></strong></p>', truncator.words(10, html=True))
 								        self.assertEqual('<p id="par"><strong><em>The quick brown fox...</em>'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            '</strong></p>', truncator.words(4, html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
+								        self.assertEqual('<p id="par"><strong><em>The quick brown fox....</em>'
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
+								            '</strong></p>', truncator.words(4, '....', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
+								        self.assertEqual('<p id="par"><strong><em>The quick brown fox</em>'
 								            '</strong></p>', truncator.words(4, '', html=True))
-												Fixed #10931 -- Made `Truncator` handle newlines properly. Thanks to gsong and Claude Paroz.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@17329 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2012-01-03 02:47:18 +08:00
+								        # Test with new line inside tag
 								        truncator = text.Truncator('<p>The quick <a href="xyz.html"\n'
 								            'id="mylink">brown fox</a> jumped over the lazy dog.</p>')
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual('<p>The quick <a href="xyz.html"\n'
-												Fixed #10931 -- Made `Truncator` handle newlines properly. Thanks to gsong and Claude Paroz.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@17329 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2012-01-03 02:47:18 +08:00
+								            'id="mylink">brown...</a></p>', truncator.words(3, '...', html=True))
-												Fixed #5025 -- Add a "truncatechars" template filter. Many thanks to Chris Beaven.

git-svn-id: http://code.djangoproject.com/svn/django/trunk@16542 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2011-07-14 21:47:10 +08:00
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
+								        # Test self-closing tags
 								        truncator = text.Truncator('<br/>The <hr />quick brown fox jumped over'
 								            ' the lazy dog.')
 								        self.assertEqual('<br/>The <hr />quick brown...',
-												Fixed #21266 -- Fixed E201,E202 pep8 warnings.

											
										
										
											2013-10-15 03:13:14 +08:00
+								            truncator.words(3, '...', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
+								        truncator = text.Truncator('<br>The <hr/>quick <em>brown fox</em> '
 								            'jumped over the lazy dog.')
 								        self.assertEqual('<br>The <hr/>quick <em>brown...</em>',
-												Fixed #21266 -- Fixed E201,E202 pep8 warnings.

											
										
										
											2013-10-15 03:13:14 +08:00
+								            truncator.words(3, '...', html=True))
-												Fixed #19693 -- Made truncatewords_html handle self-closing tags

Thanks sneawo for the report and Jonathan Loy for the patch.

											
										
										
											2013-02-14 01:24:49 +08:00
-												Fixed #20568 -- truncatewords_html no longer splits words containing HTML entities.

Thanks yann0 at hotmail.com for the report.

											
										
										
											2013-07-18 16:45:34 +08:00
+								        # Test html entities
 								        truncator = text.Truncator('<i>Buenos d&iacute;as!'
 								            ' &#x00bf;C&oacute;mo est&aacute;?</i>')
 								        self.assertEqual('<i>Buenos d&iacute;as! &#x00bf;C&oacute;mo...</i>',
 								            truncator.words(3, '...', html=True))
 								        truncator = text.Truncator('<p>I &lt;3 python, what about you?</p>')
 								        self.assertEqual('<p>I &lt;3 python...</p>',
 								            truncator.words(3, '...', html=True))
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-12-01 05:21:37 +08:00
+								    def test_wrap(self):
 								        digits = '1234 67 9'
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								        self.assertEqual(text.wrap(digits, 100), '1234 67 9')
 								        self.assertEqual(text.wrap(digits, 9), '1234 67 9')
 								        self.assertEqual(text.wrap(digits, 8), '1234 67\n9')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-12-01 05:21:37 +08:00
 								        self.assertEqual(text.wrap('short\na long line', 7),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								                         'short\na long\nline')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-12-01 05:21:37 +08:00
 								        self.assertEqual(text.wrap('do-not-break-long-words please? ok', 8),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								                         'do-not-break-long-words\nplease?\nok')
-												Tests for utils.text.wrap

git-svn-id: http://code.djangoproject.com/svn/django/trunk@14752 bcc190cf-cafb-0310-a4f2-bffc1f526a37

											
										
										
											2010-12-01 05:21:37 +08:00
 								        long_word = 'l%sng' % ('o' * 20)
 								        self.assertEqual(text.wrap(long_word, 20), long_word)
 								        self.assertEqual(text.wrap('a %s word' % long_word, 10),
-												Fixed #18269 -- Applied unicode_literals for Python 3 compatibility.

Thanks Vinay Sajip for the support of his django3 branch and
Jannis Leidel for the review.

											
										
										
											2012-06-08 00:08:47 +08:00
+								                         'a\n%s\nword' % long_word)
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 20:53:22 +08:00
-												Fixed #21572 -- Added unit test for django.utils.text.normalize_newlines.

											
										
										
											2013-12-07 16:28:22 +08:00
+								    def test_normalize_newlines(self):
 								        self.assertEqual(text.normalize_newlines("abc\ndef\rghi\r\n"),
 								                         "abc\ndef\nghi\n")
 								        self.assertEqual(text.normalize_newlines("\n\r\r\n\r"), "\n\n\n\n")
 								        self.assertEqual(text.normalize_newlines("abcdefghi"), "abcdefghi")
 								        self.assertEqual(text.normalize_newlines(""), "")
-												Fixed #21574 -- Handle bytes consistently in utils.text.normalize_newlines.

All input is now coerced to text before being normalized.
This changes nothing under Python 2 but it allows bytes
to be passed to the function without a TypeError under Python3
(bytes are assumed to be utf-8 encoded text).

Thanks to trac user vajrasky for the report.

											
										
										
											2013-12-12 22:58:14 +08:00
+								    def test_normalize_newlines_bytes(self):
 								        """normalize_newlines should be able to handle bytes too"""
 								        normalized = text.normalize_newlines(b"abc\ndef\rghi\r\n")
 								        self.assertEqual(normalized, "abc\ndef\nghi\n")
 								        self.assertIsInstance(normalized, six.text_type)
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 20:53:22 +08:00
+								    def test_slugify(self):
 								        items = (
-												[py3] Made 212b9826bd Python 3-friendly

											
										
										
											2012-08-18 23:47:21 +08:00
+								            ('Hello, World!', 'hello-world'),
 								            ('spam & eggs', 'spam-eggs'),
-												Fixed #14516 -- Extract methods from removetags and slugify template filters

Patch by @jphalip updated to apply, documentation and release notes
added.

I've documented strip_tags as well as remove_tags as the difference
between the two wouldn't be immediately obvious.

											
										
										
											2012-08-18 20:53:22 +08:00
+								        )
 								        for value, output in items:
 								            self.assertEqual(text.slugify(value), output)
-												Fix #21185: Added tests for unescape_entities.

Also fixed a py3 incompatibility.
Thanks to brutasse for the report.

											
										
										
											2013-09-27 23:00:42 +08:00
 								    def test_unescape_entities(self):
 								        items = [
 								            ('', ''),
 								            ('foo', 'foo'),
 								            ('&amp;', '&'),
 								            ('&#x26;', '&'),
 								            ('&#38;', '&'),
 								            ('foo &amp; bar', 'foo & bar'),
 								            ('foo & bar', 'foo & bar'),
 								        ]
 								        for value, output in items:
 								            self.assertEqual(text.unescape_entities(value), output)
-												Fixed #21505 -- Added unit test for django.utils.text.get_valid_filename.

											
										
										
											2013-11-24 16:10:21 +08:00
 								    def test_get_valid_filename(self):
 								        filename = "^&'@{}[],$=!-#()%+~_123.txt"
 								        self.assertEqual(text.get_valid_filename(filename), "-_123.txt")
-												Fixed #21731 -- Made javascript_quote escapes '</'.

											
										
										
											2014-01-04 12:57:50 +08:00
 								    def test_javascript_quote(self):
 								        input = "<script>alert('Hello \\xff.\n Welcome\there\r');</script>"
 								        output = r"<script>alert(\'Hello \\xff.\n Welcome\there\r\');<\/script>"
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								        with warnings.catch_warnings():
-												Fixed #21188 -- Introduced subclasses for to-be-removed-in-django-XX warnings

Thanks Anssi Kääriäinen for the idea and Simon Charette for the
review.

											
										
										
											2014-02-27 05:48:20 +08:00
+								            warnings.simplefilter("ignore", RemovedInDjango19Warning)
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								            self.assertEqual(text.javascript_quote(input), output)
-												Fixed #21731 -- Made javascript_quote escapes '</'.

											
										
										
											2014-01-04 12:57:50 +08:00
-												Really hidden warnings in javascript_quote tests

Refs #21725.

											
										
										
											2014-03-05 15:57:13 +08:00
+								            # Exercising quote_double_quotes keyword argument
 								            input = '"Text"'
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								            self.assertEqual(text.javascript_quote(input), '"Text"')
 								            self.assertEqual(text.javascript_quote(input, quote_double_quotes=True),
 								                             '&quot;Text&quot;')
-												Fixed #21725 -- Fixed JavaScript quoting encoding.

Thanks to nedbatchelder for the report.

											
										
										
											2014-02-16 01:55:33 +08:00
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								    @skipUnless(IS_WIDE_BUILD, 'Not running in a wide build of Python')
-												Fixed #21725 -- Fixed JavaScript quoting encoding.

Thanks to nedbatchelder for the report.

											
										
										
											2014-02-16 01:55:33 +08:00
+								    def test_javascript_quote_unicode(self):
 								        input = "<script>alert('Hello \\xff.\n Wel𝕃come\there\r');</script>"
 								        output = r"<script>alert(\'Hello \\xff.\n Wel𝕃come\there\r\');<\/script>"
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								        with warnings.catch_warnings():
-												Fixed #21188 -- Introduced subclasses for to-be-removed-in-django-XX warnings

Thanks Anssi Kääriäinen for the idea and Simon Charette for the
review.

											
										
										
											2014-02-27 05:48:20 +08:00
+								            warnings.simplefilter("ignore", RemovedInDjango19Warning)
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								            self.assertEqual(text.javascript_quote(input), output)
 								    def test_deprecation(self):
-												Refs #23947 -- Worked around a bug in Python that prevents deprecation warnings from appearing in tests.

											
										
										
											2014-12-06 04:14:20 +08:00
+								        reset_warning_registry()
-												Deprecated django.utils.text.javascript_quote.

Refs #21725.

											
										
										
											2014-02-21 21:46:23 +08:00
+								        with warnings.catch_warnings(record=True) as w:
 								            warnings.simplefilter("always")
 								            text.javascript_quote('thingy')
 								            self.assertEqual(len(w), 1)
 								            self.assertIn('escapejs()', repr(w[0].message))