django1/tests/utils_tests/test_encoding.py

import datetime
import sys
import unittest
from unittest import mock
from urllib.parse import quote_plus

from django.test import SimpleTestCase
from django.utils.encoding import (
    DjangoUnicodeDecodeError, escape_uri_path, filepath_to_uri, force_bytes,
    force_str, get_system_encoding, iri_to_uri, repercent_broken_unicode,
    smart_bytes, smart_str, uri_to_iri,
)
from django.utils.functional import SimpleLazyObject
from django.utils.translation import gettext_lazy


class TestEncodingUtils(SimpleTestCase):
    def test_force_str_exception(self):
        """
        Broken __str__ actually raises an error.
        """
        class MyString:
            def __str__(self):
                return b'\xc3\xb6\xc3\xa4\xc3\xbc'

        # str(s) raises a TypeError if the result is not a text type.
        with self.assertRaises(TypeError):
            force_str(MyString())

    def test_force_str_lazy(self):
        s = SimpleLazyObject(lambda: 'x')
        self.assertIs(type(force_str(s)), str)

    def test_force_str_DjangoUnicodeDecodeError(self):
        msg = (
            "'utf-8' codec can't decode byte 0xff in position 0: invalid "
            "start byte. You passed in b'\\xff' (<class 'bytes'>)"
        )
        with self.assertRaisesMessage(DjangoUnicodeDecodeError, msg):
            force_str(b'\xff')

    def test_force_bytes_exception(self):
        """
        force_bytes knows how to convert to bytes an exception
        containing non-ASCII characters in its args.
        """
        error_msg = "This is an exception, voilà"
        exc = ValueError(error_msg)
        self.assertEqual(force_bytes(exc), error_msg.encode())
        self.assertEqual(force_bytes(exc, encoding='ascii', errors='ignore'), b'This is an exception, voil')

    def test_force_bytes_strings_only(self):
        today = datetime.date.today()
        self.assertEqual(force_bytes(today, strings_only=True), today)

    def test_force_bytes_encoding(self):
        error_msg = 'This is an exception, voilà'.encode()
        result = force_bytes(error_msg, encoding='ascii', errors='ignore')
        self.assertEqual(result, b'This is an exception, voil')

    def test_force_bytes_memory_view(self):
        data = b'abc'
        result = force_bytes(memoryview(data))
        # Type check is needed because memoryview(bytes) == bytes.
        self.assertIs(type(result), bytes)
        self.assertEqual(result, data)

    def test_smart_bytes(self):
        class Test:
            def __str__(self):
                return 'ŠĐĆŽćžšđ'

        lazy_func = gettext_lazy('x')
        self.assertIs(smart_bytes(lazy_func), lazy_func)
        self.assertEqual(smart_bytes(Test()), b'\xc5\xa0\xc4\x90\xc4\x86\xc5\xbd\xc4\x87\xc5\xbe\xc5\xa1\xc4\x91')
        self.assertEqual(smart_bytes(1), b'1')
        self.assertEqual(smart_bytes('foo'), b'foo')

    def test_smart_str(self):
        class Test:
            def __str__(self):
                return 'ŠĐĆŽćžšđ'

        lazy_func = gettext_lazy('x')
        self.assertIs(smart_str(lazy_func), lazy_func)
        self.assertEqual(smart_str(Test()), '\u0160\u0110\u0106\u017d\u0107\u017e\u0161\u0111')
        self.assertEqual(smart_str(1), '1')
        self.assertEqual(smart_str('foo'), 'foo')

    def test_get_default_encoding(self):
        with mock.patch('locale.getdefaultlocale', side_effect=Exception):
            self.assertEqual(get_system_encoding(), 'ascii')

    def test_repercent_broken_unicode_recursion_error(self):
        # Prepare a string long enough to force a recursion error if the tested
        # function uses recursion.
        data = b'\xfc' * sys.getrecursionlimit()
        try:
            self.assertEqual(repercent_broken_unicode(data), b'%FC' * sys.getrecursionlimit())
        except RecursionError:
            self.fail('Unexpected RecursionError raised.')


class TestRFC3987IEncodingUtils(unittest.TestCase):

    def test_filepath_to_uri(self):
        self.assertIsNone(filepath_to_uri(None))
        self.assertEqual(filepath_to_uri('upload\\чубака.mp4'), 'upload/%D1%87%D1%83%D0%B1%D0%B0%D0%BA%D0%B0.mp4')

    def test_iri_to_uri(self):
        cases = [
            # Valid UTF-8 sequences are encoded.
            ('red%09rosé#red', 'red%09ros%C3%A9#red'),
            ('/blog/for/Jürgen Münster/', '/blog/for/J%C3%BCrgen%20M%C3%BCnster/'),
            ('locations/%s' % quote_plus('Paris & Orléans'), 'locations/Paris+%26+Orl%C3%A9ans'),

            # Reserved chars remain unescaped.
            ('%&', '%&'),
            ('red&♥ros%#red', 'red&%E2%99%A5ros%#red'),
            (gettext_lazy('red&♥ros%#red'), 'red&%E2%99%A5ros%#red'),
        ]

        for iri, uri in cases:
            with self.subTest(iri):
                self.assertEqual(iri_to_uri(iri), uri)

                # Test idempotency.
                self.assertEqual(iri_to_uri(iri_to_uri(iri)), uri)

    def test_uri_to_iri(self):
        cases = [
            (None, None),
            # Valid UTF-8 sequences are decoded.
            ('/%e2%89%Ab%E2%99%a5%E2%89%aB/', '/≫♥≫/'),
            ('/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93', '/♥♥/?utf8=✓'),
            ('/%41%5a%6B/', '/AZk/'),
            # Reserved and non-URL valid ASCII chars are not decoded.
            ('/%25%20%02%41%7b/', '/%25%20%02A%7b/'),
            # Broken UTF-8 sequences remain escaped.
            ('/%AAd%AAj%AAa%AAn%AAg%AAo%AA/', '/%AAd%AAj%AAa%AAn%AAg%AAo%AA/'),
            ('/%E2%99%A5%E2%E2%99%A5/', '/♥%E2♥/'),
            ('/%E2%99%A5%E2%99%E2%99%A5/', '/♥%E2%99♥/'),
            ('/%E2%E2%99%A5%E2%99%A5%99/', '/%E2♥♥%99/'),
            ('/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93', '/♥♥/?utf8=%9C%93✓%9C%93'),
        ]

        for uri, iri in cases:
            with self.subTest(uri):
                self.assertEqual(uri_to_iri(uri), iri)

                # Test idempotency.
                self.assertEqual(uri_to_iri(uri_to_iri(uri)), iri)

    def test_complementarity(self):
        cases = [
            ('/blog/for/J%C3%BCrgen%20M%C3%BCnster/', '/blog/for/J\xfcrgen%20M\xfcnster/'),
            ('%&', '%&'),
            ('red&%E2%99%A5ros%#red', 'red&♥ros%#red'),
            ('/%E2%99%A5%E2%99%A5/', '/♥♥/'),
            ('/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93', '/♥♥/?utf8=✓'),
            ('/%25%20%02%7b/', '/%25%20%02%7b/'),
            ('/%AAd%AAj%AAa%AAn%AAg%AAo%AA/', '/%AAd%AAj%AAa%AAn%AAg%AAo%AA/'),
            ('/%E2%99%A5%E2%E2%99%A5/', '/♥%E2♥/'),
            ('/%E2%99%A5%E2%99%E2%99%A5/', '/♥%E2%99♥/'),
            ('/%E2%E2%99%A5%E2%99%A5%99/', '/%E2♥♥%99/'),
            ('/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93', '/♥♥/?utf8=%9C%93✓%9C%93'),
        ]

        for uri, iri in cases:
            with self.subTest(uri):
                self.assertEqual(iri_to_uri(uri_to_iri(uri)), uri)
                self.assertEqual(uri_to_iri(iri_to_uri(iri)), iri)

    def test_escape_uri_path(self):
        cases = [
            (
                '/;some/=awful/?path/:with/@lots/&of/+awful/chars',
                '/%3Bsome/%3Dawful/%3Fpath/:with/@lots/&of/+awful/chars',
            ),
            ('/foo#bar', '/foo%23bar'),
            ('/foo?bar', '/foo%3Fbar'),
        ]
        for uri, expected in cases:
            with self.subTest(uri):
                self.assertEqual(escape_uri_path(uri), expected)
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 23:28:28 +08:00			`import datetime`
Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 23:04:53 +08:00			`import sys`
Sorted imports with isort; refs #23860. 2015-01-28 20:35:27 +08:00			`import unittest`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`from unittest import mock`
Refs #23919 -- Replaced usage of django.utils.http utilities with Python equivalents Thanks Tim Graham for the review. 2017-01-26 21:25:15 +08:00			`from urllib.parse import quote_plus`
Stopped using django.utils.unittest in the test suite. Refs #20680. 2013-07-01 20:22:27 +08:00
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-02 04:48:53 +08:00			`from django.test import SimpleTestCase`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 23:43:34 +08:00			`from django.utils.encoding import (`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-02 04:48:53 +08:00			`DjangoUnicodeDecodeError, escape_uri_path, filepath_to_uri, force_bytes,`
Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 23:04:53 +08:00			`force_str, get_system_encoding, iri_to_uri, repercent_broken_unicode,`
			`smart_bytes, smart_str, uri_to_iri,`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 23:43:34 +08:00			`)`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-27 04:46:13 +08:00			`from django.utils.functional import SimpleLazyObject`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`from django.utils.translation import gettext_lazy`
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 15:24:39 +08:00

Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-02 04:48:53 +08:00			`class TestEncodingUtils(SimpleTestCase):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`def test_force_str_exception(self):`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-07 01:16:06 +08:00			`"""`
Refs #23919 -- Removed unneeded str() calls 2017-01-20 17:20:53 +08:00			`Broken __str__ actually raises an error.`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-07 01:16:06 +08:00			`"""`
Refs #23919 -- Stopped inheriting from object to define new style classes. 2017-01-19 15:39:46 +08:00			`class MyString:`
Fixed #20812 -- Error out if __unicode__/__str__ doesn't return a text type. 2013-09-07 01:16:06 +08:00			`def __str__(self):`
			`return b'\xc3\xb6\xc3\xa4\xc3\xbc'`

Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 18:38:01 +08:00			`# str(s) raises a TypeError if the result is not a text type.`
			`with self.assertRaises(TypeError):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`force_str(MyString())`
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 23:28:28 +08:00
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`def test_force_str_lazy(self):`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-27 04:46:13 +08:00			`s = SimpleLazyObject(lambda: 'x')`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`self.assertIs(type(force_str(s)), str)`
Fixed #24836 -- Made force_text() resolve lazy objects. 2015-05-27 04:46:13 +08:00
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`def test_force_str_DjangoUnicodeDecodeError(self):`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-02 04:48:53 +08:00			`msg = (`
			`"'utf-8' codec can't decode byte 0xff in position 0: invalid "`
			`"start byte. You passed in b'\\xff' (<class 'bytes'>)"`
			`)`
			`with self.assertRaisesMessage(DjangoUnicodeDecodeError, msg):`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`force_str(b'\xff')`
Added a test for force_text()'s DjangoUnicodeDecodeError path. 2017-02-02 04:48:53 +08:00
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 15:24:39 +08:00			`def test_force_bytes_exception(self):`
			`"""`
Refs #27392 -- Removed "Tests that", "Ensures that", etc. from test docstrings. 2016-10-27 15:53:39 +08:00			`force_bytes knows how to convert to bytes an exception`
Fixed #18902 -- Made force_bytes properly handle exception input Thanks Aymeric Augustin for the report and the initial patch. 2012-09-04 15:24:39 +08:00			`containing non-ASCII characters in its args.`
			`"""`
			`error_msg = "This is an exception, voilà"`
			`exc = ValueError(error_msg)`
Refs #23919 -- Removed default 'utf-8' argument for str.encode()/decode(). 2017-02-08 01:05:47 +08:00			`self.assertEqual(force_bytes(exc), error_msg.encode())`
Removed an untested and broken branch in force_bytes() (refs #6353). The new test crashed in the removed branch. It's unclear if the branch has value since c6a2bd9b962af1cdf46f964589e6023046cfa8ec didn't include tests. 2017-02-04 08:36:53 +08:00			`self.assertEqual(force_bytes(exc, encoding='ascii', errors='ignore'), b'This is an exception, voil')`
Fixed #20108 -- Fixed filepath_to_uri decoding error This was a regression due to unicode_literals usage. Thanks Ivan Virabyan for the report and the initial patch. 2013-03-23 00:55:12 +08:00
Fixed #18719 -- Made force_bytes more consistent with force_text. 2013-09-06 23:28:28 +08:00			`def test_force_bytes_strings_only(self):`
			`today = datetime.date.today()`
			`self.assertEqual(force_bytes(today, strings_only=True), today)`

Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`def test_force_bytes_encoding(self):`
			`error_msg = 'This is an exception, voilà'.encode()`
			`result = force_bytes(error_msg, encoding='ascii', errors='ignore')`
			`self.assertEqual(result, b'This is an exception, voil')`

			`def test_force_bytes_memory_view(self):`
Made test for memoryview handling in force_bytes() more strict. 2018-07-09 23:01:42 +08:00			`data = b'abc'`
			`result = force_bytes(memoryview(data))`
			`# Type check is needed because memoryview(bytes) == bytes.`
			`self.assertIs(type(result), bytes)`
			`self.assertEqual(result, data)`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00
			`def test_smart_bytes(self):`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 23:45:54 +08:00			`class Test:`
Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 18:38:01 +08:00			`def __str__(self):`
			`return 'ŠĐĆŽćžšđ'`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 23:45:54 +08:00
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`lazy_func = gettext_lazy('x')`
			`self.assertIs(smart_bytes(lazy_func), lazy_func)`
			`self.assertEqual(smart_bytes(Test()), b'\xc5\xa0\xc4\x90\xc4\x86\xc5\xbd\xc4\x87\xc5\xbe\xc5\xa1\xc4\x91')`
			`self.assertEqual(smart_bytes(1), b'1')`
			`self.assertEqual(smart_bytes('foo'), b'foo')`

Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`def test_smart_str(self):`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`class Test:`
Refs #23919 -- Removed six.PY2/PY3 usage Thanks Tim Graham for the review. 2016-12-01 18:38:01 +08:00			`def __str__(self):`
			`return 'ŠĐĆŽćžšđ'`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 23:45:54 +08:00
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`lazy_func = gettext_lazy('x')`
Refs #27753 -- Favored force/smart_str() over force/smart_text(). 2017-01-26 17:08:08 +08:00			`self.assertIs(smart_str(lazy_func), lazy_func)`
			`self.assertEqual(smart_str(Test()), '\u0160\u0110\u0106\u017d\u0107\u017e\u0161\u0111')`
			`self.assertEqual(smart_str(1), '1')`
			`self.assertEqual(smart_str('foo'), 'foo')`
Fixed #18456 -- Added path escaping to HttpRequest.get_full_path(). 2014-10-31 23:43:34 +08:00
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`def test_get_default_encoding(self):`
			`with mock.patch('locale.getdefaultlocale', side_effect=Exception):`
			`self.assertEqual(get_system_encoding(), 'ascii')`

Fixed CVE-2019-14235 -- Fixed potential memory exhaustion in django.utils.encoding.uri_to_iri(). Thanks to Guido Vranken for initial report. 2019-07-19 23:04:53 +08:00			`def test_repercent_broken_unicode_recursion_error(self):`
			`# Prepare a string long enough to force a recursion error if the tested`
			`# function uses recursion.`
			`data = b'\xfc' * sys.getrecursionlimit()`
			`try:`
			`self.assertEqual(repercent_broken_unicode(data), b'%FC' * sys.getrecursionlimit())`
			`except RecursionError:`
			`self.fail('Unexpected RecursionError raised.')`

Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00
			`class TestRFC3987IEncodingUtils(unittest.TestCase):`

Fixed #20108 -- Fixed filepath_to_uri decoding error This was a regression due to unicode_literals usage. Thanks Ivan Virabyan for the report and the initial patch. 2013-03-23 00:55:12 +08:00			`def test_filepath_to_uri(self):`
Used more specific unittest assertions in tests. * assertIsNone()/assertIsNotNone() instead of comparing to None. * assertLess() for < comparisons. * assertIs() for 'is' expressions. * assertIsInstance() for isinstance() expressions. * rounding of assertAlmostEqual() for round() expressions. * assertIs(..., True/False) instead of comparing to True/False. * assertIs()/assertIsNot() for ==/!= comparisons. * assertNotEqual() for == comparisons. * assertTrue()/assertFalse() instead of comparing to True/False. 2019-10-21 16:55:05 +08:00			`self.assertIsNone(filepath_to_uri(None))`
Fixed E128 flake8 warnings in tests/. 2016-04-08 10:04:45 +08:00			`self.assertEqual(filepath_to_uri('upload\\чубака.mp4'), 'upload/%D1%87%D1%83%D0%B1%D0%B0%D0%BA%D0%B0.mp4')`
Fixed #21198 -- Prevented invalid use of @python_2_unicode_compatible. Thanks jpic for the report and chmodas for working on a patch. Reverts 2ea80b94. Refs #19362. 2013-10-14 00:06:58 +08:00
Consolidated some text utils into the utils_tests test package. 2014-09-23 20:45:59 +08:00			`def test_iri_to_uri(self):`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`cases = [`
			`# Valid UTF-8 sequences are encoded.`
			`('red%09rosé#red', 'red%09ros%C3%A9#red'),`
			`('/blog/for/Jürgen Münster/', '/blog/for/J%C3%BCrgen%20M%C3%BCnster/'),`
Refs #23919 -- Replaced usage of django.utils.http utilities with Python equivalents Thanks Tim Graham for the review. 2017-01-26 21:25:15 +08:00			`('locations/%s' % quote_plus('Paris & Orléans'), 'locations/Paris+%26+Orl%C3%A9ans'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00
			`# Reserved chars remain unescaped.`
			`('%&', '%&'),`
			`('red&♥ros%#red', 'red&%E2%99%A5ros%#red'),`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`(gettext_lazy('red&♥ros%#red'), 'red&%E2%99%A5ros%#red'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`]`

			`for iri, uri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`with self.subTest(iri):`
			`self.assertEqual(iri_to_uri(iri), uri)`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`# Test idempotency.`
			`self.assertEqual(iri_to_uri(iri_to_uri(iri)), uri)`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00
			`def test_uri_to_iri(self):`
			`cases = [`
Completed test coverage for django.utils.encoding. 2017-02-23 09:54:55 +08:00			`(None, None),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`# Valid UTF-8 sequences are decoded.`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 21:55:44 +08:00			`('/%e2%89%Ab%E2%99%a5%E2%89%aB/', '/≫♥≫/'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`('/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93', '/♥♥/?utf8=✓'),`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 21:55:44 +08:00			`('/%41%5a%6B/', '/AZk/'),`
			`# Reserved and non-URL valid ASCII chars are not decoded.`
			`('/%25%20%02%41%7b/', '/%25%20%02A%7b/'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`# Broken UTF-8 sequences remain escaped.`
			`('/%AAd%AAj%AAa%AAn%AAg%AAo%AA/', '/%AAd%AAj%AAa%AAn%AAg%AAo%AA/'),`
			`('/%E2%99%A5%E2%E2%99%A5/', '/♥%E2♥/'),`
			`('/%E2%99%A5%E2%99%E2%99%A5/', '/♥%E2%99♥/'),`
			`('/%E2%E2%99%A5%E2%99%A5%99/', '/%E2♥♥%99/'),`
			`('/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93', '/♥♥/?utf8=%9C%93✓%9C%93'),`
			`]`
Consolidated some text utils into the utils_tests test package. 2014-09-23 20:45:59 +08:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`for uri, iri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`with self.subTest(uri):`
			`self.assertEqual(uri_to_iri(uri), iri)`
Consolidated some text utils into the utils_tests test package. 2014-09-23 20:45:59 +08:00
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`# Test idempotency.`
			`self.assertEqual(uri_to_iri(uri_to_iri(uri)), iri)`
Consolidated some text utils into the utils_tests test package. 2014-09-23 20:45:59 +08:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`def test_complementarity(self):`
			`cases = [`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 21:55:44 +08:00			`('/blog/for/J%C3%BCrgen%20M%C3%BCnster/', '/blog/for/J\xfcrgen%20M\xfcnster/'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`('%&', '%&'),`
			`('red&%E2%99%A5ros%#red', 'red&♥ros%#red'),`
			`('/%E2%99%A5%E2%99%A5/', '/♥♥/'),`
			`('/%E2%99%A5%E2%99%A5/?utf8=%E2%9C%93', '/♥♥/?utf8=✓'),`
Fixed #26005 -- Fixed some percent decoding cases in uri_to_iri(). 2017-02-07 21:55:44 +08:00			`('/%25%20%02%7b/', '/%25%20%02%7b/'),`
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`('/%AAd%AAj%AAa%AAn%AAg%AAo%AA/', '/%AAd%AAj%AAa%AAn%AAg%AAo%AA/'),`
			`('/%E2%99%A5%E2%E2%99%A5/', '/♥%E2♥/'),`
			`('/%E2%99%A5%E2%99%E2%99%A5/', '/♥%E2%99♥/'),`
			`('/%E2%E2%99%A5%E2%99%A5%99/', '/%E2♥♥%99/'),`
			`('/%E2%99%A5%E2%99%A5/?utf8=%9C%93%E2%9C%93%9C%93', '/♥♥/?utf8=%9C%93✓%9C%93'),`
			`]`
Consolidated some text utils into the utils_tests test package. 2014-09-23 20:45:59 +08:00
Fixed #19508 -- Implemented uri_to_iri as per RFC. Thanks Loic Bistuer for helping in shaping the patch and Claude Paroz for the review. 2014-07-22 20:25:22 +08:00			`for uri, iri in cases:`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`with self.subTest(uri):`
			`self.assertEqual(iri_to_uri(uri_to_iri(uri)), uri)`
			`self.assertEqual(uri_to_iri(iri_to_uri(iri)), iri)`
Cleaned up some forms tests. Thanks Berker Peksag and Tim Graham for the reviews. Refs #24219. 2015-01-25 23:45:54 +08:00
			`def test_escape_uri_path(self):`
Refs #27804 -- Used subTest() in utils_tests/test_encoding.py. 2019-08-26 17:58:06 +08:00			`cases = [`
			`(`
			`'/;some/=awful/?path/:with/@lots/&of/+awful/chars',`
			`'/%3Bsome/%3Dawful/%3Fpath/:with/@lots/&of/+awful/chars',`
			`),`
			`('/foo#bar', '/foo%23bar'),`
			`('/foo?bar', '/foo%3Fbar'),`
			`]`
			`for uri, expected in cases:`
			`with self.subTest(uri):`
			`self.assertEqual(escape_uri_path(uri), expected)`