django1/django/utils/http.py

import re
import urllib
from email.Utils import formatdate

from django.utils.encoding import smart_str, force_unicode
from django.utils.functional import allow_lazy

ETAG_MATCH = re.compile(r'(?:W/)?"((?:\\.|[^"])*)"')

def urlquote(url, safe='/'):
    """
    A version of Python's urllib.quote() function that can operate on unicode
    strings. The url is first UTF-8 encoded before quoting. The returned string
    can safely be used as part of an argument to a subsequent iri_to_uri() call
    without double-quoting occurring.
    """
    return force_unicode(urllib.quote(smart_str(url), smart_str(safe)))

urlquote = allow_lazy(urlquote, unicode)

def urlquote_plus(url, safe=''):
    """
    A version of Python's urllib.quote_plus() function that can operate on
    unicode strings. The url is first UTF-8 encoded before quoting. The
    returned string can safely be used as part of an argument to a subsequent
    iri_to_uri() call without double-quoting occurring.
    """
    return force_unicode(urllib.quote_plus(smart_str(url), smart_str(safe)))
urlquote_plus = allow_lazy(urlquote_plus, unicode)

def urlencode(query, doseq=0):
    """
    A version of Python's urllib.urlencode() function that can operate on
    unicode strings. The parameters are first case to UTF-8 encoded strings and
    then encoded as per normal.
    """
    if hasattr(query, 'items'):
        query = query.items()
    return urllib.urlencode(
        [(smart_str(k),
         isinstance(v, (list,tuple)) and [smart_str(i) for i in v] or smart_str(v))
            for k, v in query],
        doseq)

def cookie_date(epoch_seconds=None):
    """
    Formats the time to ensure compatibility with Netscape's cookie standard.

    Accepts a floating point number expressed in seconds since the epoch, in
    UTC - such as that outputted by time.time(). If set to None, defaults to
    the current time.

    Outputs a string in the format 'Wdy, DD-Mon-YYYY HH:MM:SS GMT'.
    """
    rfcdate = formatdate(epoch_seconds)
    return '%s-%s-%s GMT' % (rfcdate[:7], rfcdate[8:11], rfcdate[12:25])

def http_date(epoch_seconds=None):
    """
    Formats the time to match the RFC1123 date format as specified by HTTP
    RFC2616 section 3.3.1.

    Accepts a floating point number expressed in seconds since the epoch, in
    UTC - such as that outputted by time.time(). If set to None, defaults to
    the current time.

    Outputs a string in the format 'Wdy, DD Mon YYYY HH:MM:SS GMT'.
    """
    rfcdate = formatdate(epoch_seconds)
    return '%s GMT' % rfcdate[:25]

# Base 36 functions: useful for generating compact URLs

def base36_to_int(s):
    """
    Converts a base 36 string to an ``int``. To prevent
    overconsumption of server resources, raises ``ValueError` if the
    input is longer than 13 base36 digits (13 digits is sufficient to
    base36-encode any 64-bit integer).
    """
    if len(s) > 13:
        raise ValueError("Base36 input too large")
    return int(s, 36)

def int_to_base36(i):
    """
    Converts an integer to a base36 string
    """
    digits = "0123456789abcdefghijklmnopqrstuvwxyz"
    factor = 0
    # Find starting factor
    while True:
        factor += 1
        if i < 36 ** factor:
            factor -= 1
            break
    base36 = []
    # Construct base36 representation
    while factor >= 0:
        j = 36 ** factor
        base36.append(digits[i / j])
        i = i % j
        factor -= 1
    return ''.join(base36)

def parse_etags(etag_str):
    """
    Parses a string with one or several etags passed in If-None-Match and
    If-Match headers by the rules in RFC 2616. Returns a list of etags
    without surrounding double quotes (") and unescaped from \<CHAR>.
    """
    etags = ETAG_MATCH.findall(etag_str)
    if not etags:
        # etag_str has wrong format, treat it as an opaque string then
        return [etag_str]
    etags = [e.decode('string_escape') for e in etags]
    return etags

def quote_etag(etag):
    """
    Wraps a string in double quotes escaping contents as necesary.
    """
    return '"%s"' % etag.replace('\\', '\\\\').replace('"', '\\"')
Fixed #5791 -- Added early-bailout support for views (ETags and Last-modified). This provides support for views that can have their ETag and/or Last-modified values computed much more quickly than the view itself. Supports all HTTP verbs (not just GET). Documentation and tests need a little more fleshing out (I'm not happy with the documentation at the moment, since it's a bit backwards), but the functionality is correct. git-svn-id: http://code.djangoproject.com/svn/django/trunk@10114 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2009-03-22 15:58:29 +08:00			`import re`
Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00			`import urllib`
Fixed #5816 -- Fixed a regression from [6333] that generates incorrect cookie "expires" dates when using a locale other than English. Introduced `http_date` and `cookie_date` utility functions. Thanks for the report Michael Lemaire. Thanks for the patch Karen Tracey and `SmileyChris`. git-svn-id: http://code.djangoproject.com/svn/django/trunk@6634 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-10-31 11:59:40 +08:00			`from email.Utils import formatdate`

Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00			`from django.utils.encoding import smart_str, force_unicode`
			`from django.utils.functional import allow_lazy`

Fixed #5791 -- Added early-bailout support for views (ETags and Last-modified). This provides support for views that can have their ETag and/or Last-modified values computed much more quickly than the view itself. Supports all HTTP verbs (not just GET). Documentation and tests need a little more fleshing out (I'm not happy with the documentation at the moment, since it's a bit backwards), but the functionality is correct. git-svn-id: http://code.djangoproject.com/svn/django/trunk@10114 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2009-03-22 15:58:29 +08:00			`ETAG_MATCH = re.compile(r'(?:W/)?"((?:\\.\|[^"])*)"')`

Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00			`def urlquote(url, safe='/'):`
			`"""`
			`A version of Python's urllib.quote() function that can operate on unicode`
			`strings. The url is first UTF-8 encoded before quoting. The returned string`
			`can safely be used as part of an argument to a subsequent iri_to_uri() call`
			`without double-quoting occurring.`
			`"""`
Fixed #13765 - 'safe' parameter for urlencode filter Thanks to KyleMac for the suggestion and SmileyChris for the patch git-svn-id: http://code.djangoproject.com/svn/django/trunk@13849 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2010-09-14 07:01:34 +08:00			`return force_unicode(urllib.quote(smart_str(url), smart_str(safe)))`
Fixed #5734 -- Fixed an omission where we weren't passing the "safe" argument upstream in django.utils.http.urlquote(). Thanks, Thomas Güttler. git-svn-id: http://code.djangoproject.com/svn/django/trunk@6554 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-10-20 16:38:59 +08:00
Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00			`urlquote = allow_lazy(urlquote, unicode)`

			`def urlquote_plus(url, safe=''):`
			`"""`
			`A version of Python's urllib.quote_plus() function that can operate on`
			`unicode strings. The url is first UTF-8 encoded before quoting. The`
			`returned string can safely be used as part of an argument to a subsequent`
			`iri_to_uri() call without double-quoting occurring.`
			`"""`
Fixed #13765 - 'safe' parameter for urlencode filter Thanks to KyleMac for the suggestion and SmileyChris for the patch git-svn-id: http://code.djangoproject.com/svn/django/trunk@13849 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2010-09-14 07:01:34 +08:00			`return force_unicode(urllib.quote_plus(smart_str(url), smart_str(safe)))`
Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00			`urlquote_plus = allow_lazy(urlquote_plus, unicode)`

			`def urlencode(query, doseq=0):`
			`"""`
			`A version of Python's urllib.urlencode() function that can operate on`
			`unicode strings. The parameters are first case to UTF-8 encoded strings and`
			`then encoded as per normal.`
			`"""`
			`if hasattr(query, 'items'):`
			`query = query.items()`
Fixed #4402 -- Modified test client to allow multi-valued inputs on GET requests. Thanks for the suggestion, eddymul@gmail.com. git-svn-id: http://code.djangoproject.com/svn/django/trunk@5741 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-21 13:17:20 +08:00			`return urllib.urlencode(`
			`[(smart_str(k),`
			`isinstance(v, (list,tuple)) and [smart_str(i) for i in v] or smart_str(v))`
			`for k, v in query],`
			`doseq)`
Merged Unicode branch into trunk (r4952:5608). This should be fully backwards compatible for all practical purposes. Fixed #2391, #2489, #2996, #3322, #3344, #3370, #3406, #3432, #3454, #3492, #3582, #3690, #3878, #3891, #3937, #4039, #4141, #4227, #4286, #4291, #4300, #4452, #4702 git-svn-id: http://code.djangoproject.com/svn/django/trunk@5609 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-07-04 20:11:04 +08:00
Fixed #5816 -- Fixed a regression from [6333] that generates incorrect cookie "expires" dates when using a locale other than English. Introduced `http_date` and `cookie_date` utility functions. Thanks for the report Michael Lemaire. Thanks for the patch Karen Tracey and `SmileyChris`. git-svn-id: http://code.djangoproject.com/svn/django/trunk@6634 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2007-10-31 11:59:40 +08:00			`def cookie_date(epoch_seconds=None):`
			`"""`
			`Formats the time to ensure compatibility with Netscape's cookie standard.`

			`Accepts a floating point number expressed in seconds since the epoch, in`
			`UTC - such as that outputted by time.time(). If set to None, defaults to`
			`the current time.`

			`Outputs a string in the format 'Wdy, DD-Mon-YYYY HH:MM:SS GMT'.`
			`"""`
			`rfcdate = formatdate(epoch_seconds)`
			`return '%s-%s-%s GMT' % (rfcdate[:7], rfcdate[8:11], rfcdate[12:25])`

			`def http_date(epoch_seconds=None):`
			`"""`
			`Formats the time to match the RFC1123 date format as specified by HTTP`
			`RFC2616 section 3.3.1.`

			`Accepts a floating point number expressed in seconds since the epoch, in`
			`UTC - such as that outputted by time.time(). If set to None, defaults to`
			`the current time.`

			`Outputs a string in the format 'Wdy, DD Mon YYYY HH:MM:SS GMT'.`
			`"""`
			`rfcdate = formatdate(epoch_seconds)`
			`return '%s GMT' % rfcdate[:25]`
Fixed #7723 - implemented a secure password reset form that uses a token and prompts user for new password. git-svn-id: http://code.djangoproject.com/svn/django/trunk@8162 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2008-08-01 04:47:53 +08:00
			`# Base 36 functions: useful for generating compact URLs`

			`def base36_to_int(s):`
			`"""`
Fix a security issue in the auth system. Disclosure and new release forthcoming. git-svn-id: http://code.djangoproject.com/svn/django/trunk@15032 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2010-12-23 11:45:08 +08:00			Converts a base 36 string to an ``int``. To prevent
			overconsumption of server resources, raises ``ValueError` if the
			`input is longer than 13 base36 digits (13 digits is sufficient to`
			`base36-encode any 64-bit integer).`
Fixed #7723 - implemented a secure password reset form that uses a token and prompts user for new password. git-svn-id: http://code.djangoproject.com/svn/django/trunk@8162 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2008-08-01 04:47:53 +08:00			`"""`
Fix a security issue in the auth system. Disclosure and new release forthcoming. git-svn-id: http://code.djangoproject.com/svn/django/trunk@15032 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2010-12-23 11:45:08 +08:00			`if len(s) > 13:`
			`raise ValueError("Base36 input too large")`
Fixed #7723 - implemented a secure password reset form that uses a token and prompts user for new password. git-svn-id: http://code.djangoproject.com/svn/django/trunk@8162 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2008-08-01 04:47:53 +08:00			`return int(s, 36)`

			`def int_to_base36(i):`
			`"""`
			`Converts an integer to a base36 string`
			`"""`
			`digits = "0123456789abcdefghijklmnopqrstuvwxyz"`
			`factor = 0`
			`# Find starting factor`
			`while True:`
			`factor += 1`
			`if i < 36 ** factor:`
			`factor -= 1`
			`break`
			`base36 = []`
			`# Construct base36 representation`
			`while factor >= 0:`
			`j = 36 ** factor`
			`base36.append(digits[i / j])`
			`i = i % j`
			`factor -= 1`
			`return ''.join(base36)`
Fixed #5791 -- Added early-bailout support for views (ETags and Last-modified). This provides support for views that can have their ETag and/or Last-modified values computed much more quickly than the view itself. Supports all HTTP verbs (not just GET). Documentation and tests need a little more fleshing out (I'm not happy with the documentation at the moment, since it's a bit backwards), but the functionality is correct. git-svn-id: http://code.djangoproject.com/svn/django/trunk@10114 bcc190cf-cafb-0310-a4f2-bffc1f526a37 2009-03-22 15:58:29 +08:00
			`def parse_etags(etag_str):`
			`"""`
			`Parses a string with one or several etags passed in If-None-Match and`
			`If-Match headers by the rules in RFC 2616. Returns a list of etags`
			`without surrounding double quotes (") and unescaped from \<CHAR>.`
			`"""`
			`etags = ETAG_MATCH.findall(etag_str)`
			`if not etags:`
			`# etag_str has wrong format, treat it as an opaque string then`
			`return [etag_str]`
			`etags = [e.decode('string_escape') for e in etags]`
			`return etags`

			`def quote_etag(etag):`
			`"""`
			`Wraps a string in double quotes escaping contents as necesary.`
			`"""`
			`return '"%s"' % etag.replace('\\', '\\\\').replace('"', '\\"')`