2010-10-11 22:34:42 +08:00
from django . contrib . sites . models import Site , get_current_site
2008-07-26 13:07:16 +08:00
from django . core import urlresolvers , paginator
2010-10-11 22:34:42 +08:00
from django . core . exceptions import ImproperlyConfigured
2006-09-01 07:13:59 +08:00
import urllib
2007-05-21 04:47:18 +08:00
PING_URL = " http://www.google.com/webmasters/tools/ping "
2006-09-01 07:13:59 +08:00
class SitemapNotFound ( Exception ) :
pass
def ping_google ( sitemap_url = None , ping_url = PING_URL ) :
"""
Alerts Google that the sitemap for the current site has been updated .
If sitemap_url is provided , it should be an absolute path to the sitemap
for this site - - e . g . , ' /sitemap.xml ' . If sitemap_url is not provided , this
function will attempt to deduce it by using urlresolvers . reverse ( ) .
"""
if sitemap_url is None :
try :
# First, try to get the "index" sitemap URL.
2006-09-03 02:10:00 +08:00
sitemap_url = urlresolvers . reverse ( ' django.contrib.sitemaps.views.index ' )
2006-09-01 07:13:59 +08:00
except urlresolvers . NoReverseMatch :
try :
# Next, try for the "global" sitemap URL.
2006-09-03 02:10:00 +08:00
sitemap_url = urlresolvers . reverse ( ' django.contrib.sitemaps.views.sitemap ' )
2006-09-01 07:13:59 +08:00
except urlresolvers . NoReverseMatch :
pass
if sitemap_url is None :
raise SitemapNotFound ( " You didn ' t provide a sitemap_url, and the sitemap URL couldn ' t be auto-detected. " )
from django . contrib . sites . models import Site
current_site = Site . objects . get_current ( )
2007-05-21 04:47:18 +08:00
url = " http:// %s %s " % ( current_site . domain , sitemap_url )
2006-09-01 07:13:59 +08:00
params = urllib . urlencode ( { ' sitemap ' : url } )
urllib . urlopen ( " %s ? %s " % ( ping_url , params ) )
2008-09-17 12:56:04 +08:00
class Sitemap ( object ) :
2008-07-26 13:07:16 +08:00
# This limit is defined by Google. See the index documentation at
# http://sitemaps.org/protocol.php#index.
limit = 50000
2006-09-01 07:13:59 +08:00
def __get ( self , name , obj , default = None ) :
try :
attr = getattr ( self , name )
except AttributeError :
return default
if callable ( attr ) :
return attr ( obj )
return attr
def items ( self ) :
return [ ]
def location ( self , obj ) :
return obj . get_absolute_url ( )
2008-07-26 13:07:16 +08:00
def _get_paginator ( self ) :
2008-08-08 23:40:31 +08:00
if not hasattr ( self , " _paginator " ) :
self . _paginator = paginator . Paginator ( self . items ( ) , self . limit )
return self . _paginator
2008-07-26 13:07:16 +08:00
paginator = property ( _get_paginator )
2010-10-11 22:34:42 +08:00
def get_urls ( self , page = 1 , site = None ) :
if site is None :
if Site . _meta . installed :
try :
site = Site . objects . get_current ( )
except Site . DoesNotExist :
pass
if site is None :
raise ImproperlyConfigured ( " In order to use Sitemaps you must either use the sites framework or pass in a Site or RequestSite object in your view code. " )
2006-09-01 07:13:59 +08:00
urls = [ ]
2008-07-26 13:07:16 +08:00
for item in self . paginator . page ( page ) . object_list :
2010-10-11 22:34:42 +08:00
loc = " http:// %s %s " % ( site . domain , self . __get ( ' location ' , item ) )
2010-08-30 23:09:12 +08:00
priority = self . __get ( ' priority ' , item , None )
2006-09-01 07:13:59 +08:00
url_info = {
2011-06-28 18:16:34 +08:00
' item ' : item ,
2006-09-01 07:13:59 +08:00
' location ' : loc ,
' lastmod ' : self . __get ( ' lastmod ' , item , None ) ,
' changefreq ' : self . __get ( ' changefreq ' , item , None ) ,
2011-06-28 18:16:34 +08:00
' priority ' : str ( priority is not None and priority or ' ' ) ,
2006-09-01 07:13:59 +08:00
}
urls . append ( url_info )
return urls
2006-09-01 07:31:25 +08:00
class FlatPageSitemap ( Sitemap ) :
2006-09-01 07:13:59 +08:00
def items ( self ) :
2010-10-11 22:34:42 +08:00
current_site = Site . objects . get_current ( )
return current_site . flatpage_set . filter ( registration_required = False )
2006-09-01 07:13:59 +08:00
class GenericSitemap ( Sitemap ) :
priority = None
changefreq = None
def __init__ ( self , info_dict , priority = None , changefreq = None ) :
self . queryset = info_dict [ ' queryset ' ]
self . date_field = info_dict . get ( ' date_field ' , None )
self . priority = priority
self . changefreq = changefreq
def items ( self ) :
# Make sure to return a clone; we don't want premature evaluation.
return self . queryset . filter ( )
def lastmod ( self , item ) :
if self . date_field is not None :
return getattr ( item , self . date_field )
return None