You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
100 lines
3.5 KiB
100 lines
3.5 KiB
from django.core import urlresolvers, paginator |
|
import urllib |
|
|
|
PING_URL = "http://www.google.com/webmasters/tools/ping" |
|
|
|
class SitemapNotFound(Exception): |
|
pass |
|
|
|
def ping_google(sitemap_url=None, ping_url=PING_URL): |
|
""" |
|
Alerts Google that the sitemap for the current site has been updated. |
|
If sitemap_url is provided, it should be an absolute path to the sitemap |
|
for this site -- e.g., '/sitemap.xml'. If sitemap_url is not provided, this |
|
function will attempt to deduce it by using urlresolvers.reverse(). |
|
""" |
|
if sitemap_url is None: |
|
try: |
|
# First, try to get the "index" sitemap URL. |
|
sitemap_url = urlresolvers.reverse('django.contrib.sitemaps.views.index') |
|
except urlresolvers.NoReverseMatch: |
|
try: |
|
# Next, try for the "global" sitemap URL. |
|
sitemap_url = urlresolvers.reverse('django.contrib.sitemaps.views.sitemap') |
|
except urlresolvers.NoReverseMatch: |
|
pass |
|
|
|
if sitemap_url is None: |
|
raise SitemapNotFound("You didn't provide a sitemap_url, and the sitemap URL couldn't be auto-detected.") |
|
|
|
from django.contrib.sites.models import Site |
|
current_site = Site.objects.get_current() |
|
url = "http://%s%s" % (current_site.domain, sitemap_url) |
|
params = urllib.urlencode({'sitemap':url}) |
|
urllib.urlopen("%s?%s" % (ping_url, params)) |
|
|
|
class Sitemap: |
|
# This limit is defined by Google. See the index documentation at |
|
# http://sitemaps.org/protocol.php#index. |
|
limit = 50000 |
|
|
|
def __get(self, name, obj, default=None): |
|
try: |
|
attr = getattr(self, name) |
|
except AttributeError: |
|
return default |
|
if callable(attr): |
|
return attr(obj) |
|
return attr |
|
|
|
def items(self): |
|
return [] |
|
|
|
def location(self, obj): |
|
return obj.get_absolute_url() |
|
|
|
def _get_paginator(self): |
|
if not hasattr(self, "_paginator"): |
|
self._paginator = paginator.Paginator(self.items(), self.limit) |
|
return self._paginator |
|
paginator = property(_get_paginator) |
|
|
|
def get_urls(self, page=1): |
|
from django.contrib.sites.models import Site |
|
current_site = Site.objects.get_current() |
|
urls = [] |
|
for item in self.paginator.page(page).object_list: |
|
loc = "http://%s%s" % (current_site.domain, self.__get('location', item)) |
|
url_info = { |
|
'location': loc, |
|
'lastmod': self.__get('lastmod', item, None), |
|
'changefreq': self.__get('changefreq', item, None), |
|
'priority': self.__get('priority', item, None) |
|
} |
|
urls.append(url_info) |
|
return urls |
|
|
|
class FlatPageSitemap(Sitemap): |
|
def items(self): |
|
from django.contrib.sites.models import Site |
|
current_site = Site.objects.get_current() |
|
return current_site.flatpage_set.all() |
|
|
|
class GenericSitemap(Sitemap): |
|
priority = None |
|
changefreq = None |
|
|
|
def __init__(self, info_dict, priority=None, changefreq=None): |
|
self.queryset = info_dict['queryset'] |
|
self.date_field = info_dict.get('date_field', None) |
|
self.priority = priority |
|
self.changefreq = changefreq |
|
|
|
def items(self): |
|
# Make sure to return a clone; we don't want premature evaluation. |
|
return self.queryset.filter() |
|
|
|
def lastmod(self, item): |
|
if self.date_field is not None: |
|
return getattr(item, self.date_field) |
|
return None
|
|
|