From cbc3bcb0d3f14e0c4e07c832b7606816c379d703 Mon Sep 17 00:00:00 2001 From: Bastian Kleineidam Date: Sun, 23 Sep 2012 23:20:21 +0200 Subject: [PATCH] Sitemap logger fixes. --- linkcheck/logger/sitemapxml.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/linkcheck/logger/sitemapxml.py b/linkcheck/logger/sitemapxml.py index 2cd1c06e..9533d23e 100644 --- a/linkcheck/logger/sitemapxml.py +++ b/linkcheck/logger/sitemapxml.py @@ -80,6 +80,8 @@ class SitemapXmlLogger (xmllog.XMLLogger): self.prefix = url_data.url # first URL (ie. the homepage) gets priority 1.0 per default priority = 1.0 + elif url_data.url == self.prefix: + return else: # all other pages get priority 0.5 per default priority = 0.5 @@ -89,7 +91,6 @@ class SitemapXmlLogger (xmllog.XMLLogger): if (url_data.valid and url_data.url.startswith(HTTP_SCHEMES) and url_data.url.startswith(self.prefix) - and url_data.url != self.prefix and url_data.content_type in HTML_TYPES and not url_data.cached): self.log_url(url_data, priority=priority)