From 5ebd754cdbd131cfdb360ce4bfaa71b0b63d048c Mon Sep 17 00:00:00 2001 From: Bastian Kleineidam Date: Mon, 1 Oct 2012 16:11:45 +0200 Subject: [PATCH] Improved duplicate url check. --- linkcheck/url.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/linkcheck/url.py b/linkcheck/url.py index c3fad170..eaa620d7 100644 --- a/linkcheck/url.py +++ b/linkcheck/url.py @@ -588,6 +588,8 @@ def shorten_duplicate_content_url(url): url = url.split('#', 1)[0] if url.endswith('index.html'): return url[:-10] + if url.endswith('index.htm'): + return url[:-9] return url