mirror of
https://github.com/Hopiu/linkchecker.git
synced 2026-04-20 22:31:00 +00:00
added
git-svn-id: https://linkchecker.svn.sourceforge.net/svnroot/linkchecker/trunk/linkchecker@2585 e7d03fd6-7b0d-0410-9947-9c21f3af8025
This commit is contained in:
parent
1a7a771648
commit
208a7f095f
1 changed files with 48 additions and 0 deletions
48
linkcheck/checker/internpaturl.py
Normal file
48
linkcheck/checker/internpaturl.py
Normal file
|
|
@ -0,0 +1,48 @@
|
|||
# -*- coding: iso-8859-1 -*-
|
||||
# Copyright (C) 2005 Bastian Kleineidam
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
# the Free Software Foundation; either version 2 of the License, or
|
||||
# (at your option) any later version.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful,
|
||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
# GNU General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program; if not, write to the Free Software
|
||||
# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
||||
"""
|
||||
Intern URL pattern support.
|
||||
"""
|
||||
import re
|
||||
import urlbase
|
||||
import linkcheck.checker
|
||||
|
||||
class InternPatternUrl (urlbase.UrlBase):
|
||||
"""
|
||||
Class supporting an intern URL pattern.
|
||||
"""
|
||||
|
||||
def get_intern_pattern (self):
|
||||
"""
|
||||
Get pattern for intern URL matching.
|
||||
|
||||
@return non-empty regex pattern or None
|
||||
@rtype String or None
|
||||
"""
|
||||
absolute = linkcheck.checker.absolute_url
|
||||
url = absolute(self.base_url, self.base_ref, self.parent_url)
|
||||
if not url:
|
||||
return None
|
||||
parts = linkcheck.strformat.url_unicode_split(url)
|
||||
scheme = parts[0]
|
||||
domain = parts[1]
|
||||
domain, is_idn = linkcheck.url.idna_encode(domain)
|
||||
if not (domain and scheme):
|
||||
return None
|
||||
path = parts[2]
|
||||
args = tuple(re.escape(x) for x in (scheme, domain, path))
|
||||
return "%s://%s%s" % args
|
||||
Loading…
Reference in a new issue