mirror of
https://github.com/Hopiu/linkchecker.git
synced 2026-04-19 05:41:00 +00:00
unicode split
git-svn-id: https://linkchecker.svn.sourceforge.net/svnroot/linkchecker/trunk/linkchecker@2090 e7d03fd6-7b0d-0410-9947-9c21f3af8025
This commit is contained in:
parent
ef0d624c0d
commit
6d99454ebf
1 changed files with 7 additions and 2 deletions
|
|
@ -353,7 +353,7 @@ def match_url (url, domainlist):
|
|||
list"""
|
||||
if not url:
|
||||
return False
|
||||
return match_host(spliturl(url)[1], domainlist)
|
||||
return match_host(url_split(url)[1], domainlist)
|
||||
|
||||
|
||||
def match_host (host, domainlist):
|
||||
|
|
@ -384,7 +384,7 @@ def url_needs_quoting (url):
|
|||
return not _safe_url_chars_ro.match(url)
|
||||
|
||||
|
||||
def spliturl (url):
|
||||
def url_split (url):
|
||||
"""Split url in a tuple (scheme, hostname, port, document) where
|
||||
hostname is always lowercased.
|
||||
Precondition: url is syntactically correct URI (eg has no whitespace)
|
||||
|
|
@ -396,3 +396,8 @@ def spliturl (url):
|
|||
host = host.lower()
|
||||
host, port = urllib.splitnport(host, port)
|
||||
return scheme, host, port, document
|
||||
|
||||
|
||||
def url_unicode_split (url):
|
||||
"""Like urlparse.urlsplit(), but always returning unicode parts."""
|
||||
return [unicode(s) for s in urlparse.urlsplit(url)]
|
||||
|
|
|
|||
Loading…
Reference in a new issue