linkchecker/tests/checker/test_http_misc.py
Marius Gedminas 0d58a39376 Fix failing test
http://www.heise.de/ now does a redirect to HTTPS instead of denying our
crawl via robots.txt.

Fixes #269.
2019-09-04 14:04:07 +03:00

68 lines
2.3 KiB
Python

# -*- coding: iso-8859-1 -*-
# Copyright (C) 2004-2014 Bastian Kleineidam
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License along
# with this program; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
"""
Test http checking.
"""
import os
import sys
from .httpserver import HttpServerTest
from tests import need_network
from linkcheck.network import iputil
class TestHttpMisc (HttpServerTest):
"""Test http:// misc link checking."""
@need_network
def test_html (self):
self.swf_test()
self.obfuscate_test()
def swf_test (self):
url = self.get_url(u"test.swf")
resultlines = [
u"url %s" % url,
u"cache key %s" % url,
u"real url %s" % url,
u"valid",
u"url http://www.example.org/",
u"cache key http://www.example.org/",
u"real url http://www.example.org/",
u"valid",
]
self.direct(url, resultlines, recursionlevel=1)
def obfuscate_test (self):
if os.name != "posix" or sys.platform != 'linux2':
return
host = "www.heise.de"
for tentative_ip in iputil.resolve_host(host):
if iputil.is_valid_ipv4(tentative_ip):
ip = tentative_ip
break
else:
raise NotImplementedError("no IPv4 address detected for test host")
url = u"http://%s/" % iputil.obfuscate_ip(ip)
rurl = u"http://%s/" % ip
resultlines = [
u"url %s" % url,
u"cache key %s" % rurl,
u"real url https://%s/" % host,
u"info Redirected to `https://%s/'." % host,
u"warning URL %s has obfuscated IP address %s" % (url, ip),
u"valid",
]
self.direct(url, resultlines, recursionlevel=0)