mirror of
https://github.com/Hopiu/linkchecker.git
synced 2026-03-22 17:00:25 +00:00
Use Python 2.5 features and get rid of old compat code. Also some code cleanups have been made. git-svn-id: https://linkchecker.svn.sourceforge.net/svnroot/linkchecker/trunk/linkchecker@3737 e7d03fd6-7b0d-0410-9947-9c21f3af8025
118 lines
3.8 KiB
Python
118 lines
3.8 KiB
Python
# -*- coding: iso-8859-1 -*-
|
|
# Copyright (C) 2006-2008 Bastian Kleineidam
|
|
#
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program; if not, write to the Free Software
|
|
# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
"""
|
|
Management of checking a queue of links with several threads.
|
|
"""
|
|
import time
|
|
import os
|
|
import thread
|
|
from .. import log, LOG_CHECK
|
|
import linkcheck.cache.urlqueue
|
|
import linkcheck.cache.robots_txt
|
|
import linkcheck.cache.cookie
|
|
import linkcheck.cache.connection
|
|
import aggregator
|
|
import console
|
|
|
|
|
|
def check_urls (aggregate):
|
|
"""Main check function; checks all configured URLs until interrupted
|
|
with Ctrl-C.
|
|
@return: None
|
|
"""
|
|
try:
|
|
aggregate.logger.start_log_output()
|
|
if not aggregate.urlqueue.empty():
|
|
aggregate.start_threads()
|
|
check_url(aggregate)
|
|
aggregate.finish()
|
|
aggregate.logger.end_log_output()
|
|
except KeyboardInterrupt:
|
|
interrupt(aggregate)
|
|
except thread.error:
|
|
log.warn(LOG_CHECK,
|
|
_("Could not start a new thread. Check that the current user" \
|
|
" is allowed to start new threads."))
|
|
abort(aggregate)
|
|
except Exception:
|
|
console.internal_error()
|
|
abort(aggregate)
|
|
|
|
|
|
def check_url (aggregate):
|
|
"""Helper function waiting for URL queue."""
|
|
while True:
|
|
try:
|
|
aggregate.urlqueue.join(timeout=1)
|
|
break
|
|
except linkcheck.cache.urlqueue.Timeout:
|
|
# Since urlqueue.join() is not interruptable, add a timeout
|
|
# and a one-second slumber.
|
|
time.sleep(1)
|
|
aggregate.remove_stopped_threads()
|
|
if not aggregate.threads:
|
|
break
|
|
|
|
|
|
def interrupt (aggregate):
|
|
"""Interrupt execution and shutdown, ignoring any subsequent
|
|
interrupts."""
|
|
while True:
|
|
try:
|
|
log.warn(LOG_CHECK,
|
|
_("keyboard interrupt; waiting for active threads to finish"))
|
|
log.warn(LOG_CHECK,
|
|
_("another keyboard interrupt will exit immediately"))
|
|
print_active_threads(aggregate)
|
|
abort(aggregate)
|
|
break
|
|
except KeyboardInterrupt:
|
|
pass
|
|
|
|
|
|
def print_active_threads (aggregate):
|
|
if not aggregate.threads:
|
|
return
|
|
log.info(LOG_CHECK, _("These URLs are still active:"))
|
|
for t in aggregate.threads:
|
|
name = t.getName()
|
|
if name.startswith("Check-"):
|
|
log.info(LOG_CHECK, name[6:])
|
|
|
|
|
|
def abort (aggregate):
|
|
"""Helper function to ensure a clean shutdown."""
|
|
while True:
|
|
try:
|
|
aggregate.abort()
|
|
aggregate.finish()
|
|
aggregate.logger.end_log_output()
|
|
break
|
|
except KeyboardInterrupt:
|
|
log.warn(LOG_CHECK, _("keyboard interrupt; force shutdown"))
|
|
# forced exit without cleanup
|
|
os._exit(1)
|
|
|
|
|
|
def get_aggregate (config):
|
|
"""Get an aggregator instance with given configuration."""
|
|
urlqueue = linkcheck.cache.urlqueue.UrlQueue()
|
|
connections = linkcheck.cache.connection.ConnectionPool(wait=config["wait"])
|
|
cookies = linkcheck.cache.cookie.CookieJar()
|
|
robots_txt = linkcheck.cache.robots_txt.RobotsTxt()
|
|
return aggregator.Aggregate(config, urlqueue, connections,
|
|
cookies, robots_txt)
|