1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
|
# config.py - configuration state for webcheck
#
# Copyright (C) 1998, 1999 Albert Hopkins (marduk)
# Copyright (C) 2002 Mike Meyer
# Copyright (C) 2005, 2006, 2007, 2008, 2010, 2011 Arthur de Jong
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
#
# The files produced as output from the software do not automatically fall
# under the copyright of the software, unless explicitly stated otherwise.
"""Configuration state for webcheck.
This file contains the default configuration for webcheck. All configurable
items should be changeble from the command line."""
# Whether to consider any URL not starting with the base URL to be external.
# This is the state of the -b command line option.
BASE_URLS_ONLY = False
# Avoid checking external links at all. This is the state of the -a command
# line option.
AVOID_EXTERNAL_LINKS = False
# IO timeout as passed to socket.setdefaulttimeout()
# value is a float in seconds None disables the timeout
IOTIMEOUT = 10.0
# Output directory. This is the state of the -o command line option.
OUTPUT_DIR = '.'
# Whether to try to read a state file to continue from.
CONTINUE = False
# This is the time in seconds to wait between requests. This is the state of
# the -w command line option.
WAIT_BETWEEN_REQUESTS = 0
# Maximum number of links to follow from the specified base URLs.
MAX_DEPTH = None
# Redirect depth, the number of redirects to follow. This is the state of the
# -r command line option.
REDIRECT_DEPTH = 5
# The list of plugins that will be used to generate the report.
PLUGINS = ['webcheck.plugins.anchors',
'webcheck.plugins.sitemap',
'webcheck.plugins.urllist',
'webcheck.plugins.images',
'webcheck.plugins.external',
'webcheck.plugins.notchkd',
'webcheck.plugins.badlinks',
'webcheck.plugins.old',
'webcheck.plugins.new',
'webcheck.plugins.size',
'webcheck.plugins.notitles',
'webcheck.plugins.problems',
'webcheck.plugins.about',
'webcheck.plugins.csvfile']
# Whether to overwrite files without asking. This is the state of the -f
# command line option.
OVERWRITE_FILES = False
# Whether to add extra headers to outgoing requests, requesting to
# disable caching, ensuring that a fresh page is returned
BYPASSHTTPCACHE = False
# The number of levels the sitemap plugin should show.
REPORT_SITEMAP_LEVEL = 8
# The age of pages in days that after which a page is considered too old.
REPORT_WHATSOLD_URL_AGE = 700
# The age of pages in days within wich a page is considered new.
REPORT_WHATSNEW_URL_AGE = 7
# The size of a page in kilobytes after which the page is considered too big.
REPORT_SLOW_URL_SIZE = 76
# The maximum number of links to show in the "referenced from:" lists
PARENT_LISTLEN = 10
# Whether to open links in a new window (add target="_blank")
# (disabled by default because it is not xhtml 1.1)
REPORT_LINKS_IN_NEW_WINDOW = False
# Whether to fetch robots.txt files and do checking based on the information
# present in those files (normally matching links are yanked).
USE_ROBOTS = True
# Options for tidy (make None to disable running tidy)
# See http://tidy.sourceforge.net/docs/quickref.html for details.
TIDY_OPTIONS = dict(quiet=1,
accessibility_check=1,
show_errors=6,
show_warnings=1,
char_encoding='utf8')
|