Arthur de Jong

Open Source / Free Software developer

summaryrefslogtreecommitdiffstats
path: root/crawler.py
diff options
context:
space:
mode:
authorArthur de Jong <arthur@arthurdejong.org>2006-05-07 11:12:25 +0200
committerArthur de Jong <arthur@arthurdejong.org>2006-05-07 11:12:25 +0200
commit2e0f32353f5e3dffcc8f29239c272f04907e06e0 (patch)
tree59a53842bf8a8dbed15b4d8b52945ad4120f5620 /crawler.py
parent76170833713c2fc72cefbefa28b8c7ef6a47ef80 (diff)
some more small code improvements thanks to pychecker
git-svn-id: http://arthurdejong.org/svn/webcheck/webcheck@252 86f53f14-5ff3-0310-afe5-9b438ce3f40c
Diffstat (limited to 'crawler.py')
-rw-r--r--crawler.py4
1 files changed, 3 insertions, 1 deletions
diff --git a/crawler.py b/crawler.py
index b5b68f5..902c347 100644
--- a/crawler.py
+++ b/crawler.py
@@ -383,6 +383,7 @@ class Link:
self.linkproblems = []
self.pageproblems = []
self.redirectdepth = 0
+ self.redirectlist = None
def _checkurl(self, url):
"""Check to see if the url is formatted properly, correct formatting
@@ -462,7 +463,8 @@ class Link:
def redirect(self, url):
"""Indicate that this link redirects to the specified url. Maximum
redirect counting is done as well as loop detection."""
- # figure out depth
+ # figure out depth and urls that have been visited in this
+ # redirect list
redirectdepth = 0
redirectlist = []
for parent in self.parents: