]> granicus.if.org Git - python/commitdiff
Process <img> and <frame> tags. Don't bother skipping second href.
authorGuido van Rossum <guido@python.org>
Sat, 1 Feb 1997 05:16:08 +0000 (05:16 +0000)
committerGuido van Rossum <guido@python.org>
Sat, 1 Feb 1997 05:16:08 +0000 (05:16 +0000)
Tools/webchecker/webchecker.py

index 9e676caf0150e2cb20cf7d45b03275eea3b5963e..69e462a94c67a00f724645c4f33c3f8b299a5813 100755 (executable)
@@ -564,11 +564,21 @@ class MyHTMLParser(sgmllib.SGMLParser):
        sgmllib.SGMLParser.__init__ (self)
 
     def start_a(self, attributes):
+       self.link_attr(attributes, 'href')
+
+    def end_a(self): pass
+
+    def do_img(self, attributes):
+       self.link_attr(attributes, 'src', 'lowsrc')
+
+    def do_frame(self, attributes):
+       self.link_attr(attributes, 'src')
+
+    def link_attr(self, attributes, *args):
        for name, value in attributes:
-           if name == 'href':
+           if name in args:
                if value: value = string.strip(value)
                if value: self.links[value] = None
-               return  # match only first href
 
     def do_base(self, attributes):
        for name, value in attributes:
@@ -578,7 +588,6 @@ class MyHTMLParser(sgmllib.SGMLParser):
                    if verbose > 1:
                        print "  Base", value
                    self.base = value
-               return  # match only first href
 
     def getlinks(self):
        return self.links.keys()