Change several "raise HTMLParseError" statements into assertions, as

these are really complaints about the intgrity of our own code. HTMLParseError should be raised only for invalid input. (Should we turn more unrecognized constructs into exceptions, e.g. '&' not followed by an entity or character reference?) Also added an 'r' prefix to a regex string containing a backslash.

Change several "raise HTMLParseError" statements into assertions, as
these are really complaints about the intgrity of our own code. HTMLParseError should be raised only for invalid input. (Should we turn more unrecognized constructs into exceptions, e.g. '&' not followed by an entity or character reference?) Also added an 'r' prefix to a regex string containing a backslash.
fb73bb90 · Guido van Rossum · 062277d2 · fb73bb90
Commit fb73bb90 authored Mar 21, 2001 by Guido van Rossum
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 12 deletions

lib/python/TAL/HTMLParser.py lib/python/TAL/HTMLParser.py +5 -12

No files found.
--- a/lib/python/TAL/HTMLParser.py
+++ b/lib/python/TAL/HTMLParser.py
@@ -23,7 +23,7 @@ entityref = re.compile('&([a-zA-Z][-.a-zA-Z0-9]*)[^a-zA-Z0-9]')
 charref = re.compile('&#([0-9]+)[^0-9]')
 starttagopen = re.compile('<[a-zA-Z]')
-piopen = re.compile('<\?')
+piopen = re.compile(r'<\?')
 piclose = re.compile('>')
 endtagopen = re.compile('</[a-zA-Z]')
 special = re.compile('<![^<>]*>')
@@ -147,6 +147,7 @@ class HTMLParser:
            if i < j: self.handle_data(rawdata[i:j])
            i = self.updatepos(i, j)
            if i == n: break
+            assert rawdata[i] in "<&", "interesting.search() lied"
            if rawdata[i] == '<':
                if starttagopen.match(rawdata, i):
                    if self.literal:
@@ -213,8 +214,6 @@ class HTMLParser:
                        k = k-1
                    i = self.updatepos(i, k)
                    continue
-            else:
-                raise HTMLParserError('neither < nor & ??', self.getpos())
            # We get here only if incomplete matches but
            # nothing else
            match = incomplete.match(rawdata, i)
@@ -237,9 +236,7 @@ class HTMLParser:
    # Internal -- parse comment, return length or -1 if not terminated
    def parse_comment(self, i):
        rawdata = self.rawdata
-        if rawdata[i:i+4] != '<!--':
+        assert rawdata[i:i+4] == '<!--', 'unexpected call to parse_comment()'
-            raise HTMLParseError('unexpected call to parse_comment()',
-                                 self.getpos())
        match = commentclose.search(rawdata, i+4)
        if not match:
            return -1
@@ -283,9 +280,7 @@ class HTMLParser:
    # Internal -- parse processing instr, return length or -1 if not terminated
    def parse_pi(self, i):
        rawdata = self.rawdata
-        if rawdata[i:i+2] != '<?':
+        assert rawdata[i:i+2] == '<?', 'unexpected call to parse_pi()'
-            raise HTMLParseError('unexpected call to parse_pi()',
-                                 self.getpos())
        match = piclose.search(rawdata, i+2)
        if not match:
            return -1
@@ -311,9 +306,7 @@ class HTMLParser:
        # Now parse the data between i+1 and j into a tag and attrs
        attrs = []
        match = tagfind.match(rawdata, i+1)
-        if not match:
+        assert match, 'unexpected call to parse_starttag()'
-            raise HTMLParseError('unexpected call to parse_starttag()',
-                                 self.getpos())
        k = match.end(0)
        self.lasttag = tag = string.lower(rawdata[i+1:k])