#1651995: fix _convert_ref for non-ASCII characters.
This commit is contained in:
parent
95fafec732
commit
0c7b2c9c19
|
@ -396,7 +396,7 @@ class SGMLParser(markupbase.ParserBase):
|
|||
n = int(name)
|
||||
except ValueError:
|
||||
return
|
||||
if not 0 <= n <= 255:
|
||||
if not 0 <= n <= 127:
|
||||
return
|
||||
return self.convert_codepoint(n)
|
||||
|
||||
|
|
|
@ -373,6 +373,15 @@ DOCTYPE html PUBLIC '-//W3C//DTD HTML 4.01//EN'
|
|||
if len(data) != CHUNK:
|
||||
break
|
||||
|
||||
def test_only_decode_ascii(self):
|
||||
# SF bug #1651995, make sure non-ascii character references are not decoded
|
||||
s = '<signs exclamation="!" copyright="©" quoteleft="‘">'
|
||||
self.check_events(s, [
|
||||
('starttag', 'signs',
|
||||
[('exclamation', '!'), ('copyright', '©'),
|
||||
('quoteleft', '‘')]),
|
||||
])
|
||||
|
||||
# XXX These tests have been disabled by prefixing their names with
|
||||
# an underscore. The first two exercise outstanding bugs in the
|
||||
# sgmllib module, and the third exhibits questionable behavior
|
||||
|
|
Loading…
Reference in New Issue