Merged revisions 70906 via svnmerge from

svn+ssh://pythondev@svn.python.org/python/trunk

........
  r70906 | georg.brandl | 2009-04-01 00:11:53 +0200 (Mi, 01 Apr 2009) | 1 line

  #1651995: fix _convert_ref for non-ASCII characters.
........
This commit is contained in:
Matthias Klose 2009-04-04 12:51:52 +00:00
parent c9da90a74e
commit ee13a2ecf4
2 changed files with 10 additions and 1 deletions

View File

@ -396,7 +396,7 @@ class SGMLParser(markupbase.ParserBase):
n = int(name)
except ValueError:
return
if not 0 <= n <= 255:
if not 0 <= n <= 127:
return
return self.convert_codepoint(n)

View File

@ -373,6 +373,15 @@ DOCTYPE html PUBLIC '-//W3C//DTD HTML 4.01//EN'
if len(data) != CHUNK:
break
def test_only_decode_ascii(self):
# SF bug #1651995, make sure non-ascii character references are not decoded
s = '<signs exclamation="&#33" copyright="&#169" quoteleft="&#8216;">'
self.check_events(s, [
('starttag', 'signs',
[('exclamation', '!'), ('copyright', '&#169'),
('quoteleft', '&#8216;')]),
])
# XXX These tests have been disabled by prefixing their names with
# an underscore. The first two exercise outstanding bugs in the
# sgmllib module, and the third exhibits questionable behavior