mirror of https://github.com/python/cpython
merge #11584: make Header and make_header handle binary unknown-8bit input
This commit is contained in:
commit
e76ff4081a
|
@ -275,7 +275,10 @@ class Header:
|
|||
charset = Charset(charset)
|
||||
if not isinstance(s, str):
|
||||
input_charset = charset.input_codec or 'us-ascii'
|
||||
s = s.decode(input_charset, errors)
|
||||
if input_charset == _charset.UNKNOWN8BIT:
|
||||
s = s.decode('us-ascii', 'surrogateescape')
|
||||
else:
|
||||
s = s.decode(input_charset, errors)
|
||||
# Ensure that the bytes we're storing can be decoded to the output
|
||||
# character set, otherwise an early error is thrown.
|
||||
output_charset = charset.output_codec or 'us-ascii'
|
||||
|
|
|
@ -4330,6 +4330,21 @@ A very long line that must get split to something other than at the
|
|||
'Ynwp4dUEbay Auction Semiar- No Charge \uFFFD Earn Big')
|
||||
self.assertEqual(email.header.decode_header(h), [(x, 'unknown-8bit')])
|
||||
|
||||
def test_header_handles_binary_unknown8bit(self):
|
||||
x = b'Ynwp4dUEbay Auction Semiar- No Charge \x96 Earn Big'
|
||||
h = Header(x, charset=email.charset.UNKNOWN8BIT)
|
||||
self.assertEqual(str(h),
|
||||
'Ynwp4dUEbay Auction Semiar- No Charge \uFFFD Earn Big')
|
||||
self.assertEqual(email.header.decode_header(h), [(x, 'unknown-8bit')])
|
||||
|
||||
def test_make_header_handles_binary_unknown8bit(self):
|
||||
x = b'Ynwp4dUEbay Auction Semiar- No Charge \x96 Earn Big'
|
||||
h = Header(x, charset=email.charset.UNKNOWN8BIT)
|
||||
h2 = email.header.make_header(email.header.decode_header(h))
|
||||
self.assertEqual(str(h2),
|
||||
'Ynwp4dUEbay Auction Semiar- No Charge \uFFFD Earn Big')
|
||||
self.assertEqual(email.header.decode_header(h2), [(x, 'unknown-8bit')])
|
||||
|
||||
def test_modify_returned_list_does_not_change_header(self):
|
||||
h = Header('test')
|
||||
chunks = email.header.decode_header(h)
|
||||
|
|
|
@ -194,7 +194,8 @@ Library
|
|||
-------
|
||||
|
||||
- Issue #11584: email.header.decode_header no longer fails if the header
|
||||
passed to it is a Header object.
|
||||
passed to it is a Header object, and Header/make_header no longer fail
|
||||
if given binary unknown-8bit input.
|
||||
|
||||
- Issue #11700: mailbox proxy object close methods can now be called multiple
|
||||
times without error.
|
||||
|
|
Loading…
Reference in New Issue