cpython/Lib/email/test/test_email_codecs.py

# Copyright (C) 2002-2006 Python Software Foundation
# Contact: email-sig@python.org
# email package unit tests for (optional) Asian codecs

import unittest
from test.test_support import TestSkipped, run_unittest

from email.test.test_email import TestEmailBase
from email.Charset import Charset
from email.Header import Header, decode_header
from email.Message import Message

# We're compatible with Python 2.3, but it doesn't have the built-in Asian
# codecs, so we have to skip all these tests.
try:
    str('foo', 'euc-jp')
except LookupError:
    raise TestSkipped


class TestEmailAsianCodecs(TestEmailBase):
    def test_japanese_codecs(self):
        eq = self.ndiffAssertEqual
        j = Charset("euc-jp")
        g = Charset("iso-8859-1")
        h = Header("Hello World!")
        jhello = '\xa5\xcf\xa5\xed\xa1\xbc\xa5\xef\xa1\xbc\xa5\xeb\xa5\xc9\xa1\xaa'
        ghello = 'Gr\xfc\xdf Gott!'
        h.append(jhello, j)
        h.append(ghello, g)
        # BAW: This used to -- and maybe should -- fold the two iso-8859-1
        # chunks into a single encoded word.  However it doesn't violate the
        # standard to have them as two encoded chunks and maybe it's
        # reasonable <wink> for each .append() call to result in a separate
        # encoded word.
        eq(h.encode(), """\
Hello World! =?iso-2022-jp?b?GyRCJU8lbSE8JW8hPCVrJUkhKhsoQg==?=
 =?iso-8859-1?q?Gr=FC=DF?= =?iso-8859-1?q?_Gott!?=""")
        eq(decode_header(h.encode()),
           [('Hello World!', None),
            ('\x1b$B%O%m!<%o!<%k%I!*\x1b(B', 'iso-2022-jp'),
            ('Gr\xfc\xdf Gott!', 'iso-8859-1')])
        int = 'test-ja \xa4\xd8\xc5\xea\xb9\xc6\xa4\xb5\xa4\xec\xa4\xbf\xa5\xe1\xa1\xbc\xa5\xeb\xa4\xcf\xbb\xca\xb2\xf1\xbc\xd4\xa4\xce\xbe\xb5\xc7\xa7\xa4\xf2\xc2\xd4\xa4\xc3\xa4\xc6\xa4\xa4\xa4\xde\xa4\xb9'
        h = Header(int, j, header_name="Subject")
        # test a very long header
        enc = h.encode()
        # TK: splitting point may differ by codec design and/or Header encoding
        eq(enc , """\
=?iso-2022-jp?b?dGVzdC1qYSAbJEIkWEVqOUYkNSRsJD8lYSE8JWskTztKGyhC?=
 =?iso-2022-jp?b?GyRCMnE8VCROPjVHJyRyQlQkQyRGJCQkXiQ5GyhC?=""")
        # TK: full decode comparison
        eq(h.__unicode__().encode('euc-jp'), int)

    def test_payload_encoding(self):
        jhello = '\xa5\xcf\xa5\xed\xa1\xbc\xa5\xef\xa1\xbc\xa5\xeb\xa5\xc9\xa1\xaa'
        jcode  = 'euc-jp'
        msg = Message()
        msg.set_payload(jhello, jcode)
        ustr = str(msg.get_payload(), msg.get_content_charset())
        self.assertEqual(jhello, ustr.encode(jcode))


def suite():
    suite = unittest.TestSuite()
    suite.addTest(unittest.makeSuite(TestEmailAsianCodecs))
    return suite


def test_main():
    run_unittest(TestEmailAsianCodecs)


if __name__ == '__main__':
    unittest.main(defaultTest='suite')
-												Port relevant patches for SF 1409455 to the trunk for email 3.0/Python 2.5.
Will port to Python 2.4.

											
										
										
											2006-02-08 10:34:21 -04:00
+								# Copyright (C) 2002-2006 Python Software Foundation
 								# Contact: email-sig@python.org
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
+								# email package unit tests for (optional) Asian codecs
 								import unittest
-												Get rid of relative imports in all unittests.  Now anything that
imports e.g. test_support must do so using an absolute package name
such as "import test.test_support" or "from test import test_support".

This also updates the README in Lib/test, and gets rid of the
duplicate data dirctory in Lib/test/data (replaced by
Lib/email/test/data).

Now Tim and Jack can have at it. :)

											
										
										
											2002-07-23 16:04:11 -03:00
+								from test.test_support import TestSkipped, run_unittest
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
 								from email.test.test_email import TestEmailBase
 								from email.Charset import Charset
 								from email.Header import Header, decode_header
-												Port relevant patches for SF 1409455 to the trunk for email 3.0/Python 2.5.
Will port to Python 2.4.

											
										
										
											2006-02-08 10:34:21 -04:00
+								from email.Message import Message
-												Merge p3yk branch with the trunk up to revision 45595. This breaks a fair
number of tests, all because of the codecs/_multibytecodecs issue described
here (it's not a Py3K issue, just something Py3K discovers):
http://mail.python.org/pipermail/python-dev/2006-April/064051.html

Hye-Shik Chang promised to look for a fix, so no need to fix it here. The
tests that are expected to break are:

test_codecencodings_cn
test_codecencodings_hk
test_codecencodings_jp
test_codecencodings_kr
test_codecencodings_tw
test_codecs
test_multibytecodec

This merge fixes an actual test failure (test_weakref) in this branch,
though, so I believe merging is the right thing to do anyway.

											
										
										
											2006-04-21 07:40:58 -03:00
+								# We're compatible with Python 2.3, but it doesn't have the built-in Asian
 								# codecs, so we have to skip all these tests.
 								try:
-												Rip out all the u"..." literals and calls to unicode().

											
										
										
											2007-05-02 16:09:54 -03:00
+								    str('foo', 'euc-jp')
-												Merge p3yk branch with the trunk up to revision 45595. This breaks a fair
number of tests, all because of the codecs/_multibytecodecs issue described
here (it's not a Py3K issue, just something Py3K discovers):
http://mail.python.org/pipermail/python-dev/2006-April/064051.html

Hye-Shik Chang promised to look for a fix, so no need to fix it here. The
tests that are expected to break are:

test_codecencodings_cn
test_codecencodings_hk
test_codecencodings_jp
test_codecencodings_kr
test_codecencodings_tw
test_codecs
test_multibytecodec

This merge fixes an actual test failure (test_weakref) in this branch,
though, so I believe merging is the right thing to do anyway.

											
										
										
											2006-04-21 07:40:58 -03:00
+								except LookupError:
 								    raise TestSkipped
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
 								class TestEmailAsianCodecs(TestEmailBase):
 								    def test_japanese_codecs(self):
 								        eq = self.ndiffAssertEqual
 								        j = Charset("euc-jp")
 								        g = Charset("iso-8859-1")
 								        h = Header("Hello World!")
 								        jhello = '\xa5\xcf\xa5\xed\xa1\xbc\xa5\xef\xa1\xbc\xa5\xeb\xa5\xc9\xa1\xaa'
 								        ghello = 'Gr\xfc\xdf Gott!'
 								        h.append(jhello, j)
 								        h.append(ghello, g)
-												Merge of the folding-reimpl-branch.  Specific changes,

Update tests for email 2.5.

											
										
										
											2003-03-06 01:41:07 -04:00
+								        # BAW: This used to -- and maybe should -- fold the two iso-8859-1
 								        # chunks into a single encoded word.  However it doesn't violate the
 								        # standard to have them as two encoded chunks and maybe it's
 								        # reasonable <wink> for each .append() call to result in a separate
 								        # encoded word.
 								        eq(h.encode(), """\
 								Hello World! =?iso-2022-jp?b?GyRCJU8lbSE8JW8hPCVrJUkhKhsoQg==?=
 								 =?iso-8859-1?q?Gr=FC=DF?= =?iso-8859-1?q?_Gott!?=""")
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
+								        eq(decode_header(h.encode()),
 								           [('Hello World!', None),
 								            ('\x1b$B%O%m!<%o!<%k%I!*\x1b(B', 'iso-2022-jp'),
 								            ('Gr\xfc\xdf Gott!', 'iso-8859-1')])
-												Rip out 'long' and 'L'-suffixed integer literals.
(Rough first cut.)

											
										
										
											2007-01-15 12:59:06 -04:00
+								        int = 'test-ja \xa4\xd8\xc5\xea\xb9\xc6\xa4\xb5\xa4\xec\xa4\xbf\xa5\xe1\xa1\xbc\xa5\xeb\xa4\xcf\xbb\xca\xb2\xf1\xbc\xd4\xa4\xce\xbe\xb5\xc7\xa7\xa4\xf2\xc2\xd4\xa4\xc3\xa4\xc6\xa4\xa4\xa4\xde\xa4\xb9'
 								        h = Header(int, j, header_name="Subject")
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
+								        # test a very long header
 								        enc = h.encode()
-												Merge of the folding-reimpl-branch.  Specific changes,

Update tests for email 2.5.

											
										
										
											2003-03-06 01:41:07 -04:00
+								        # TK: splitting point may differ by codec design and/or Header encoding
 								        eq(enc , """\
 								=?iso-2022-jp?b?dGVzdC1qYSAbJEIkWEVqOUYkNSRsJD8lYSE8JWskTztKGyhC?=
 								 =?iso-2022-jp?b?GyRCMnE8VCROPjVHJyRyQlQkQyRGJCQkXiQ5GyhC?=""")
 								        # TK: full decode comparison
-												Rip out 'long' and 'L'-suffixed integer literals.
(Rough first cut.)

											
										
										
											2007-01-15 12:59:06 -04:00
+								        eq(h.__unicode__().encode('euc-jp'), int)
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
-												Port relevant patches for SF 1409455 to the trunk for email 3.0/Python 2.5.
Will port to Python 2.4.

											
										
										
											2006-02-08 10:34:21 -04:00
+								    def test_payload_encoding(self):
 								        jhello = '\xa5\xcf\xa5\xed\xa1\xbc\xa5\xef\xa1\xbc\xa5\xeb\xa5\xc9\xa1\xaa'
 								        jcode  = 'euc-jp'
 								        msg = Message()
 								        msg.set_payload(jhello, jcode)
-												Rip out all the u"..." literals and calls to unicode().

											
										
										
											2007-05-02 16:09:54 -03:00
+								        ustr = str(msg.get_payload(), msg.get_content_charset())
-												Port relevant patches for SF 1409455 to the trunk for email 3.0/Python 2.5.
Will port to Python 2.4.

											
										
										
											2006-02-08 10:34:21 -04:00
+								        self.assertEqual(jhello, ustr.encode(jcode))
-												The email package's tests live much better in a subpackage
(i.e. email.test), so move the guts of them here from Lib/test.  The
latter directory will retain stubs to run the email.test tests using
Python's standard regression test.

test_email_torture.py is a torture tester which will not run under
Python's test suite because I don't want to commit megs of data to
that project (it will fail cleanly there).  When run under the mimelib
project it'll stress test the package with megs of message samples
collected from various locations in the wild.

											
										
										
											2002-07-19 19:31:10 -03:00
 								def suite():
 								    suite = unittest.TestSuite()
 								    suite.addTest(unittest.makeSuite(TestEmailAsianCodecs))
 								    return suite
 								def test_main():
 								    run_unittest(TestEmailAsianCodecs)
 								if __name__ == '__main__':
 								    unittest.main(defaultTest='suite')