2003-01-27 07:28:52 -04:00
|
|
|
from test import test_support
|
|
|
|
import unittest, sys
|
|
|
|
import codecs, _iconv_codec
|
|
|
|
from encodings import iconv_codec
|
|
|
|
from StringIO import StringIO
|
|
|
|
|
|
|
|
class IconvCodecTest(unittest.TestCase):
|
|
|
|
|
|
|
|
if sys.byteorder == 'big':
|
2003-01-30 15:55:28 -04:00
|
|
|
spam = '\x00s\x00p\x00a\x00m' * 2
|
2003-01-27 07:28:52 -04:00
|
|
|
else:
|
2003-01-30 15:55:28 -04:00
|
|
|
spam = 's\x00p\x00a\x00m\x00' * 2
|
2003-01-27 07:28:52 -04:00
|
|
|
|
|
|
|
def test_sane(self):
|
2003-01-30 15:55:28 -04:00
|
|
|
# FIXME: Commented out, because it's not clear whether
|
|
|
|
# the internal encoding choosen requires byte swapping
|
|
|
|
# for this iconv() implementation.
|
|
|
|
if False:
|
|
|
|
self.encoder, self.decoder, self.reader, self.writer = \
|
|
|
|
codecs.lookup(_iconv_codec.internal_encoding)
|
|
|
|
self.assertEqual(self.decoder(self.spam), (u'spamspam', 16))
|
|
|
|
self.assertEqual(self.encoder(u'spamspam'), (self.spam, 8))
|
|
|
|
self.assertEqual(self.reader(StringIO(self.spam)).read(), u'spamspam')
|
|
|
|
f = StringIO()
|
|
|
|
self.writer(f).write(u'spamspam')
|
|
|
|
self.assertEqual(f.getvalue(), self.spam)
|
2003-01-27 07:28:52 -04:00
|
|
|
|
|
|
|
def test_basic_errors(self):
|
|
|
|
self.encoder, self.decoder, self.reader, self.writer = \
|
|
|
|
iconv_codec.lookup("ascii")
|
|
|
|
def testencerror(errors):
|
|
|
|
return self.encoder(u'sp\ufffdam', errors)
|
|
|
|
def testdecerror(errors):
|
|
|
|
return self.decoder('sp\xffam', errors)
|
|
|
|
|
|
|
|
self.assertRaises(UnicodeEncodeError, testencerror, 'strict')
|
|
|
|
self.assertRaises(UnicodeDecodeError, testdecerror, 'strict')
|
|
|
|
self.assertEqual(testencerror('replace'), ('sp?am', 5))
|
|
|
|
self.assertEqual(testdecerror('replace'), (u'sp\ufffdam', 5))
|
|
|
|
self.assertEqual(testencerror('ignore'), ('spam', 5))
|
|
|
|
self.assertEqual(testdecerror('ignore'), (u'spam', 5))
|
|
|
|
|
|
|
|
def test_pep293_errors(self):
|
|
|
|
self.encoder, self.decoder, self.reader, self.writer = \
|
|
|
|
iconv_codec.lookup("ascii")
|
|
|
|
def testencerror(errors):
|
|
|
|
return self.encoder(u'sp\ufffdam', errors)
|
|
|
|
def testdecerror(errors):
|
|
|
|
return self.decoder('sp\xffam', errors)
|
|
|
|
|
|
|
|
self.assertEqual(testencerror('xmlcharrefreplace'),
|
|
|
|
('sp�am', 5))
|
|
|
|
self.assertEqual(testencerror('backslashreplace'),
|
|
|
|
('sp\\ufffdam', 5))
|
|
|
|
|
|
|
|
def error_bomb(exc):
|
|
|
|
return (u'*'*40, len(exc.object))
|
|
|
|
def error_mock(exc):
|
|
|
|
error_mock.lastexc = exc
|
|
|
|
return (unicode(exc.object[exc.start - 1]), exc.end)
|
|
|
|
|
|
|
|
codecs.register_error('test_iconv_codec.bomb', error_bomb)
|
|
|
|
codecs.register_error('test_iconv_codec.mock', error_mock)
|
|
|
|
|
|
|
|
self.assertEqual(testencerror('test_iconv_codec.bomb'),
|
|
|
|
('sp' + ('*'*40), 5))
|
|
|
|
self.assertEqual(testdecerror('test_iconv_codec.bomb'),
|
|
|
|
(u'sp' + (u'*'*40), 5))
|
|
|
|
|
|
|
|
self.assertEqual(testencerror('test_iconv_codec.mock'), ('sppam', 5))
|
|
|
|
exc = error_mock.lastexc
|
|
|
|
self.assertEqual(exc.object, u'sp\ufffdam')
|
|
|
|
self.assertEqual(exc.start, 2)
|
|
|
|
self.assertEqual(exc.end, 3)
|
|
|
|
self.assert_(isinstance(exc, UnicodeEncodeError))
|
|
|
|
|
|
|
|
self.assertEqual(testdecerror('test_iconv_codec.mock'), (u'sppam', 5))
|
|
|
|
exc = error_mock.lastexc
|
|
|
|
self.assertEqual(exc.object, 'sp\xffam')
|
|
|
|
self.assertEqual(exc.start, 2)
|
|
|
|
self.assertEqual(exc.end, 3)
|
|
|
|
self.assert_(isinstance(exc, UnicodeDecodeError))
|
|
|
|
|
|
|
|
def test_empty_escape_decode(self):
|
|
|
|
self.encoder, self.decoder, self.reader, self.writer = \
|
|
|
|
iconv_codec.lookup("ascii")
|
|
|
|
self.assertEquals(self.decoder(u""), ("", 0))
|
|
|
|
self.assertEquals(self.encoder(""), (u"", 0))
|
|
|
|
|
|
|
|
def test_main():
|
|
|
|
suite = unittest.TestSuite()
|
|
|
|
suite.addTest(unittest.makeSuite(IconvCodecTest))
|
|
|
|
test_support.run_suite(suite)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
test_main()
|
|
|
|
|
|
|
|
# ex: ts=8 sts=4 et
|