2008-05-05 17:21:38 -03:00
|
|
|
import sys
|
2011-05-14 00:24:53 -03:00
|
|
|
from json.tests import PyTest, CTest
|
2008-05-05 17:21:38 -03:00
|
|
|
|
|
|
|
|
2011-05-14 00:24:53 -03:00
|
|
|
class TestScanstring(object):
|
|
|
|
def test_scanstring(self):
|
|
|
|
scanstring = self.json.decoder.scanstring
|
2008-05-05 17:21:38 -03:00
|
|
|
if sys.maxunicode == 65535:
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring(u'"z\U0001d120x"', 1, None, True),
|
|
|
|
(u'z\U0001d120x', 6))
|
|
|
|
else:
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring(u'"z\U0001d120x"', 1, None, True),
|
|
|
|
(u'z\U0001d120x', 5))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('"\\u007b"', 1, None, True),
|
|
|
|
(u'{', 8))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('"A JSON payload should be an object or array, not a string."', 1, None, True),
|
|
|
|
(u'A JSON payload should be an object or array, not a string.', 60))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["Unclosed array"', 2, None, True),
|
|
|
|
(u'Unclosed array', 17))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["extra comma",]', 2, None, True),
|
|
|
|
(u'extra comma', 14))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["double extra comma",,]', 2, None, True),
|
|
|
|
(u'double extra comma', 21))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["Comma after the close"],', 2, None, True),
|
|
|
|
(u'Comma after the close', 24))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["Extra close"]]', 2, None, True),
|
|
|
|
(u'Extra close', 14))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Extra comma": true,}', 2, None, True),
|
|
|
|
(u'Extra comma', 14))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Extra value after close": true} "misplaced quoted value"', 2, None, True),
|
|
|
|
(u'Extra value after close', 26))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Illegal expression": 1 + 2}', 2, None, True),
|
|
|
|
(u'Illegal expression', 21))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Illegal invocation": alert()}', 2, None, True),
|
|
|
|
(u'Illegal invocation', 21))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Numbers cannot have leading zeroes": 013}', 2, None, True),
|
|
|
|
(u'Numbers cannot have leading zeroes', 37))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Numbers cannot be hex": 0x14}', 2, None, True),
|
|
|
|
(u'Numbers cannot be hex', 24))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]', 21, None, True),
|
|
|
|
(u'Too deep', 30))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Missing colon" null}', 2, None, True),
|
|
|
|
(u'Missing colon', 16))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Double colon":: null}', 2, None, True),
|
|
|
|
(u'Double colon', 15))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('{"Comma instead of colon", null}', 2, None, True),
|
|
|
|
(u'Comma instead of colon', 25))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["Colon instead of comma": false]', 2, None, True),
|
|
|
|
(u'Colon instead of comma', 25))
|
|
|
|
|
2010-11-21 09:34:58 -04:00
|
|
|
self.assertEqual(
|
2008-05-05 17:21:38 -03:00
|
|
|
scanstring('["Bad value", truth]', 2, None, True),
|
|
|
|
(u'Bad value', 12))
|
2008-10-16 18:09:28 -03:00
|
|
|
|
2013-11-26 15:25:15 -04:00
|
|
|
def test_surrogates(self):
|
|
|
|
scanstring = self.json.decoder.scanstring
|
|
|
|
def assertScan(given, expect):
|
|
|
|
self.assertEqual(scanstring(given, 1, None, True),
|
|
|
|
(expect, len(given)))
|
|
|
|
if not isinstance(given, unicode):
|
|
|
|
given = unicode(given)
|
|
|
|
self.assertEqual(scanstring(given, 1, None, True),
|
|
|
|
(expect, len(given)))
|
|
|
|
|
2013-12-01 11:30:55 -04:00
|
|
|
surrogates = unichr(0xd834) + unichr(0xdd20)
|
2013-11-26 15:25:15 -04:00
|
|
|
assertScan('"z\\ud834\\u0079x"', u'z\ud834yx')
|
|
|
|
assertScan('"z\\ud834\\udd20x"', u'z\U0001d120x')
|
|
|
|
assertScan('"z\\ud834\\ud834\\udd20x"', u'z\ud834\U0001d120x')
|
|
|
|
assertScan('"z\\ud834x"', u'z\ud834x')
|
2013-12-01 11:30:55 -04:00
|
|
|
assertScan(u'"z\\ud834\udd20x12345"', u'z%sx12345' % surrogates)
|
2013-11-26 15:25:15 -04:00
|
|
|
assertScan('"z\\udd20x"', u'z\udd20x')
|
|
|
|
assertScan(u'"z\ud834\udd20x"', u'z\ud834\udd20x')
|
2013-12-01 11:30:55 -04:00
|
|
|
assertScan(u'"z\ud834\\udd20x"', u'z%sx' % surrogates)
|
2013-11-26 15:25:15 -04:00
|
|
|
assertScan(u'"z\ud834x"', u'z\ud834x')
|
|
|
|
|
|
|
|
def test_bad_escapes(self):
|
|
|
|
scanstring = self.json.decoder.scanstring
|
|
|
|
bad_escapes = [
|
|
|
|
'"\\"',
|
|
|
|
'"\\x"',
|
|
|
|
'"\\u"',
|
|
|
|
'"\\u0"',
|
|
|
|
'"\\u01"',
|
|
|
|
'"\\u012"',
|
|
|
|
'"\\uz012"',
|
|
|
|
'"\\u0z12"',
|
|
|
|
'"\\u01z2"',
|
|
|
|
'"\\u012z"',
|
|
|
|
'"\\u0x12"',
|
|
|
|
'"\\u0X12"',
|
|
|
|
'"\\ud834\\"',
|
|
|
|
'"\\ud834\\u"',
|
|
|
|
'"\\ud834\\ud"',
|
|
|
|
'"\\ud834\\udd"',
|
|
|
|
'"\\ud834\\udd2"',
|
|
|
|
'"\\ud834\\uzdd2"',
|
|
|
|
'"\\ud834\\udzd2"',
|
|
|
|
'"\\ud834\\uddz2"',
|
|
|
|
'"\\ud834\\udd2z"',
|
|
|
|
'"\\ud834\\u0x20"',
|
|
|
|
'"\\ud834\\u0X20"',
|
|
|
|
]
|
|
|
|
for s in bad_escapes:
|
|
|
|
with self.assertRaises(ValueError):
|
|
|
|
scanstring(s, 1, None, True)
|
|
|
|
|
2008-10-16 18:09:28 -03:00
|
|
|
def test_issue3623(self):
|
2011-05-14 00:24:53 -03:00
|
|
|
self.assertRaises(ValueError, self.json.decoder.scanstring, b"xxx", 1,
|
2008-10-16 18:09:28 -03:00
|
|
|
"xxx")
|
|
|
|
self.assertRaises(UnicodeDecodeError,
|
2011-05-14 00:24:53 -03:00
|
|
|
self.json.encoder.encode_basestring_ascii, b"xx\xff")
|
2009-05-05 04:48:12 -03:00
|
|
|
|
|
|
|
def test_overflow(self):
|
2011-05-14 00:24:53 -03:00
|
|
|
with self.assertRaises(OverflowError):
|
|
|
|
self.json.decoder.scanstring(b"xxx", sys.maxsize+1)
|
|
|
|
|
|
|
|
|
|
|
|
class TestPyScanstring(TestScanstring, PyTest): pass
|
|
|
|
class TestCScanstring(TestScanstring, CTest): pass
|