1 import sys
2 from test.test_json import PyTest, CTest
3
4
5 class ESC[4;38;5;81mTestScanstring:
6 def test_scanstring(self):
7 scanstring = self.json.decoder.scanstring
8 self.assertEqual(
9 scanstring('"z\U0001d120x"', 1, True),
10 ('z\U0001d120x', 5))
11
12 self.assertEqual(
13 scanstring('"\\u007b"', 1, True),
14 ('{', 8))
15
16 self.assertEqual(
17 scanstring('"A JSON payload should be an object or array, not a string."', 1, True),
18 ('A JSON payload should be an object or array, not a string.', 60))
19
20 self.assertEqual(
21 scanstring('["Unclosed array"', 2, True),
22 ('Unclosed array', 17))
23
24 self.assertEqual(
25 scanstring('["extra comma",]', 2, True),
26 ('extra comma', 14))
27
28 self.assertEqual(
29 scanstring('["double extra comma",,]', 2, True),
30 ('double extra comma', 21))
31
32 self.assertEqual(
33 scanstring('["Comma after the close"],', 2, True),
34 ('Comma after the close', 24))
35
36 self.assertEqual(
37 scanstring('["Extra close"]]', 2, True),
38 ('Extra close', 14))
39
40 self.assertEqual(
41 scanstring('{"Extra comma": true,}', 2, True),
42 ('Extra comma', 14))
43
44 self.assertEqual(
45 scanstring('{"Extra value after close": true} "misplaced quoted value"', 2, True),
46 ('Extra value after close', 26))
47
48 self.assertEqual(
49 scanstring('{"Illegal expression": 1 + 2}', 2, True),
50 ('Illegal expression', 21))
51
52 self.assertEqual(
53 scanstring('{"Illegal invocation": alert()}', 2, True),
54 ('Illegal invocation', 21))
55
56 self.assertEqual(
57 scanstring('{"Numbers cannot have leading zeroes": 013}', 2, True),
58 ('Numbers cannot have leading zeroes', 37))
59
60 self.assertEqual(
61 scanstring('{"Numbers cannot be hex": 0x14}', 2, True),
62 ('Numbers cannot be hex', 24))
63
64 self.assertEqual(
65 scanstring('[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]', 21, True),
66 ('Too deep', 30))
67
68 self.assertEqual(
69 scanstring('{"Missing colon" null}', 2, True),
70 ('Missing colon', 16))
71
72 self.assertEqual(
73 scanstring('{"Double colon":: null}', 2, True),
74 ('Double colon', 15))
75
76 self.assertEqual(
77 scanstring('{"Comma instead of colon", null}', 2, True),
78 ('Comma instead of colon', 25))
79
80 self.assertEqual(
81 scanstring('["Colon instead of comma": false]', 2, True),
82 ('Colon instead of comma', 25))
83
84 self.assertEqual(
85 scanstring('["Bad value", truth]', 2, True),
86 ('Bad value', 12))
87
88 def test_surrogates(self):
89 scanstring = self.json.decoder.scanstring
90 def assertScan(given, expect):
91 self.assertEqual(scanstring(given, 1, True),
92 (expect, len(given)))
93
94 assertScan('"z\\ud834\\u0079x"', 'z\ud834yx')
95 assertScan('"z\\ud834\\udd20x"', 'z\U0001d120x')
96 assertScan('"z\\ud834\\ud834\\udd20x"', 'z\ud834\U0001d120x')
97 assertScan('"z\\ud834x"', 'z\ud834x')
98 assertScan('"z\\ud834\udd20x12345"', 'z\ud834\udd20x12345')
99 assertScan('"z\\udd20x"', 'z\udd20x')
100 assertScan('"z\ud834\udd20x"', 'z\ud834\udd20x')
101 assertScan('"z\ud834\\udd20x"', 'z\ud834\udd20x')
102 assertScan('"z\ud834x"', 'z\ud834x')
103
104 def test_bad_escapes(self):
105 scanstring = self.json.decoder.scanstring
106 bad_escapes = [
107 '"\\"',
108 '"\\x"',
109 '"\\u"',
110 '"\\u0"',
111 '"\\u01"',
112 '"\\u012"',
113 '"\\uz012"',
114 '"\\u0z12"',
115 '"\\u01z2"',
116 '"\\u012z"',
117 '"\\u0x12"',
118 '"\\u0X12"',
119 '"\\ud834\\"',
120 '"\\ud834\\u"',
121 '"\\ud834\\ud"',
122 '"\\ud834\\udd"',
123 '"\\ud834\\udd2"',
124 '"\\ud834\\uzdd2"',
125 '"\\ud834\\udzd2"',
126 '"\\ud834\\uddz2"',
127 '"\\ud834\\udd2z"',
128 '"\\ud834\\u0x20"',
129 '"\\ud834\\u0X20"',
130 ]
131 for s in bad_escapes:
132 with self.assertRaises(self.JSONDecodeError, msg=s):
133 scanstring(s, 1, True)
134
135 def test_overflow(self):
136 with self.assertRaises(OverflowError):
137 self.json.decoder.scanstring(b"xxx", sys.maxsize+1)
138
139
140 class ESC[4;38;5;81mTestPyScanstring(ESC[4;38;5;149mTestScanstring, ESC[4;38;5;149mPyTest): pass
141 class ESC[4;38;5;81mTestCScanstring(ESC[4;38;5;149mTestScanstring, ESC[4;38;5;149mCTest): pass