OLD | NEW |
| (Empty) |
1 {"tests": [ | |
2 | |
3 {"description": "Undefined named entity in attribute value ending in semicolon a
nd whose name starts with a known entity name.", | |
4 "input":"<h a='¬i;'>", | |
5 "output": ["ParseError", ["StartTag", "h", {"a": "¬i;"}]]}, | |
6 | |
7 {"description": "Entity name followed by the equals sign in an attribute value."
, | |
8 "input":"<h a='&lang='>", | |
9 "output": ["ParseError", ["StartTag", "h", {"a": "&lang="}]]}, | |
10 | |
11 {"description": "CR as numeric entity", | |
12 "input":"
", | |
13 "output": ["ParseError", ["Character", "\r"]]}, | |
14 | |
15 {"description": "CR as hexadecimal numeric entity", | |
16 "input":"
", | |
17 "output": ["ParseError", ["Character", "\r"]]}, | |
18 | |
19 {"description": "Windows-1252 EURO SIGN numeric entity.", | |
20 "input":"€", | |
21 "output": ["ParseError", ["Character", "\u20AC"]]}, | |
22 | |
23 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
24 "input":"", | |
25 "output": ["ParseError", ["Character", "\u0081"]]}, | |
26 | |
27 {"description": "Windows-1252 SINGLE LOW-9 QUOTATION MARK numeric entity.", | |
28 "input":"‚", | |
29 "output": ["ParseError", ["Character", "\u201A"]]}, | |
30 | |
31 {"description": "Windows-1252 LATIN SMALL LETTER F WITH HOOK numeric entity.", | |
32 "input":"ƒ", | |
33 "output": ["ParseError", ["Character", "\u0192"]]}, | |
34 | |
35 {"description": "Windows-1252 DOUBLE LOW-9 QUOTATION MARK numeric entity.", | |
36 "input":"„", | |
37 "output": ["ParseError", ["Character", "\u201E"]]}, | |
38 | |
39 {"description": "Windows-1252 HORIZONTAL ELLIPSIS numeric entity.", | |
40 "input":"…", | |
41 "output": ["ParseError", ["Character", "\u2026"]]}, | |
42 | |
43 {"description": "Windows-1252 DAGGER numeric entity.", | |
44 "input":"†", | |
45 "output": ["ParseError", ["Character", "\u2020"]]}, | |
46 | |
47 {"description": "Windows-1252 DOUBLE DAGGER numeric entity.", | |
48 "input":"‡", | |
49 "output": ["ParseError", ["Character", "\u2021"]]}, | |
50 | |
51 {"description": "Windows-1252 MODIFIER LETTER CIRCUMFLEX ACCENT numeric entity."
, | |
52 "input":"ˆ", | |
53 "output": ["ParseError", ["Character", "\u02C6"]]}, | |
54 | |
55 {"description": "Windows-1252 PER MILLE SIGN numeric entity.", | |
56 "input":"‰", | |
57 "output": ["ParseError", ["Character", "\u2030"]]}, | |
58 | |
59 {"description": "Windows-1252 LATIN CAPITAL LETTER S WITH CARON numeric entity."
, | |
60 "input":"Š", | |
61 "output": ["ParseError", ["Character", "\u0160"]]}, | |
62 | |
63 {"description": "Windows-1252 SINGLE LEFT-POINTING ANGLE QUOTATION MARK numeric
entity.", | |
64 "input":"‹", | |
65 "output": ["ParseError", ["Character", "\u2039"]]}, | |
66 | |
67 {"description": "Windows-1252 LATIN CAPITAL LIGATURE OE numeric entity.", | |
68 "input":"Œ", | |
69 "output": ["ParseError", ["Character", "\u0152"]]}, | |
70 | |
71 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
72 "input":"", | |
73 "output": ["ParseError", ["Character", "\u008D"]]}, | |
74 | |
75 {"description": "Windows-1252 LATIN CAPITAL LETTER Z WITH CARON numeric entity."
, | |
76 "input":"Ž", | |
77 "output": ["ParseError", ["Character", "\u017D"]]}, | |
78 | |
79 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
80 "input":"", | |
81 "output": ["ParseError", ["Character", "\u008F"]]}, | |
82 | |
83 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
84 "input":"", | |
85 "output": ["ParseError", ["Character", "\u0090"]]}, | |
86 | |
87 {"description": "Windows-1252 LEFT SINGLE QUOTATION MARK numeric entity.", | |
88 "input":"‘", | |
89 "output": ["ParseError", ["Character", "\u2018"]]}, | |
90 | |
91 {"description": "Windows-1252 RIGHT SINGLE QUOTATION MARK numeric entity.", | |
92 "input":"’", | |
93 "output": ["ParseError", ["Character", "\u2019"]]}, | |
94 | |
95 {"description": "Windows-1252 LEFT DOUBLE QUOTATION MARK numeric entity.", | |
96 "input":"“", | |
97 "output": ["ParseError", ["Character", "\u201C"]]}, | |
98 | |
99 {"description": "Windows-1252 RIGHT DOUBLE QUOTATION MARK numeric entity.", | |
100 "input":"”", | |
101 "output": ["ParseError", ["Character", "\u201D"]]}, | |
102 | |
103 {"description": "Windows-1252 BULLET numeric entity.", | |
104 "input":"•", | |
105 "output": ["ParseError", ["Character", "\u2022"]]}, | |
106 | |
107 {"description": "Windows-1252 EN DASH numeric entity.", | |
108 "input":"–", | |
109 "output": ["ParseError", ["Character", "\u2013"]]}, | |
110 | |
111 {"description": "Windows-1252 EM DASH numeric entity.", | |
112 "input":"—", | |
113 "output": ["ParseError", ["Character", "\u2014"]]}, | |
114 | |
115 {"description": "Windows-1252 SMALL TILDE numeric entity.", | |
116 "input":"˜", | |
117 "output": ["ParseError", ["Character", "\u02DC"]]}, | |
118 | |
119 {"description": "Windows-1252 TRADE MARK SIGN numeric entity.", | |
120 "input":"™", | |
121 "output": ["ParseError", ["Character", "\u2122"]]}, | |
122 | |
123 {"description": "Windows-1252 LATIN SMALL LETTER S WITH CARON numeric entity.", | |
124 "input":"š", | |
125 "output": ["ParseError", ["Character", "\u0161"]]}, | |
126 | |
127 {"description": "Windows-1252 SINGLE RIGHT-POINTING ANGLE QUOTATION MARK numeric
entity.", | |
128 "input":"›", | |
129 "output": ["ParseError", ["Character", "\u203A"]]}, | |
130 | |
131 {"description": "Windows-1252 LATIN SMALL LIGATURE OE numeric entity.", | |
132 "input":"œ", | |
133 "output": ["ParseError", ["Character", "\u0153"]]}, | |
134 | |
135 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
136 "input":"", | |
137 "output": ["ParseError", ["Character", "\u009D"]]}, | |
138 | |
139 {"description": "Windows-1252 EURO SIGN hexadecimal numeric entity.", | |
140 "input":"€", | |
141 "output": ["ParseError", ["Character", "\u20AC"]]}, | |
142 | |
143 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
144 "input":"", | |
145 "output": ["ParseError", ["Character", "\u0081"]]}, | |
146 | |
147 {"description": "Windows-1252 SINGLE LOW-9 QUOTATION MARK hexadecimal numeric en
tity.", | |
148 "input":"‚", | |
149 "output": ["ParseError", ["Character", "\u201A"]]}, | |
150 | |
151 {"description": "Windows-1252 LATIN SMALL LETTER F WITH HOOK hexadecimal numeric
entity.", | |
152 "input":"ƒ", | |
153 "output": ["ParseError", ["Character", "\u0192"]]}, | |
154 | |
155 {"description": "Windows-1252 DOUBLE LOW-9 QUOTATION MARK hexadecimal numeric en
tity.", | |
156 "input":"„", | |
157 "output": ["ParseError", ["Character", "\u201E"]]}, | |
158 | |
159 {"description": "Windows-1252 HORIZONTAL ELLIPSIS hexadecimal numeric entity.", | |
160 "input":"…", | |
161 "output": ["ParseError", ["Character", "\u2026"]]}, | |
162 | |
163 {"description": "Windows-1252 DAGGER hexadecimal numeric entity.", | |
164 "input":"†", | |
165 "output": ["ParseError", ["Character", "\u2020"]]}, | |
166 | |
167 {"description": "Windows-1252 DOUBLE DAGGER hexadecimal numeric entity.", | |
168 "input":"‡", | |
169 "output": ["ParseError", ["Character", "\u2021"]]}, | |
170 | |
171 {"description": "Windows-1252 MODIFIER LETTER CIRCUMFLEX ACCENT hexadecimal nume
ric entity.", | |
172 "input":"ˆ", | |
173 "output": ["ParseError", ["Character", "\u02C6"]]}, | |
174 | |
175 {"description": "Windows-1252 PER MILLE SIGN hexadecimal numeric entity.", | |
176 "input":"‰", | |
177 "output": ["ParseError", ["Character", "\u2030"]]}, | |
178 | |
179 {"description": "Windows-1252 LATIN CAPITAL LETTER S WITH CARON hexadecimal nume
ric entity.", | |
180 "input":"Š", | |
181 "output": ["ParseError", ["Character", "\u0160"]]}, | |
182 | |
183 {"description": "Windows-1252 SINGLE LEFT-POINTING ANGLE QUOTATION MARK hexadeci
mal numeric entity.", | |
184 "input":"‹", | |
185 "output": ["ParseError", ["Character", "\u2039"]]}, | |
186 | |
187 {"description": "Windows-1252 LATIN CAPITAL LIGATURE OE hexadecimal numeric enti
ty.", | |
188 "input":"Œ", | |
189 "output": ["ParseError", ["Character", "\u0152"]]}, | |
190 | |
191 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
192 "input":"", | |
193 "output": ["ParseError", ["Character", "\u008D"]]}, | |
194 | |
195 {"description": "Windows-1252 LATIN CAPITAL LETTER Z WITH CARON hexadecimal nume
ric entity.", | |
196 "input":"Ž", | |
197 "output": ["ParseError", ["Character", "\u017D"]]}, | |
198 | |
199 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
200 "input":"", | |
201 "output": ["ParseError", ["Character", "\u008F"]]}, | |
202 | |
203 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
204 "input":"", | |
205 "output": ["ParseError", ["Character", "\u0090"]]}, | |
206 | |
207 {"description": "Windows-1252 LEFT SINGLE QUOTATION MARK hexadecimal numeric ent
ity.", | |
208 "input":"‘", | |
209 "output": ["ParseError", ["Character", "\u2018"]]}, | |
210 | |
211 {"description": "Windows-1252 RIGHT SINGLE QUOTATION MARK hexadecimal numeric en
tity.", | |
212 "input":"’", | |
213 "output": ["ParseError", ["Character", "\u2019"]]}, | |
214 | |
215 {"description": "Windows-1252 LEFT DOUBLE QUOTATION MARK hexadecimal numeric ent
ity.", | |
216 "input":"“", | |
217 "output": ["ParseError", ["Character", "\u201C"]]}, | |
218 | |
219 {"description": "Windows-1252 RIGHT DOUBLE QUOTATION MARK hexadecimal numeric en
tity.", | |
220 "input":"”", | |
221 "output": ["ParseError", ["Character", "\u201D"]]}, | |
222 | |
223 {"description": "Windows-1252 BULLET hexadecimal numeric entity.", | |
224 "input":"•", | |
225 "output": ["ParseError", ["Character", "\u2022"]]}, | |
226 | |
227 {"description": "Windows-1252 EN DASH hexadecimal numeric entity.", | |
228 "input":"–", | |
229 "output": ["ParseError", ["Character", "\u2013"]]}, | |
230 | |
231 {"description": "Windows-1252 EM DASH hexadecimal numeric entity.", | |
232 "input":"—", | |
233 "output": ["ParseError", ["Character", "\u2014"]]}, | |
234 | |
235 {"description": "Windows-1252 SMALL TILDE hexadecimal numeric entity.", | |
236 "input":"˜", | |
237 "output": ["ParseError", ["Character", "\u02DC"]]}, | |
238 | |
239 {"description": "Windows-1252 TRADE MARK SIGN hexadecimal numeric entity.", | |
240 "input":"™", | |
241 "output": ["ParseError", ["Character", "\u2122"]]}, | |
242 | |
243 {"description": "Windows-1252 LATIN SMALL LETTER S WITH CARON hexadecimal numeri
c entity.", | |
244 "input":"š", | |
245 "output": ["ParseError", ["Character", "\u0161"]]}, | |
246 | |
247 {"description": "Windows-1252 SINGLE RIGHT-POINTING ANGLE QUOTATION MARK hexadec
imal numeric entity.", | |
248 "input":"›", | |
249 "output": ["ParseError", ["Character", "\u203A"]]}, | |
250 | |
251 {"description": "Windows-1252 LATIN SMALL LIGATURE OE hexadecimal numeric entity
.", | |
252 "input":"œ", | |
253 "output": ["ParseError", ["Character", "\u0153"]]}, | |
254 | |
255 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
256 "input":"", | |
257 "output": ["ParseError", ["Character", "\u009D"]]}, | |
258 | |
259 {"description": "Windows-1252 LATIN SMALL LETTER Z WITH CARON hexadecimal numeri
c entity.", | |
260 "input":"ž", | |
261 "output": ["ParseError", ["Character", "\u017E"]]}, | |
262 | |
263 {"description": "Windows-1252 LATIN CAPITAL LETTER Y WITH DIAERESIS hexadecimal
numeric entity.", | |
264 "input":"Ÿ", | |
265 "output": ["ParseError", ["Character", "\u0178"]]}, | |
266 | |
267 {"description": "Decimal numeric entity followed by hex character a.", | |
268 "input":"aa", | |
269 "output": ["ParseError", ["Character", "aa"]]}, | |
270 | |
271 {"description": "Decimal numeric entity followed by hex character A.", | |
272 "input":"aA", | |
273 "output": ["ParseError", ["Character", "aA"]]}, | |
274 | |
275 {"description": "Decimal numeric entity followed by hex character f.", | |
276 "input":"af", | |
277 "output": ["ParseError", ["Character", "af"]]}, | |
278 | |
279 {"description": "Decimal numeric entity followed by hex character A.", | |
280 "input":"aF", | |
281 "output": ["ParseError", ["Character", "aF"]]} | |
282 | |
283 ]} | |
OLD | NEW |