| OLD | NEW |
| (Empty) |
| 1 {"tests": [ | |
| 2 | |
| 3 {"description": "Undefined named entity in attribute value ending in semicolon a
nd whose name starts with a known entity name.", | |
| 4 "input":"<h a='¬i;'>", | |
| 5 "output": ["ParseError", ["StartTag", "h", {"a": "¬i;"}]]}, | |
| 6 | |
| 7 {"description": "Entity name followed by the equals sign in an attribute value."
, | |
| 8 "input":"<h a='&lang='>", | |
| 9 "output": ["ParseError", ["StartTag", "h", {"a": "&lang="}]]}, | |
| 10 | |
| 11 {"description": "CR as numeric entity", | |
| 12 "input":"
", | |
| 13 "output": ["ParseError", ["Character", "\r"]]}, | |
| 14 | |
| 15 {"description": "CR as hexadecimal numeric entity", | |
| 16 "input":"
", | |
| 17 "output": ["ParseError", ["Character", "\r"]]}, | |
| 18 | |
| 19 {"description": "Windows-1252 EURO SIGN numeric entity.", | |
| 20 "input":"€", | |
| 21 "output": ["ParseError", ["Character", "\u20AC"]]}, | |
| 22 | |
| 23 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
| 24 "input":"", | |
| 25 "output": ["ParseError", ["Character", "\u0081"]]}, | |
| 26 | |
| 27 {"description": "Windows-1252 SINGLE LOW-9 QUOTATION MARK numeric entity.", | |
| 28 "input":"‚", | |
| 29 "output": ["ParseError", ["Character", "\u201A"]]}, | |
| 30 | |
| 31 {"description": "Windows-1252 LATIN SMALL LETTER F WITH HOOK numeric entity.", | |
| 32 "input":"ƒ", | |
| 33 "output": ["ParseError", ["Character", "\u0192"]]}, | |
| 34 | |
| 35 {"description": "Windows-1252 DOUBLE LOW-9 QUOTATION MARK numeric entity.", | |
| 36 "input":"„", | |
| 37 "output": ["ParseError", ["Character", "\u201E"]]}, | |
| 38 | |
| 39 {"description": "Windows-1252 HORIZONTAL ELLIPSIS numeric entity.", | |
| 40 "input":"…", | |
| 41 "output": ["ParseError", ["Character", "\u2026"]]}, | |
| 42 | |
| 43 {"description": "Windows-1252 DAGGER numeric entity.", | |
| 44 "input":"†", | |
| 45 "output": ["ParseError", ["Character", "\u2020"]]}, | |
| 46 | |
| 47 {"description": "Windows-1252 DOUBLE DAGGER numeric entity.", | |
| 48 "input":"‡", | |
| 49 "output": ["ParseError", ["Character", "\u2021"]]}, | |
| 50 | |
| 51 {"description": "Windows-1252 MODIFIER LETTER CIRCUMFLEX ACCENT numeric entity."
, | |
| 52 "input":"ˆ", | |
| 53 "output": ["ParseError", ["Character", "\u02C6"]]}, | |
| 54 | |
| 55 {"description": "Windows-1252 PER MILLE SIGN numeric entity.", | |
| 56 "input":"‰", | |
| 57 "output": ["ParseError", ["Character", "\u2030"]]}, | |
| 58 | |
| 59 {"description": "Windows-1252 LATIN CAPITAL LETTER S WITH CARON numeric entity."
, | |
| 60 "input":"Š", | |
| 61 "output": ["ParseError", ["Character", "\u0160"]]}, | |
| 62 | |
| 63 {"description": "Windows-1252 SINGLE LEFT-POINTING ANGLE QUOTATION MARK numeric
entity.", | |
| 64 "input":"‹", | |
| 65 "output": ["ParseError", ["Character", "\u2039"]]}, | |
| 66 | |
| 67 {"description": "Windows-1252 LATIN CAPITAL LIGATURE OE numeric entity.", | |
| 68 "input":"Œ", | |
| 69 "output": ["ParseError", ["Character", "\u0152"]]}, | |
| 70 | |
| 71 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
| 72 "input":"", | |
| 73 "output": ["ParseError", ["Character", "\u008D"]]}, | |
| 74 | |
| 75 {"description": "Windows-1252 LATIN CAPITAL LETTER Z WITH CARON numeric entity."
, | |
| 76 "input":"Ž", | |
| 77 "output": ["ParseError", ["Character", "\u017D"]]}, | |
| 78 | |
| 79 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
| 80 "input":"", | |
| 81 "output": ["ParseError", ["Character", "\u008F"]]}, | |
| 82 | |
| 83 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
| 84 "input":"", | |
| 85 "output": ["ParseError", ["Character", "\u0090"]]}, | |
| 86 | |
| 87 {"description": "Windows-1252 LEFT SINGLE QUOTATION MARK numeric entity.", | |
| 88 "input":"‘", | |
| 89 "output": ["ParseError", ["Character", "\u2018"]]}, | |
| 90 | |
| 91 {"description": "Windows-1252 RIGHT SINGLE QUOTATION MARK numeric entity.", | |
| 92 "input":"’", | |
| 93 "output": ["ParseError", ["Character", "\u2019"]]}, | |
| 94 | |
| 95 {"description": "Windows-1252 LEFT DOUBLE QUOTATION MARK numeric entity.", | |
| 96 "input":"“", | |
| 97 "output": ["ParseError", ["Character", "\u201C"]]}, | |
| 98 | |
| 99 {"description": "Windows-1252 RIGHT DOUBLE QUOTATION MARK numeric entity.", | |
| 100 "input":"”", | |
| 101 "output": ["ParseError", ["Character", "\u201D"]]}, | |
| 102 | |
| 103 {"description": "Windows-1252 BULLET numeric entity.", | |
| 104 "input":"•", | |
| 105 "output": ["ParseError", ["Character", "\u2022"]]}, | |
| 106 | |
| 107 {"description": "Windows-1252 EN DASH numeric entity.", | |
| 108 "input":"–", | |
| 109 "output": ["ParseError", ["Character", "\u2013"]]}, | |
| 110 | |
| 111 {"description": "Windows-1252 EM DASH numeric entity.", | |
| 112 "input":"—", | |
| 113 "output": ["ParseError", ["Character", "\u2014"]]}, | |
| 114 | |
| 115 {"description": "Windows-1252 SMALL TILDE numeric entity.", | |
| 116 "input":"˜", | |
| 117 "output": ["ParseError", ["Character", "\u02DC"]]}, | |
| 118 | |
| 119 {"description": "Windows-1252 TRADE MARK SIGN numeric entity.", | |
| 120 "input":"™", | |
| 121 "output": ["ParseError", ["Character", "\u2122"]]}, | |
| 122 | |
| 123 {"description": "Windows-1252 LATIN SMALL LETTER S WITH CARON numeric entity.", | |
| 124 "input":"š", | |
| 125 "output": ["ParseError", ["Character", "\u0161"]]}, | |
| 126 | |
| 127 {"description": "Windows-1252 SINGLE RIGHT-POINTING ANGLE QUOTATION MARK numeric
entity.", | |
| 128 "input":"›", | |
| 129 "output": ["ParseError", ["Character", "\u203A"]]}, | |
| 130 | |
| 131 {"description": "Windows-1252 LATIN SMALL LIGATURE OE numeric entity.", | |
| 132 "input":"œ", | |
| 133 "output": ["ParseError", ["Character", "\u0153"]]}, | |
| 134 | |
| 135 {"description": "Windows-1252 REPLACEMENT CHAR numeric entity.", | |
| 136 "input":"", | |
| 137 "output": ["ParseError", ["Character", "\u009D"]]}, | |
| 138 | |
| 139 {"description": "Windows-1252 EURO SIGN hexadecimal numeric entity.", | |
| 140 "input":"€", | |
| 141 "output": ["ParseError", ["Character", "\u20AC"]]}, | |
| 142 | |
| 143 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
| 144 "input":"", | |
| 145 "output": ["ParseError", ["Character", "\u0081"]]}, | |
| 146 | |
| 147 {"description": "Windows-1252 SINGLE LOW-9 QUOTATION MARK hexadecimal numeric en
tity.", | |
| 148 "input":"‚", | |
| 149 "output": ["ParseError", ["Character", "\u201A"]]}, | |
| 150 | |
| 151 {"description": "Windows-1252 LATIN SMALL LETTER F WITH HOOK hexadecimal numeric
entity.", | |
| 152 "input":"ƒ", | |
| 153 "output": ["ParseError", ["Character", "\u0192"]]}, | |
| 154 | |
| 155 {"description": "Windows-1252 DOUBLE LOW-9 QUOTATION MARK hexadecimal numeric en
tity.", | |
| 156 "input":"„", | |
| 157 "output": ["ParseError", ["Character", "\u201E"]]}, | |
| 158 | |
| 159 {"description": "Windows-1252 HORIZONTAL ELLIPSIS hexadecimal numeric entity.", | |
| 160 "input":"…", | |
| 161 "output": ["ParseError", ["Character", "\u2026"]]}, | |
| 162 | |
| 163 {"description": "Windows-1252 DAGGER hexadecimal numeric entity.", | |
| 164 "input":"†", | |
| 165 "output": ["ParseError", ["Character", "\u2020"]]}, | |
| 166 | |
| 167 {"description": "Windows-1252 DOUBLE DAGGER hexadecimal numeric entity.", | |
| 168 "input":"‡", | |
| 169 "output": ["ParseError", ["Character", "\u2021"]]}, | |
| 170 | |
| 171 {"description": "Windows-1252 MODIFIER LETTER CIRCUMFLEX ACCENT hexadecimal nume
ric entity.", | |
| 172 "input":"ˆ", | |
| 173 "output": ["ParseError", ["Character", "\u02C6"]]}, | |
| 174 | |
| 175 {"description": "Windows-1252 PER MILLE SIGN hexadecimal numeric entity.", | |
| 176 "input":"‰", | |
| 177 "output": ["ParseError", ["Character", "\u2030"]]}, | |
| 178 | |
| 179 {"description": "Windows-1252 LATIN CAPITAL LETTER S WITH CARON hexadecimal nume
ric entity.", | |
| 180 "input":"Š", | |
| 181 "output": ["ParseError", ["Character", "\u0160"]]}, | |
| 182 | |
| 183 {"description": "Windows-1252 SINGLE LEFT-POINTING ANGLE QUOTATION MARK hexadeci
mal numeric entity.", | |
| 184 "input":"‹", | |
| 185 "output": ["ParseError", ["Character", "\u2039"]]}, | |
| 186 | |
| 187 {"description": "Windows-1252 LATIN CAPITAL LIGATURE OE hexadecimal numeric enti
ty.", | |
| 188 "input":"Œ", | |
| 189 "output": ["ParseError", ["Character", "\u0152"]]}, | |
| 190 | |
| 191 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
| 192 "input":"", | |
| 193 "output": ["ParseError", ["Character", "\u008D"]]}, | |
| 194 | |
| 195 {"description": "Windows-1252 LATIN CAPITAL LETTER Z WITH CARON hexadecimal nume
ric entity.", | |
| 196 "input":"Ž", | |
| 197 "output": ["ParseError", ["Character", "\u017D"]]}, | |
| 198 | |
| 199 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
| 200 "input":"", | |
| 201 "output": ["ParseError", ["Character", "\u008F"]]}, | |
| 202 | |
| 203 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
| 204 "input":"", | |
| 205 "output": ["ParseError", ["Character", "\u0090"]]}, | |
| 206 | |
| 207 {"description": "Windows-1252 LEFT SINGLE QUOTATION MARK hexadecimal numeric ent
ity.", | |
| 208 "input":"‘", | |
| 209 "output": ["ParseError", ["Character", "\u2018"]]}, | |
| 210 | |
| 211 {"description": "Windows-1252 RIGHT SINGLE QUOTATION MARK hexadecimal numeric en
tity.", | |
| 212 "input":"’", | |
| 213 "output": ["ParseError", ["Character", "\u2019"]]}, | |
| 214 | |
| 215 {"description": "Windows-1252 LEFT DOUBLE QUOTATION MARK hexadecimal numeric ent
ity.", | |
| 216 "input":"“", | |
| 217 "output": ["ParseError", ["Character", "\u201C"]]}, | |
| 218 | |
| 219 {"description": "Windows-1252 RIGHT DOUBLE QUOTATION MARK hexadecimal numeric en
tity.", | |
| 220 "input":"”", | |
| 221 "output": ["ParseError", ["Character", "\u201D"]]}, | |
| 222 | |
| 223 {"description": "Windows-1252 BULLET hexadecimal numeric entity.", | |
| 224 "input":"•", | |
| 225 "output": ["ParseError", ["Character", "\u2022"]]}, | |
| 226 | |
| 227 {"description": "Windows-1252 EN DASH hexadecimal numeric entity.", | |
| 228 "input":"–", | |
| 229 "output": ["ParseError", ["Character", "\u2013"]]}, | |
| 230 | |
| 231 {"description": "Windows-1252 EM DASH hexadecimal numeric entity.", | |
| 232 "input":"—", | |
| 233 "output": ["ParseError", ["Character", "\u2014"]]}, | |
| 234 | |
| 235 {"description": "Windows-1252 SMALL TILDE hexadecimal numeric entity.", | |
| 236 "input":"˜", | |
| 237 "output": ["ParseError", ["Character", "\u02DC"]]}, | |
| 238 | |
| 239 {"description": "Windows-1252 TRADE MARK SIGN hexadecimal numeric entity.", | |
| 240 "input":"™", | |
| 241 "output": ["ParseError", ["Character", "\u2122"]]}, | |
| 242 | |
| 243 {"description": "Windows-1252 LATIN SMALL LETTER S WITH CARON hexadecimal numeri
c entity.", | |
| 244 "input":"š", | |
| 245 "output": ["ParseError", ["Character", "\u0161"]]}, | |
| 246 | |
| 247 {"description": "Windows-1252 SINGLE RIGHT-POINTING ANGLE QUOTATION MARK hexadec
imal numeric entity.", | |
| 248 "input":"›", | |
| 249 "output": ["ParseError", ["Character", "\u203A"]]}, | |
| 250 | |
| 251 {"description": "Windows-1252 LATIN SMALL LIGATURE OE hexadecimal numeric entity
.", | |
| 252 "input":"œ", | |
| 253 "output": ["ParseError", ["Character", "\u0153"]]}, | |
| 254 | |
| 255 {"description": "Windows-1252 REPLACEMENT CHAR hexadecimal numeric entity.", | |
| 256 "input":"", | |
| 257 "output": ["ParseError", ["Character", "\u009D"]]}, | |
| 258 | |
| 259 {"description": "Windows-1252 LATIN SMALL LETTER Z WITH CARON hexadecimal numeri
c entity.", | |
| 260 "input":"ž", | |
| 261 "output": ["ParseError", ["Character", "\u017E"]]}, | |
| 262 | |
| 263 {"description": "Windows-1252 LATIN CAPITAL LETTER Y WITH DIAERESIS hexadecimal
numeric entity.", | |
| 264 "input":"Ÿ", | |
| 265 "output": ["ParseError", ["Character", "\u0178"]]}, | |
| 266 | |
| 267 {"description": "Decimal numeric entity followed by hex character a.", | |
| 268 "input":"aa", | |
| 269 "output": ["ParseError", ["Character", "aa"]]}, | |
| 270 | |
| 271 {"description": "Decimal numeric entity followed by hex character A.", | |
| 272 "input":"aA", | |
| 273 "output": ["ParseError", ["Character", "aA"]]}, | |
| 274 | |
| 275 {"description": "Decimal numeric entity followed by hex character f.", | |
| 276 "input":"af", | |
| 277 "output": ["ParseError", ["Character", "af"]]}, | |
| 278 | |
| 279 {"description": "Decimal numeric entity followed by hex character A.", | |
| 280 "input":"aF", | |
| 281 "output": ["ParseError", ["Character", "aF"]]} | |
| 282 | |
| 283 ]} | |
| OLD | NEW |