| OLD | NEW |
| 1 //******************************************************************************
* | 1 //******************************************************************************
* |
| 2 // | 2 // |
| 3 // Copyright (C) 2003-2007, International Business Machines | 3 // Copyright (C) 2003-2008, International Business Machines |
| 4 // Corporation and others. All Rights Reserved. | 4 // Corporation and others. All Rights Reserved. |
| 5 // | 5 // |
| 6 // file name: conversion.txt | 6 // file name: conversion.txt |
| 7 // encoding: US-ASCII | 7 // encoding: US-ASCII |
| 8 // tab size: 8 (not used) | 8 // tab size: 8 (not used) |
| 9 // indentation:4 | 9 // indentation:4 |
| 10 // | 10 // |
| 11 // created on: 2003jul15 | 11 // created on: 2003jul15 |
| 12 // created by: Markus W. Scherer | 12 // created by: Markus W. Scherer |
| 13 // | 13 // |
| (...skipping 141 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 155 :intvector{ 0,1,1,1,1,2,3,8,11,13,14,14,14,14,15,16 }, | 155 :intvector{ 0,1,1,1,1,2,3,8,11,13,14,14,14,14,15,16 }, |
| 156 :int{1}, :int{0}, "", "&C", :bin{""} | 156 :int{1}, :int{0}, "", "&C", :bin{""} |
| 157 } | 157 } |
| 158 { | 158 { |
| 159 "ISO-2022-CN-EXT", | 159 "ISO-2022-CN-EXT", |
| 160 :bin{ 4f1b4f4f1b242b494f1b4f4f4f4f1b204f }, | 160 :bin{ 4f1b4f4f1b242b494f1b4f4f4f4f1b204f }, |
| 161 "O\\x1BOOO\u492bO\\x1B O", | 161 "O\\x1BOOO\u492bO\\x1B O", |
| 162 :intvector{ 0,1,1,1,1,2,3,8,11,13,14,14,14,14,15,16 }, | 162 :intvector{ 0,1,1,1,1,2,3,8,11,13,14,14,14,14,15,16 }, |
| 163 :int{1}, :int{0}, "", "&C", :bin{""} | 163 :int{1}, :int{0}, "", "&C", :bin{""} |
| 164 } | 164 } |
| 165 // Test ticket 5691: HZ with illegal tilde sequences. |
| 166 { |
| 167 "HZ", |
| 168 :bin{ 417e20427e21437e80447e7b41417e207e41427e7f41437e7d5a }, |
| 169 "A\\x7E B\\x7E!C\\x7E\\x80D\u4eae\\x7E\\x20\\x7E\u8c05\\x7E\\x7F\u64a9
Z", |
| 170 :intvector{ 0,1,1,1,1,2,3,4,4,4,4,5,6,7,7,7,7,7,7,7,7,9,
// SBCS |
| 171 12,14,14,14,14,14,14,14,14,16,16,16,16,17,19,19,19,19,19,1
9,19,19,21, // DBCS |
| 172 25 },
// SBCS |
| 173 :int{1}, :int{0}, "", "&C", :bin{""} |
| 174 } |
| 165 // Test ticket 5691: Example from Peter Edberg. | 175 // Test ticket 5691: Example from Peter Edberg. |
| 166 { | 176 { |
| 167 "ISO-2022-JP", | 177 "ISO-2022-JP", |
| 168 :bin{ 1b244230212f7e742630801b284a621b2458631b2842648061 }, | 178 :bin{ 1b244230212f7e742630801b284a621b2458631b2842648061 }, |
| 169 "\u4e9c\ufffd\u7199\ufffdb\ufffd$Xcd\ufffda", | 179 "\u4e9c\ufffd\u7199\ufffdb\ufffd$Xcd\ufffda", |
| 170 :intvector{ 3,5,7,9,14,15,16,17,18,22,23,24 }, | 180 :intvector{ 3,5,7,9,14,15,16,17,18,22,23,24 }, |
| 171 :int{1}, :int{0}, "", "?", :bin{""} | 181 :int{1}, :int{0}, "", "?", :bin{""} |
| 172 } | 182 } |
| 183 // Test bug 6071 (2:1 Unicode:charset SBCS mapping). |
| 184 { |
| 185 "*test1bmp", |
| 186 :bin{ 050008 }, |
| 187 "e@uv", |
| 188 :intvector{ 0,1,2,2 }, |
| 189 :int{1}, :int{1}, "", "?", :bin{""} |
| 190 } |
| 191 // test that HZ limits its byte values to lead bytes 21..7d and trail by
tes 21..7e |
| 192 { |
| 193 "HZ", |
| 194 :bin{ 7e7b21212120217e217f772100007e217e7e7d207e7e807e0a2b }, |
| 195 "\u3000\ufffd\u3013\ufffd\u9ccc\ufffd\ufffd\u3013 ~\ufffd+", |
| 196 :intvector{ 2,4,6,8,10,12,14,15,19,20,22,25 }, |
| 197 :int{1}, :int{1}, "", "?", :bin{""} |
| 198 } |
| 173 // improve coverage of ISO-2022-JP converter with hardcoded JIS X 0201 a
nd | 199 // improve coverage of ISO-2022-JP converter with hardcoded JIS X 0201 a
nd |
| 174 // using the Shift-JIS table for JIS X 0208 (ticket #5797) | 200 // using the Shift-JIS table for JIS X 0208 (ticket #5797) |
| 175 { | 201 { |
| 176 "ISO-2022-JP", | 202 "ISO-2022-JP", |
| 177 :bin{ 1b284a7d7e801b2442306c20217f7e21202160217f22202225227f5f211b2842
}, | 203 :bin{ 1b284a7d7e801b2442306c20217f7e21202160217f22202225227f5f211b2842
}, |
| 178 "}\u203e\ufffd\u4e00\ufffd\ufffd\ufffd\ufffd\xf7\ufffd\ufffd\u25b2\uff
fd\u6f3e", | 204 "}\u203e\ufffd\u4e00\ufffd\ufffd\ufffd\ufffd\xf7\ufffd\ufffd\u25b2\uff
fd\u6f3e", |
| 179 :intvector{ 3,4,5,9,11,12,14,16,17,19,21,23,25,27 }, | 205 :intvector{ 3,4,5,9,11,12,14,16,17,19,21,23,25,27 }, |
| 180 :int{1}, :int{1}, "", "?", :bin{""} | 206 :int{1}, :int{1}, "", "?", :bin{""} |
| 181 } | 207 } |
| 182 // improve coverage of unrolled loops in ucnvmbcs.c/ucnv_MBCSSingleToBMP
WithOffsets() | 208 // improve coverage of unrolled loops in ucnvmbcs.c/ucnv_MBCSSingleToBMP
WithOffsets() |
| (...skipping 123 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 306 :int{1}, :int{1}, "", ".", :bin{""} | 332 :int{1}, :int{1}, "", ".", :bin{""} |
| 307 } | 333 } |
| 308 // more complicated example | 334 // more complicated example |
| 309 { | 335 { |
| 310 "ISO-2022-KR", | 336 "ISO-2022-KR", |
| 311 :bin{ 411b242943420e4141affe0f43 }, | 337 :bin{ 411b242943420e4141affe0f43 }, |
| 312 "AB\uc88b%XAF%XFEC", | 338 "AB\uc88b%XAF%XFEC", |
| 313 :intvector{ 0, 5, 7, 9, 9, 9, 9, 9, 9, 9, 9, 12 }, | 339 :intvector{ 0, 5, 7, 9, 9, 9, 9, 9, 9, 9, 9, 12 }, |
| 314 :int{1}, :int{1}, "", "&", :bin{""} | 340 :int{1}, :int{1}, "", "&", :bin{""} |
| 315 } | 341 } |
| 342 // empty segment (using substitution and stop) |
| 343 { |
| 344 "ISO-2022-KR", |
| 345 :bin{ 1b242943610e0f620d0a }, |
| 346 "a\uFFFDb\u000D\u000A", |
| 347 :intvector{ 4, 6, 7, 8, 9 }, |
| 348 :int{1}, :int{1}, "", "?", :bin{""} |
| 349 } |
| 350 { |
| 351 "ISO-2022-KR", |
| 352 :bin{ 1b242943610e0f620d0a }, |
| 353 "a", |
| 354 :intvector{ 4 }, |
| 355 :int{1}, :int{1}, "illesc", ".", :bin{"0f"} |
| 356 } |
| 316 | 357 |
| 317 // ISO-2022-JP | 358 // ISO-2022-JP |
| 318 | 359 |
| 319 // truncated, partial escape sequence | 360 // truncated, partial escape sequence |
| 320 { | 361 { |
| 321 "ISO-2022-JP", | 362 "ISO-2022-JP", |
| 322 :bin{ 1b }, "", :intvector{}, | 363 :bin{ 1b }, "", :intvector{}, |
| 323 :int{1}, :int{1}, "truncated", ".", :bin{ 1b } | 364 :int{1}, :int{1}, "truncated", ".", :bin{ 1b } |
| 324 } | 365 } |
| 325 { | 366 { |
| (...skipping 30 matching lines...) Expand all Loading... |
| 356 "JIS7", | 397 "JIS7", |
| 357 :bin{ 41420e41420f4142 }, "AB\uff81\uff82AB", :intvector{ 0, 1, 3, 4,
6, 7 }, | 398 :bin{ 41420e41420f4142 }, "AB\uff81\uff82AB", :intvector{ 0, 1, 3, 4,
6, 7 }, |
| 358 :int{1}, :int{1}, "", ".", :bin{""} | 399 :int{1}, :int{1}, "", ".", :bin{""} |
| 359 } | 400 } |
| 360 // JIS8 with Katakana | 401 // JIS8 with Katakana |
| 361 { | 402 { |
| 362 "JIS8", | 403 "JIS8", |
| 363 :bin{ 41c15c1b284a5cc242 }, "A\uff81\\\xa5\uff82B", :intvector{ 0, 1,
2, 6, 7, 8 }, | 404 :bin{ 41c15c1b284a5cc242 }, "A\uff81\\\xa5\uff82B", :intvector{ 0, 1,
2, 6, 7, 8 }, |
| 364 :int{1}, :int{1}, "", ".", :bin{""} | 405 :int{1}, :int{1}, "", ".", :bin{""} |
| 365 } | 406 } |
| 407 // empty segment (using substitution and stop) |
| 408 { |
| 409 "ISO-2022-JP", |
| 410 :bin{ 61621b24421b284263640d0a }, |
| 411 "ab\uFFFDcd\u000D\u000A", |
| 412 :intvector{ 0, 1, 5, 8, 9, 10, 11 }, |
| 413 :int{1}, :int{1}, "", "?", :bin{""} |
| 414 } |
| 415 { |
| 416 "ISO-2022-JP", |
| 417 :bin{ 61621b24421b284263640d0a }, |
| 418 "ab", |
| 419 :intvector{ 0, 1 }, |
| 420 :int{1}, :int{1}, "illesc", ".", :bin{"1b2842"} |
| 421 } |
| 366 | 422 |
| 367 // ISO-2022-CN | 423 // ISO-2022-CN |
| 368 | 424 |
| 369 // truncated, partial escape sequence | 425 // truncated, partial escape sequence |
| 370 { | 426 { |
| 371 "ISO_2022,locale=zh,version=1", | 427 "ISO_2022,locale=zh,version=1", |
| 372 :bin{ 1b }, "", :intvector{}, | 428 :bin{ 1b }, "", :intvector{}, |
| 373 :int{1}, :int{1}, "truncated", ".", :bin{ 1b } | 429 :int{1}, :int{1}, "truncated", ".", :bin{ 1b } |
| 374 } | 430 } |
| 375 { | 431 { |
| (...skipping 50 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 426 "ISO-2022-CN-EXT", | 482 "ISO-2022-CN-EXT", |
| 427 :bin{ 411b4e2121 }, "\x41", :intvector{ 0 }, | 483 :bin{ 411b4e2121 }, "\x41", :intvector{ 0 }, |
| 428 :int{1}, :int{1}, "illesc", ".", :bin{ 1b } | 484 :int{1}, :int{1}, "illesc", ".", :bin{ 1b } |
| 429 } | 485 } |
| 430 // G3 designator: recognized, but not supported for -CN (only for -CN-EX
T) | 486 // G3 designator: recognized, but not supported for -CN (only for -CN-EX
T) |
| 431 { | 487 { |
| 432 "ISO-2022-CN", | 488 "ISO-2022-CN", |
| 433 :bin{ 411b242b491b4f2121 }, "\x41", :intvector{ 0 }, | 489 :bin{ 411b242b491b4f2121 }, "\x41", :intvector{ 0 }, |
| 434 :int{1}, :int{1}, "unsuppesc", ".", :bin{ 1b242b49 } | 490 :int{1}, :int{1}, "unsuppesc", ".", :bin{ 1b242b49 } |
| 435 } | 491 } |
| 492 // empty segment 1 (using substitution and stop) |
| 493 { |
| 494 "ISO-2022-CN", |
| 495 :bin{ 611b242941620e0f1b242a481b4e6a65630d0a }, |
| 496 "ab\uFFFD\u994Cc\u000D\u000A", |
| 497 :intvector{ 0, 5, 7, 14, 16, 17, 18 }, |
| 498 :int{1}, :int{1}, "", "?", :bin{""} |
| 499 } |
| 500 { |
| 501 "ISO-2022-CN", |
| 502 :bin{ 611b242941620e0f1b242a481b4e6a65630d0a }, |
| 503 "ab", |
| 504 :intvector{ 0, 5 }, |
| 505 :int{1}, :int{1}, "illesc", ".", :bin{"0f"} |
| 506 } |
| 507 // empty segment 2 (using substitution and stop) |
| 508 { |
| 509 "ISO-2022-CN", |
| 510 :bin{ 611b242941620e1b24294768640f630d0a }, |
| 511 "ab\uFFFD\u5F70c\u000D\u000A", |
| 512 :intvector{ 0, 5, 7, 11, 14, 15, 16 }, |
| 513 :int{1}, :int{1}, "", "?", :bin{""} |
| 514 } |
| 515 { |
| 516 "ISO-2022-CN", |
| 517 :bin{ 611b242941620e1b24294768640f630d0a }, |
| 518 "ab", |
| 519 :intvector{ 0, 5 }, |
| 520 :int{1}, :int{1}, "illesc", ".", :bin{"1b242947"} |
| 521 } |
| 436 | 522 |
| 437 // ISO-2022 SBCS | 523 // ISO-2022 SBCS |
| 438 // [U_ENABLE_GENERIC_ISO_2022] | 524 // [U_ENABLE_GENERIC_ISO_2022] |
| 439 // The _generic_ ISO-2022 converter is disabled starting 2003-dec-03 (IC
U 2.8). | 525 // The _generic_ ISO-2022 converter is disabled starting 2003-dec-03 (IC
U 2.8). |
| 440 // For details see the icu mailing list from 2003-dec-01 and the ucnv202
2.c file. | 526 // For details see the icu mailing list from 2003-dec-01 and the ucnv202
2.c file. |
| 441 // Language-specific variants of ISO-2022 continue to be available as li
sted below. | 527 // Language-specific variants of ISO-2022 continue to be available as li
sted below. |
| 442 //{ | 528 //{ |
| 443 // "ISO_2022", | 529 // "ISO_2022", |
| 444 // :bin{ 0008090a0d1a1c1f203f415c7d7e7f }, | 530 // :bin{ 0008090a0d1a1c1f203f415c7d7e7f }, |
| 445 // "\x00\x08\t\n\r\x1a\x1c\x1f ?A\\}~\x7f", | 531 // "\x00\x08\t\n\r\x1a\x1c\x1f ?A\\}~\x7f", |
| 446 // :intvector{ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14 }, | 532 // :intvector{ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14 }, |
| 447 // :int{1}, :int{1}, "", ".", :bin{""} | 533 // :int{1}, :int{1}, "", ".", :bin{""} |
| 448 //} | 534 //} |
| 449 | 535 |
| 536 // HZ-GB-2312 |
| 537 |
| 538 // empty segment 1 (using substitution and stop) |
| 539 { |
| 540 "HZ-GB-2312", |
| 541 :bin{ 61627e7b7e7d6364 }, |
| 542 "ab\uFFFDcd", |
| 543 :intvector{ 0, 1, 4, 6, 7 }, |
| 544 :int{1}, :int{1}, "", "?", :bin{""} |
| 545 } |
| 546 { |
| 547 "HZ-GB-2312", |
| 548 :bin{ 61627e7b7e7d63640d0a }, |
| 549 "ab", |
| 550 :intvector{ 0, 1 }, |
| 551 :int{1}, :int{1}, "illesc", ".", :bin{"7e7d"} |
| 552 } |
| 553 // empty segment 2 & legal redundant switches (using substitution and st
op) |
| 554 { |
| 555 "HZ-GB-2312", |
| 556 :bin{ 61627e7b323b3f557e7b7e7b523b7e7d63647e7d65667e7d7e7d }, |
| 557 "ab\u4E0D\u7A7A\uFFFD\u4E00cdef\uFFFD", |
| 558 :intvector{ 0, 1, 4, 6, 10, 12, 16, 17, 20, 21, 24 }, |
| 559 :int{1}, :int{1}, "", "?", :bin{""} |
| 560 } |
| 561 { |
| 562 "HZ-GB-2312", |
| 563 :bin{ 61627e7b323b3f557e7b7e7b523b7e7d63647e7d65667e7d7e7d }, |
| 564 "ab\u4E0D\u7A7A", |
| 565 :intvector{ 0, 1, 4, 6 }, |
| 566 :int{1}, :int{1}, "illesc", ".", :bin{"7e7b"} |
| 567 } |
| 568 |
| 450 // DBCS-only extensions | 569 // DBCS-only extensions |
| 451 { | 570 { |
| 452 "ibm-970", | 571 "ibm-970", |
| 453 :bin{ 617eece9b2eb }, | 572 :bin{ 617eece9b2eb }, |
| 454 "\x61\x7e\u4e00\ub000", | 573 "\x61\x7e\u4e00\ub000", |
| 455 :intvector{ 0, 1, 2, 4 }, | 574 :intvector{ 0, 1, 2, 4 }, |
| 456 :int{1}, :int{1}, "", "?", :bin{""} | 575 :int{1}, :int{1}, "", "?", :bin{""} |
| 457 } | 576 } |
| 458 | 577 |
| 459 { | 578 { |
| (...skipping 151 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 611 :intvector{ 0, 2 }, | 730 :intvector{ 0, 2 }, |
| 612 :int{1}, :int{0}, "", "?", :bin{""} | 731 :int{1}, :int{0}, "", "?", :bin{""} |
| 613 } | 732 } |
| 614 { // Verify gb18030 enumeration | 733 { // Verify gb18030 enumeration |
| 615 "gb18030", | 734 "gb18030", |
| 616 :bin{ 8130D2398130D3308136A5318136A532 }, | 735 :bin{ 8130D2398130D3308136A5318136A532 }, |
| 617 "\u0450\u0452\u200F\u2011", | 736 "\u0450\u0452\u200F\u2011", |
| 618 :intvector{ 0, 4, 8, 12 }, | 737 :intvector{ 0, 4, 8, 12 }, |
| 619 :int{1}, :int{0}, "", "?", :bin{""} | 738 :int{1}, :int{0}, "", "?", :bin{""} |
| 620 } | 739 } |
| 740 // Test iso-2022-jp-2 miscellaneous symbols |
| 741 { |
| 742 "iso-2022-jp-2", |
| 743 :bin{ 1b242843224f224e1b2842 }, |
| 744 "\u260E\u260F", |
| 745 :intvector{ 4, 6 }, |
| 746 :int{1}, :int{0}, "", ".", :bin{""} |
| 747 } |
| 621 } | 748 } |
| 622 } | 749 } |
| 623 | 750 |
| 624 // --------------------------------------------------------------------- *** | 751 // --------------------------------------------------------------------- *** |
| 625 | 752 |
| 626 fromUnicode { | 753 fromUnicode { |
| 627 Headers { "charset", "unicode", "bytes", "offsets", "flush", "fallbacks",
"errorCode", "callback", "invalidUChars" } | 754 Headers { "charset", "unicode", "bytes", "offsets", "flush", "fallbacks",
"errorCode", "callback", "invalidUChars" } |
| 628 Cases { | 755 Cases { |
| 756 // Test bug 6071 (1:2 Unicode:charset SBCS mapping). |
| 757 { |
| 758 "*test1bmp", |
| 759 "e@t", |
| 760 :bin{ 05000709 }, |
| 761 :intvector{ 0,1,2,2 }, |
| 762 :int{1}, :int{0}, "", "?", "" |
| 763 } |
| 629 // improve coverage of ISO-2022-JP converter with hardcoded JIS X 0201 a
nd | 764 // improve coverage of ISO-2022-JP converter with hardcoded JIS X 0201 a
nd |
| 630 // using the Shift-JIS table for JIS X 0208 (ticket #5797) | 765 // using the Shift-JIS table for JIS X 0208 (ticket #5797) |
| 631 { | 766 { |
| 632 "ISO-2022-JP", | 767 "ISO-2022-JP", |
| 633 "\u203e\xa5\u4e00\ufa10\u6f3e\u0391", | 768 "\u203e\xa5\u4e00\ufa10\u6f3e\u0391", |
| 634 :bin{ 1b284a7e5c1b2442306c222e5f2126211b2842 }, | 769 :bin{ 1b284a7e5c1b2442306c222e5f2126211b2842 }, |
| 635 :intvector{ 0,0,0,0,1,2,2,2,2,2,3,3,4,4,5,5,5,5,5 }, | 770 :intvector{ 0,0,0,0,1,2,2,2,2,2,3,3,4,4,5,5,5,5,5 }, |
| 636 :int{1}, :int{0}, "", "?=\u3013", "" // U+3013 Geta Mark converts to
222e | 771 :int{1}, :int{0}, "", "?=\u3013", "" // U+3013 Geta Mark converts to
222e |
| 637 } | 772 } |
| 638 // Verify that mappings that would result in byte values outside 20..7F
(for SBCS) | 773 // Verify that mappings that would result in byte values outside 20..7F
(for SBCS) |
| (...skipping 787 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 1426 { | 1561 { |
| 1427 "ibm-25546", | 1562 "ibm-25546", |
| 1428 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa1\xa4\xfe\u0111\u4e00\u4e01\uac00-\uac
01\uffe6]", | 1563 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa1\xa4\xfe\u0111\u4e00\u4e01\uac00-\uac
01\uffe6]", |
| 1429 "[\x0e\x0f\x1b\x80-\xa0\xa3\xa5\xff-\u0110\uac02\uffe7-\U0010ffff]", | 1564 "[\x0e\x0f\x1b\x80-\xa0\xa3\xa5\xff-\u0110\uac02\uffe7-\U0010ffff]", |
| 1430 :int{0} | 1565 :int{0} |
| 1431 } | 1566 } |
| 1432 | 1567 |
| 1433 // versions of ISO-2022-JP | 1568 // versions of ISO-2022-JP |
| 1434 { | 1569 { |
| 1435 "ISO-2022-JP", | 1570 "ISO-2022-JP", |
| 1436 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa5\u0391-\u03a1\u203e\uff61-\uff9f\u4e0
0\u4e01\uffe5]", | 1571 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa5\u0391-\u03a1\u2015\u203e\u4e00\u4e01
\uffe5]", |
| 1437 "[\x0e\x0f\x1b\u0100-\u0113\u0385-\u038a\u4e02\u4e27-\u4e29\ufa0e-\ufa
2d\uffe6-\U0010ffff]", | 1572 "[\x0e\x0f\x1b\u0100-\u0113\u0385-\u038a\u2014\u301c\u4e02\u4e27-\u4e2
9\u4fe0\u663b\u9eb5\ufa0e-\ufa2d\uff61-\uff9f\uffe4\uffe6-\U0010ffff]", |
| 1438 :int{0} | 1573 :int{0} |
| 1439 } | 1574 } |
| 1440 { | 1575 { |
| 1441 "ISO-2022-JP-2", | 1576 "ISO-2022-JP-2", |
| 1442 "[\x00-\x0d\x10-\x1a\x1c-\u0113\u0384-\u0386\u0388-\u038a\u0390-\u03a1
\u203e\uff61-\uff9f\u4e00-\u4e05\uffe6]", | 1577 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa0-\u0113\u0384-\u0386\u0388-\u038a\u03
90-\u03a1\u203e\u4e00-\u4e05\u4fe0\u663b\uffe6]", |
| 1443 "[\x0e\x0f\x1b\uffe7-\U0010ffff]", | 1578 "[\x0e\x0f\x1b\uff61-\uff9f\uffe4\uffe7-\U0010ffff]", |
| 1444 :int{0} | 1579 :int{0} |
| 1445 } | 1580 } |
| 1581 { |
| 1582 "JIS7", |
| 1583 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa0-\u0113\u0384-\u0386\u0388-\u038a\u03
90-\u03a1\u203e\u4e00-\u4e05\u4fe0\u663b\uff61-\uff9f\uffe6]", |
| 1584 "[\x0e\x0f\x1b\uffe4\uffe7-\U0010ffff]", |
| 1585 :int{0} |
| 1586 } |
| 1587 // with fallbacks |
| 1588 { |
| 1589 "ISO-2022-JP", |
| 1590 "[\x00-\x0d\x10-\x1a\x1c-\x7f\xa5\u0391-\u03a1\u2014\u2015\u203e\u301c
\u4e00\u4e01\u4fe0\u9eb5\uff61-\uff9f\uffe5]", |
| 1591 "[\x0e\x0f\x1b\xa6\u0100-\u0113\u0385-\u038a\u4e02\u4e27-\u4e29\u663b\
ufa0e-\ufa2d\uffe4\uffe6-\U0010ffff]", |
| 1592 :int{1} |
| 1593 } |
| 1446 | 1594 |
| 1447 // versions of ISO-2022-CN | 1595 // versions of ISO-2022-CN |
| 1448 { | 1596 { |
| 1449 "ISO-2022-CN", | 1597 "ISO-2022-CN", |
| 1450 "[\x00-\x0d\x10-\x1a\x1c-\x7f\u4e00\u4e01\u9f98\ufe6b]", | 1598 "[\x00-\x0d\x10-\x1a\x1c-\x7f\u4e00\u4e01\u9f98\ufe6b]", |
| 1451 "[\x0e\x0f\x1b\u4e29\uffe6-\U0010ffff]", | 1599 "[\x0e\x0f\x1b\u4e29\uffe6-\U0010ffff]", |
| 1452 :int{0} | 1600 :int{0} |
| 1453 } | 1601 } |
| 1454 { | 1602 { |
| 1455 "ISO-2022-CN-EXT", | 1603 "ISO-2022-CN-EXT", |
| 1456 "[\x00-\x0d\x10-\x1a\x1c-\x7f\u4e00-\u4e05\u9f98\ufe6b\u4e28-\u4e2b\U0
0020000\U00020003-\U00020005\U00029664]", | 1604 "[\x00-\x0d\x10-\x1a\x1c-\x7f\u4e00-\u4e05\u9f98\ufe6b\u4e28-\u4e2b\U0
0020000\U00020003-\U00020005\U00029664]", |
| 1457 "[\x0e\x0f\x1b\U00020001\U00020002\U0002a6d7-\U0010ffff]", | 1605 "[\x0e\x0f\x1b\U00020001\U00020002\U0002a6d7-\U0010ffff]", |
| 1458 :int{0} | 1606 :int{0} |
| 1459 } | 1607 } |
| 1460 | 1608 |
| 1609 // HZ |
| 1610 { |
| 1611 "HZ", |
| 1612 "[\u0410-\u044f\u4e00\u4e01\u4e03]", |
| 1613 "[\u4e02\u4e04-\u4e06\uac00-\ud7ff]", |
| 1614 :int{0} |
| 1615 } |
| 1616 |
| 1617 // LMBCS |
| 1618 { |
| 1619 "LMBCS", |
| 1620 "[\x00-\U0010ffff]", |
| 1621 "[]", |
| 1622 :int{0} |
| 1623 } |
| 1624 |
| 1461 // DBCS-only | 1625 // DBCS-only |
| 1462 { | 1626 { |
| 1463 "ibm-971", | 1627 "ibm-971", |
| 1464 "[\xa1\xa4\uac01\ub000]", | 1628 "[\xa1\xa4\uac01\ub000]", |
| 1465 "[\x00-\x9f\u2015]", | 1629 "[\x00-\x9f\u2015]", |
| 1466 :int{0} | 1630 :int{0} |
| 1467 } | 1631 } |
| 1468 | 1632 |
| 1469 { | 1633 { |
| 1470 "ibm-16684", | 1634 "ibm-16684", |
| (...skipping 16 matching lines...) Expand all Loading... |
| 1487 "*test3", | 1651 "*test3", |
| 1488 "[\x05\x0b\xc0\u20ac\U00023456\U00101234" | 1652 "[\x05\x0b\xc0\u20ac\U00023456\U00101234" |
| 1489 "{\U00101234\U00050005\U00060006}{\U00101234\U00050005}{\U00101234
\U00060006}{\xc4\xc4\U00101234\x05}]", | 1653 "{\U00101234\U00050005\U00060006}{\U00101234\U00050005}{\U00101234
\U00060006}{\xc4\xc4\U00101234\x05}]", |
| 1490 "[\x06\x0e\U00034567\U000febcd{\U00101234\U00070007}]", | 1654 "[\x06\x0e\U00034567\U000febcd{\U00101234\U00070007}]", |
| 1491 :int{0} | 1655 :int{0} |
| 1492 } | 1656 } |
| 1493 } | 1657 } |
| 1494 } | 1658 } |
| 1495 } | 1659 } |
| 1496 } | 1660 } |
| OLD | NEW |