| OLD | NEW |
| 1 /* | 1 /* |
| 2 ********************************************************************** | 2 ********************************************************************** |
| 3 * Copyright (C) 2005-2013, International Business Machines | 3 * Copyright (C) 2005-2015, International Business Machines |
| 4 * Corporation and others. All Rights Reserved. | 4 * Corporation and others. All Rights Reserved. |
| 5 ********************************************************************** | 5 ********************************************************************** |
| 6 */ | 6 */ |
| 7 | 7 |
| 8 | 8 |
| 9 #include "unicode/utypes.h" | 9 #include "unicode/utypes.h" |
| 10 #include "unicode/ucsdet.h" | 10 #include "unicode/ucsdet.h" |
| 11 #include "unicode/ucnv.h" | 11 #include "unicode/ucnv.h" |
| 12 #include "unicode/unistr.h" | 12 #include "unicode/unistr.h" |
| 13 #include "unicode/putil.h" | 13 #include "unicode/putil.h" |
| (...skipping 563 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 577 } | 577 } |
| 578 } | 578 } |
| 579 | 579 |
| 580 delete root; | 580 delete root; |
| 581 delete parser; | 581 delete parser; |
| 582 #endif | 582 #endif |
| 583 } | 583 } |
| 584 | 584 |
| 585 void CharsetDetectionTest::IBM424Test() | 585 void CharsetDetectionTest::IBM424Test() |
| 586 { | 586 { |
| 587 #if !UCONFIG_ONLY_HTML_CONVERSION |
| 587 UErrorCode status = U_ZERO_ERROR; | 588 UErrorCode status = U_ZERO_ERROR; |
| 588 | 589 |
| 589 static const UChar chars[] = { | 590 static const UChar chars[] = { |
| 590 0x05D4, 0x05E4, 0x05E8, 0x05E7, 0x05DC, 0x05D9, 0x05D8, 0x0020, 0x05
D4, 0x05E6, 0x05D1, 0x05D0, 0x05D9, 0x0020, 0x05D4, 0x05E8, | 591 0x05D4, 0x05E4, 0x05E8, 0x05E7, 0x05DC, 0x05D9, 0x05D8, 0x0020, 0x05
D4, 0x05E6, 0x05D1, 0x05D0, 0x05D9, 0x0020, 0x05D4, 0x05E8, |
| 591 0x05D0, 0x05E9, 0x05D9, 0x002C, 0x0020, 0x05EA, 0x05EA, 0x0020, 0x05
D0, 0x05DC, 0x05D5, 0x05E3, 0x0020, 0x05D0, 0x05D1, 0x05D9, | 592 0x05D0, 0x05E9, 0x05D9, 0x002C, 0x0020, 0x05EA, 0x05EA, 0x0020, 0x05
D0, 0x05DC, 0x05D5, 0x05E3, 0x0020, 0x05D0, 0x05D1, 0x05D9, |
| 592 0x05D7, 0x05D9, 0x0020, 0x05DE, 0x05E0, 0x05D3, 0x05DC, 0x05D1, 0x05
DC, 0x05D9, 0x05D8, 0x002C, 0x0020, 0x05D4, 0x05D5, 0x05E8, | 593 0x05D7, 0x05D9, 0x0020, 0x05DE, 0x05E0, 0x05D3, 0x05DC, 0x05D1, 0x05
DC, 0x05D9, 0x05D8, 0x002C, 0x0020, 0x05D4, 0x05D5, 0x05E8, |
| 593 0x05D4, 0x0020, 0x05E2, 0x05DC, 0x0020, 0x05E4, 0x05EA, 0x05D9, 0x05
D7, 0x05EA, 0x0020, 0x05D7, 0x05E7, 0x05D9, 0x05E8, 0x05EA, | 594 0x05D4, 0x0020, 0x05E2, 0x05DC, 0x0020, 0x05E4, 0x05EA, 0x05D9, 0x05
D7, 0x05EA, 0x0020, 0x05D7, 0x05E7, 0x05D9, 0x05E8, 0x05EA, |
| 594 0x0020, 0x05DE, 0x05E6, 0x0022, 0x05D7, 0x0020, 0x05D1, 0x05E2, 0x05
E7, 0x05D1, 0x05D5, 0x05EA, 0x0020, 0x05E2, 0x05D3, 0x05D5, | 595 0x0020, 0x05DE, 0x05E6, 0x0022, 0x05D7, 0x0020, 0x05D1, 0x05E2, 0x05
E7, 0x05D1, 0x05D5, 0x05EA, 0x0020, 0x05E2, 0x05D3, 0x05D5, |
| 595 0x05D9, 0x05D5, 0x05EA, 0x0020, 0x05D7, 0x05D9, 0x05D9, 0x05DC, 0x05
D9, 0x0020, 0x05E6, 0x05D4, 0x0022, 0x05DC, 0x0020, 0x05DE, | 596 0x05D9, 0x05D5, 0x05EA, 0x0020, 0x05D7, 0x05D9, 0x05D9, 0x05DC, 0x05
D9, 0x0020, 0x05E6, 0x05D4, 0x0022, 0x05DC, 0x0020, 0x05DE, |
| 596 0x05DE, 0x05D1, 0x05E6, 0x05E2, 0x0020, 0x05E2, 0x05D5, 0x05E4, 0x05
E8, 0x05EA, 0x0020, 0x05D9, 0x05E6, 0x05D5, 0x05E7, 0x05D4, | 597 0x05DE, 0x05D1, 0x05E6, 0x05E2, 0x0020, 0x05E2, 0x05D5, 0x05E4, 0x05
E8, 0x05EA, 0x0020, 0x05D9, 0x05E6, 0x05D5, 0x05E7, 0x05D4, |
| (...skipping 72 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 669 | 670 |
| 670 name = ucsdet_getName(match, &status); | 671 name = ucsdet_getName(match, &status); |
| 671 if (strcmp(name, "IBM424_ltr") != 0) { | 672 if (strcmp(name, "IBM424_ltr") != 0) { |
| 672 errln("Encoding detection failure for IBM424_ltr: got %s", name); | 673 errln("Encoding detection failure for IBM424_ltr: got %s", name); |
| 673 } | 674 } |
| 674 | 675 |
| 675 bail: | 676 bail: |
| 676 freeBytes(bytes); | 677 freeBytes(bytes); |
| 677 freeBytes(bytes_r); | 678 freeBytes(bytes_r); |
| 678 ucsdet_close(csd); | 679 ucsdet_close(csd); |
| 680 #endif |
| 679 } | 681 } |
| 680 | 682 |
| 681 void CharsetDetectionTest::IBM420Test() | 683 void CharsetDetectionTest::IBM420Test() |
| 682 { | 684 { |
| 685 #if !UCONFIG_ONLY_HTML_CONVERSION |
| 683 UErrorCode status = U_ZERO_ERROR; | 686 UErrorCode status = U_ZERO_ERROR; |
| 684 | 687 |
| 685 static const UChar chars[] = { | 688 static const UChar chars[] = { |
| 686 0x0648, 0x064F, 0x0636, 0x0639, 0x062A, 0x0020, 0x0648, 0x0646, 0x064F,
0x0641, 0x0630, 0x062A, 0x0020, 0x0628, 0x0631, 0x0627, | 689 0x0648, 0x064F, 0x0636, 0x0639, 0x062A, 0x0020, 0x0648, 0x0646, 0x064F,
0x0641, 0x0630, 0x062A, 0x0020, 0x0628, 0x0631, 0x0627, |
| 687 0x0645, 0x062C, 0x0020, 0x062A, 0x0623, 0x0645, 0x064A, 0x0646, 0x0020,
0x0639, 0x062F, 0x064A, 0x062F, 0x0629, 0x0020, 0x0641, | 690 0x0645, 0x062C, 0x0020, 0x062A, 0x0623, 0x0645, 0x064A, 0x0646, 0x0020,
0x0639, 0x062F, 0x064A, 0x062F, 0x0629, 0x0020, 0x0641, |
| 688 0x064A, 0x0020, 0x0645, 0x0624, 0x0633, 0x0633, 0x0629, 0x0020, 0x0627,
0x0644, 0x062A, 0x0623, 0x0645, 0x064A, 0x0646, 0x0020, | 691 0x064A, 0x0020, 0x0645, 0x0624, 0x0633, 0x0633, 0x0629, 0x0020, 0x0627,
0x0644, 0x062A, 0x0623, 0x0645, 0x064A, 0x0646, 0x0020, |
| 689 0x0627, 0x0644, 0x0648, 0x0637, 0x0646, 0x064A, 0x002C, 0x0020, 0x0645,
0x0639, 0x0020, 0x0645, 0x0644, 0x0627, 0x0626, 0x0645, | 692 0x0627, 0x0644, 0x0648, 0x0637, 0x0646, 0x064A, 0x002C, 0x0020, 0x0645,
0x0639, 0x0020, 0x0645, 0x0644, 0x0627, 0x0626, 0x0645, |
| 690 0x062A, 0x0647, 0x0627, 0x0020, 0x062F, 0x0627, 0x0626, 0x0645, 0x0627,
0x064B, 0x0020, 0x0644, 0x0644, 0x0627, 0x062D, 0x062A, | 693 0x062A, 0x0647, 0x0627, 0x0020, 0x062F, 0x0627, 0x0626, 0x0645, 0x0627,
0x064B, 0x0020, 0x0644, 0x0644, 0x0627, 0x062D, 0x062A, |
| 691 0x064A, 0x0627, 0x062C, 0x0627, 0x062A, 0x0020, 0x0627, 0x0644, 0x0645,
0x062A, 0x063A, 0x064A, 0x0631, 0x0629, 0x0020, 0x0644, | 694 0x064A, 0x0627, 0x062C, 0x0627, 0x062A, 0x0020, 0x0627, 0x0644, 0x0645,
0x062A, 0x063A, 0x064A, 0x0631, 0x0629, 0x0020, 0x0644, |
| 692 0x0644, 0x0645, 0x062C, 0x062A, 0x0645, 0x0639, 0x0020, 0x0648, 0x0644,
0x0644, 0x062F, 0x0648, 0x0644, 0x0629, 0x002E, 0x0020, | 695 0x0644, 0x0645, 0x062C, 0x062A, 0x0645, 0x0639, 0x0020, 0x0648, 0x0644,
0x0644, 0x062F, 0x0648, 0x0644, 0x0629, 0x002E, 0x0020, |
| (...skipping 64 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 757 | 760 |
| 758 name = ucsdet_getName(match, &status); | 761 name = ucsdet_getName(match, &status); |
| 759 if (strcmp(name, "IBM420_ltr") != 0) { | 762 if (strcmp(name, "IBM420_ltr") != 0) { |
| 760 errln("Encoding detection failure for IBM420_ltr: got %s\n", name); | 763 errln("Encoding detection failure for IBM420_ltr: got %s\n", name); |
| 761 } | 764 } |
| 762 | 765 |
| 763 bail: | 766 bail: |
| 764 freeBytes(bytes); | 767 freeBytes(bytes); |
| 765 freeBytes(bytes_r); | 768 freeBytes(bytes_r); |
| 766 ucsdet_close(csd); | 769 ucsdet_close(csd); |
| 770 #endif |
| 767 } | 771 } |
| 768 | 772 |
| 769 | 773 |
| 770 void CharsetDetectionTest::Ticket6394Test() { | 774 void CharsetDetectionTest::Ticket6394Test() { |
| 771 #if !UCONFIG_NO_CONVERSION | 775 #if !UCONFIG_NO_CONVERSION |
| 772 const char charText[] = "Here is some random English text that should be de
tected as ISO-8859-1." | 776 const char charText[] = "Here is some random English text that should be de
tected as ISO-8859-1." |
| 773 "Ticket 6394 claims that ISO-8859-1 will appear in
the array of detected " | 777 "Ticket 6394 claims that ISO-8859-1 will appear in
the array of detected " |
| 774 "encodings more than once. The hop through Unicode
String is for platforms " | 778 "encodings more than once. The hop through Unicode
String is for platforms " |
| 775 "where this char * string is be EBCDIC and needs co
nversion to Latin1."; | 779 "where this char * string is be EBCDIC and needs co
nversion to Latin1."; |
| 776 char latin1Text[sizeof(charText)]; | 780 char latin1Text[sizeof(charText)]; |
| (...skipping 71 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 848 name1 = ucsdet_getName(match1, &status); | 852 name1 = ucsdet_getName(match1, &status); |
| 849 TEST_ASSERT_SUCCESS(status); | 853 TEST_ASSERT_SUCCESS(status); |
| 850 TEST_ASSERT(strcmp(name1, "windows-1252")==0); | 854 TEST_ASSERT(strcmp(name1, "windows-1252")==0); |
| 851 | 855 |
| 852 ucsdet_close(csd1); | 856 ucsdet_close(csd1); |
| 853 ucsdet_close(csd2); | 857 ucsdet_close(csd2); |
| 854 freeBytes(bISO); | 858 freeBytes(bISO); |
| 855 freeBytes(bWindows); | 859 freeBytes(bWindows); |
| 856 #endif | 860 #endif |
| 857 } | 861 } |
| OLD | NEW |