Index: icu46/source/test/intltest/jamotest.cpp |
=================================================================== |
--- icu46/source/test/intltest/jamotest.cpp (revision 0) |
+++ icu46/source/test/intltest/jamotest.cpp (revision 0) |
@@ -0,0 +1,553 @@ |
+/******************************************************************** |
+ * COPYRIGHT: |
+ * Copyright (c) 1997-2010, International Business Machines Corporation and |
+ * others. All Rights Reserved. |
+ ******************************************************************** |
+************************************************************************ |
+* Date Name Description |
+* 02/28/2001 aliu Creation |
+* 03/01/2001 George port to HP/UX |
+************************************************************************/ |
+ |
+#include "unicode/utypes.h" |
+ |
+#if !UCONFIG_NO_TRANSLITERATION |
+ |
+#include "jamotest.h" |
+#include "unicode/utypes.h" |
+#include "unicode/translit.h" |
+#include "cpdtrans.h" |
+ |
+// SEP is the disambiguation separator used by Latin-Jamo and Jamo-Latin |
+#define SEP "-" |
+ |
+JamoTest::JamoTest() |
+{ |
+ UParseError parseError; |
+ UErrorCode status = U_ZERO_ERROR; |
+ NAME_JAMO = Transliterator::createFromRules("Name-Jamo", |
+ UnicodeString(JAMO_NAMES_RULES, -1, US_INV), |
+ UTRANS_FORWARD, parseError, status); |
+ |
+ if (U_FAILURE(status)) { |
+ delete NAME_JAMO; |
+ NAME_JAMO = NULL; |
+ } |
+ status = U_ZERO_ERROR; |
+ JAMO_NAME = Transliterator::createFromRules("Jamo-Name", |
+ UnicodeString(JAMO_NAMES_RULES, -1, US_INV), |
+ UTRANS_REVERSE, parseError, status); |
+ if (U_FAILURE(status)) { |
+ delete JAMO_NAME; |
+ JAMO_NAME = NULL; |
+ } |
+} |
+ |
+JamoTest::~JamoTest() |
+{ |
+ delete NAME_JAMO; |
+ delete JAMO_NAME; |
+} |
+ |
+void |
+JamoTest::runIndexedTest(int32_t index, UBool exec, |
+ const char* &name, char* /*par*/) { |
+ switch (index) { |
+ TESTCASE(0,TestJamo); |
+ TESTCASE(1,TestRealText); |
+ TESTCASE(2,TestPiecemeal); |
+ default: name = ""; break; |
+ } |
+} |
+ |
+void |
+JamoTest::TestJamo() { |
+ UParseError parseError; |
+ UErrorCode status = U_ZERO_ERROR; |
+ Transliterator* latinJamo = Transliterator::createInstance("Latin-Jamo", UTRANS_FORWARD, parseError, status); |
+ |
+ if (latinJamo == 0 || U_FAILURE(status)) { |
+ dataerrln("FAIL: createInstance() returned 0 - %s", u_errorName(status)); |
+ return; |
+ } |
+ |
+ Transliterator* jamoLatin = latinJamo->createInverse(status); |
+ |
+ if (jamoLatin == 0) { |
+ delete latinJamo; |
+ errln("FAIL: createInverse() returned 0"); |
+ return; |
+ } |
+ |
+ static const char* CASE[] = { |
+ // Column 1 is the latin text L1 to be fed to Latin-Jamo |
+ // to yield output J. |
+ |
+ // Column 2 is expected value of J. J is fed to |
+ // Jamo-Latin to yield output L2. |
+ |
+ // Column 3 is expected value of L2. If the expected |
+ // value of L2 is L1, then L2 is NULL. |
+ |
+ // add tests for the update to fix problems where it didn't follow the standard |
+ // see also http://www.unicode.org/cldr/data/charts/transforms/Latin-Hangul.html |
+ "gach", "(Gi)(A)(Cf)", NULL, |
+ "geumhui", "(Gi)(EU)(Mf)(Hi)(YI)", NULL, |
+ "choe", "(Ci)(OE)", NULL, |
+ "wo", "(IEUNG)(WEO)", NULL, |
+ "Wonpil", "(IEUNG)(WEO)(Nf)(Pi)(I)(L)", "wonpil", |
+ "GIPPEUM", "(Gi)(I)(BB)(EU)(Mf)", "gippeum", |
+ "EUTTEUM", "(IEUNG)(EU)(DD)(EU)(Mf)", "eutteum", |
+ "KKOTNAE", "(GGi)(O)(Tf)(Ni)(AE)", "kkotnae", |
+ "gaga", "(Gi)(A)(Gi)(A)", NULL, |
+ "gag-a", "(Gi)(A)(Gf)(IEUNG)(A)", NULL, |
+ "gak-ka", "(Gi)(A)(Kf)(Ki)(A)", NULL, |
+ "gakka", "(Gi)(A)(GGi)(A)", NULL, |
+ "gakk-a", "(Gi)(A)(GGf)(IEUNG)(A)", NULL, |
+ "gakkka", "(Gi)(A)(GGf)(Ki)(A)", NULL, |
+ "gak-kka", "(Gi)(A)(Kf)(GGi)(A)", NULL, |
+ |
+ "bab", "(Bi)(A)(Bf)", NULL, |
+ "babb", "(Bi)(A)(Bf)(Bi)(EU)", "babbeu", |
+ "babbba", "(Bi)(A)(Bf)(Bi)(EU)(Bi)(A)", "babbeuba", |
+ "bagg", "(Bi)(A)(Gf)(Gi)(EU)", "baggeu", |
+ "baggga", "(Bi)(A)(Gf)(Gi)(EU)(Gi)(A)", "baggeuga", |
+ //"bag" SEP "gga", "(Bi)(A)(Gf)" SEP "(Gi)(EU)(Gi)(A)", "bag" SEP "geuga", |
+ "kabsa", "(Ki)(A)(Bf)(Si)(A)", NULL, |
+ "kabska", "(Ki)(A)(BS)(Ki)(A)", NULL, |
+ "gabsbka", "(Gi)(A)(BS)(Bi)(EU)(Ki)(A)", "gabsbeuka", // not (Kf) |
+ "gga", "(Gi)(EU)(Gi)(A)", "geuga", |
+ "bsa", "(Bi)(EU)(Si)(A)", "beusa", |
+ "agg", "(IEUNG)(A)(Gf)(Gi)(EU)", "aggeu", |
+ "agga", "(IEUNG)(A)(Gf)(Gi)(A)", NULL, |
+ "la", "(R)(A)", NULL, |
+ "bs", "(Bi)(EU)(Sf)", "beus", |
+ "kalgga", "(Ki)(A)(L)(Gi)(EU)(Gi)(A)", "kalgeuga", |
+ |
+ // 'r' in a final position is treated like 'l' |
+ "karka", "(Ki)(A)(L)(Ki)(A)", "kalka", |
+ }; |
+ |
+ enum { CASE_length = sizeof(CASE) / sizeof(CASE[0]) }; |
+ |
+ int32_t i; |
+ for (i=0; i<CASE_length; i+=3) { |
+ UnicodeString jamo = nameToJamo(CASE[i+1]); |
+ if (CASE[i+2] == NULL) { |
+ expect(*latinJamo, CASE[i], jamo, *jamoLatin); |
+ } else { |
+ // Handle case where round-trip is expected to fail |
+ expect(*latinJamo, CASE[i], jamo); |
+ expect(*jamoLatin, jamo, CASE[i+2]); |
+ } |
+ } |
+ |
+ delete latinJamo; |
+ delete jamoLatin; |
+} |
+ |
+/** |
+ * Test various step-at-a-time transformation of hangul to jamo to |
+ * latin and back. |
+ */ |
+void JamoTest::TestPiecemeal(void) { |
+ UnicodeString hangul; hangul.append((UChar)0xBC0F); |
+ UnicodeString jamo = nameToJamo("(Mi)(I)(Cf)"); |
+ UnicodeString latin("mic"); |
+ UnicodeString latin2("mich"); |
+ |
+ Transliterator *t = NULL; |
+ UErrorCode status = U_ZERO_ERROR; |
+ |
+ t = Transliterator::createInstance("NFD", UTRANS_FORWARD, status); // was Hangul-Jamo |
+ if (U_FAILURE(status) || t == 0) { |
+ dataerrln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, hangul, jamo); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("NFC", UTRANS_FORWARD, status); // was Jamo-Hangul |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, jamo, hangul); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Latin-Jamo", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ dataerrln("FAIL: createInstance failed - %s", u_errorName(status)); |
+ return; |
+ } |
+ expect(*t, latin, jamo); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Jamo-Latin", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, jamo, latin2); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Hangul-Latin", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, hangul, latin2); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Latin-Hangul", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, latin, hangul); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Hangul-Latin; Latin-Jamo", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, hangul, jamo); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Jamo-Latin; Latin-Hangul", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, jamo, hangul); |
+ delete t; |
+ |
+ t = Transliterator::createInstance("Hangul-Latin; Latin-Hangul", UTRANS_FORWARD, status); |
+ if (U_FAILURE(status) || t == 0) { |
+ errln("FAIL: createInstance failed"); |
+ return; |
+ } |
+ expect(*t, hangul, hangul); |
+ delete t; |
+} |
+ |
+void |
+JamoTest::TestRealText() { |
+ // Test text taken from the Unicode web site |
+ static const char* const WHAT_IS_UNICODE[] = { |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc\\uc5d0", "\\ub300\\ud574", "?", |
+ |
+ "\\uc5b4\\ub5a4", "\\ud50c\\ub7ab\\ud3fc,", "\\uc5b4\\ub5a4", |
+ "\\ud504\\ub85c\\uadf8\\ub7a8,", "\\uc5b4\\ub5a4", "\\uc5b8\\uc5b4\\uc5d0\\ub3c4", |
+ "\\uc0c1\\uad00\\uc5c6\\uc774", "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub294", "\\ubaa8\\ub4e0", |
+ "\\ubb38\\uc790\\uc5d0", "\\ub300\\ud574", "\\uace0\\uc720", "\\ubc88\\ud638\\ub97c", |
+ "\\uc81c\\uacf5\\ud569\\ub2c8\\ub2e4.", |
+ |
+ "\\uae30\\ubcf8\\uc801\\uc73c\\ub85c", "\\ucef4\\ud4e8\\ud130\\ub294", |
+ "\\uc22b\\uc790\\ub9cc", "\\ucc98\\ub9ac\\ud569\\ub2c8\\ub2e4.", "\\uae00\\uc790\\ub098", |
+ "\\ub2e4\\ub978", "\\ubb38\\uc790\\uc5d0\\ub3c4", "\\uc22b\\uc790\\ub97c", |
+ "\\uc9c0\\uc815\\ud558\\uc5ec", |
+ "\\uc800\\uc7a5\\ud569\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc\\uac00", |
+ "\\uac1c\\ubc1c\\ub418\\uae30", "\\uc804\\uc5d0\\ub294", "\\uc774\\ub7ec\\ud55c", |
+ "\\uc22b\\uc790\\ub97c", "\\uc9c0\\uc815\\ud558\\uae30", "\\uc704\\ud574", "\\uc218\\ubc31", |
+ "\\uac00\\uc9c0\\uc758", "\\ub2e4\\ub978", "\\uae30\\ud638\\ud654", |
+ "\\uc2dc\\uc2a4\\ud15c\\uc744", |
+ "\\uc0ac\\uc6a9\\ud588\\uc2b5\\ub2c8\\ub2e4.", "\\ub2e8\\uc77c", "\\uae30\\ud638\\ud654", |
+ "\\ubc29\\ubc95\\uc73c\\ub85c\\ub294", "\\ubaa8\\ub4e0", "\\ubb38\\uc790\\ub97c", |
+ "\\ud3ec\\ud568\\ud560", "\\uc218", "\\uc5c6\\uc5c8\\uc2b5\\ub2c8\\ub2e4.", "\\uc608\\ub97c", |
+ "\\ub4e4\\uc5b4", "\\uc720\\ub7fd", "\\uc5f0\\ud569\\uc5d0\\uc11c\\ub9cc", |
+ "\\ubcf4\\ub354\\ub77c\\ub3c4", "\\ubaa8\\ub4e0", "\\uac01", "\\ub098\\ub77c\\ubcc4", |
+ "\\uc5b8\\uc5b4\\ub97c", "\\ucc98\\ub9ac\\ud558\\ub824\\uba74", "\\uc5ec\\ub7ec", |
+ "\\uac1c\\uc758", "\\ub2e4\\ub978", "\\uae30\\ud638\\ud654", "\\ubc29\\ubc95\\uc774", |
+ "\\ud544\\uc694\\ud569\\ub2c8\\ub2e4.", "\\uc601\\uc5b4\\uc640", "\\uac19\\uc740", |
+ "\\ub2e8\\uc77c", "\\uc5b8\\uc5b4\\uc758", "\\uacbd\\uc6b0\\ub3c4", |
+ "\\uacf5\\ud1b5\\uc801\\uc73c\\ub85c", "\\uc0ac\\uc6a9\\ub418\\ub294", "\\ubaa8\\ub4e0", |
+ "\\uae00\\uc790,", "\\ubb38\\uc7a5", "\\ubd80\\ud638", "\\ubc0f", |
+ "\\ud14c\\ud06c\\ub2c8\\uceec", "\\uae30\\ud638\\uc5d0", "\\ub9de\\ub294", "\\ub2e8\\uc77c", |
+ "\\uae30\\ud638\\ud654", "\\ubc29\\ubc95\\uc744", "\\uac16\\uace0", "\\uc788\\uc9c0", |
+ "\\ubabb\\ud558\\uc600\\uc2b5\\ub2c8\\ub2e4.", |
+ |
+ "\\uc774\\ub7ec\\ud55c", "\\uae30\\ud638\\ud654", "\\uc2dc\\uc2a4\\ud15c\\uc740", |
+ "\\ub610\\ud55c", "\\ub2e4\\ub978", "\\uae30\\ud638\\ud654", "\\uc2dc\\uc2a4\\ud15c\\uacfc", |
+ "\\ucda9\\ub3cc\\ud569\\ub2c8\\ub2e4.", "\\uc989", "\\ub450", "\\uac00\\uc9c0", |
+ "\\uae30\\ud638\\ud654", "\\ubc29\\ubc95\\uc774", "\\ub450", "\\uac1c\\uc758", "\\ub2e4\\ub978", |
+ "\\ubb38\\uc790\\uc5d0", "\\ub300\\ud574", "\\uac19\\uc740", "\\ubc88\\ud638\\ub97c", |
+ "\\uc0ac\\uc6a9\\ud558\\uac70\\ub098", "\\uac19\\uc740", "\\ubb38\\uc790\\uc5d0", |
+ "\\ub300\\ud574", "\\ub2e4\\ub978", "\\ubc88\\ud638\\ub97c", "\\uc0ac\\uc6a9\\ud560", "\\uc218", |
+ "\\uc788\\uc2b5\\ub2c8\\ub2e4.", "\\uc8fc\\uc5b4\\uc9c4", "\\ubaa8\\ub4e0", |
+ "\\ucef4\\ud4e8\\ud130(\\ud2b9\\ud788", "\\uc11c\\ubc84)\\ub294", "\\uc11c\\ub85c", |
+ "\\ub2e4\\ub978", "\\uc5ec\\ub7ec", "\\uac00\\uc9c0", "\\uae30\\ud638\\ud654", |
+ "\\ubc29\\ubc95\\uc744", "\\uc9c0\\uc6d0\\ud574\\uc57c", |
+ "\\ud569\\ub2c8\\ub2e4.", "\\uadf8\\ub7ec\\ub098,", "\\ub370\\uc774\\ud130\\ub97c", |
+ "\\uc11c\\ub85c", "\\ub2e4\\ub978", "\\uae30\\ud638\\ud654", "\\ubc29\\ubc95\\uc774\\ub098", |
+ "\\ud50c\\ub7ab\\ud3fc", "\\uac04\\uc5d0", "\\uc804\\ub2ec\\ud560", "\\ub54c\\ub9c8\\ub2e4", |
+ "\\uadf8", "\\ub370\\uc774\\ud130\\ub294", "\\ud56d\\uc0c1", "\\uc190\\uc0c1\\uc758", |
+ "\\uc704\\ud5d8\\uc744", "\\uacaa\\uac8c", "\\ub429\\ub2c8\\ub2e4.", |
+ |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub85c", "\\ubaa8\\ub4e0", "\\uac83\\uc744", |
+ "\\ud574\\uacb0\\ud560", "\\uc218", "\\uc788\\uc2b5\\ub2c8\\ub2e4!", |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub294", "\\uc0ac\\uc6a9", "\\uc911\\uc778", |
+ "\\ud50c\\ub7ab\\ud3fc,", "\\ud504\\ub85c\\uadf8\\ub7a8,", "\\uc5b8\\uc5b4\\uc5d0", |
+ "\\uad00\\uacc4\\uc5c6\\uc774", "\\ubb38\\uc790\\ub9c8\\ub2e4", "\\uace0\\uc720\\ud55c", |
+ "\\uc22b\\uc790\\ub97c", |
+ "\\uc81c\\uacf5\\ud569\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc", |
+ "\\ud45c\\uc900\\uc740", // "Apple, HP, IBM, JustSystem, Microsoft, Oracle, SAP, " |
+ // "Sun, Sybase, Unisys " |
+ "\\ubc0f", "\\uae30\\ud0c0", "\\uc5ec\\ub7ec", |
+ "\\ud68c\\uc0ac\\uc640", "\\uac19\\uc740", "\\uc5c5\\uacc4", |
+ "\\uc120\\ub450\\uc8fc\\uc790\\uc5d0", "\\uc758\\ud574", |
+ "\\ucc44\\ud0dd\\ub418\\uc5c8\\uc2b5\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub294", |
+ // "XML, Java, ECMAScript(JavaScript), LDAP, CORBA 3.0, WML " |
+ "\\ub4f1\\uacfc", |
+ "\\uac19\\uc774", "\\ud604\\uc7ac", "\\ub110\\ub9ac", "\\uc0ac\\uc6a9\\ub418\\ub294", |
+ "\\ud45c\\uc900\\uc5d0\\uc11c", "\\ud544\\uc694\\ud558\\uba70", "\\uc774\\ub294", // "ISO/IEC", |
+ "10646\\uc744", "\\uad6c\\ud604\\ud558\\ub294", "\\uacf5\\uc2dd\\uc801\\uc778", |
+ "\\ubc29\\ubc95\\uc785\\ub2c8\\ub2e4.", "\\uc774\\ub294", "\\ub9ce\\uc740", "\\uc6b4\\uc601", |
+ "\\uccb4\\uc81c,", "\\uc694\\uc998", "\\uc0ac\\uc6a9\\ub418\\ub294", "\\ubaa8\\ub4e0", |
+ "\\ube0c\\ub77c\\uc6b0\\uc800", "\\ubc0f", "\\uae30\\ud0c0", "\\ub9ce\\uc740", |
+ "\\uc81c\\ud488\\uc5d0\\uc11c", |
+ "\\uc9c0\\uc6d0\\ub429\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc", |
+ "\\ud45c\\uc900\\uc758", "\\ubd80\\uc0c1\\uacfc", "\\uc774\\ub97c", |
+ "\\uc9c0\\uc6d0\\ud558\\ub294", "\\ub3c4\\uad6c\\uc758", "\\uac00\\uc6a9\\uc131\\uc740", |
+ "\\ucd5c\\uadfc", "\\uc804", "\\uc138\\uacc4\\uc5d0", "\\ubd88\\uace0", "\\uc788\\ub294", |
+ "\\uae30\\uc220", "\\uacbd\\ud5a5\\uc5d0\\uc11c", "\\uac00\\uc7a5", "\\uc911\\uc694\\ud55c", |
+ "\\ubd80\\ubd84\\uc744", "\\ucc28\\uc9c0\\ud558\\uace0", "\\uc788\\uc2b5\\ub2c8\\ub2e4.", |
+ |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub97c", |
+ // Replaced a hyphen with a space to make the test case work with CLDR1.5 |
+ //"\\ud074\\ub77c\\uc774\\uc5b8\\ud2b8-\\uc11c\\ubc84", "\\ub610\\ub294", |
+ "\\ud074\\ub77c\\uc774\\uc5b8\\ud2b8 \\uc11c\\ubc84", "\\ub610\\ub294", |
+ // Replaced a hyphen with a space. |
+ //"\\ub2e4\\uc911-\\uc5f0\\uacb0", "\\uc751\\uc6a9", "\\ud504\\ub85c\\uadf8\\ub7a8\\uacfc", |
+ "\\ub2e4\\uc911 \\uc5f0\\uacb0", "\\uc751\\uc6a9", "\\ud504\\ub85c\\uadf8\\ub7a8\\uacfc", |
+ "\\uc6f9", "\\uc0ac\\uc774\\ud2b8\\uc5d0", "\\ud1b5\\ud569\\ud558\\uba74", |
+ "\\ub808\\uac70\\uc2dc", "\\ubb38\\uc790", "\\uc138\\ud2b8", "\\uc0ac\\uc6a9\\uc5d0", |
+ "\\uc788\\uc5b4\\uc11c", "\\uc0c1\\ub2f9\\ud55c", "\\ube44\\uc6a9", "\\uc808\\uac10", |
+ "\\ud6a8\\uacfc\\uac00", |
+ "\\ub098\\ud0c0\\ub0a9\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc\\ub97c", |
+ "\\ud1b5\\ud574", "\\ub9ac\\uc5d4\\uc9c0\\ub2c8\\uc5b4\\ub9c1", "\\uc5c6\\uc774", |
+ "\\ub2e4\\uc911", "\\ud50c\\ub7ab\\ud3fc,", "\\uc5b8\\uc5b4", "\\ubc0f", "\\uad6d\\uac00", |
+ "\\uac04\\uc5d0", "\\ub2e8\\uc77c", "\\uc18c\\ud504\\ud2b8\\uc6e8\\uc5b4", |
+ "\\ud50c\\ub7ab\\ud3fc", "\\ub610\\ub294", "\\ub2e8\\uc77c", "\\uc6f9", |
+ "\\uc0ac\\uc774\\ud2b8\\ub97c", "\\ubaa9\\ud45c\\ub85c", "\\uc0bc\\uc744", "\\uc218", |
+ "\\uc788\\uc2b5\\ub2c8\\ub2e4.", "\\uc774\\ub97c", "\\uc0ac\\uc6a9\\ud558\\uba74", |
+ "\\ub370\\uc774\\ud130\\ub97c", "\\uc190\\uc0c1", "\\uc5c6\\uc774", "\\uc5ec\\ub7ec", |
+ "\\uc2dc\\uc2a4\\ud15c\\uc744", "\\ud1b5\\ud574", "\\uc804\\uc1a1\\ud560", "\\uc218", |
+ "\\uc788\\uc2b5\\ub2c8\\ub2e4.", |
+ |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc", "\\ucf58\\uc18c\\uc2dc\\uc5c4\\uc5d0", "\\ub300\\ud574", |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc", "\\ucf58\\uc18c\\uc2dc\\uc5c4\\uc740", |
+ "\\ube44\\uc601\\ub9ac", "\\uc870\\uc9c1\\uc73c\\ub85c\\uc11c", "\\ud604\\ub300", |
+ "\\uc18c\\ud504\\ud2b8\\uc6e8\\uc5b4", "\\uc81c\\ud488\\uacfc", |
+ "\\ud45c\\uc900\\uc5d0\\uc11c", "\\ud14d\\uc2a4\\ud2b8\\uc758", "\\ud45c\\ud604\\uc744", |
+ "\\uc9c0\\uc815\\ud558\\ub294", "\\uc720\\ub2c8\\ucf54\\ub4dc", "\\ud45c\\uc900\\uc758", |
+ "\\uc0ac\\uc6a9\\uc744", "\\uac1c\\ubc1c\\ud558\\uace0", "\\ud655\\uc7a5\\ud558\\uba70", |
+ "\\uc7a5\\ub824\\ud558\\uae30", "\\uc704\\ud574", |
+ "\\uc138\\uc6cc\\uc84c\\uc2b5\\ub2c8\\ub2e4.", "\\ucf58\\uc18c\\uc2dc\\uc5c4", |
+ "\\uba64\\ubc84\\uc27d\\uc740", "\\ucef4\\ud4e8\\ud130\\uc640", "\\uc815\\ubcf4", |
+ "\\ucc98\\ub9ac", "\\uc0b0\\uc5c5\\uc5d0", "\\uc885\\uc0ac\\ud558\\uace0", "\\uc788\\ub294", |
+ "\\uad11\\ubc94\\uc704\\ud55c", "\\ud68c\\uc0ac", "\\ubc0f", "\\uc870\\uc9c1\\uc758", |
+ "\\ubc94\\uc704\\ub97c", |
+ "\\ub098\\ud0c0\\ub0c5\\ub2c8\\ub2e4.", "\\ucf58\\uc18c\\uc2dc\\uc5c4\\uc758", |
+ "\\uc7ac\\uc815\\uc740", "\\uc804\\uc801\\uc73c\\ub85c", "\\ud68c\\ube44\\uc5d0", |
+ "\\uc758\\ud574", "\\ucda9\\ub2f9\\ub429\\ub2c8\\ub2e4.", "\\uc720\\ub2c8\\ucf54\\ub4dc", |
+ "\\ucee8\\uc18c\\uc2dc\\uc5c4\\uc5d0\\uc11c\\uc758", "\\uba64\\ubc84\\uc27d\\uc740", |
+ "\\uc804", "\\uc138\\uacc4", "\\uc5b4\\ub290", "\\uacf3\\uc5d0\\uc11c\\ub098", |
+ "\\uc720\\ub2c8\\ucf54\\ub4dc", "\\ud45c\\uc900\\uc744", "\\uc9c0\\uc6d0\\ud558\\uace0", |
+ "\\uadf8", "\\ud655\\uc7a5\\uacfc", "\\uad6c\\ud604\\uc744", |
+ "\\uc9c0\\uc6d0\\ud558\\uace0\\uc790\\ud558\\ub294", "\\uc870\\uc9c1\\uacfc", |
+ "\\uac1c\\uc778\\uc5d0\\uac8c", "\\uac1c\\ubc29\\ub418\\uc5b4", |
+ "\\uc788\\uc2b5\\ub2c8\\ub2e4.", |
+ |
+ "\\ub354", "\\uc790\\uc138\\ud55c", "\\ub0b4\\uc6a9\\uc740", "\\uc6a9\\uc5b4\\uc9d1,", |
+ "\\uc608\\uc81c", "\\uc720\\ub2c8\\ucf54\\ub4dc", "\\uc0ac\\uc6a9", "\\uac00\\ub2a5", |
+ "\\uc81c\\ud488,", "\\uae30\\uc220", "\\uc815\\ubcf4", "\\ubc0f", "\\uae30\\ud0c0", |
+ "\\uc720\\uc6a9\\ud55c", "\\uc815\\ubcf4\\ub97c", |
+ "\\ucc38\\uc870\\ud558\\uc2ed\\uc2dc\\uc624." |
+ }; |
+ |
+ enum { WHAT_IS_UNICODE_length = sizeof(WHAT_IS_UNICODE) / sizeof(WHAT_IS_UNICODE[0]) }; |
+ |
+ UParseError parseError; |
+ UErrorCode status = U_ZERO_ERROR; |
+ Transliterator* latinJamo = Transliterator::createInstance("Latin-Jamo", UTRANS_FORWARD, parseError, status); |
+ Transliterator* jamoHangul = Transliterator::createInstance("NFC(NFD)", UTRANS_FORWARD, parseError, status); |
+ if (latinJamo == 0 || jamoHangul == 0 || U_FAILURE(status)) { |
+ delete latinJamo; |
+ delete jamoHangul; |
+ dataerrln("FAIL: createInstance returned NULL - %s", u_errorName(status)); |
+ return; |
+ } |
+ Transliterator* jamoLatin = latinJamo->createInverse(status); |
+ Transliterator* hangulJamo = jamoHangul->createInverse(status); |
+ if (jamoLatin == 0 || hangulJamo == 0) { |
+ errln("FAIL: createInverse returned NULL"); |
+ delete latinJamo; |
+ delete jamoLatin; |
+ delete jamoHangul; |
+ delete hangulJamo; |
+ return; |
+ } |
+ |
+ Transliterator* tarray[4] = |
+ { hangulJamo, jamoLatin, latinJamo, jamoHangul }; |
+ CompoundTransliterator rt(tarray, 4); |
+ |
+ UnicodeString buf; |
+ int32_t total = 0; |
+ int32_t errors = 0; |
+ int32_t i; |
+ for (i=0; i < WHAT_IS_UNICODE_length; ++i) { |
+ ++total; |
+ UnicodeString hangul = UnicodeString(WHAT_IS_UNICODE[i], -1, US_INV); |
+ hangul = hangul.unescape(); // Parse backslash-u escapes |
+ UnicodeString hangulX = hangul; |
+ rt.transliterate(hangulX); |
+ if (hangul != hangulX) { |
+ ++errors; |
+ UnicodeString jamo = hangul; hangulJamo->transliterate(jamo); |
+ UnicodeString latin = jamo; jamoLatin->transliterate(latin); |
+ UnicodeString jamo2 = latin; latinJamo->transliterate(jamo2); |
+ UnicodeString hangul2 = jamo2; jamoHangul->transliterate(hangul2); |
+ |
+ buf.remove(0); |
+ buf.append("FAIL: "); |
+ if (hangul2 != hangulX) { |
+ buf.append((UnicodeString)"(Weird: " + hangulX + " != " + hangul2 + ")"); |
+ } |
+ // The Hangul-Jamo conversion is not usually the |
+ // bug here, so we hide it from display. |
+ // Uncomment lines to see the Hangul. |
+ buf.append(//hangul + " => " + |
+ jamoToName(jamo) + " => " + |
+ latin + " => " + jamoToName(jamo2) |
+ //+ " => " + hangul2 |
+ ); |
+ errln(prettify(buf)); |
+ } |
+ } |
+ if (errors != 0) { |
+ errln((UnicodeString)"Test word failures: " + errors + " out of " + total); |
+ } else { |
+ logln((UnicodeString)"All " + total + " test words passed"); |
+ } |
+ |
+ delete latinJamo; |
+ delete jamoLatin; |
+ delete jamoHangul; |
+ delete hangulJamo; |
+} |
+ |
+// Override TransliteratorTest |
+void |
+JamoTest::expectAux(const UnicodeString& tag, |
+ const UnicodeString& summary, UBool pass, |
+ const UnicodeString& expectedResult) { |
+ UnicodeString jsum = jamoToName(summary); |
+ UnicodeString jexp = jamoToName(expectedResult); |
+ TransliteratorTest::expectAux(tag, jsum, pass, jexp); |
+} |
+ |
+const char* JamoTest::JAMO_NAMES_RULES = |
+ "'(Gi)' <> \\u1100;" |
+ "'(GGi)' <> \\u1101;" |
+ "'(Ni)' <> \\u1102;" |
+ "'(Di)' <> \\u1103;" |
+ "'(DD)' <> \\u1104;" |
+ "'(R)' <> \\u1105;" |
+ "'(Mi)' <> \\u1106;" |
+ "'(Bi)' <> \\u1107;" |
+ "'(BB)' <> \\u1108;" |
+ "'(Si)' <> \\u1109;" |
+ "'(SSi)' <> \\u110A;" |
+ "'(IEUNG)' <> \\u110B;" |
+ "'(Ji)' <> \\u110C;" |
+ "'(JJ)' <> \\u110D;" |
+ "'(Ci)' <> \\u110E;" |
+ "'(Ki)' <> \\u110F;" |
+ "'(Ti)' <> \\u1110;" |
+ "'(Pi)' <> \\u1111;" |
+ "'(Hi)' <> \\u1112;" |
+ |
+ "'(A)' <> \\u1161;" |
+ "'(AE)' <> \\u1162;" |
+ "'(YA)' <> \\u1163;" |
+ "'(YAE)' <> \\u1164;" |
+ "'(EO)' <> \\u1165;" |
+ "'(E)' <> \\u1166;" |
+ "'(YEO)' <> \\u1167;" |
+ "'(YE)' <> \\u1168;" |
+ "'(O)' <> \\u1169;" |
+ "'(WA)' <> \\u116A;" |
+ "'(WAE)' <> \\u116B;" |
+ "'(OE)' <> \\u116C;" |
+ "'(YO)' <> \\u116D;" |
+ "'(U)' <> \\u116E;" |
+ "'(WEO)' <> \\u116F;" |
+ "'(WE)' <> \\u1170;" |
+ "'(WI)' <> \\u1171;" |
+ "'(YU)' <> \\u1172;" |
+ "'(EU)' <> \\u1173;" |
+ "'(YI)' <> \\u1174;" |
+ "'(I)' <> \\u1175;" |
+ |
+ "'(Gf)' <> \\u11A8;" |
+ "'(GGf)' <> \\u11A9;" |
+ "'(GS)' <> \\u11AA;" |
+ "'(Nf)' <> \\u11AB;" |
+ "'(NJ)' <> \\u11AC;" |
+ "'(NH)' <> \\u11AD;" |
+ "'(Df)' <> \\u11AE;" |
+ "'(L)' <> \\u11AF;" |
+ "'(LG)' <> \\u11B0;" |
+ "'(LM)' <> \\u11B1;" |
+ "'(LB)' <> \\u11B2;" |
+ "'(LS)' <> \\u11B3;" |
+ "'(LT)' <> \\u11B4;" |
+ "'(LP)' <> \\u11B5;" |
+ "'(LH)' <> \\u11B6;" |
+ "'(Mf)' <> \\u11B7;" |
+ "'(Bf)' <> \\u11B8;" |
+ "'(BS)' <> \\u11B9;" |
+ "'(Sf)' <> \\u11BA;" |
+ "'(SSf)' <> \\u11BB;" |
+ "'(NG)' <> \\u11BC;" |
+ "'(Jf)' <> \\u11BD;" |
+ "'(Cf)' <> \\u11BE;" |
+ "'(Kf)' <> \\u11BF;" |
+ "'(Tf)' <> \\u11C0;" |
+ "'(Pf)' <> \\u11C1;" |
+ "'(Hf)' <> \\u11C2;"; |
+ |
+/** |
+ * Convert short names to actual jamo. E.g., "x(LG)y" returns |
+ * "x\u11B0y". See JAMO_NAMES for table of names. |
+ */ |
+UnicodeString |
+JamoTest::nameToJamo(const UnicodeString& input) { |
+ if (NAME_JAMO == 0) { |
+ errln("Failed to create NAME_JAMO"); |
+ return input; /* failure! */ |
+ } |
+ UnicodeString result(input); |
+ NAME_JAMO->transliterate(result); |
+ return result; |
+} |
+ |
+/** |
+ * Convert jamo to short names. E.g., "x\u11B0y" returns |
+ * "x(LG)y". See JAMO_NAMES for table of names. |
+ */ |
+UnicodeString |
+JamoTest::jamoToName(const UnicodeString& input) { |
+ if (NAME_JAMO == 0) { |
+ errln("Failed to create NAME_JAMO"); |
+ return input; /* failure! */ |
+ } |
+ UnicodeString result(input); |
+ JAMO_NAME->transliterate(result); |
+ return result; |
+} |
+ |
+#endif /* #if !UCONFIG_NO_TRANSLITERATION */ |
Property changes on: icu46/source/test/intltest/jamotest.cpp |
___________________________________________________________________ |
Added: svn:eol-style |
+ LF |