| OLD | NEW |
| (Empty) |
| 1 //*****************************************************************************
** | |
| 2 //* | |
| 3 //* Copyright (C) 2002-2010, International Business Machines | |
| 4 //* Corporation and others. All Rights Reserved. | |
| 5 //* | |
| 6 //******************************************************************************
* | |
| 7 | |
| 8 casing:table(nofallback) { | |
| 9 Info { | |
| 10 Description { "This is test data file for string casing." } | |
| 11 | |
| 12 LongDescription { | |
| 13 "each item is an array with\n" | |
| 14 "input string, result string, locale ID[, break iterator]\n" | |
| 15 "the break iterator (only for titlecasing) is specified as an int, s
ame as in UBreakIteratorType:\n" | |
| 16 "0=UBRK_CHARACTER 1=UBRK_WORD 2=UBRK_LINE 3=UBRK_SENTENCE 4=UBRK
_TITLE -1=default (NULL=words) -2=no breaks (.*)\n" | |
| 17 "options: T=U_FOLD_CASE_EXCLUDE_SPECIAL_I L=U_TITLECASE_NO_LOWERCAS
E A=U_TITLECASE_NO_BREAK_ADJUSTMENT\n" | |
| 18 } | |
| 19 } | |
| 20 TestData { | |
| 21 lowercasing { | |
| 22 Headers { "Input", "Output", "Locale" } | |
| 23 Cases { | |
| 24 { " tHe QUIcK bRoWn", " the quick brown", "" }, | |
| 25 { "aBIΣßΣ/𐐅", "abiσßς/𐐭", "" }, | |
| 26 { "aBIΣßΣ/𐐅", "abıσßς/𐐭", "tur" } // tur: 3-letter code for Turkis
h | |
| 27 } | |
| 28 } | |
| 29 uppercasing { | |
| 30 Headers { "Input", "Output", "Locale" } | |
| 31 Cases { | |
| 32 { " tHe QUIcK bRoWn", " THE QUICK BROWN", "" }, | |
| 33 { "aBiσßς/ffi𐐭", "ABIΣSSΣ/FFI𐐅", "" }, | |
| 34 { "aBiσßς/ffi𐐭", "ABİΣSSΣ/FFI𐐅", "az" } // az same casing as tr | |
| 35 } | |
| 36 } | |
| 37 titlecasing { | |
| 38 Headers { "Input", "Output", "Locale", "Type", "Options" } | |
| 39 Cases { | |
| 40 { "ʻaMeLikA huI Pū ʻʻʻiA", "ʻAmelika Hui Pū ʻʻʻIa", "", "-1", "" },
// titlecase first _cased_ letter, j4933 | |
| 41 { " tHe QUIcK bRoWn", " The Quick Brown", "", "4", "" }, | |
| 42 { "DŽDždžLJLjljNJNjnj", "DžDžDžLjLjLjNjNjNj", "", "0", "" }, // UBRK_CHARACTER | |
| 43 { "ljubav ljubav", "Ljubav Ljubav", "", "-1", "" }, // Lj vs. L+j | |
| 44 { "ijssel igloo IJMUIDEN", "Ijssel Igloo Ijmuiden", "", "1", "" }, /
/ Dutch titlecasing default | |
| 45 { "ijssel igloo IJMUIDEN", "IJssel Igloo IJmuiden", "nl", "1", "" },
// Dutch titlecasing | |
| 46 { "'oH dOn'T tItLeCaSe AfTeR lEtTeR+'", "'Oh Don't Titlecase After L
etter+'", "", "-1", "" }, | |
| 47 | |
| 48 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻCat. A ʻDog! ʻEtc.", "", "-1", "" },
// default | |
| 49 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻcat. A ʻdog! ʻetc.", "", "-1", "A" },
// U_TITLECASE_NO_BREAK_ADJUSTMENT | |
| 50 { "a ʻCaT. A ʻdOg! ʻeTc.", "A ʻCaT. A ʻdOg! ʻETc.", "", "3", "L" },
// UBRK_SENTENCE and U_TITLECASE_NO_LOWERCASE | |
| 51 | |
| 52 { "ʻcAt! ʻeTc.", "ʻCat! ʻetc.", "", "-2", "" }, // -2=Trivial break
iterator | |
| 53 { "ʻcAt! ʻeTc.", "ʻcat! ʻetc.", "", "-2", "A" }, // U_TITLECASE_NO_B
REAK_ADJUSTMENT | |
| 54 { "ʻcAt! ʻeTc.", "ʻCAt! ʻeTc.", "", "-2", "L" }, // U_TITLECASE_NO_L
OWERCASE | |
| 55 { "ʻcAt! ʻeTc.", "ʻcAt! ʻeTc.", "", "-2", "AL" }, // Both options | |
| 56 | |
| 57 // Test case for ticket #7251: UCharacter.toTitleCase() throws OutOf
MemoryError | |
| 58 // when TITLECASE_NO_LOWERCASE encounters a single-letter word | |
| 59 { "a b c", "A B C", "", "1", "L" } // U_TITLECASE_NO_LOWERCASE | |
| 60 } | |
| 61 } | |
| 62 casefolding { | |
| 63 Headers { "Input", "Output", "Options" } | |
| 64 Cases { | |
| 65 { "aBİIıϐßffi", "abi̇iıβssffi", "" }, | |
| 66 { "aBİIıϐßffi", "abiııβssffi", "T" } // U_FOLD_CASE_EXCLUDE_SPECIAL_
I | |
| 67 } | |
| 68 } | |
| 69 } | |
| 70 } | |
| OLD | NEW |