Chromium Code Reviews| OLD | NEW |
|---|---|
| (Empty) | |
| 1 // Copyright 2016 the V8 project authors. All rights reserved. | |
| 2 // Use of this source code is governed by a BSD-style license that can be | |
| 3 // found in the LICENSE file. | |
| 4 | |
| 5 // Flags: --icu_case_mapping | |
|
jungshik at Google
2016/04/29 06:23:16
This does not work. --icu_case_mapping is not used
| |
| 6 | |
| 7 // Some edge cases that unibrow got wrong | |
| 8 | |
| 9 assertEquals("𐐘", "𐑀".toUpperCase()); | |
| 10 assertEquals("𐑀", "𐐘".toLowerCase()); | |
| 11 assertEquals("σ", "Σ".toLowerCase()); | |
| 12 | |
| 13 // Some different paths in the ICU case conversion fastpath | |
| 14 | |
| 15 assertEquals("σς", "\u03A3\u03A3".toLowerCase()); | |
| 16 // Expand sharp s in latin1 fastpath | |
| 17 assertEquals("ASSB", "A\u00DFB".toUpperCase()); | |
| 18 assertEquals("AB", "Ab".toUpperCase()); | |
| 19 // Find first upper case in fastpath | |
| 20 assertEquals("ab", "aB".toLowerCase()); | |
| 21 assertEquals("AÜ", "aü".toUpperCase()); | |
| 22 assertEquals("AÜ", "AÜ".toUpperCase()); | |
| 23 assertEquals("aü", "aü".toLowerCase()); | |
| 24 assertEquals("aü", "AÜ".toLowerCase()); | |
| 25 assertEquals("aü", "AÜ".toLowerCase()); | |
| 26 | |
| 27 // Starts with fastpath, but switches to full Unicode path | |
| 28 // U+00FF is uppercased to U+0178. | |
| 29 assertEquals("AŸ", "aÿ".toUpperCase()); | |
| 30 // U+00B5 (µ) is uppercased to U+039C (Μ) | |
| 31 assertEquals("AΜ", "aµ".toUpperCase()); | |
| 32 | |
| 33 // Buffer size increase | |
| 34 assertEquals("CSSBẶ", "cßbặ".toUpperCase()); | |
| 35 assertEquals("FIFLFFIFFL", "\uFB01\uFB02\uFB03\uFB04".toUpperCase()); | |
| 36 | |
| 37 // More comprehensive tests for "tr", "az" and "lt" are in | |
| 38 // test262/intl402/Strings/* | |
| 39 | |
| 40 // Buffer size decrease with a single locale or locale list. | |
| 41 // In Turkic (tr, az), U+0307 preceeded by Capital Letter I is dropped. | |
| 42 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase("tr")); | |
| 43 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase("az")); | |
| 44 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase(["tr", "en"])); | |
| 45 | |
| 46 // Cons string | |
| 47 assertEquals("abcijkl", ("aBcI" + "\u0307jkl").toLocaleLowerCase("tr")); | |
| 48 assertEquals("abcijkl", | |
| 49 ("aB" + "cI" + "\u0307j" + "kl").toLocaleLowerCase("tr")); | |
| 50 assertEquals("abci\u0307jkl", ("aBcI" + "\u0307jkl").toLocaleLowerCase("en")); | |
| 51 assertEquals("abci\u0307jkl", | |
| 52 ("aB" + "cI" + "\u0307j" + "kl").toLocaleLowerCase("en")); | |
| 53 assertEquals("abci\u0307jkl", ("aBcI" + "\u0307jkl").toLowerCase()); | |
| 54 assertEquals("abci\u0307jkl", | |
| 55 ("aB" + "cI" + "\u0307j" + "kl").toLowerCase()); | |
| 56 | |
| 57 // "tr" and "az" should behave identically. | |
| 58 assertEquals("aBcI\u0307".toLocaleLowerCase("tr"), | |
| 59 "aBcI\u0307".toLocaleLowerCase("az")); | |
| 60 // What matters is the first locale in the locale list. | |
| 61 assertEquals("aBcI\u0307".toLocaleLowerCase(["tr", "en", "fr"]), | |
| 62 "aBcI\u0307".toLocaleLowerCase("tr")); | |
| 63 assertEquals("aBcI\u0307".toLocaleLowerCase(["en", "tr", "az"]), | |
| 64 "aBcI\u0307".toLocaleLowerCase("en")); | |
| 65 assertEquals("aBcI\u0307".toLocaleLowerCase(["en", "tr", "az"]), | |
| 66 "aBcI\u0307".toLowerCase()); | |
| 67 | |
| 68 // An empty locale list is the same as the default locale. Try these tests | |
| 69 // under Turkish and Greek locale. | |
| 70 assertEquals("aBcI\u0307".toLocaleLowerCase([]), | |
| 71 "aBcI\u0307".toLocaleLowerCase()); | |
| 72 assertEquals("aBcI\u0307".toLocaleLowerCase([]), | |
| 73 "aBcI\u0307".toLocaleLowerCase(Intl.GetDefaultLocale)); | |
| 74 assertEquals("άόύώ".toLocaleUpperCase([]), "άόύώ".toLocaleUpperCase()); | |
| 75 assertEquals("άόύώ".toLocaleUpperCase([]), | |
| 76 "άόύώ".toLocaleUpperCase(Intl.GetDefaultLocale)); | |
| 77 | |
| 78 | |
| 79 // English/root locale keeps U+0307 (combining dot above). | |
| 80 assertEquals("abci\u0307", "aBcI\u0307".toLocaleLowerCase("en")); | |
| 81 assertEquals("abci\u0307", "aBcI\u0307".toLocaleLowerCase(["en", "tr"])); | |
| 82 assertEquals("abci\u0307", "aBcI\u0307".toLowerCase()); | |
| 83 | |
| 84 // Greek uppercasing: not covered by intl402/String/*, yet. Tonos (U+0301) and | |
| 85 // other diacritic marks are dropped. This rule is based on the current CLDR's | |
| 86 // el-Upper transformation, but Greek uppercasing rules are more sophisticated | |
| 87 // than this. See http://bugs.icu-project.org/trac/ticket/10582 and | |
| 88 // http://unicode.org/cldr/trac/ticket/7905 . | |
| 89 assertEquals("Α", "α\u0301".toLocaleUpperCase("el")); | |
| 90 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-GR")); | |
| 91 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-Grek")); | |
| 92 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-Grek-GR")); | |
| 93 assertEquals("Α", "ά".toLocaleUpperCase("el")); | |
| 94 assertEquals("ΑΟΥΩ", "άόύώ".toLocaleUpperCase("el")); | |
| 95 assertEquals("ΑΟΥΩ", "α\u0301ο\u0301υ\u0301ω\u0301".toLocaleUpperCase("el")); | |
| 96 assertEquals("ΑΟΥΩ", "άόύώ".toLocaleUpperCase("el")); | |
| 97 assertEquals("ΟΕ", "Ό\u1f15".toLocaleUpperCase("el")); | |
| 98 assertEquals("ΟΕ", "Ο\u0301ε\u0314\u0301".toLocaleUpperCase("el")); | |
| 99 | |
| 100 // In other locales, U+0301 is preserved. | |
| 101 assertEquals("Α\u0301Ο\u0301Υ\u0301Ω\u0301", | |
| 102 "α\u0301ο\u0301υ\u0301ω\u0301".toLocaleUpperCase("en")); | |
| 103 assertEquals("Α\u0301Ο\u0301Υ\u0301Ω\u0301", | |
| 104 "α\u0301ο\u0301υ\u0301ω\u0301".toUpperCase()); | |
| 105 | |
| 106 // Plane 1; Deseret and Warang Citi Script. | |
| 107 assertEquals("\u{10400}\u{118A0}", "\u{10428}\u{118C0}".toUpperCase()); | |
| 108 assertEquals("\u{10428}\u{118C0}", "\u{10400}\u{118A0}".toLowerCase()); | |
| 109 // Mathematical Bold {Capital, Small} Letter A do not change. | |
| 110 assertEquals("\u{1D400}\u{1D41A}", "\u{1D400}\u{1D41A}".toUpperCase()); | |
| 111 assertEquals("\u{1D400}\u{1D41A}", "\u{1D400}\u{1D41A}".toLowerCase()); | |
| 112 // Plane 1; New characters in Unicode 8.0 | |
| 113 assertEquals("\u{10C80}", "\u{10CC0}".toUpperCase()); | |
| 114 assertEquals("\u{10CC0}", "\u{10C80}".toLowerCase()); | |
| 115 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase()); | |
| 116 assertEquals("\u{10CC0}", "\u{10C80}".toLocaleLowerCase()); | |
| 117 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase(["tr"])); | |
| 118 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase(["tr"])); | |
| 119 assertEquals("\u{10CC0}", "\u{10C80}".toLocaleLowerCase()); | |
| OLD | NEW |