Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(141)

Side by Side Diff: test/intl/general/case-mapping.js

Issue 1812673005: Use ICU case conversion/transliterator for case conversion behind a flag (Closed) Base URL: https://chromium.googlesource.com/v8/v8.git@master
Patch Set: trival change: unnecessary line dropped Created 4 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
(Empty)
1 // Copyright 2016 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 // Some edge cases that unibrow got wrong
6
7 assertEquals("𐐘", "𐑀".toUpperCase());
8 assertEquals("𐑀", "𐐘".toLowerCase());
9 assertEquals("σ", "Σ".toLowerCase());
10
11 // Some different paths in the ICU case conversion fastpath
12
13 assertEquals("σς", "\u03A3\u03A3".toLowerCase());
14 // Expand sharp s in latin1 fastpath
15 assertEquals("ASSB", "A\u00DFB".toUpperCase());
16 assertEquals("AB", "Ab".toUpperCase());
17 // Find first upper case in fastpath
18 assertEquals("ab", "aB".toLowerCase());
19 assertEquals("AÜ", "aü".toUpperCase());
20 assertEquals("AÜ", "AÜ".toUpperCase());
21 assertEquals("aü", "aü".toLowerCase());
22 assertEquals("aü", "AÜ".toLowerCase());
23 assertEquals("aü", "AÜ".toLowerCase());
24
25 // Starts with fastpath, but switches to full Unicode path
26 // U+00FF is uppercased to U+0178.
27 assertEquals("AŸ", "aÿ".toUpperCase());
28 // U+00B5 (µ) is uppercased to U+039C (Μ)
29 assertEquals("AΜ", "aµ".toUpperCase());
30
31 // Buffer size increase
32 assertEquals("CSSBẶ", "cßbặ".toUpperCase());
33 assertEquals("FIFLFFIFFL", "\uFB01\uFB02\uFB03\uFB04".toUpperCase());
34
35 // More comprehensive tests for "tr", "az" and "lt" are in
36 // test262/intl402/Strings/*
37
38 // Buffer size decrease with a single locale or locale list.
39 // In Turkic (tr, az), U+0307 preceeded by Capital Letter I is dropped.
40 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase("tr"));
41 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase("az"));
42 assertEquals("abci", "aBcI\u0307".toLocaleLowerCase(["tr", "en"]));
43
44
45 // "tr" and "az" should behave identically.
46 assertEquals("aBcI\u0307".toLocaleLowerCase("tr"),
47 "aBcI\u0307".toLocaleLowerCase("az"));
48 // What matters is the first locale in the locale list.
49 assertEquals("aBcI\u0307".toLocaleLowerCase(["tr", "en", "fr"]),
50 "aBcI\u0307".toLocaleLowerCase("tr"));
51 assertEquals("aBcI\u0307".toLocaleLowerCase(["en", "tr", "az"]),
52 "aBcI\u0307".toLocaleLowerCase("en"));
53 assertEquals("aBcI\u0307".toLocaleLowerCase(["en", "tr", "az"]),
54 "aBcI\u0307".toLowerCase());
55
56 // An empty locale list is the same as the default locale. Try these tests
57 // under Turkish and Greek locale.
58 assertEquals("aBcI\u0307".toLocaleLowerCase([]),
59 "aBcI\u0307".toLocaleLowerCase());
60 assertEquals("aBcI\u0307".toLocaleLowerCase([]),
61 "aBcI\u0307".toLocaleLowerCase(Intl.GetDefaultLocale));
62 assertEquals("άόύώ".toLocaleUpperCase([]), "άόύώ".toLocaleUpperCase());
63 assertEquals("άόύώ".toLocaleUpperCase([]),
64 "άόύώ".toLocaleUpperCase(Intl.GetDefaultLocale));
65
66
67 // English/root locale keeps U+0307 (combining dot above).
68 assertEquals("abci\u0307", "aBcI\u0307".toLocaleLowerCase("en"));
69 assertEquals("abci\u0307", "aBcI\u0307".toLocaleLowerCase(["en", "tr"]));
70 assertEquals("abci\u0307", "aBcI\u0307".toLowerCase());
71
72 // Greek uppercasing: not covered by intl402/String/*, yet. Tonos (U+0301) and
73 // other diacritic marks are dropped. This rule is based on the current CLDR's
74 // el-Upper transformation, but Greek uppercasing rules are more sophisticated
75 // than this. See http://bugs.icu-project.org/trac/ticket/10582 and
76 // http://unicode.org/cldr/trac/ticket/7905 .
77 assertEquals("Α", "α\u0301".toLocaleUpperCase("el"));
78 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-GR"));
79 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-Grek"));
80 assertEquals("Α", "α\u0301".toLocaleUpperCase("el-Grek-GR"));
81 assertEquals("Α", "ά".toLocaleUpperCase("el"));
82 assertEquals("ΑΟΥΩ", "άόύώ".toLocaleUpperCase("el"));
83 assertEquals("ΑΟΥΩ", "α\u0301ο\u0301υ\u0301ω\u0301".toLocaleUpperCase("el"));
84 assertEquals("ΑΟΥΩ", "άόύώ".toLocaleUpperCase("el"));
85 assertEquals("ΟΕ", "Ό\u1f15".toLocaleUpperCase("el"));
86 assertEquals("ΟΕ", "Ο\u0301ε\u0314\u0301".toLocaleUpperCase("el"));
87
88 // In other locales, U+0301 is preserved.
89 assertEquals("Α\u0301Ο\u0301Υ\u0301Ω\u0301",
90 "α\u0301ο\u0301υ\u0301ω\u0301".toLocaleUpperCase("en"));
91 assertEquals("Α\u0301Ο\u0301Υ\u0301Ω\u0301",
92 "α\u0301ο\u0301υ\u0301ω\u0301".toUpperCase());
93
94 // Plane 1; Deseret and Warang Citi Script.
95 assertEquals("\u{10400}\u{118A0}", "\u{10428}\u{118C0}".toUpperCase());
96 assertEquals("\u{10428}\u{118C0}", "\u{10400}\u{118A0}".toLowerCase());
97 // Mathematical Bold {Capital, Small} Letter A do not change.
98 assertEquals("\u{1D400}\u{1D41A}", "\u{1D400}\u{1D41A}".toUpperCase());
99 assertEquals("\u{1D400}\u{1D41A}", "\u{1D400}\u{1D41A}".toLowerCase());
100 // Plane 1; New characters in Unicode 8.0
101 assertEquals("\u{10C80}", "\u{10CC0}".toUpperCase());
102 assertEquals("\u{10CC0}", "\u{10C80}".toLowerCase());
103 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase());
104 assertEquals("\u{10CC0}", "\u{10C80}".toLocaleLowerCase());
105 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase(["tr"]));
106 assertEquals("\u{10C80}", "\u{10CC0}".toLocaleUpperCase(["tr"]));
107 assertEquals("\u{10CC0}", "\u{10C80}".toLocaleLowerCase());
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698